npm - @oh-my-pi/pi-coding-agent - Versions diffs - 14.5.14 → 14.6.0 - Mend

@oh-my-pi/pi-coding-agent 14.5.14 → 14.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

package/CHANGELOG.md +39 -0
package/package.json +7 -7
package/src/autoresearch/command-resume.md +5 -8
package/src/autoresearch/git.ts +41 -51
package/src/autoresearch/helpers.ts +43 -359
package/src/autoresearch/index.ts +281 -273
package/src/autoresearch/prompt-setup.md +43 -0
package/src/autoresearch/prompt.md +52 -193
package/src/autoresearch/resume-message.md +2 -8
package/src/autoresearch/state.ts +59 -166
package/src/autoresearch/storage.ts +687 -0
package/src/autoresearch/tools/init-experiment.ts +201 -290
package/src/autoresearch/tools/log-experiment.ts +304 -517
package/src/autoresearch/tools/run-experiment.ts +117 -296
package/src/autoresearch/tools/update-notes.ts +116 -0
package/src/autoresearch/types.ts +16 -66
package/src/config/settings-schema.ts +1 -1
package/src/config/settings.ts +20 -1
package/src/cursor.ts +1 -1
package/src/edit/index.ts +9 -31
package/src/edit/line-hash.ts +70 -43
package/src/edit/modes/hashline.lark +26 -0
package/src/edit/modes/hashline.ts +898 -1099
package/src/edit/modes/patch.ts +0 -7
package/src/edit/modes/replace.ts +0 -4
package/src/edit/renderer.ts +22 -20
package/src/edit/streaming.ts +8 -28
package/src/eval/eval.lark +24 -30
package/src/eval/js/context-manager.ts +5 -162
package/src/eval/js/prelude.txt +0 -12
package/src/eval/parse.ts +129 -129
package/src/eval/py/prelude.py +1 -219
package/src/export/html/template.generated.ts +1 -1
package/src/export/html/template.js +2 -2
package/src/internal-urls/docs-index.generated.ts +1 -1
package/src/modes/components/session-observer-overlay.ts +5 -2
package/src/modes/components/status-line/segments.ts +1 -1
package/src/modes/components/status-line.ts +3 -5
package/src/modes/components/tree-selector.ts +4 -5
package/src/modes/components/welcome.ts +11 -1
package/src/modes/controllers/command-controller.ts +2 -6
package/src/modes/controllers/event-controller.ts +1 -2
package/src/modes/controllers/extension-ui-controller.ts +3 -15
package/src/modes/controllers/input-controller.ts +0 -1
package/src/modes/controllers/selector-controller.ts +1 -1
package/src/modes/interactive-mode.ts +5 -7
package/src/prompts/system/system-prompt.md +14 -38
package/src/prompts/tools/ast-edit.md +8 -8
package/src/prompts/tools/ast-grep.md +10 -10
package/src/prompts/tools/eval.md +13 -31
package/src/prompts/tools/find.md +2 -1
package/src/prompts/tools/hashline.md +66 -57
package/src/prompts/tools/search.md +2 -2
package/src/session/session-manager.ts +17 -13
package/src/tools/ast-edit.ts +141 -44
package/src/tools/ast-grep.ts +112 -36
package/src/tools/eval.ts +2 -53
package/src/tools/find.ts +16 -15
package/src/tools/path-utils.ts +36 -196
package/src/tools/search.ts +56 -35
package/src/utils/edit-mode.ts +2 -11
package/src/utils/file-display-mode.ts +1 -1
package/src/utils/git.ts +17 -0
package/src/utils/session-color.ts +0 -12
package/src/utils/title-generator.ts +22 -38
package/src/autoresearch/apply-contract-to-state.ts +0 -24
package/src/autoresearch/contract.ts +0 -288
package/src/edit/modes/atom.lark +0 -29
package/src/edit/modes/atom.ts +0 -1773
package/src/prompts/tools/atom.md +0 -150

package/src/autoresearch/tools/run-experiment.ts CHANGED Viewed

@@ -7,48 +7,25 @@ import { Type } from "@sinclair/typebox";
 import type { ToolDefinition } from "../../extensibility/extensions";
 import type { Theme } from "../../modes/theme/theme";
 import { DEFAULT_MAX_BYTES, DEFAULT_MAX_LINES, truncateTail } from "../../session/streaming-output";
-import { replaceTabs, shortenPath, truncateToWidth } from "../../tools/render-utils";
+import { replaceTabs, shortenPath } from "../../tools/render-utils";
 import * as git from "../../utils/git";
 import { parseWorkDirDirtyPaths } from "../git";
 import {
-	collectLoggedRunNumbers,
 	EXPERIMENT_MAX_BYTES,
 	EXPERIMENT_MAX_LINES,
 	formatElapsed,
 	formatNum,
-	getAutoresearchRunDirectory,
-	getNextAutoresearchRunNumber,
-	isAutoresearchLocalStatePath,
-	isAutoresearchShCommand,
 	killTree,
 	parseAsiLines,
 	parseMetricLines,
-	readPendingRunSummary,
-	resolveWorkDir,
-	validateWorkDir,
 } from "../helpers";
+import { buildExperimentState } from "../state";
+import { openAutoresearchStorageIfExists } from "../storage";
 import type { AutoresearchToolFactoryOptions, RunDetails, RunExperimentProgressDetails } from "../types";
+import { DEFAULT_HARNESS_COMMAND } from "./init-experiment";
 const runExperimentSchema = Type.Object({
-	command: Type.String({
-		description: "Shell command to run for this experiment.",
-	}),
-	timeout_seconds: Type.Optional(
-		Type.Number({
-			description: "Timeout in seconds. Defaults to 600.",
-		}),
-	),
-	checks_timeout_seconds: Type.Optional(
-		Type.Number({
-			description: "Timeout in seconds for autoresearch.checks.sh. Defaults to 300.",
-		}),
-	),
-	force: Type.Optional(
-		Type.Boolean({
-			description:
-				"When true, allow a command that differs from the segment benchmark command and skip the rule that autoresearch.sh must be invoked directly when that script exists.",
-		}),
-	),
+	timeout_seconds: Type.Optional(Type.Number({ description: "Timeout in seconds. Defaults to 600." })),
 });
 interface ProcessExecutionResult {
@@ -58,13 +35,6 @@ interface ProcessExecutionResult {
 	output: string;
 }
-interface ChecksExecutionResult {
-	code: number | null;
-	killed: boolean;
-	logPath: string;
-	output: string;
-}
 interface ProgressSnapshot {
 	elapsed: string;
 	runDirectory: string;
@@ -80,136 +50,73 @@ export function createRunExperimentTool(
 		name: "run_experiment",
 		label: "Run Experiment",
 		description:
-			"Run an experiment command with timing, output capture, structured metric parsing, durable run artifacts, and optional autoresearch.checks.sh validation.",
+			"Run any benchmark command. Output is captured automatically; `METRIC name=value` and `ASI key=value` lines printed by the command are parsed.",
 		parameters: runExperimentSchema,
 		defaultInactive: true,
 		async execute(_toolCallId, params, signal, onUpdate, ctx) {
-			const workDirError = validateWorkDir(ctx.cwd);
-			if (workDirError) {
-				return {
-					content: [{ type: "text", text: `Error: ${workDirError}` }],
-				};
-			}
-			const runtime = options.getRuntime(ctx);
-			const state = runtime.state;
-			const workDir = resolveWorkDir(ctx.cwd);
-			const checksPath = path.join(workDir, "autoresearch.checks.sh");
-			const autoresearchScriptPath = path.join(workDir, "autoresearch.sh");
-			const forceCommand = params.force === true;
-			if (!forceCommand && state.benchmarkCommand && params.command.trim() !== state.benchmarkCommand) {
+			const storage = await openAutoresearchStorageIfExists(ctx.cwd);
+			const currentBranch = (await git.branch.current(ctx.cwd)) ?? null;
+			const session = storage?.getActiveSessionForBranch(currentBranch) ?? null;
+			if (!storage || !session) {
 				return {
 					content: [
 						{
 							type: "text",
-							text:
-								"Error: command does not match the benchmark command recorded for this segment.\n" +
-								`Expected: ${state.benchmarkCommand}\nReceived: ${params.command}`,
+							text: "Error: no active autoresearch session for the current branch. Call init_experiment first.",
 						},
 					],
 				};
 			}
-			if (!forceCommand && fs.existsSync(autoresearchScriptPath) && !isAutoresearchShCommand(params.command)) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								`Error: autoresearch.sh exists. Run it directly instead of using a different command.\n` +
-								`Expected something like: bash autoresearch.sh\n` +
-								`Received: ${params.command}`,
-						},
-					],
-				};
-			}
+			const runtime = options.getRuntime(ctx);
-			if (state.maxExperiments !== null) {
-				const segmentRuns = state.results.filter(result => result.segment === state.currentSegment).length;
-				if (segmentRuns >= state.maxExperiments) {
-					return {
-						content: [
-							{
-								type: "text",
-								text: `Maximum experiments reached (${state.maxExperiments}). Re-initialize to start a new segment.`,
-							},
-						],
-					};
-				}
-			}
+			const abandonedPriorRun = (() => {
+				const pending = storage.getPendingRun(session.id);
+				if (!pending) return null;
+				storage.abandonPendingRuns(session.id);
+				return pending.id;
+			})();
-			const pendingRun =
-				runtime.lastRunSummary ?? (await readPendingRunSummary(workDir, collectLoggedRunNumbers(state.results)));
-			if (pendingRun) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								`Error: run #${pendingRun.runNumber} has not been logged yet. ` +
-								"Call log_experiment before starting another benchmark run.",
-						},
-					],
-				};
-			}
+			const resolvedCommand = DEFAULT_HARNESS_COMMAND;
+			const preRunStatus = await tryGitStatus(ctx.cwd);
+			const workDirPrefix = await tryGitPrefix(ctx.cwd);
+			const preRunDirtyPaths = parseWorkDirDirtyPaths(preRunStatus, workDirPrefix);
-			const runNumber = getNextAutoresearchRunNumber(workDir, runtime.lastRunNumber);
-			const runDirectory = getAutoresearchRunDirectory(workDir, runNumber);
-			const benchmarkLogPath = path.join(runDirectory, "benchmark.log");
-			const checksLogPath = path.join(runDirectory, "checks.log");
-			const runJsonPath = path.join(runDirectory, "run.json");
-			await fs.promises.mkdir(runDirectory, { recursive: true });
-			const preRunStatus = await git.status(workDir, {
-				porcelainV1: true,
-				untrackedFiles: "all",
-				z: true,
+			const startedAt = Date.now();
+			const insertedRun = storage.insertRun({
+				sessionId: session.id,
+				segment: session.currentSegment,
+				command: resolvedCommand,
+				logPath: "", // patched after we know the run id
+				preRunDirtyPaths,
+				startedAt,
 			});
-			const workDirPrefix = await git.show.prefix(workDir);
-			const preRunDirtyPaths = parseWorkDirDirtyPaths(preRunStatus, workDirPrefix).filter(
-				p => !isAutoresearchLocalStatePath(p),
-			);
-			runtime.lastRunChecks = null;
+			const runDirectory = path.join(storage.projectDir, "runs", String(insertedRun.id).padStart(4, "0"));
+			const benchmarkLogPath = path.join(runDirectory, "benchmark.log");
+			fs.mkdirSync(runDirectory, { recursive: true });
+			storage.updateRunLogPath(insertedRun.id, benchmarkLogPath);
 			runtime.lastRunDuration = null;
 			runtime.lastRunAsi = null;
 			runtime.lastRunArtifactDir = runDirectory;
-			runtime.lastRunNumber = runNumber;
+			runtime.lastRunNumber = insertedRun.id;
 			runtime.lastRunSummary = null;
-			await Bun.write(
-				runJsonPath,
-				JSON.stringify(
-					{
-						runNumber,
-						runDirectory,
-						benchmarkLogPath,
-						checksLogPath,
-						command: params.command,
-						preRunDirtyPaths,
-						startedAt: new Date().toISOString(),
-					},
-					null,
-					2,
-				),
-			);
 			runtime.runningExperiment = {
-				startedAt: Date.now(),
-				command: params.command,
+				startedAt,
+				command: resolvedCommand,
 				runDirectory,
-				runNumber,
+				runNumber: insertedRun.id,
 			};
 			options.dashboard.updateWidget(ctx, runtime);
 			options.dashboard.requestRender();
 			const timeoutMs = Math.max(0, Math.floor((params.timeout_seconds ?? 600) * 1000));
-			const startedAt = Date.now();
 			let execution: ProcessExecutionResult;
 			try {
 				execution = await executeProcess({
-					command: ["bash", "-lc", params.command],
-					cwd: workDir,
+					command: ["bash", "-lc", resolvedCommand],
+					cwd: ctx.cwd,
 					logPath: benchmarkLogPath,
 					timeoutMs,
 					signal,
@@ -232,41 +139,11 @@ export function createRunExperimentTool(
 				options.dashboard.requestRender();
 			}
-			const durationSeconds = (Date.now() - startedAt) / 1000;
+			const completedAt = Date.now();
+			const durationMs = completedAt - startedAt;
+			const durationSeconds = durationMs / 1000;
 			runtime.lastRunDuration = durationSeconds;
-			const benchmarkPassed = execution.exitCode === 0 && !execution.killed;
-			let checksPass: boolean | null = null;
-			let checksTimedOut = false;
-			let checksOutput = "";
-			let checksDuration = 0;
-			let checksLogPathValue: string | undefined;
-			if (benchmarkPassed && fs.existsSync(checksPath)) {
-				const checksStartedAt = Date.now();
-				const checksResult = await runChecks({
-					cwd: workDir,
-					pathToChecks: checksPath,
-					logPath: checksLogPath,
-					timeoutMs: Math.max(0, Math.floor((params.checks_timeout_seconds ?? 300) * 1000)),
-					signal,
-				});
-				checksDuration = (Date.now() - checksStartedAt) / 1000;
-				checksTimedOut = checksResult.killed;
-				checksPass = checksResult.code === 0 && !checksResult.killed;
-				checksOutput = checksResult.output;
-				checksLogPathValue = checksResult.logPath;
-			}
-			runtime.lastRunChecks =
-				checksPass === null
-					? null
-					: {
-							pass: checksPass,
-							output: checksOutput,
-							duration: checksDuration,
-						};
 			const llmTruncation = truncateTail(execution.output, {
 				maxBytes: EXPERIMENT_MAX_BYTES,
 				maxLines: EXPERIMENT_MAX_LINES,
@@ -278,113 +155,87 @@ export function createRunExperimentTool(
 			const parsedMetricsMap = parseMetricLines(execution.output);
 			const parsedMetrics = parsedMetricsMap.size > 0 ? Object.fromEntries(parsedMetricsMap.entries()) : null;
-			const parsedPrimary = parsedMetricsMap.get(state.metricName) ?? null;
+			const parsedPrimary = parsedMetricsMap.get(session.primaryMetric) ?? null;
 			const parsedAsi = parseAsiLines(execution.output);
 			runtime.lastRunAsi = parsedAsi;
+			storage.markRunCompleted({
+				runId: insertedRun.id,
+				completedAt,
+				durationMs,
+				exitCode: execution.exitCode,
+				timedOut: execution.killed,
+				parsedPrimary,
+				parsedMetrics,
+				parsedAsi,
+			});
+			const passed = execution.exitCode === 0 && !execution.killed;
 			const resultDetails: RunDetails = {
-				runNumber,
+				runNumber: insertedRun.id,
 				runDirectory,
 				benchmarkLogPath,
-				checksLogPath: checksLogPathValue,
-				command: params.command,
+				command: resolvedCommand,
 				exitCode: execution.exitCode,
 				durationSeconds,
-				passed: benchmarkPassed && (checksPass === null || checksPass),
-				crashed: execution.exitCode !== 0 || execution.killed || checksPass === false,
+				passed,
+				crashed: execution.exitCode !== 0 || execution.killed,
 				timedOut: execution.killed,
 				tailOutput: displayTruncation.content,
-				checksPass,
-				checksTimedOut,
-				checksOutput: checksOutput.split("\n").slice(-80).join("\n"),
-				checksDuration,
 				parsedMetrics,
 				parsedPrimary,
 				parsedAsi,
-				metricName: state.metricName,
-				metricUnit: state.metricUnit,
+				metricName: session.primaryMetric,
+				metricUnit: session.metricUnit,
 				preRunDirtyPaths,
+				abandonedPriorRun,
 				truncation: llmTruncation.truncated ? llmTruncation : undefined,
 				fullOutputPath: execution.logPath,
 			};
 			runtime.lastRunSummary = {
-				checksDurationSeconds: checksDuration,
-				checksPass,
-				checksTimedOut,
-				command: params.command,
+				command: resolvedCommand,
 				durationSeconds,
 				parsedAsi,
 				parsedMetrics,
 				parsedPrimary,
-				passed: resultDetails.passed,
+				passed,
 				preRunDirtyPaths,
 				runDirectory,
-				runNumber,
+				runNumber: insertedRun.id,
+				exitCode: execution.exitCode,
+				timedOut: execution.killed,
 			};
 			runtime.autoResumeArmed = true;
 			runtime.lastAutoResumePendingRunNumber = null;
+			// Refresh state to reflect any prior abandonment changes (logged set unchanged).
+			const refreshedSession = storage.getSessionById(session.id);
+			if (refreshedSession) {
+				runtime.state = buildExperimentState(refreshedSession, storage.listLoggedRuns(session.id));
+			}
 			options.dashboard.updateWidget(ctx, runtime);
 			options.dashboard.requestRender();
-			await Bun.write(
-				runJsonPath,
-				JSON.stringify(
-					{
-						runNumber,
-						runDirectory,
-						benchmarkLogPath,
-						checksLogPath: checksLogPathValue,
-						command: params.command,
-						completedAt: new Date().toISOString(),
-						durationSeconds,
-						exitCode: execution.exitCode,
-						timedOut: execution.killed,
-						checks: {
-							durationSeconds: checksDuration,
-							passed: checksPass,
-							timedOut: checksTimedOut,
-						},
-						parsedMetrics,
-						parsedPrimary,
-						parsedAsi,
-						preRunDirtyPaths,
-						truncation: resultDetails.truncation,
-						fullOutputPath: resultDetails.fullOutputPath,
-					},
-					null,
-					2,
-				),
-			);
-			const commandWarnings: string[] = [];
-			if (forceCommand) {
-				if (state.benchmarkCommand && params.command.trim() !== state.benchmarkCommand) {
-					commandWarnings.push(
-						`Warning: command override (force=true). Segment benchmark is ${state.benchmarkCommand}; ran ${params.command}.`,
-					);
-				}
-				if (fs.existsSync(autoresearchScriptPath) && !isAutoresearchShCommand(params.command)) {
-					commandWarnings.push(
-						"Warning: autoresearch.sh exists but the command was not a direct autoresearch.sh invocation (force=true).",
-					);
-				}
+			const headerLines: string[] = [];
+			if (abandonedPriorRun !== null) {
+				headerLines.push(`Note: abandoned prior pending run #${abandonedPriorRun} before starting this run.`);
 			}
-			const warningPrefix = commandWarnings.length > 0 ? `${commandWarnings.join("\n")}\n\n` : "";
+			const warningPrefix = headerLines.length > 0 ? `${headerLines.join("\n")}\n\n` : "";
 			return {
 				content: [
 					{
 						type: "text",
-						text: warningPrefix + buildRunText(resultDetails, llmTruncation.content, state.bestMetric),
+						text: warningPrefix + buildRunText(resultDetails, llmTruncation.content, runtime.state.bestMetric),
 					},
 				],
 				details: resultDetails,
 			};
 		},
-		renderCall(args, _options, theme): Text {
-			const commandPreview = truncateToWidth(replaceTabs(args.command), 100);
+		renderCall(_args, _options, theme): Text {
 			return new Text(
-				`${theme.fg("toolTitle", theme.bold("run_experiment"))} ${theme.fg("muted", commandPreview)}`,
+				`${theme.fg("toolTitle", theme.bold("run_experiment"))} ${theme.fg("muted", DEFAULT_HARNESS_COMMAND)}`,
 				0,
 				0,
 			);
@@ -395,17 +246,14 @@ export function createRunExperimentTool(
 				const preview = replaceTabs(result.content.find(part => part.type === "text")?.text ?? "");
 				return new Text(preview ? `${header}\n${theme.fg("dim", preview)}` : header, 0, 0);
 			}
 			const details = result.details;
 			if (!details || !isRunDetails(details)) {
 				return new Text(replaceTabs(result.content.find(part => part.type === "text")?.text ?? ""), 0, 0);
 			}
 			const statusText = renderStatus(details, theme);
 			if (!options.expanded && details.tailOutput.trim().length === 0) {
 				return new Text(statusText, 0, 0);
 			}
 			const preview = replaceTabs(
 				options.expanded ? details.tailOutput : details.tailOutput.split("\n").slice(-5).join("\n"),
 			);
@@ -418,7 +266,23 @@ export function createRunExperimentTool(
 	};
 }
-async function executeProcess(options: {
+async function tryGitStatus(cwd: string): Promise<string> {
+	try {
+		return await git.status(cwd, { porcelainV1: true, untrackedFiles: "all", z: true });
+	} catch {
+		return "";
+	}
+}
+async function tryGitPrefix(cwd: string): Promise<string> {
+	try {
+		return await git.show.prefix(cwd);
+	} catch {
+		return "";
+	}
+}
+async function executeProcess(opts: {
 	command: string[];
 	cwd: string;
 	logPath: string;
@@ -427,8 +291,8 @@ async function executeProcess(options: {
 	onProgress?(details: ProgressSnapshot): void;
 }): Promise<ProcessExecutionResult> {
 	const { promise, resolve, reject } = Promise.withResolvers<ProcessExecutionResult>();
-	const child = childProcess.spawn(options.command[0] ?? "bash", options.command.slice(1), {
-		cwd: options.cwd,
+	const child = childProcess.spawn(opts.command[0] ?? "bash", opts.command.slice(1), {
+		cwd: opts.cwd,
 		detached: true,
 		stdio: ["ignore", "pipe", "pipe"],
 	});
@@ -437,7 +301,7 @@ async function executeProcess(options: {
 	let chunksBytes = 0;
 	let killedByTimeout = false;
 	let resolved = false;
-	let writeStream: fs.WriteStream | undefined = fs.createWriteStream(options.logPath);
+	let writeStream: fs.WriteStream | undefined = fs.createWriteStream(opts.logPath);
 	let forceKillTimeout: NodeJS.Timeout | undefined;
 	const closeWriteStream = (): Promise<void> => {
@@ -459,7 +323,7 @@ async function executeProcess(options: {
 		if (progressTimer) clearInterval(progressTimer);
 		if (timeoutHandle) clearTimeout(timeoutHandle);
 		if (forceKillTimeout) clearTimeout(forceKillTimeout);
-		options.signal?.removeEventListener("abort", abortHandler);
+		opts.signal?.removeEventListener("abort", abortHandler);
 	};
 	const finish = (callback: () => void): void => {
@@ -486,8 +350,8 @@ async function executeProcess(options: {
 		});
 		return {
 			elapsed: formatElapsed(Date.now() - startedAt),
-			runDirectory: path.dirname(options.logPath),
-			fullOutputPath: options.logPath,
+			runDirectory: path.dirname(opts.logPath),
+			fullOutputPath: opts.logPath,
 			tailOutput: tail.content,
 			truncation: tail.truncated ? tail : undefined,
 		};
@@ -503,26 +367,26 @@ async function executeProcess(options: {
 	};
 	const startedAt = Date.now();
-	const progressTimer = options.onProgress
+	const progressTimer = opts.onProgress
 		? setInterval(() => {
-				options.onProgress?.(snapshot());
+				opts.onProgress?.(snapshot());
 			}, 1000)
 		: undefined;
 	const timeoutHandle =
-		options.timeoutMs > 0
+		opts.timeoutMs > 0
 			? setTimeout(() => {
 					killedByTimeout = true;
 					killTreeWithEscalation();
-				}, options.timeoutMs)
+				}, opts.timeoutMs)
 			: undefined;
 	const abortHandler = (): void => {
 		killTreeWithEscalation();
 	};
-	if (options.signal?.aborted) {
+	if (opts.signal?.aborted) {
 		abortHandler();
 	} else {
-		options.signal?.addEventListener("abort", abortHandler, { once: true });
+		opts.signal?.addEventListener("abort", abortHandler, { once: true });
 	}
 	child.stdout?.on("data", data => {
@@ -539,16 +403,16 @@ async function executeProcess(options: {
 	child.on("close", async code => {
 		try {
 			await closeWriteStream();
-			if (options.signal?.aborted) {
+			if (opts.signal?.aborted) {
 				finish(() => reject(new Error("aborted")));
 				return;
 			}
-			const output = await fs.promises.readFile(options.logPath, "utf8");
+			const output = await fs.promises.readFile(opts.logPath, "utf8");
 			finish(() =>
 				resolve({
 					exitCode: code,
 					killed: killedByTimeout,
-					logPath: options.logPath,
+					logPath: opts.logPath,
 					output,
 				}),
 			);
@@ -560,31 +424,9 @@ async function executeProcess(options: {
 	return promise;
 }
-async function runChecks(options: {
-	cwd: string;
-	pathToChecks: string;
-	logPath: string;
-	timeoutMs: number;
-	signal?: AbortSignal;
-}): Promise<ChecksExecutionResult> {
-	const result = await executeProcess({
-		command: ["bash", options.pathToChecks],
-		cwd: options.cwd,
-		logPath: options.logPath,
-		timeoutMs: options.timeoutMs,
-		signal: options.signal,
-	});
-	return {
-		code: result.exitCode,
-		killed: result.killed,
-		logPath: result.logPath,
-		output: result.output.trim(),
-	};
-}
 function buildRunText(details: RunDetails, outputPreview: string, bestMetric: number | null): string {
 	const lines: string[] = [];
-	lines.push(`Run directory: ${details.runDirectory}`);
+	lines.push(`Run #${details.runNumber} directory: ${details.runDirectory}`);
 	if (details.timedOut) {
 		lines.push(`TIMEOUT after ${details.durationSeconds.toFixed(1)}s`);
 	} else if (details.exitCode !== 0) {
@@ -592,13 +434,6 @@ function buildRunText(details: RunDetails, outputPreview: string, bestMetric: nu
 	} else {
 		lines.push(`PASSED in ${details.durationSeconds.toFixed(1)}s`);
 	}
-	if (details.checksTimedOut) {
-		lines.push(`Checks timed out after ${details.checksDuration.toFixed(1)}s`);
-	} else if (details.checksPass === false) {
-		lines.push(`Checks failed in ${details.checksDuration.toFixed(1)}s`);
-	} else if (details.checksPass === true) {
-		lines.push(`Checks passed in ${details.checksDuration.toFixed(1)}s`);
-	}
 	if (bestMetric !== null) {
 		lines.push(`Current baseline ${details.metricName}: ${formatNum(bestMetric, details.metricUnit)}`);
 	}
@@ -627,14 +462,6 @@ function buildRunText(details: RunDetails, outputPreview: string, bestMetric: nu
 			`Output truncated (${formatBytes(EXPERIMENT_MAX_BYTES)} limit). Full output: ${details.fullOutputPath}`,
 		);
 	}
-	if (details.checksLogPath) {
-		lines.push(`Checks log: ${details.checksLogPath}`);
-	}
-	if (details.checksPass === false && details.checksOutput.length > 0) {
-		lines.push("");
-		lines.push("Checks output:");
-		lines.push(details.checksOutput);
-	}
 	return lines.join("\n").trimEnd();
 }
@@ -642,12 +469,6 @@ function renderStatus(details: RunDetails, theme: Theme): string {
 	if (details.timedOut) {
 		return theme.fg("error", `TIMEOUT ${details.durationSeconds.toFixed(1)}s`);
 	}
-	if (details.checksTimedOut) {
-		return theme.fg("warning", `Checks timeout ${details.checksDuration.toFixed(1)}s`);
-	}
-	if (details.checksPass === false) {
-		return theme.fg("error", `Checks failed ${details.checksDuration.toFixed(1)}s`);
-	}
 	if (details.exitCode !== 0) {
 		return theme.fg("error", `FAIL exit=${details.exitCode} ${details.durationSeconds.toFixed(1)}s`);
 	}
@@ -665,5 +486,5 @@ function isRunDetails(value: unknown): value is RunDetails {
 function isProgressDetails(value: unknown): value is RunExperimentProgressDetails {
 	if (typeof value !== "object" || value === null) return false;
-	return "phase" in value && value.phase === "running";
+	return "phase" in value && (value as { phase: unknown }).phase === "running";
 }