npm - @oh-my-pi/pi-coding-agent - Versions diffs - 13.18.0 → 14.0.2 - Mend

@oh-my-pi/pi-coding-agent 13.18.0 → 14.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (235) hide show

package/CHANGELOG.md +316 -1
package/package.json +86 -24
package/scripts/format-prompts.ts +2 -2
package/src/autoresearch/apply-contract-to-state.ts +24 -0
package/src/autoresearch/contract.ts +0 -44
package/src/autoresearch/dashboard.ts +1 -2
package/src/autoresearch/git.ts +116 -30
package/src/autoresearch/helpers.ts +49 -0
package/src/autoresearch/index.ts +28 -187
package/src/autoresearch/prompt.md +26 -9
package/src/autoresearch/state.ts +0 -6
package/src/autoresearch/tools/init-experiment.ts +202 -117
package/src/autoresearch/tools/log-experiment.ts +123 -178
package/src/autoresearch/tools/run-experiment.ts +48 -10
package/src/autoresearch/types.ts +2 -2
package/src/capability/index.ts +4 -2
package/src/cli/file-processor.ts +3 -3
package/src/cli/grep-cli.ts +8 -8
package/src/cli/grievances-cli.ts +78 -0
package/src/cli/read-cli.ts +67 -0
package/src/cli/setup-cli.ts +4 -4
package/src/cli/update-cli.ts +3 -3
package/src/cli.ts +2 -0
package/src/commands/grep.ts +6 -1
package/src/commands/grievances.ts +20 -0
package/src/commands/read.ts +33 -0
package/src/commit/agentic/agent.ts +5 -8
package/src/commit/agentic/index.ts +22 -26
package/src/commit/agentic/tools/analyze-file.ts +3 -3
package/src/commit/agentic/tools/git-file-diff.ts +3 -6
package/src/commit/agentic/tools/git-hunk.ts +3 -3
package/src/commit/agentic/tools/git-overview.ts +6 -9
package/src/commit/agentic/tools/index.ts +6 -8
package/src/commit/agentic/tools/propose-commit.ts +4 -7
package/src/commit/agentic/tools/recent-commits.ts +3 -3
package/src/commit/agentic/tools/split-commit.ts +4 -4
package/src/commit/agentic/validation.ts +1 -1
package/src/commit/analysis/conventional.ts +4 -4
package/src/commit/analysis/summary.ts +3 -3
package/src/commit/changelog/generate.ts +4 -4
package/src/commit/changelog/index.ts +5 -9
package/src/commit/map-reduce/map-phase.ts +4 -4
package/src/commit/map-reduce/reduce-phase.ts +4 -4
package/src/commit/pipeline.ts +13 -16
package/src/config/keybindings.ts +7 -6
package/src/config/prompt-templates.ts +44 -226
package/src/config/resolve-config-value.ts +4 -2
package/src/config/settings-schema.ts +98 -2
package/src/config/settings.ts +25 -26
package/src/dap/client.ts +674 -0
package/src/dap/config.ts +150 -0
package/src/dap/defaults.json +211 -0
package/src/dap/index.ts +4 -0
package/src/dap/session.ts +1255 -0
package/src/dap/types.ts +600 -0
package/src/debug/log-viewer.ts +3 -2
package/src/discovery/builtin.ts +1 -2
package/src/discovery/codex.ts +2 -2
package/src/discovery/github.ts +2 -1
package/src/discovery/helpers.ts +2 -2
package/src/discovery/opencode.ts +2 -2
package/src/edit/diff.ts +818 -0
package/src/edit/index.ts +309 -0
package/src/edit/line-hash.ts +67 -0
package/src/edit/modes/chunk.ts +454 -0
package/src/{patch → edit/modes}/hashline.ts +741 -361
package/src/{patch/applicator.ts → edit/modes/patch.ts} +420 -117
package/src/{patch/fuzzy.ts → edit/modes/replace.ts} +519 -197
package/src/{patch → edit}/normalize.ts +97 -76
package/src/{patch/shared.ts → edit/renderer.ts} +181 -108
package/src/exec/bash-executor.ts +4 -2
package/src/exec/idle-timeout-watchdog.ts +126 -0
package/src/exec/non-interactive-env.ts +5 -0
package/src/extensibility/custom-commands/bundled/ci-green/index.ts +6 -18
package/src/extensibility/custom-commands/bundled/review/index.ts +45 -43
package/src/extensibility/custom-commands/loader.ts +1 -2
package/src/extensibility/custom-tools/loader.ts +34 -11
package/src/extensibility/custom-tools/types.ts +1 -1
package/src/extensibility/extensions/loader.ts +9 -4
package/src/extensibility/extensions/runner.ts +24 -1
package/src/extensibility/extensions/types.ts +4 -2
package/src/extensibility/hooks/loader.ts +5 -6
package/src/extensibility/hooks/types.ts +2 -2
package/src/extensibility/plugins/doctor.ts +2 -1
package/src/extensibility/plugins/marketplace/fetcher.ts +2 -57
package/src/extensibility/plugins/marketplace/source-resolver.ts +4 -4
package/src/extensibility/slash-commands.ts +3 -7
package/src/index.ts +3 -1
package/src/internal-urls/docs-index.generated.ts +11 -11
package/src/ipy/executor.ts +58 -17
package/src/ipy/gateway-coordinator.ts +6 -4
package/src/ipy/kernel.ts +45 -22
package/src/ipy/runtime.ts +2 -2
package/src/lsp/client.ts +7 -4
package/src/lsp/clients/lsp-linter-client.ts +4 -4
package/src/lsp/config.ts +2 -2
package/src/lsp/defaults.json +688 -154
package/src/lsp/index.ts +234 -45
package/src/lsp/lspmux.ts +2 -2
package/src/lsp/startup-events.ts +13 -0
package/src/lsp/types.ts +12 -1
package/src/lsp/utils.ts +8 -1
package/src/main.ts +125 -47
package/src/memories/index.ts +4 -5
package/src/modes/acp/acp-agent.ts +563 -163
package/src/modes/acp/acp-event-mapper.ts +9 -1
package/src/modes/acp/acp-mode.ts +4 -2
package/src/modes/components/agent-dashboard.ts +3 -4
package/src/modes/components/diff.ts +6 -7
package/src/modes/components/footer.ts +9 -29
package/src/modes/components/hook-editor.ts +3 -3
package/src/modes/components/hook-selector.ts +6 -1
package/src/modes/components/read-tool-group.ts +6 -12
package/src/modes/components/session-observer-overlay.ts +472 -0
package/src/modes/components/settings-defs.ts +24 -0
package/src/modes/components/status-line.ts +15 -61
package/src/modes/components/tool-execution.ts +1 -1
package/src/modes/components/welcome.ts +1 -1
package/src/modes/controllers/btw-controller.ts +2 -2
package/src/modes/controllers/command-controller.ts +4 -2
package/src/modes/controllers/event-controller.ts +59 -2
package/src/modes/controllers/extension-ui-controller.ts +1 -0
package/src/modes/controllers/input-controller.ts +15 -8
package/src/modes/controllers/selector-controller.ts +26 -0
package/src/modes/index.ts +20 -2
package/src/modes/interactive-mode.ts +278 -69
package/src/modes/rpc/host-tools.ts +186 -0
package/src/modes/rpc/rpc-client.ts +178 -13
package/src/modes/rpc/rpc-mode.ts +73 -3
package/src/modes/rpc/rpc-types.ts +53 -1
package/src/modes/session-observer-registry.ts +146 -0
package/src/modes/shared.ts +0 -42
package/src/modes/theme/theme.ts +80 -8
package/src/modes/types.ts +4 -2
package/src/modes/utils/keybinding-matchers.ts +9 -0
package/src/prompts/system/custom-system-prompt.md +5 -0
package/src/prompts/system/system-prompt.md +8 -1
package/src/prompts/tools/chunk-edit.md +219 -0
package/src/prompts/tools/debug.md +43 -0
package/src/prompts/tools/grep.md +3 -0
package/src/prompts/tools/lsp.md +5 -5
package/src/prompts/tools/read-chunk.md +17 -0
package/src/prompts/tools/read.md +19 -5
package/src/sdk.ts +216 -165
package/src/secrets/index.ts +1 -1
package/src/secrets/obfuscator.ts +25 -17
package/src/session/agent-session.ts +381 -286
package/src/session/agent-storage.ts +12 -12
package/src/session/compaction/branch-summarization.ts +3 -3
package/src/session/compaction/compaction.ts +5 -6
package/src/session/compaction/utils.ts +3 -3
package/src/session/history-storage.ts +62 -19
package/src/session/messages.ts +3 -3
package/src/session/session-dump-format.ts +203 -0
package/src/session/session-manager.ts +15 -5
package/src/session/session-storage.ts +4 -2
package/src/session/streaming-output.ts +1 -1
package/src/session/tool-choice-queue.ts +213 -0
package/src/slash-commands/builtin-registry.ts +56 -8
package/src/ssh/connection-manager.ts +2 -2
package/src/ssh/sshfs-mount.ts +5 -5
package/src/stt/downloader.ts +4 -4
package/src/stt/recorder.ts +4 -4
package/src/stt/transcriber.ts +2 -2
package/src/system-prompt.ts +25 -13
package/src/task/agents.ts +5 -6
package/src/task/commands.ts +2 -5
package/src/task/executor.ts +32 -4
package/src/task/index.ts +91 -82
package/src/task/template.ts +2 -2
package/src/task/types.ts +25 -0
package/src/task/worktree.ts +131 -149
package/src/tools/ask.ts +2 -3
package/src/tools/ast-edit.ts +7 -7
package/src/tools/ast-grep.ts +7 -7
package/src/tools/auto-generated-guard.ts +36 -41
package/src/tools/await-tool.ts +2 -2
package/src/tools/bash.ts +5 -23
package/src/tools/browser.ts +4 -5
package/src/tools/calculator.ts +2 -3
package/src/tools/cancel-job.ts +2 -2
package/src/tools/checkpoint.ts +3 -3
package/src/tools/debug.ts +1007 -0
package/src/tools/exit-plan-mode.ts +3 -3
package/src/tools/fetch.ts +67 -3
package/src/tools/find.ts +4 -5
package/src/tools/fs-cache-invalidation.ts +5 -0
package/src/tools/gemini-image.ts +13 -5
package/src/tools/gh.ts +130 -308
package/src/tools/grep.ts +57 -9
package/src/tools/index.ts +44 -22
package/src/tools/inspect-image.ts +4 -4
package/src/tools/output-meta.ts +1 -1
package/src/tools/python.ts +19 -6
package/src/tools/read.ts +211 -146
package/src/tools/render-mermaid.ts +2 -3
package/src/tools/render-utils.ts +20 -6
package/src/tools/renderers.ts +3 -1
package/src/tools/report-tool-issue.ts +80 -0
package/src/tools/resolve.ts +70 -39
package/src/tools/search-tool-bm25.ts +2 -2
package/src/tools/ssh.ts +2 -2
package/src/tools/todo-write.ts +2 -2
package/src/tools/tool-timeouts.ts +1 -0
package/src/tools/write.ts +5 -6
package/src/tui/tree-list.ts +3 -1
package/src/utils/clipboard.ts +80 -0
package/src/utils/commit-message-generator.ts +2 -3
package/src/utils/edit-mode.ts +49 -0
package/src/utils/external-editor.ts +11 -5
package/src/utils/file-display-mode.ts +6 -5
package/src/utils/file-mentions.ts +8 -7
package/src/utils/git.ts +1400 -0
package/src/utils/image-loading.ts +98 -0
package/src/utils/title-generator.ts +2 -3
package/src/utils/tools-manager.ts +6 -6
package/src/web/scrapers/choosealicense.ts +1 -1
package/src/web/search/index.ts +3 -3
package/src/web/search/render.ts +6 -4
package/src/autoresearch/command-initialize.md +0 -34
package/src/commit/git/errors.ts +0 -9
package/src/commit/git/index.ts +0 -210
package/src/commit/git/operations.ts +0 -54
package/src/patch/diff.ts +0 -433
package/src/patch/index.ts +0 -888
package/src/patch/parser.ts +0 -532
package/src/patch/types.ts +0 -292
package/src/prompts/agents/oracle.md +0 -77
package/src/tools/gh-cli.ts +0 -125
package/src/tools/pending-action.ts +0 -49
package/src/utils/child-process.ts +0 -88
package/src/utils/frontmatter.ts +0 -117
package/src/utils/image-input.ts +0 -274
package/src/utils/mime.ts +0 -53
package/src/utils/prompt-format.ts +0 -170

package/src/autoresearch/prompt.md CHANGED Viewed

@@ -8,7 +8,11 @@ Autoresearch mode is active.
 Primary goal:
 {{goal}}
 {{else}}
+{{#if has_autoresearch_md}}
 Primary goal is documented in `autoresearch.md` for this session.
+{{else}}
+There is no `autoresearch.md` yet. Infer what to optimize from the latest user message and the conversation; after you create `autoresearch.md`, keep it as the durable source of truth for goal and benchmark contract.
+{{/if}}
 {{/if}}
 Working directory:
@@ -63,7 +67,7 @@ An unlogged run artifact exists at `{{pending_run_directory}}`.
 - `init_experiment` — initialize or reset the experiment session for the current optimization target.
 - `run_experiment` — run a benchmark or experiment command with timing, output capture, structured metric parsing, and optional backpressure checks.
-- `log_experiment` — record the result, update the dashboard, persist JSONL history, auto-commit kept experiments, and auto-revert discarded or failed experiments.
+- `log_experiment` — record the result, update the dashboard, persist JSONL history, auto-commit kept experiments, and revert only run-modified files for discarded or failed experiments (pre-existing uncommitted changes are preserved).
 ### Operating protocol
@@ -83,6 +87,8 @@ An unlogged run artifact exists at `{{pending_run_directory}}`.
    - Use the same workload every run unless you intentionally re-initialize with a new segment.
    - Keep the measurement harness, evaluator, and fixed benchmark inputs stable unless you intentionally start a new segment and document the change.
 4. Initialize the loop with `init_experiment` before the first logged run of a segment.
+   - Pass `from_autoresearch_md: true` with only `name` to load the benchmark contract from `autoresearch.md` without mirroring every field in the tool call.
+   - Use `abandon_unlogged_runs: true` only when you intentionally discard unlogged run artifacts and need a fresh segment (for example after a bad or obsolete benchmark directory).
 5. Run a baseline first.
    - Establish the baseline metric before attempting optimizations.
    - Track secondary metrics only when they matter to correctness, quality, or obvious regressions.
@@ -90,7 +96,9 @@ An unlogged run artifact exists at `{{pending_run_directory}}`.
    - Make one coherent experiment at a time.
    - Run `run_experiment`.
    - Interpret the result honestly.
-   - Call `log_experiment` after every run.
+   - Call `log_experiment` after every run (it refreshes benchmark/scope fields from `autoresearch.md` before logging so keep validation matches the file on disk).
+   - Use `run_experiment` with `force: true` only when you must override the segment benchmark command or skip the direct-`autoresearch.sh` rule.
+   - On `log_experiment`, `force: true` relaxes ASI requirements and allows keeping a primary-metric regression; prefer normal logging when possible.
 7. Keep the primary metric as the decision maker.
    - `keep` when the primary metric improves.
    - `discard` when it regresses or stays flat.
@@ -137,7 +145,11 @@ Suggested structure:
 {{#if has_goal}}
 - {{goal}}
 {{else}}
+{{#if has_autoresearch_md}}
 - document the active target here before the first benchmark
+{{else}}
+- (derive from the user's messages, then record here)
+{{/if}}
 {{/if}}
 ## Benchmark
@@ -194,15 +206,20 @@ Resume from the existing notes:
 {{else}}
 ### Initial setup
-`autoresearch.md` does not exist yet.
+`autoresearch.md` does not exist yet. You decide the benchmark contract, harness, and scope from the user's messages and the repository—do not ask the user to re-type benchmark commands or metric names in a separate UI prompt.
+Before the first benchmark:
-Create the experiment workspace before the first benchmark:
+- Write `autoresearch.md` with goal, benchmark command (must be a **direct** invocation of `autoresearch.sh`, e.g. `bash autoresearch.sh`), primary metric name and unit, direction (`lower` or `higher`), tradeoff metrics if relevant, files in scope, off limits, and constraints.
+- Add a short preflight section: prerequisites, one-time setup, and the comparability invariant that must stay fixed across runs.
+- Mark ground-truth evaluators, fixed datasets, and other measurement-critical files as off limits or hard constraints when they define the benchmark contract.
+- Write or update `autoresearch.program.md` when you learn durable heuristics, failure patterns, or repo-specific strategy for later resume turns.
+- Create `autoresearch.sh` as the canonical benchmark entrypoint; print the primary metric as `METRIC <name>=<number>` and optional secondary metrics as additional `METRIC` lines.
+- Optionally add `autoresearch.checks.sh` if correctness or quality needs a hard gate.
+- Call `init_experiment` with arguments that match `autoresearch.md` exactly (benchmark command, metric, unit, direction, scope paths, off limits, constraints).
+- Run and log the baseline.
-- write `autoresearch.md`
-- write `autoresearch.sh`
-- optionally write `autoresearch.checks.sh`
-- run `init_experiment`
-- run and log the baseline
+Until `init_experiment` succeeds, only autoresearch control files (`autoresearch.md`, `autoresearch.sh`, `autoresearch.program.md`, `autoresearch.ideas.md`, `autoresearch.checks.sh`) may be edited; after initialization, respect Files in Scope from the contract.
 {{/if}}
 {{#if has_checks}}

package/src/autoresearch/state.ts CHANGED Viewed

@@ -34,7 +34,6 @@ export function createExperimentState(): ExperimentState {
 		scopePaths: [],
 		offLimits: [],
 		constraints: [],
-		segmentFingerprint: null,
 	};
 }
@@ -203,8 +202,6 @@ export function reconstructStateFromJsonl(workDir: string): ReconstructedExperim
 			state.scopePaths = cloneStringArray(configEntry.scopePaths);
 			state.offLimits = cloneStringArray(configEntry.offLimits);
 			state.constraints = cloneStringArray(configEntry.constraints);
-			state.segmentFingerprint =
-				typeof configEntry.segmentFingerprint === "string" ? configEntry.segmentFingerprint : null;
 			state.secondaryMetrics = hydrateMetricDefs(configEntry.secondaryMetrics);
 			continue;
 		}
@@ -322,9 +319,6 @@ function parseConfigEntry(value: unknown): AutoresearchJsonConfigEntry | null {
 			candidate.constraints.filter((item): item is string => typeof item === "string"),
 		);
 	}
-	if (typeof candidate.segmentFingerprint === "string" && candidate.segmentFingerprint.trim().length > 0) {
-		config.segmentFingerprint = candidate.segmentFingerprint;
-	}
 	return config;
 }

package/src/autoresearch/tools/init-experiment.ts CHANGED Viewed

@@ -6,15 +6,15 @@ import { Type } from "@sinclair/typebox";
 import type { ToolDefinition } from "../../extensibility/extensions";
 import type { Theme } from "../../modes/theme/theme";
 import { replaceTabs, truncateToWidth } from "../../tools/render-utils";
+import { applyAutoresearchContractToExperimentState } from "../apply-contract-to-state";
 import {
-	buildAutoresearchSegmentFingerprint,
 	contractListsEqual,
 	contractPathListsEqual,
 	loadAutoresearchScriptSnapshot,
 	readAutoresearchContract,
 } from "../contract";
 import {
-	inferMetricUnitFromName,
+	abandonUnloggedAutoresearchRuns,
 	isAutoresearchShCommand,
 	readMaxExperiments,
 	readPendingRunSummary,
@@ -28,9 +28,29 @@ const initExperimentSchema = Type.Object({
 	name: Type.String({
 		description: "Human-readable experiment name.",
 	}),
-	metric_name: Type.String({
-		description: "Primary metric name shown in the dashboard.",
-	}),
+	from_autoresearch_md: Type.Optional(
+		Type.Boolean({
+			description:
+				"When true, load benchmark command, metrics, scope, off-limits, and constraints from autoresearch.md instead of passing mirrored fields below.",
+		}),
+	),
+	abandon_unlogged_runs: Type.Optional(
+		Type.Boolean({
+			description:
+				"When true, mark all completed but unlogged run artifacts as abandoned so initialization can proceed without logging them first.",
+		}),
+	),
+	new_segment: Type.Optional(
+		Type.Boolean({
+			description:
+				"When true, force a new segment even when the contract fields have not changed. Without this, re-initialization with matching contract is a no-op.",
+		}),
+	),
+	metric_name: Type.Optional(
+		Type.String({
+			description: "Primary metric name shown in the dashboard. Required when from_autoresearch_md is false.",
+		}),
+	),
 	metric_unit: Type.Optional(
 		Type.String({
 			description: "Unit for the primary metric, for example µs, ms, s, kb, or empty.",
@@ -41,13 +61,17 @@ const initExperimentSchema = Type.Object({
 			description: "Whether lower or higher values are better. Defaults to lower.",
 		}),
 	),
-	benchmark_command: Type.String({
-		description: "Benchmark command recorded in autoresearch.md.",
-	}),
-	scope_paths: Type.Array(Type.String(), {
-		description: "Files in Scope from autoresearch.md. Must be non-empty.",
-		minItems: 1,
-	}),
+	benchmark_command: Type.Optional(
+		Type.String({
+			description: "Benchmark command recorded in autoresearch.md. Required when from_autoresearch_md is false.",
+		}),
+	),
+	scope_paths: Type.Optional(
+		Type.Array(Type.String(), {
+			description: "Files in Scope from autoresearch.md. Required when from_autoresearch_md is false.",
+			minItems: 1,
+		}),
+	),
 	off_limits: Type.Optional(
 		Type.Array(Type.String(), {
 			description: "Off Limits paths from autoresearch.md.",
@@ -86,25 +110,43 @@ export function createInitExperimentTool(
 			const state = runtime.state;
 			const isReinitializing = state.results.length > 0;
 			const workDir = resolveWorkDir(ctx.cwd);
-			const pendingRun = await readPendingRunSummary(workDir, collectLoggedRunNumbers(state.results));
+			const loggedRunNumbers = collectLoggedRunNumbers(state.results);
+			let abandonSummary = "";
+			if (params.abandon_unlogged_runs === true) {
+				const abandoned = await abandonUnloggedAutoresearchRuns(workDir, loggedRunNumbers);
+				if (abandoned > 0) {
+					abandonSummary =
+						abandoned === 1
+							? "Abandoned 1 unlogged run artifact.\n"
+							: `Abandoned ${abandoned} unlogged run artifacts.\n`;
+				}
+			}
+			const pendingRun = await readPendingRunSummary(workDir, loggedRunNumbers);
 			if (pendingRun) {
+				const metricInfo = pendingRun.parsedPrimary !== null ? `, metric=${pendingRun.parsedPrimary}` : "";
+				const passedInfo = pendingRun.passed ? "passed" : "failed";
 				return {
 					content: [
 						{
 							type: "text",
 							text:
-								`Error: run #${pendingRun.runNumber} has not been logged yet. ` +
-								"Call log_experiment before re-initializing the current segment.",
+								abandonSummary +
+								`Error: run #${pendingRun.runNumber} has not been logged yet.\n` +
+								`Pending: command="${pendingRun.command}"${metricInfo}, ${passedInfo}\n` +
+								"Call log_experiment before re-initializing, or pass abandon_unlogged_runs=true.",
 						},
 					],
 				};
 			}
 			const contractResult = readAutoresearchContract(workDir);
 			const scriptSnapshot = loadAutoresearchScriptSnapshot(workDir);
 			const errors = [...contractResult.errors, ...scriptSnapshot.errors];
 			if (errors.length > 0) {
 				return {
-					content: [{ type: "text", text: `Error: ${errors.join(" ")}` }],
+					content: [{ type: "text", text: `${abandonSummary}Error: ${errors.join(" ")}` }],
 				};
 			}
@@ -117,118 +159,161 @@ export function createInitExperimentTool(
 						{
 							type: "text",
 							text:
+								abandonSummary +
 								"Error: Benchmark.command in autoresearch.md must invoke `autoresearch.sh` directly. " +
 								"Move the real workload into `autoresearch.sh` and re-run init_experiment.",
 						},
 					],
 				};
 			}
-			if (benchmarkContract.command !== params.benchmark_command.trim()) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								"Error: benchmark_command does not match autoresearch.md. " +
-								`Expected: ${benchmarkContract.command ?? "(missing)"}\nReceived: ${params.benchmark_command}`,
-						},
-					],
-				};
-			}
-			if (benchmarkContract.primaryMetric !== params.metric_name.trim()) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								"Error: metric_name does not match autoresearch.md. " +
-								`Expected: ${benchmarkContract.primaryMetric ?? "(missing)"}\nReceived: ${params.metric_name}`,
-						},
-					],
-				};
-			}
-			if ((params.metric_unit ?? "") !== expectedMetricUnit) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								"Error: metric_unit does not match autoresearch.md. " +
-								`Expected: ${expectedMetricUnit || "(empty)"}\nReceived: ${params.metric_unit ?? "(empty)"}`,
-						},
-					],
-				};
-			}
-			if ((params.direction ?? "lower") !== expectedDirection) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								"Error: direction does not match autoresearch.md. " +
-								`Expected: ${expectedDirection}\nReceived: ${params.direction ?? "lower"}`,
-						},
-					],
-				};
-			}
-			if (!contractPathListsEqual(params.scope_paths, contractResult.contract.scopePaths)) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								"Error: scope_paths do not match autoresearch.md. " +
-								`Expected: ${contractResult.contract.scopePaths.join(", ")}`,
-						},
-					],
-				};
-			}
-			if (!contractPathListsEqual(params.off_limits ?? [], contractResult.contract.offLimits)) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								"Error: off_limits do not match autoresearch.md. " +
-								`Expected: ${contractResult.contract.offLimits.join(", ") || "(empty)"}`,
-						},
-					],
-				};
-			}
-			if (!contractListsEqual(params.constraints ?? [], contractResult.contract.constraints)) {
-				return {
-					content: [
-						{
-							type: "text",
-							text:
-								"Error: constraints do not match autoresearch.md. " +
-								`Expected: ${contractResult.contract.constraints.join(", ") || "(empty)"}`,
-						},
-					],
-				};
+			const fromMd = params.from_autoresearch_md === true;
+			if (!fromMd) {
+				const metricName = params.metric_name?.trim();
+				const benchmarkCommand = params.benchmark_command?.trim();
+				const scopePaths = params.scope_paths;
+				if (!metricName || !benchmarkCommand || !scopePaths || scopePaths.length === 0) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: when from_autoresearch_md is false or omitted, metric_name, benchmark_command, and scope_paths are required and must match autoresearch.md. " +
+									"Alternatively pass from_autoresearch_md=true with only name (plus optional flags).",
+							},
+						],
+					};
+				}
+				if (benchmarkContract.command !== benchmarkCommand) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: benchmark_command does not match autoresearch.md. " +
+									`Expected: ${benchmarkContract.command ?? "(missing)"}\nReceived: ${params.benchmark_command}`,
+							},
+						],
+					};
+				}
+				if (benchmarkContract.primaryMetric !== metricName) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: metric_name does not match autoresearch.md. " +
+									`Expected: ${benchmarkContract.primaryMetric ?? "(missing)"}\nReceived: ${params.metric_name}`,
+							},
+						],
+					};
+				}
+				if ((params.metric_unit ?? "") !== expectedMetricUnit) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: metric_unit does not match autoresearch.md. " +
+									`Expected: ${expectedMetricUnit || "(empty)"}\nReceived: ${params.metric_unit ?? "(empty)"}`,
+							},
+						],
+					};
+				}
+				if ((params.direction ?? "lower") !== expectedDirection) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: direction does not match autoresearch.md. " +
+									`Expected: ${expectedDirection}\nReceived: ${params.direction ?? "lower"}`,
+							},
+						],
+					};
+				}
+				if (!contractPathListsEqual(scopePaths, contractResult.contract.scopePaths)) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: scope_paths do not match autoresearch.md. " +
+									`Expected: ${contractResult.contract.scopePaths.join(", ")}`,
+							},
+						],
+					};
+				}
+				if (!contractPathListsEqual(params.off_limits ?? [], contractResult.contract.offLimits)) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: off_limits do not match autoresearch.md. " +
+									`Expected: ${contractResult.contract.offLimits.join(", ") || "(empty)"}`,
+							},
+						],
+					};
+				}
+				if (!contractListsEqual(params.constraints ?? [], contractResult.contract.constraints)) {
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									"Error: constraints do not match autoresearch.md. " +
+									`Expected: ${contractResult.contract.constraints.join(", ") || "(empty)"}`,
+							},
+						],
+					};
+				}
 			}
-			const segmentFingerprint = buildAutoresearchSegmentFingerprint(contractResult.contract, {
-				benchmarkScript: scriptSnapshot.benchmarkScript,
-				checksScript: scriptSnapshot.checksScript,
-			});
+			// Check if contract matches current state — if so, re-init is a no-op
+			if (isReinitializing && params.new_segment !== true) {
+				const contract = contractResult.contract;
+				const bm = contract.benchmark;
+				const contractMatches =
+					(bm.primaryMetric ?? "metric") === state.metricName &&
+					bm.metricUnit === state.metricUnit &&
+					(bm.direction ?? "lower") === state.bestDirection &&
+					(bm.command ?? null) === state.benchmarkCommand &&
+					contractPathListsEqual(contract.scopePaths, state.scopePaths) &&
+					contractPathListsEqual(contract.offLimits, state.offLimits) &&
+					contractListsEqual(contract.constraints, state.constraints);
+				if (contractMatches) {
+					runtime.autoresearchMode = true;
+					runtime.autoResumeArmed = true;
+					options.dashboard.updateWidget(ctx, runtime);
+					options.dashboard.requestRender();
+					return {
+						content: [
+							{
+								type: "text",
+								text:
+									abandonSummary +
+									`Experiment session already initialized with matching contract. Continuing segment ${state.currentSegment}.`,
+							},
+						],
+						details: { state: cloneExperimentState(state) },
+					};
+				}
+			}
+			applyAutoresearchContractToExperimentState(contractResult.contract, state);
 			state.name = params.name;
-			state.metricName = params.metric_name;
-			state.metricUnit = params.metric_unit ?? "";
-			state.bestDirection = params.direction ?? "lower";
 			state.maxExperiments = readMaxExperiments(ctx.cwd);
 			state.bestMetric = null;
 			state.confidence = null;
-			state.secondaryMetrics = benchmarkContract.secondaryMetrics.map(name => ({
-				name,
-				unit: inferMetricUnitFromName(name),
-			}));
-			state.benchmarkCommand = params.benchmark_command.trim();
-			state.scopePaths = [...contractResult.contract.scopePaths];
-			state.offLimits = [...contractResult.contract.offLimits];
-			state.constraints = [...contractResult.contract.constraints];
-			state.segmentFingerprint = segmentFingerprint;
 			if (isReinitializing) {
 				state.currentSegment += 1;
 			}
@@ -245,7 +330,6 @@ export function createInitExperimentTool(
 				scopePaths: state.scopePaths,
 				offLimits: state.offLimits,
 				constraints: state.constraints,
-				segmentFingerprint,
 			});
 			if (isReinitializing) {
@@ -267,6 +351,7 @@ export function createInitExperimentTool(
 			options.dashboard.requestRender();
 			const lines = [
+				abandonSummary.trimEnd(),
 				`Experiment initialized: ${state.name}`,
 				`Metric: ${state.metricName} (${state.metricUnit || "unitless"}, ${state.bestDirection} is better)`,
 				`Benchmark command: ${state.benchmarkCommand}`,
@@ -275,7 +360,7 @@ export function createInitExperimentTool(
 				isReinitializing
 					? "Previous results remain in history. This starts a new segment and requires a fresh baseline."
 					: "Now run the baseline experiment and log it.",
-			];
+			].filter(line => line.length > 0);
 			if (state.maxExperiments !== null) {
 				lines.push(`Max iterations: ${state.maxExperiments}`);
 			}