npm - @oh-my-pi/pi-coding-agent - Versions diffs - 16.0.4 → 16.0.6 - Mend

@oh-my-pi/pi-coding-agent 16.0.4 → 16.0.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (270) hide show

package/CHANGELOG.md +94 -0
package/dist/cli.js +2027 -1396
package/dist/types/advisor/advise-tool.d.ts +31 -19
package/dist/types/autoresearch/tools/init-experiment.d.ts +13 -17
package/dist/types/autoresearch/tools/log-experiment.d.ts +17 -19
package/dist/types/autoresearch/tools/run-experiment.d.ts +3 -4
package/dist/types/autoresearch/tools/update-notes.d.ts +4 -5
package/dist/types/cli/args.d.ts +1 -0
package/dist/types/cli/bench-cli.d.ts +6 -0
package/dist/types/cli/ttsr-cli.d.ts +39 -0
package/dist/types/commands/launch.d.ts +3 -0
package/dist/types/commands/ttsr.d.ts +57 -0
package/dist/types/commit/agentic/tools/analyze-file.d.ts +4 -5
package/dist/types/commit/agentic/tools/git-file-diff.d.ts +4 -5
package/dist/types/commit/agentic/tools/git-hunk.d.ts +5 -6
package/dist/types/commit/agentic/tools/git-overview.d.ts +4 -5
package/dist/types/commit/agentic/tools/propose-changelog.d.ts +23 -24
package/dist/types/commit/agentic/tools/propose-commit.d.ts +11 -32
package/dist/types/commit/agentic/tools/recent-commits.d.ts +3 -4
package/dist/types/commit/agentic/tools/schemas.d.ts +6 -27
package/dist/types/commit/agentic/tools/split-commit.d.ts +28 -49
package/dist/types/commit/changelog/generate.d.ts +12 -13
package/dist/types/commit/shared-llm.d.ts +10 -37
package/dist/types/config/config-file.d.ts +4 -4
package/dist/types/config/keybindings.d.ts +5 -0
package/dist/types/config/models-config-schema.d.ts +625 -990
package/dist/types/config/models-config.d.ts +229 -217
package/dist/types/config/settings-schema.d.ts +144 -25
package/dist/types/edit/hashline/params.d.ts +7 -11
package/dist/types/edit/index.d.ts +2 -1
package/dist/types/edit/modes/apply-patch.d.ts +4 -5
package/dist/types/edit/modes/patch.d.ts +15 -24
package/dist/types/edit/modes/replace.d.ts +16 -17
package/dist/types/eval/js/index.d.ts +1 -0
package/dist/types/extensibility/custom-commands/types.d.ts +6 -3
package/dist/types/extensibility/custom-tools/types.d.ts +8 -5
package/dist/types/extensibility/extensions/runner.d.ts +5 -2
package/dist/types/extensibility/extensions/types.d.ts +14 -10
package/dist/types/extensibility/hooks/types.d.ts +7 -4
package/dist/types/extensibility/legacy-pi-ai-shim.d.ts +13 -5
package/dist/types/extensibility/legacy-pi-coding-agent-shim.d.ts +17 -0
package/dist/types/extensibility/shared-events.d.ts +22 -1
package/dist/types/extensibility/typebox.d.ts +80 -58
package/dist/types/goals/tools/goal-tool.d.ts +11 -24
package/dist/types/index.d.ts +2 -0
package/dist/types/lsp/index.d.ts +11 -26
package/dist/types/lsp/types.d.ts +12 -28
package/dist/types/main.d.ts +1 -0
package/dist/types/mcp/client.d.ts +8 -0
package/dist/types/modes/components/btw-panel.d.ts +1 -0
package/dist/types/modes/components/custom-editor.d.ts +3 -1
package/dist/types/modes/components/status-line/component.d.ts +1 -1
package/dist/types/modes/components/status-line/context-thresholds.d.ts +0 -1
package/dist/types/modes/controllers/btw-controller.d.ts +2 -0
package/dist/types/modes/controllers/input-controller.d.ts +1 -0
package/dist/types/modes/interactive-mode.d.ts +3 -0
package/dist/types/modes/rpc/rpc-types.d.ts +1 -1
package/dist/types/modes/setup-wizard/index.d.ts +1 -0
package/dist/types/modes/setup-wizard/startup-splash.d.ts +7 -0
package/dist/types/modes/theme/theme.d.ts +1 -1
package/dist/types/modes/types.d.ts +3 -0
package/dist/types/modes/utils/context-usage.d.ts +12 -0
package/dist/types/sdk.d.ts +8 -1
package/dist/types/session/agent-session.d.ts +24 -0
package/dist/types/session/session-persistence.d.ts +4 -0
package/dist/types/startup-splash.d.ts +12 -0
package/dist/types/task/types.d.ts +47 -48
package/dist/types/tools/ask.d.ts +26 -27
package/dist/types/tools/ast-edit.d.ts +17 -17
package/dist/types/tools/ast-grep.d.ts +12 -13
package/dist/types/tools/bash.d.ts +20 -17
package/dist/types/tools/browser.d.ts +46 -71
package/dist/types/tools/checkpoint.d.ts +14 -15
package/dist/types/tools/debug.d.ts +82 -145
package/dist/types/tools/eval.d.ts +30 -40
package/dist/types/tools/find.d.ts +17 -18
package/dist/types/tools/gh.d.ts +49 -78
package/dist/types/tools/image-gen.d.ts +20 -36
package/dist/types/tools/inspect-image.d.ts +10 -11
package/dist/types/tools/irc.d.ts +22 -33
package/dist/types/tools/job.d.ts +11 -12
package/dist/types/tools/learn.d.ts +21 -28
package/dist/types/tools/manage-skill.d.ts +13 -22
package/dist/types/tools/memory-edit.d.ts +15 -24
package/dist/types/tools/memory-recall.d.ts +7 -8
package/dist/types/tools/memory-reflect.d.ts +9 -10
package/dist/types/tools/memory-retain.d.ts +13 -14
package/dist/types/tools/read.d.ts +8 -8
package/dist/types/tools/resolve.d.ts +11 -18
package/dist/types/tools/review.d.ts +9 -15
package/dist/types/tools/search-tool-bm25.d.ts +9 -10
package/dist/types/tools/search.d.ts +16 -17
package/dist/types/tools/ssh.d.ts +14 -15
package/dist/types/tools/todo.d.ts +27 -43
package/dist/types/tools/tts.d.ts +8 -9
package/dist/types/tools/write.d.ts +9 -10
package/dist/types/tui/code-cell.d.ts +2 -0
package/dist/types/tui/index.d.ts +1 -0
package/dist/types/tui/width-aware-text.d.ts +23 -0
package/dist/types/utils/image-vision-fallback.d.ts +28 -0
package/dist/types/utils/markit.d.ts +10 -1
package/dist/types/web/search/index.d.ts +17 -28
package/dist/types/web/search/providers/base.d.ts +1 -0
package/dist/types/web/search/providers/gemini.d.ts +1 -0
package/dist/types/web/search/providers/perplexity.d.ts +0 -2
package/dist/types/web/search/types.d.ts +32 -26
package/package.json +14 -13
package/scripts/omp +1 -1
package/src/advisor/__tests__/advisor.test.ts +103 -1
package/src/advisor/advise-tool.ts +47 -11
package/src/autoresearch/tools/init-experiment.ts +13 -16
package/src/autoresearch/tools/log-experiment.ts +15 -18
package/src/autoresearch/tools/run-experiment.ts +3 -3
package/src/autoresearch/tools/update-notes.ts +4 -4
package/src/cli/args.ts +1 -0
package/src/cli/bench-cli.ts +30 -7
package/src/cli/flag-tables.ts +8 -0
package/src/cli/ttsr-cli.ts +995 -0
package/src/cli-commands.ts +1 -0
package/src/cli.ts +7 -1
package/src/collab/host.ts +2 -2
package/src/commands/launch.ts +3 -0
package/src/commands/ttsr.ts +125 -0
package/src/commit/agentic/tools/analyze-file.ts +4 -4
package/src/commit/agentic/tools/git-file-diff.ts +4 -4
package/src/commit/agentic/tools/git-hunk.ts +7 -5
package/src/commit/agentic/tools/git-overview.ts +4 -4
package/src/commit/agentic/tools/propose-changelog.ts +18 -15
package/src/commit/agentic/tools/propose-commit.ts +6 -6
package/src/commit/agentic/tools/recent-commits.ts +3 -3
package/src/commit/agentic/tools/schemas.ts +8 -20
package/src/commit/agentic/tools/split-commit.ts +19 -23
package/src/commit/analysis/summary.ts +7 -5
package/src/commit/changelog/generate.ts +15 -11
package/src/commit/shared-llm.ts +17 -24
package/src/config/config-file.ts +13 -15
package/src/config/keybindings.ts +6 -0
package/src/config/models-config-schema.ts +206 -179
package/src/config/settings-schema.ts +118 -2
package/src/discovery/builtin-rules/index.ts +2 -0
package/src/discovery/builtin-rules/ts-import-type.md +2 -2
package/src/discovery/builtin-rules/ts-no-any.md +11 -2
package/src/discovery/builtin-rules/ts-no-inline-cast-access.md +55 -0
package/src/edit/hashline/params.ts +12 -11
package/src/edit/index.ts +5 -4
package/src/edit/modes/apply-patch.ts +4 -4
package/src/edit/modes/patch.ts +15 -18
package/src/edit/modes/replace.ts +13 -17
package/src/edit/renderer.ts +0 -1
package/src/eval/agent-bridge.ts +11 -13
package/src/eval/completion-bridge.ts +25 -17
package/src/eval/js/context-manager.ts +17 -2
package/src/eval/js/index.ts +1 -1
package/src/eval/py/executor.ts +2 -2
package/src/eval/py/runner.py +44 -0
package/src/extensibility/custom-commands/loader.ts +5 -3
package/src/extensibility/custom-commands/types.ts +6 -3
package/src/extensibility/custom-tools/loader.ts +4 -2
package/src/extensibility/custom-tools/types.ts +8 -5
package/src/extensibility/extensions/loader.ts +4 -2
package/src/extensibility/extensions/runner.ts +20 -2
package/src/extensibility/extensions/types.ts +22 -8
package/src/extensibility/hooks/loader.ts +5 -2
package/src/extensibility/hooks/types.ts +7 -4
package/src/extensibility/legacy-pi-ai-shim.ts +42 -5
package/src/extensibility/legacy-pi-coding-agent-shim.ts +113 -0
package/src/extensibility/plugins/legacy-pi-compat.ts +13 -13
package/src/extensibility/shared-events.ts +24 -0
package/src/extensibility/tool-proxy.ts +4 -1
package/src/extensibility/typebox.ts +778 -251
package/src/goals/guided-setup.ts +12 -3
package/src/goals/tools/goal-tool.ts +6 -6
package/src/index.ts +2 -0
package/src/internal-urls/docs-index.generated.ts +15 -13
package/src/lsp/types.ts +13 -27
package/src/main.ts +29 -21
package/src/mcp/client.ts +38 -13
package/src/mcp/render.ts +102 -89
package/src/modes/components/agent-hub.ts +11 -4
package/src/modes/components/branch-summary-message.ts +1 -0
package/src/modes/components/btw-panel.ts +5 -1
package/src/modes/components/collab-prompt-message.ts +9 -7
package/src/modes/components/compaction-summary-message.ts +1 -0
package/src/modes/components/custom-editor.ts +18 -0
package/src/modes/components/custom-message.ts +1 -0
package/src/modes/components/footer.ts +6 -5
package/src/modes/components/hook-message.ts +1 -0
package/src/modes/components/read-tool-group.ts +9 -3
package/src/modes/components/skill-message.ts +1 -0
package/src/modes/components/status-line/component.ts +139 -15
package/src/modes/components/status-line/context-thresholds.ts +0 -1
package/src/modes/components/todo-reminder.ts +1 -0
package/src/modes/components/tool-execution.ts +17 -10
package/src/modes/components/ttsr-notification.ts +1 -0
package/src/modes/components/user-message.ts +6 -6
package/src/modes/controllers/btw-controller.ts +69 -1
package/src/modes/controllers/event-controller.ts +2 -7
package/src/modes/controllers/input-controller.ts +29 -0
package/src/modes/controllers/selector-controller.ts +10 -3
package/src/modes/interactive-mode.ts +42 -10
package/src/modes/rpc/rpc-types.ts +1 -1
package/src/modes/setup-wizard/index.ts +1 -0
package/src/modes/setup-wizard/scenes/sign-in.ts +77 -5
package/src/modes/setup-wizard/startup-splash.ts +107 -0
package/src/modes/theme/theme.ts +133 -143
package/src/modes/types.ts +3 -0
package/src/modes/utils/context-usage.ts +37 -20
package/src/modes/utils/hotkeys-markdown.ts +1 -0
package/src/prompts/system/system-prompt.md +1 -0
package/src/prompts/tools/image-attachment-describe-system.md +8 -0
package/src/prompts/tools/image-attachment-describe.md +10 -0
package/src/sdk.ts +35 -22
package/src/session/agent-session.ts +715 -255
package/src/session/session-history-format.ts +11 -2
package/src/session/session-loader.ts +19 -32
package/src/session/session-persistence.ts +27 -11
package/src/session/snapcompact-inline.ts +1 -1
package/src/slash-commands/builtin-registry.ts +4 -11
package/src/ssh/connection-manager.ts +3 -2
package/src/startup-splash.ts +19 -0
package/src/task/executor.ts +12 -7
package/src/task/types.ts +44 -41
package/src/tool-discovery/tool-index.ts +17 -4
package/src/tools/ask.ts +14 -14
package/src/tools/ast-edit.ts +17 -14
package/src/tools/ast-grep.ts +10 -9
package/src/tools/bash.ts +15 -10
package/src/tools/browser/launch.ts +13 -0
package/src/tools/browser.ts +26 -32
package/src/tools/checkpoint.ts +7 -7
package/src/tools/debug.ts +72 -69
package/src/tools/eval.ts +18 -19
package/src/tools/find.ts +20 -13
package/src/tools/gh.ts +29 -49
package/src/tools/image-gen.ts +94 -57
package/src/tools/inspect-image.ts +8 -9
package/src/tools/irc.ts +12 -12
package/src/tools/job.ts +6 -6
package/src/tools/learn.ts +11 -14
package/src/tools/manage-skill.ts +19 -23
package/src/tools/memory-edit.ts +8 -8
package/src/tools/memory-recall.ts +4 -4
package/src/tools/memory-reflect.ts +5 -5
package/src/tools/memory-retain.ts +9 -11
package/src/tools/puppeteer/02_stealth_hairline.txt +1 -1
package/src/tools/puppeteer/04_stealth_iframe.txt +4 -4
package/src/tools/puppeteer/05_stealth_webgl.txt +1 -1
package/src/tools/puppeteer/10_stealth_plugins.txt +6 -4
package/src/tools/puppeteer/12_stealth_codecs.txt +2 -2
package/src/tools/puppeteer/13_stealth_worker.txt +1 -1
package/src/tools/read.ts +197 -19
package/src/tools/report-tool-issue.ts +6 -6
package/src/tools/resolve.ts +6 -6
package/src/tools/review.ts +10 -12
package/src/tools/search-tool-bm25.ts +5 -5
package/src/tools/search.ts +20 -29
package/src/tools/ssh.ts +8 -8
package/src/tools/todo.ts +16 -19
package/src/tools/tts.ts +16 -15
package/src/tools/write.ts +5 -5
package/src/tui/code-cell.ts +44 -3
package/src/tui/index.ts +1 -0
package/src/tui/width-aware-text.ts +58 -0
package/src/utils/image-vision-fallback.ts +197 -0
package/src/utils/markit.ts +17 -2
package/src/web/search/index.ts +21 -9
package/src/web/search/providers/base.ts +1 -0
package/src/web/search/providers/gemini.ts +56 -18
package/src/web/search/providers/perplexity.ts +373 -126
package/src/web/search/types.ts +28 -48

package/src/advisor/__tests__/advisor.test.ts CHANGED Viewed

@@ -1,5 +1,6 @@
 import { describe, expect, it, vi } from "bun:test";
-import type { AgentMessage } from "@oh-my-pi/pi-agent-core";
+import type { AgentMessage, AgentTelemetryConfig } from "@oh-my-pi/pi-agent-core";
+import { type } from "arktype";
 import { createAdvisorMessageCard } from "../../modes/components/advisor-message";
 import { getThemeByName } from "../../modes/theme/theme";
 import { formatSessionHistoryMarkdown } from "../../session/session-history-format";
@@ -11,7 +12,9 @@ import {
 	type AdvisorNote,
 	AdvisorRuntime,
 	type AdvisorRuntimeHost,
+	deriveAdvisorTelemetry,
 	formatAdvisorBatchContent,
+	isAdvisorInterruptImmuneTurnActive,
 	isInterruptingSeverity,
 	resolveAdvisorDeliveryChannel,
 } from "..";
@@ -114,6 +117,16 @@ describe("advisor", () => {
 			expect(result.details).toEqual({ note: "x", severity: "concern" });
 			expect(result.useless).toBe(true);
 		});
+		it("validates parameters using ArkType", () => {
+			const onAdvice = vi.fn();
+			const tool = new AdviseTool(onAdvice);
+			const valid = tool.parameters({ note: "x", severity: "concern" });
+			expect(valid instanceof type.errors).toBe(false);
+			const invalid = tool.parameters({ note: 123, severity: "invalid" as any });
+			expect(invalid instanceof type.errors).toBe(true);
+		});
 	});
 	describe("advice delivery policy", () => {
@@ -124,6 +137,44 @@ describe("advisor", () => {
 			expect(isInterruptingSeverity(undefined)).toBe(false);
 		});
+		it("keeps the interrupt-immune turn fence half-open for the configured window", () => {
+			expect(
+				isAdvisorInterruptImmuneTurnActive({
+					completedTurns: 4,
+					immuneTurnStart: undefined,
+					immuneTurns: 2,
+				}),
+			).toBe(false);
+			expect(
+				isAdvisorInterruptImmuneTurnActive({
+					completedTurns: 4,
+					immuneTurnStart: 5,
+					immuneTurns: 0,
+				}),
+			).toBe(false);
+			expect(
+				isAdvisorInterruptImmuneTurnActive({
+					completedTurns: 4,
+					immuneTurnStart: 5,
+					immuneTurns: 2,
+				}),
+			).toBe(true);
+			expect(
+				isAdvisorInterruptImmuneTurnActive({
+					completedTurns: 6,
+					immuneTurnStart: 5,
+					immuneTurns: 2,
+				}),
+			).toBe(true);
+			expect(
+				isAdvisorInterruptImmuneTurnActive({
+					completedTurns: 7,
+					immuneTurnStart: 5,
+					immuneTurns: 2,
+				}),
+			).toBe(false);
+		});
 		it("wraps each note in an advisory tag with severity as an attribute and escapes the body", () => {
 			const content = formatAdvisorBatchContent([
 				{ note: "first note" },
@@ -142,6 +193,37 @@ describe("advisor", () => {
 		});
 	});
+	describe("deriveAdvisorTelemetry", () => {
+		it("returns undefined when the primary has no telemetry so the advisor stays a no-op", () => {
+			expect(deriveAdvisorTelemetry(undefined, { id: "s-advisor", name: "Advisor" })).toBeUndefined();
+		});
+		it("inherits the primary's usage/cost hooks but restamps identity and clears the conversation", () => {
+			const onChatUsage = vi.fn();
+			const costEstimator = vi.fn();
+			const primary: AgentTelemetryConfig = {
+				agent: { id: "main", name: "Main" },
+				conversationId: "session-1",
+				attributes: { "deployment.id": "prod" },
+				onChatUsage,
+				costEstimator,
+			};
+			const identity = { id: "session-1-advisor", name: "Advisor", description: "anthropic/claude-sonnet-4-5" };
+			const derived = deriveAdvisorTelemetry(primary, identity);
+			// Usage/cost hooks are inherited so the advisor model's calls report through
+			// the same pipeline as the primary — the whole point of the fix.
+			expect(derived?.onChatUsage).toBe(onChatUsage);
+			expect(derived?.costEstimator).toBe(costEstimator);
+			expect(derived?.attributes).toEqual({ "deployment.id": "prod" });
+			// Advisor identity replaces the primary's so spans are attributable to the advisor.
+			expect(derived?.agent).toEqual(identity);
+			// Conversation cleared so the advisor loop falls back to its own `-advisor` session id.
+			expect(derived?.conversationId).toBeUndefined();
+		});
+	});
 	describe("AdvisorRuntime", () => {
 		function makeAgent(promptInputs: string[]): AdvisorAgent {
 			return {
@@ -688,6 +770,26 @@ describe("advisor", () => {
 			}
 		});
+		it("routes interrupting notes to the aside queue during immune turns without overriding preservation", () => {
+			expect(
+				resolveAdvisorDeliveryChannel({
+					severity: "concern",
+					autoResumeSuppressed: false,
+					streaming: true,
+					aborting: false,
+					interruptImmuneTurnActive: true,
+				}),
+			).toBe("aside");
+			expect(
+				resolveAdvisorDeliveryChannel({
+					severity: "blocker",
+					autoResumeSuppressed: true,
+					streaming: false,
+					aborting: false,
+					interruptImmuneTurnActive: true,
+				}),
+			).toBe("preserve");
+		});
 		it("preserves an interrupting note while suppressed AND idle (no auto-resume of a stopped run)", () => {
 			for (const severity of ["concern", "blocker"] as const) {
 				expect(

package/src/advisor/advise-tool.ts CHANGED Viewed

@@ -1,19 +1,23 @@
-import type { AgentTool, AgentToolContext, AgentToolResult, AgentToolUpdateCallback } from "@oh-my-pi/pi-agent-core";
+import type {
+	AgentIdentity,
+	AgentTelemetryConfig,
+	AgentTool,
+	AgentToolContext,
+	AgentToolResult,
+	AgentToolUpdateCallback,
+} from "@oh-my-pi/pi-agent-core";
 import { escapeXmlText } from "@oh-my-pi/pi-utils";
-import { z } from "zod/v4";
+import { type } from "arktype";
 import adviseDescription from "../prompts/advisor/advise-tool.md" with { type: "text" };
-const adviseSchema = z.object({
-	note: z
-		.string()
-		.describe("One concrete piece of advice for the agent you are watching. Terse, specific, actionable."),
-	severity: z
-		.enum(["nit", "concern", "blocker"])
-		.optional()
-		.describe("How strongly to weigh this. Omit for a plain nit."),
+const adviseSchema = type({
+	note: type("string").describe(
+		"One concrete piece of advice for the agent you are watching. Terse, specific, actionable.",
+	),
+	"severity?": type("'nit' | 'concern' | 'blocker'").describe("How strongly to weigh this. Omit for a plain nit."),
 });
-export type AdviseParams = z.infer<typeof adviseSchema>;
+export type AdviseParams = typeof adviseSchema.infer;
 export type AdvisorSeverity = "nit" | "concern" | "blocker";
@@ -68,6 +72,15 @@ export function isInterruptingSeverity(severity: AdvisorSeverity | undefined): b
 /** How an advisor note is routed to the primary. */
 export type AdvisorDeliveryChannel = "aside" | "steer" | "preserve";
+/** Half-open turn-count fence for the post-interrupt cooldown. */
+export function isAdvisorInterruptImmuneTurnActive(opts: {
+	completedTurns: number;
+	immuneTurnStart: number | undefined;
+	immuneTurns: number;
+}): boolean {
+	if (opts.immuneTurnStart === undefined || opts.immuneTurns <= 0) return false;
+	return opts.completedTurns < opts.immuneTurnStart + opts.immuneTurns;
+}
 /**
  * Decide how one advisor note reaches the primary agent.
@@ -84,18 +97,41 @@ export type AdvisorDeliveryChannel = "aside" | "steer" | "preserve";
  *   auto-resume anything, so it is delivered live. Parking it during an active
  *   run instead strands it (it never reaches the running agent) and the withheld
  *   notes dump as one burst at the next user prompt — the bug this guards.
+ * - During the post-interrupt immune-turn window, further `concern`/`blocker`
+ *   notes are downgraded to asides; suppression preservation still wins.
  */
 export function resolveAdvisorDeliveryChannel(opts: {
 	severity: AdvisorSeverity | undefined;
 	autoResumeSuppressed: boolean;
 	streaming: boolean;
 	aborting: boolean;
+	interruptImmuneTurnActive?: boolean;
 }): AdvisorDeliveryChannel {
 	if (!isInterruptingSeverity(opts.severity)) return "aside";
 	if (opts.autoResumeSuppressed && (opts.aborting || !opts.streaming)) return "preserve";
+	if (opts.interruptImmuneTurnActive) return "aside";
 	return "steer";
 }
+/**
+ * Derive the advisor loop's telemetry from the primary session's config so the
+ * advisor model's GenAI spans and usage/cost hooks (onChatUsage, onCostDelta,
+ * costEstimator) fire under the same pipeline as every other model call —
+ * stamped with the advisor's own agent identity. `conversationId` is cleared so
+ * the advisor loop falls back to its own `-advisor` session id for
+ * `gen_ai.conversation.id` instead of inheriting the primary's conversation.
+ *
+ * Returns undefined when the primary has no telemetry (instrumentation off), so
+ * the advisor `Agent` stays a zero-overhead no-op as well.
+ */
+export function deriveAdvisorTelemetry(
+	primaryTelemetry: AgentTelemetryConfig | undefined,
+	identity: AgentIdentity,
+): AgentTelemetryConfig | undefined {
+	if (!primaryTelemetry) return undefined;
+	return { ...primaryTelemetry, agent: identity, conversationId: undefined };
+}
 /**
  * Side-effect-free investigation tools handed to the advisor agent so it can
  * inspect the workspace before weighing in. Names match the primary session's

package/src/autoresearch/tools/init-experiment.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import * as path from "node:path";
 import { Text } from "@oh-my-pi/pi-tui";
-import { z } from "zod/v4";
+import { type } from "arktype";
 import type { ToolDefinition } from "../../extensibility/extensions";
 import type { Theme } from "../../modes/theme/theme";
 import { replaceTabs, truncateToWidth } from "../../tools/render-utils";
@@ -16,21 +16,18 @@ export const HARNESS_FILENAME = "autoresearch.sh";
 export const DEFAULT_HARNESS_COMMAND = `bash ${HARNESS_FILENAME}`;
 const HARNESS_COMMIT_TITLE = "autoresearch: harness setup";
-const initExperimentSchema = z.object({
-	name: z.string().describe("experiment name"),
-	goal: z.string().describe("session goal").optional(),
-	primary_metric: z.string().describe("primary metric name"),
-	metric_unit: z.string().describe("metric unit (e.g. ms, µs, mb)").optional(),
-	direction: z
-		.enum(["lower", "higher"] as const)
-		.describe("better direction (default lower)")
-		.optional(),
-	secondary_metrics: z.array(z.string()).describe("secondary metric names").optional(),
-	scope_paths: z.array(z.string()).describe("expected-to-modify paths").optional(),
-	off_limits: z.array(z.string()).describe("off-limits paths").optional(),
-	constraints: z.array(z.string()).describe("free-form constraints").optional(),
-	max_iterations: z.number().describe("soft iteration cap per segment").optional(),
-	new_segment: z.boolean().describe("bump to a new segment in existing session").optional(),
+const initExperimentSchema = type({
+	name: type("string").describe("experiment name"),
+	"goal?": type("string").describe("session goal"),
+	primary_metric: type("string").describe("primary metric name"),
+	"metric_unit?": type("string").describe("metric unit (e.g. ms, µs, mb)"),
+	"direction?": type("'lower' | 'higher'").describe("better direction (default lower)"),
+	"secondary_metrics?": type("string[]").describe("secondary metric names"),
+	"scope_paths?": type("string[]").describe("expected-to-modify paths"),
+	"off_limits?": type("string[]").describe("off-limits paths"),
+	"constraints?": type("string[]").describe("free-form constraints"),
+	"max_iterations?": type("number").describe("soft iteration cap per segment"),
+	"new_segment?": type("boolean").describe("bump to a new segment in existing session"),
 });
 interface InitExperimentDetails {

package/src/autoresearch/tools/log-experiment.ts CHANGED Viewed

@@ -2,7 +2,7 @@ import * as fs from "node:fs";
 import * as path from "node:path";
 import { Text } from "@oh-my-pi/pi-tui";
-import { z } from "zod/v4";
+import { type } from "arktype";
 import type { ToolDefinition } from "../../extensibility/extensions";
 import type { Theme } from "../../modes/theme/theme";
 import { replaceTabs, truncateToWidth } from "../../tools/render-utils";
@@ -36,23 +36,20 @@ import type {
 const EXPERIMENT_TOOL_NAMES = ["init_experiment", "run_experiment", "log_experiment", "update_notes"];
-const logExperimentSchema = z.object({
-	metric: z.number().describe("primary metric value"),
-	status: z.enum(["keep", "discard", "crash", "checks_failed"] as const).describe("run outcome"),
-	description: z.string().describe("short run description"),
-	metrics: z.record(z.string(), z.number()).describe("secondary metrics").optional(),
-	asi: z.object({}).passthrough().describe("free-form structured metadata").optional(),
-	commit: z.string().describe("override recorded commit hash").optional(),
-	justification: z.string().describe("required when keeping a scope-deviating run").optional(),
-	flag_runs: z
-		.array(
-			z.object({
-				run_id: z.number().describe("run id to flag"),
-				reason: z.string().describe("why this run is suspect"),
-			}),
-		)
-		.describe("flag earlier runs as suspect")
-		.optional(),
+const logExperimentSchema = type({
+	metric: type("number").describe("primary metric value"),
+	status: type("'keep'|'discard'|'crash'|'checks_failed'").describe("run outcome"),
+	description: type("string").describe("short run description"),
+	"metrics?": type({ "[string]": "number" }).describe("secondary metrics"),
+	"asi?": type({ "[string]": "unknown" }).describe("free-form structured metadata"),
+	"commit?": type("string").describe("override recorded commit hash"),
+	"justification?": type("string").describe("required when keeping a scope-deviating run"),
+	"flag_runs?": type({
+		run_id: type("number.integer").describe("run id to flag"),
+		reason: type("string").describe("why this run is suspect"),
+	})
+		.array()
+		.describe("flag earlier runs as suspect"),
 });
 export function createLogExperimentTool(

package/src/autoresearch/tools/run-experiment.ts CHANGED Viewed

@@ -2,7 +2,7 @@ import * as fs from "node:fs";
 import * as path from "node:path";
 import { Text } from "@oh-my-pi/pi-tui";
 import { formatBytes } from "@oh-my-pi/pi-utils";
-import { z } from "zod/v4";
+import { type } from "arktype";
 import { executeBash } from "../../exec/bash-executor";
 import type { ToolDefinition } from "../../extensibility/extensions";
 import type { Theme } from "../../modes/theme/theme";
@@ -25,8 +25,8 @@ import { openAutoresearchStorageIfExists } from "../storage";
 import type { AutoresearchToolFactoryOptions, RunDetails, RunExperimentProgressDetails } from "../types";
 import { DEFAULT_HARNESS_COMMAND } from "./init-experiment";
-const runExperimentSchema = z.object({
-	timeout_seconds: z.number().describe("timeout in seconds (default 600)").optional(),
+const runExperimentSchema = type({
+	"timeout_seconds?": type("number").describe("timeout in seconds (default 600)"),
 });
 interface ProcessExecutionResult {

package/src/autoresearch/tools/update-notes.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import { Text } from "@oh-my-pi/pi-tui";
-import { z } from "zod/v4";
+import { type } from "arktype";
 import type { ToolDefinition } from "../../extensibility/extensions";
 import type { Theme } from "../../modes/theme/theme";
 import { replaceTabs, truncateToWidth } from "../../tools/render-utils";
@@ -8,9 +8,9 @@ import { buildExperimentState } from "../state";
 import { openAutoresearchStorageIfExists } from "../storage";
 import type { AutoresearchToolFactoryOptions } from "../types";
-const updateNotesSchema = z.object({
-	body: z.string().describe("replacement notes body"),
-	append_idea: z.string().describe("append as bullet under Ideas instead of replacing body").optional(),
+const updateNotesSchema = type({
+	body: type("string").describe("replacement notes body"),
+	"append_idea?": type("string").describe("append as bullet under Ideas instead of replacing body"),
 });
 interface UpdateNotesDetails {

package/src/cli/args.ts CHANGED Viewed

@@ -28,6 +28,7 @@ export interface Args {
 	smol?: string;
 	slow?: string;
 	plan?: string;
+	maxTime?: number;
 	apiKey?: string;
 	systemPrompt?: string;
 	appendSystemPrompt?: string;

package/src/cli/bench-cli.ts CHANGED Viewed

@@ -17,7 +17,12 @@ import { formatDuration, getProjectDir } from "@oh-my-pi/pi-utils";
 import chalk from "chalk";
 import type { ApiKeyResolverModel } from "../config/api-key-resolver";
 import { type CanonicalModelQueryOptions, ModelRegistry } from "../config/model-registry";
-import { formatModelString, getModelMatchPreferences, resolveCliModel } from "../config/model-resolver";
+import {
+	formatModelSelectorValue,
+	formatModelString,
+	getModelMatchPreferences,
+	resolveCliModel,
+} from "../config/model-resolver";
 import { Settings } from "../config/settings";
 import benchPrompt from "../prompts/bench.md" with { type: "text" };
 import { discoverAuthStorage } from "../sdk";
@@ -144,9 +149,15 @@ function isFirstTokenEvent(event: AssistantMessageEvent): boolean {
  * latency does not dilute throughput. Falls back to total duration when the
  * response arrived as a single chunk (TTFT ~ duration).
  */
-function computeTokensPerSecond(outputTokens: number, durationMs: number, ttftMs: number): number {
+export function computeTokensPerSecond(
+	outputTokens: number,
+	durationMs: number,
+	ttftMs: number,
+	deltaChunkCount: number,
+): number {
 	const decodeMs = durationMs - ttftMs;
-	const windowMs = decodeMs > 0 ? decodeMs : durationMs;
+	// Fall back to total duration when the response arrived as a single chunk/non-streaming.
+	const windowMs = decodeMs > 0 && deltaChunkCount >= 2 ? decodeMs : durationMs;
 	return windowMs > 0 ? (outputTokens * 1000) / windowMs : 0;
 }
@@ -193,10 +204,17 @@ async function runBenchRequest(
 			headers: model.provider === "openrouter" ? { "X-OpenRouter-Cache": "false" } : undefined,
 		});
 		let message: AssistantMessage | undefined;
+		let deltaChunkCount = 0;
 		for await (const event of stream) {
 			if (firstTokenAt === undefined && isFirstTokenEvent(event)) {
 				firstTokenAt = now();
 			}
+			if (
+				(event.type === "text_delta" || event.type === "thinking_delta" || event.type === "toolcall_delta") &&
+				event.delta.length > 0
+			) {
+				deltaChunkCount++;
+			}
 			if (event.type === "error") {
 				return { ok: false, error: event.error.errorMessage ?? "request failed" };
 			}
@@ -218,7 +236,7 @@ async function runBenchRequest(
 			ttftMs,
 			durationMs,
 			outputTokens,
-			tokensPerSecond: computeTokensPerSecond(outputTokens, durationMs, ttftMs),
+			tokensPerSecond: computeTokensPerSecond(outputTokens, durationMs, ttftMs, deltaChunkCount),
 		};
 	} catch (error) {
 		return { ok: false, error: getErrorMessage(error) };
@@ -244,6 +262,10 @@ function buildModelReport(
 	return { selector, model: formatModelString(model), thinking, results, average };
 }
+function formatBenchModelLabel(report: BenchModelReport): string {
+	return formatModelSelectorValue(report.model, report.thinking);
+}
 function formatMs(ms: number): string {
 	return formatDuration(Math.max(0, Math.round(ms)));
 }
@@ -264,7 +286,7 @@ export function formatBenchTable(summary: BenchSummary): string {
 		return b.average.tokensPerSecond - a.average.tokensPerSecond;
 	});
 	const rows = ranked.map(report => ({
-		model: report.model,
+		model: formatBenchModelLabel(report),
 		ttft: report.average ? formatMs(report.average.ttftMs) : "-",
 		tps: report.average ? `${report.average.tokensPerSecond.toFixed(1)}/s` : "-",
 		tokens: report.average ? String(Math.round(report.average.outputTokens)) : "-",
@@ -382,8 +404,9 @@ export async function runBenchCommand(command: BenchCommandArgs, deps: BenchDepe
 		const reports: BenchModelReport[] = [];
 		for (const { selector, model, thinking } of targets) {
 			if (!json) {
-				const resolvedNote = selector === formatModelString(model) ? "" : chalk.dim(` (${selector})`);
-				writeStdout(`${chalk.bold(formatModelString(model))}${resolvedNote}\n`);
+				const resolvedModel = formatModelSelectorValue(formatModelString(model), thinking);
+				const resolvedNote = selector === resolvedModel ? "" : chalk.dim(` (${selector})`);
+				writeStdout(`${chalk.bold(resolvedModel)}${resolvedNote}\n`);
 			}
 			const results: BenchRunResult[] = [];
 			for (let index = 0; index < runs; index++) {

package/src/cli/flag-tables.ts CHANGED Viewed

@@ -120,6 +120,14 @@ export const STRING_SETTERS: Record<string, StringSetter> = {
 	"--plan": (result, value) => {
 		result.plan = value;
 	},
+	"--max-time": (result, value, deps) => {
+		const seconds = Number(value);
+		if (Number.isFinite(seconds) && seconds > 0) {
+			result.maxTime = seconds;
+		} else {
+			deps.logger.warn("Invalid seconds passed to --max-time", { value });
+		}
+	},
 	"--api-key": (result, value) => {
 		result.apiKey = value;
 	},