npm - @oh-my-pi/pi-coding-agent - Versions diffs - 12.4.0 → 12.5.0 - Mend

@oh-my-pi/pi-coding-agent 12.4.0 → 12.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/CHANGELOG.md +51 -0
package/docs/custom-tools.md +21 -6
package/docs/extensions.md +20 -0
package/package.json +12 -12
package/src/cli/setup-cli.ts +62 -2
package/src/commands/setup.ts +1 -1
package/src/config/keybindings.ts +4 -1
package/src/config/settings-schema.ts +58 -4
package/src/config/settings.ts +23 -9
package/src/debug/index.ts +26 -19
package/src/debug/log-formatting.ts +60 -0
package/src/debug/log-viewer.ts +903 -0
package/src/debug/report-bundle.ts +87 -8
package/src/discovery/helpers.ts +131 -137
package/src/extensibility/custom-tools/types.ts +44 -6
package/src/extensibility/extensions/types.ts +60 -0
package/src/extensibility/hooks/types.ts +60 -0
package/src/extensibility/skills.ts +4 -2
package/src/main.ts +7 -1
package/src/modes/components/custom-editor.ts +8 -0
package/src/modes/components/settings-selector.ts +29 -14
package/src/modes/controllers/command-controller.ts +2 -0
package/src/modes/controllers/event-controller.ts +7 -0
package/src/modes/controllers/input-controller.ts +23 -2
package/src/modes/controllers/selector-controller.ts +9 -7
package/src/modes/interactive-mode.ts +84 -1
package/src/modes/rpc/rpc-client.ts +7 -0
package/src/modes/rpc/rpc-mode.ts +8 -0
package/src/modes/rpc/rpc-types.ts +2 -0
package/src/modes/theme/theme.ts +163 -7
package/src/modes/types.ts +1 -0
package/src/patch/hashline.ts +2 -1
package/src/patch/shared.ts +44 -13
package/src/prompts/system/plan-mode-approved.md +5 -0
package/src/prompts/system/subagent-system-prompt.md +1 -0
package/src/prompts/system/system-prompt.md +10 -0
package/src/prompts/tools/todo-write.md +3 -1
package/src/sdk.ts +82 -9
package/src/session/agent-session.ts +137 -29
package/src/stt/downloader.ts +71 -0
package/src/stt/index.ts +3 -0
package/src/stt/recorder.ts +351 -0
package/src/stt/setup.ts +52 -0
package/src/stt/stt-controller.ts +160 -0
package/src/stt/transcribe.py +70 -0
package/src/stt/transcriber.ts +91 -0
package/src/task/executor.ts +10 -2

package/src/stt/transcriber.ts ADDED Viewed

@@ -0,0 +1,91 @@
+import { logger } from "@oh-my-pi/pi-utils";
+import transcribeScript from "./transcribe.py" with { type: "text" };
+export interface TranscribeOptions {
+	modelName?: string;
+	language?: string;
+	signal?: AbortSignal;
+}
+const TRANSCRIBE_TIMEOUT_MS = 120_000;
+/**
+ * Find a usable Python command.
+ */
+export function resolvePython(): string | null {
+	for (const cmd of ["python", "py", "python3"]) {
+		if (Bun.which(cmd)) return cmd;
+	}
+	return null;
+}
+/**
+ * Transcribe a WAV file using Python openai-whisper.
+ *
+ * Reads the WAV via Python's built-in `wave` module (no ffmpeg needed),
+ * resamples to 16 kHz mono, and passes the numpy array directly to whisper.
+ */
+export async function transcribe(audioPath: string, options?: TranscribeOptions): Promise<string> {
+	const audioFile = Bun.file(audioPath);
+	if (audioFile.size < 100) {
+		throw new Error(`Audio file is empty or too small (${audioFile.size} bytes). Check microphone.`);
+	}
+	const pythonCmd = resolvePython();
+	if (!pythonCmd) {
+		throw new Error("Python not found. Install Python 3.8+ from https://python.org");
+	}
+	const modelName = options?.modelName ?? "base.en";
+	const language = options?.language ?? "en";
+	logger.debug("Transcribing with Python whisper", { pythonCmd, audioPath, modelName, language });
+	const proc = Bun.spawn([pythonCmd, "-c", transcribeScript, audioPath, modelName, language], {
+		stdout: "pipe",
+		stderr: "pipe",
+	});
+	if (options?.signal?.aborted) {
+		proc.kill();
+		options.signal.throwIfAborted();
+	}
+	const onAbort = () => proc.kill();
+	options?.signal?.addEventListener("abort", onAbort, { once: true });
+	let timedOut = false;
+	const killTimer = setTimeout(() => {
+		timedOut = true;
+		logger.error("Python whisper transcription timed out, killing process", { timeoutMs: TRANSCRIBE_TIMEOUT_MS });
+		proc.kill();
+	}, TRANSCRIBE_TIMEOUT_MS);
+	const exitCode = await proc.exited;
+	clearTimeout(killTimer);
+	options?.signal?.removeEventListener("abort", onAbort);
+	options?.signal?.throwIfAborted();
+	const stdout = await new Response(proc.stdout).text();
+	const stderr = await new Response(proc.stderr).text();
+	if (timedOut) {
+		throw new Error(`Transcription timed out after ${Math.round(TRANSCRIBE_TIMEOUT_MS / 1000)}s`);
+	}
+	if (exitCode !== 0) {
+		logger.error("Python whisper transcription failed", { exitCode, stderr: stderr.trim() });
+		if (stderr.includes("No module named 'whisper'")) {
+			throw new Error("openai-whisper not installed. Run: pip install openai-whisper");
+		}
+		// Show last line of stderr (the actual error, not the full traceback)
+		const lastLine = stderr.trim().split("\n").pop() ?? "";
+		throw new Error(`Transcription failed: ${lastLine}`);
+	}
+	const text = stdout.trim();
+	logger.debug("Transcription complete", { length: text.length });
+	return text;
+}

package/src/task/executor.ts CHANGED Viewed

@@ -887,10 +887,17 @@ export async function runSubprocess(options: ExecutorOptions): Promise<SingleRes
 			activeSession = session;
+			const subagentToolNames = session.getActiveToolNames();
+			const parentOwnedToolNames = new Set(["todo_write"]);
+			const filteredSubagentTools = subagentToolNames.filter(name => !parentOwnedToolNames.has(name));
+			if (filteredSubagentTools.length !== subagentToolNames.length) {
+				await session.setActiveToolsByName(filteredSubagentTools);
+			}
 			session.sessionManager.appendSessionInit({
 				systemPrompt: session.agent.state.systemPrompt,
 				task,
-				tools: session.getAllToolNames(),
+				tools: session.getActiveToolNames(),
 				outputSchema,
 			});
@@ -928,7 +935,8 @@ export async function runSubprocess(options: ExecutorOptions): Promise<SingleRes
 						},
 						getActiveTools: () => session.getActiveToolNames(),
 						getAllTools: () => session.getAllToolNames(),
-						setActiveTools: (toolNames: string[]) => session.setActiveToolsByName(toolNames),
+						setActiveTools: (toolNames: string[]) =>
+							session.setActiveToolsByName(toolNames.filter(name => !parentOwnedToolNames.has(name))),
 						getCommands: () => [],
 						setModel: async model => {
 							const key = await session.modelRegistry.getApiKey(model);