npm - @iinm/plain-agent - Versions diffs - 1.7.15 → 1.7.17 - Mend

@iinm/plain-agent 1.7.15 → 1.7.17

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/README.md +131 -57
package/package.json +1 -1
package/src/cliFormatter.mjs +45 -2
package/src/cliInteractive.mjs +116 -2
package/src/cliInterruptTransform.mjs +22 -5
package/src/cliMuteTransform.mjs +26 -0
package/src/config.d.ts +2 -0
package/src/config.mjs +3 -0
package/src/main.mjs +3 -1
package/src/mcp.mjs +5 -2
package/src/voiceInput.mjs +671 -0

package/README.md CHANGED Viewed

@@ -4,21 +4,28 @@
 # Plain Agent
-A lightweight CLI-based coding agent.
+A lightweight CLI-based coding agent with zero framework dependencies.
-- **Safety controls** — Configure approval rules and sandboxing for safe execution
-- **Multi-provider** — Supports Anthropic, OpenAI, Gemini, Bedrock, Azure, Vertex AI, and more
-- **Sequential subagent delegation** — Delegate subtasks to specialized subagents with full visibility
-- **MCP support** — Connect to external MCP servers to extend available tools
-- **Claude Code compatible** — Reuse Claude Code plugins, agents, commands, and skills
+## Why Plain Agent?
-## Safety Controls
+- **Multi-provider** — Use Claude, GPT, Gemini, or any OpenAI-compatible model.
+  Switch providers without changing your workflow.
+- **Fine-grained approval rules** — Auto-approve commands by name, arguments,
+  and file paths using regex patterns
+  ([`config.predefined.json`](https://github.com/iinm/plain-agent/blob/main/config/config.predefined.json)).
+- **Path validation** — File paths must stay within the working directory
+  and git-ignored files (`.env`, etc.) are blocked.
+- **Sandboxed execution** — Run the agent's shell commands inside a Docker
+  container with network access restricted to allowlisted destinations
+  (e.g., `registry.npmjs.org` only for `npm install`).
+- **Extensible** — Define prompts and subagents in Markdown.
+  Connect MCP servers. Reuse Claude Code plugins.
-**Auto-Approval**: Tools with no side effects and no sensitive data access are automatically approved based on patterns defined in [`config.predefined.json#autoApproval`](https://github.com/iinm/plain-agent/blob/main/config/config.predefined.json).
+## Limitations
-**Path Validation**: All file paths in tool inputs are validated to remain within the working directory and under git control.
-⚠️ `write_file` and `patch_file` require explicit path arguments. However, `exec_command` can run arbitrary code where file access cannot be validated. Use a sandbox for stronger isolation.
+- **Sequential subagent execution** — Subagents run one at a time rather than
+  in parallel. The trade-off is full visibility: every step is streamed to
+  your terminal so you can follow exactly what each subagent is doing.
 ## Requirements
@@ -53,49 +60,28 @@ Create the configuration.
     {
       "name": "anthropic",
       "variant": "default",
-      "apiKey": "FIXME"
+      "apiKey": "<ANTHROPIC_API_KEY>"
       // Or
       // "apiKey": { "$env": "ANTHROPIC_API_KEY" }
     },
     {
       "name": "gemini",
       "variant": "default",
-      "apiKey": "FIXME"
+      "apiKey": "<GEMINI_API_KEY>"
     },
     {
       "name": "openai",
       "variant": "default",
-      "apiKey": "FIXME"
-    },
-    {
-      // Requires Azure CLI to get access token
-      "name": "azure",
-      "variant": "openai",
-      "baseURL": "https://<resource>.openai.azure.com/openai",
-      // Optional
-      "azureConfigDir": "/home/xxx/.azure-for-agent"
+      "apiKey": "<OPENAI_API_KEY>"
     },
-    {
-      "name": "bedrock",
-      "variant": "default",
-      "baseURL": "https://bedrock-runtime.<region>.amazonaws.com",
-      "awsProfile": "FIXME"
-    },
-    {
-      // Requires gcloud CLI to get authentication token
-      "name": "vertex-ai",
-      "variant": "default",
-      "baseURL": "https://aiplatform.googleapis.com/v1beta1/projects/<project>/locations/<location>",
-      // Optional
-      "account": "<service_account_email>"
-    }
   ],
   // Optional
   "tools": {
+    // askWeb: Searches the web to answer questions requiring up-to-date information or external sources.
     "askWeb": {
       "provider": "gemini",
-      "apiKey": "FIXME",
+      "apiKey": "<GEMINI_API_KEY>",
       "model": "gemini-3-flash-preview"
       // Optional
       // "baseURL": "<proxy_url>"
@@ -108,9 +94,11 @@ Create the configuration.
       // "account": "<service_account_email>"
     },
+    // askURL: Answers questions based on provided URL content.
+    //         Directly injecting URL content into context is not supported to prevent prompt injection.
     "askURL": {
       "provider": "gemini",
-      "apiKey": "FIXME"
+      "apiKey": "<GEMINI_API_KEY>"
       "model": "gemini-3-flash-preview"
       // Optional
       // "baseURL": "<proxy_url>"
@@ -129,7 +117,40 @@ Create the configuration.
 ```
 <details>
-<summary><b>Other provider examples</b></summary>
+<summary><b>Azure / Bedrock / Vertex AI provider examples</b></summary>
+```js
+{
+  "platforms": [
+    {
+      // Requires Azure CLI to get access token
+      "name": "azure",
+      "variant": "openai",
+      "baseURL": "https://<resource>.openai.azure.com/openai",
+      // Optional
+      "azureConfigDir": "/home/xxx/.azure-for-agent"
+    },
+    {
+      "name": "bedrock",
+      "variant": "default",
+      "baseURL": "https://bedrock-runtime.<region>.amazonaws.com",
+      "awsProfile": "<AWS_PROFILE>"
+    },
+    {
+      // Requires gcloud CLI to get authentication token
+      "name": "vertex-ai",
+      "variant": "default",
+      "baseURL": "https://aiplatform.googleapis.com/v1beta1/projects/<project>/locations/<location>",
+      // Optional
+      "account": "<service_account_email>"
+    }
+  ]
+}
+```
+</details>
+<details>
+<summary><b>OpenAI compatible provider examples</b></summary>
 ```js
 {
@@ -138,19 +159,19 @@ Create the configuration.
       "name": "openai-compatible",
       "variant": "ollama",
       "baseURL": "https://ollama.com",
-      "apiKey": "FIXME"
+      "apiKey": "<API_KEY>"
     },
     {
       "name": "openai-compatible",
       "variant": "huggingface",
       "baseURL": "https://router.huggingface.co",
-      "apiKey": "FIXME"
+      "apiKey": "<HUGGINGFACE_API_KEY>"
     },
     {
       "name": "openai-compatible",
       "variant": "fireworks",
       "baseURL": "https://api.fireworks.ai/inference",
-      "apiKey": "FIXME"
+      "apiKey": "<FIREWORKS_API_KEY>"
     }
   ]
 }
@@ -222,7 +243,7 @@ Create the configuration.
       "name": "bedrock",
       "variant": "jp",
       "baseURL": "https://bedrock-runtime.ap-northeast-1.amazonaws.com",
-      "awsProfile": "FIXME"
+      "awsProfile": "<AWS_PROFILE>"
     }
   ]
 }
@@ -442,7 +463,7 @@ The agent loads configuration files in the following order. Settings in later fi
     // ⚠️ Add this to config.local.json to avoid committing secrets to Git
     "slack": {
       "command": "npx",
-      "args": ["-y", "mcp-remote", "https://mcp.slack.com/mcp", "--header", "Authorization:Bearer FIXME"],
+      "args": ["-y", "mcp-remote", "https://mcp.slack.com/mcp", "--header", "Authorization:Bearer <SLACK_TOKEN>"],
     },
     "notion": {
       "command": "npx",
@@ -459,12 +480,18 @@ The agent loads configuration files in the following order. Settings in later fi
     // ⚠️ Add this to config.local.json to avoid committing secrets to Git
     "google_developer-knowledge": {
       "command": "npx",
-      "args": ["-y", "mcp-remote", "https://developerknowledge.googleapis.com/mcp", "--header", "X-Goog-Api-Key:FIXME"]
+      "args": ["-y", "mcp-remote", "https://developerknowledge.googleapis.com/mcp", "--header", "X-Goog-Api-Key:<GOOGLE_API_KEY>"]
     }
   },
   // Override default notification command
   // "notifyCmd": "/path/to/notification-command"
+  // (Optional) Voice input. See "Voice Input" below.
+  // "voiceInput": {
+  //   "provider": "openai",
+  //   "apiKey": "<OPENAI_API_KEY>"
+  // }
 }
 ```
 </details>
@@ -585,6 +612,53 @@ Example:
 plain install-claude-code-plugins
 ```
+## Voice Input
+Press **Ctrl-O** to start recording, press it again to stop. Partial
+transcripts are inserted into the prompt as you speak so you can edit
+and send them like regular text.
+### Requirements
+- A recording command on `PATH`: `arecord`, `sox`, or `ffmpeg`.
+- An API key for the chosen provider.
+- Your host must have microphone access. The sandbox does not need to.
+### Providers
+**OpenAI Realtime** (default, recommended):
+```js
+{
+  "voiceInput": {
+    "provider": "openai",
+    "apiKey": "<OPENAI_API_KEY>"
+    // "model": "gpt-4o-transcribe",  // or "gpt-4o-mini-transcribe", "whisper-1"
+    // "language": "ja"               // ISO-639-1 code. Improves accuracy and latency.
+  }
+}
+```
+**Gemini Live** (preview API; model names and pricing may change):
+```js
+{
+  "voiceInput": {
+    "provider": "gemini",
+    "apiKey": "<GEMINI_API_KEY>"
+    // "model": "gemini-3.1-flash-live-preview",
+    // "language": "ja"
+  }
+}
+```
+### Options
+- `toggleKey` — Rebind the toggle. Accepts `"ctrl-<char>"` where `<char>`
+  is a letter (a-z) or one of `[ \ ] ^ _`. Defaults to `"ctrl-o"`.
+- `recorder` — Override recorder auto-detection. Must write raw 16-bit
+  little-endian mono PCM to stdout at 24 kHz (OpenAI) or 16 kHz (Gemini).
 ## Development
 ```sh
@@ -623,9 +697,9 @@ npm publish --access public
 ```sh
 # IAM Identity Center
-identity_center_instance_arn="FIXME" # e.g., arn:aws:sso:::instance/ssoins-xxxxxxxxxxxxxxxx"
-identity_store_id=FIXME
-aws_account_id=FIXME
+identity_center_instance_arn="<IDENTITY_CENTER_INSTANCE_ARN>" # e.g., arn:aws:sso:::instance/ssoins-xxxxxxxxxxxxxxxx"
+identity_store_id=<IDENTITY_STORE_ID>
+aws_account_id=<AWS_ACCOUNT_ID>
 # Create a permission set
 permission_set_arn=$(aws sso-admin create-permission-set \
@@ -660,10 +734,10 @@ aws sso-admin put-inline-policy-to-permission-set \
   --inline-policy "$policy"
 # Create an SSO user
-sso_user_name=FIXME
-sso_user_email=FIXME
-sso_user_family_name=FIXME
-sso_user_given_name=FIXME
+sso_user_name=<SSO_USER_NAME>
+sso_user_email=<SSO_USER_EMAIL>
+sso_user_family_name=<SSO_USER_FAMILY_NAME>
+sso_user_given_name=<SSO_USER_GIVEN_NAME>
 user_id=$(aws identitystore create-user \
   --identity-store-id "$identity_store_id" \
@@ -704,8 +778,8 @@ aws bedrock-runtime invoke-model \
 <summary><b>Azure - Microsoft Foundry</b></summary>
 ```sh
-resource_group=FIXME
-account_name=FIXME # resource name
+resource_group=<RESOURCE_GROUP>
+account_name=<ACCOUNT_NAME> # resource name
 # Create a service principal
 service_principal=$(az ad sp create-for-rbac --name "CodingAgentServicePrincipal" --skip-assignment)
@@ -737,10 +811,10 @@ az login --service-principal -u "$app_id" -p "$app_secret" --tenant "$tenant_id"
 <summary><b>Google Cloud Vertex AI</b></summary>
 ```sh
-project_id=FIXME
-service_account_name=FIXME
+project_id=<PROJECT_ID>
+service_account_name=<SERVICE_ACCOUNT_NAME>
 service_account_email="${service_account_name}@${project_id}.iam.gserviceaccount.com"
-your_account_email=FIXME
+your_account_email=<YOUR_ACCOUNT_EMAIL>
 # Create a service account
 gcloud iam service-accounts create "$service_account_name" \

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@iinm/plain-agent",
-  "version": "1.7.15",
+  "version": "1.7.17",
   "description": "A lightweight CLI-based coding agent",
   "license": "MIT",
   "type": "module",

package/src/cliFormatter.mjs CHANGED Viewed

@@ -11,6 +11,49 @@
 import { styleText } from "node:util";
 import { createPatch } from "diff";
+/** Length above which a single-line arg forces block-form rendering. */
+const ARG_BLOCK_LENGTH_THRESHOLD = 60;
+/**
+ * Format an args array for display.
+ * Uses compact JSON for short single-line args; switches to a YAML-style
+ * block form when any arg contains newlines or exceeds
+ * {@link ARG_BLOCK_LENGTH_THRESHOLD} characters so that long scripts passed
+ * to `bash -c`, `python -c`, `node -e`, etc. stay readable.
+ * @param {unknown} args
+ * @returns {string}
+ */
+export function formatArgs(args) {
+  if (!Array.isArray(args) || args.length === 0) {
+    return `args: ${JSON.stringify(args ?? [])}`;
+  }
+  const needsBlock = args.some(
+    (a) =>
+      typeof a === "string" &&
+      (a.includes("\n") || a.length > ARG_BLOCK_LENGTH_THRESHOLD),
+  );
+  if (!needsBlock) {
+    return `args: ${JSON.stringify(args)}`;
+  }
+  const lines = ["args:"];
+  for (const arg of args) {
+    if (
+      typeof arg === "string" &&
+      (arg.includes("\n") || arg.length > ARG_BLOCK_LENGTH_THRESHOLD)
+    ) {
+      lines.push("  - |");
+      for (const line of arg.split("\n")) {
+        lines.push(`      ${line}`);
+      }
+    } else {
+      lines.push(`  - ${JSON.stringify(arg)}`);
+    }
+  }
+  return lines.join("\n");
+}
 /**
  * Format tool use for display.
  * @param {MessageContentToolUse} toolUse
@@ -25,7 +68,7 @@ export function formatToolUse(toolUse) {
     return [
       `tool: ${toolName}`,
       `command: ${JSON.stringify(execCommandInput.command)}`,
-      `args: ${JSON.stringify(execCommandInput.args)}`,
+      formatArgs(execCommandInput.args),
     ].join("\n");
   }
@@ -82,7 +125,7 @@ export function formatToolUse(toolUse) {
     return [
       `tool: ${toolName}`,
       `command: ${tmuxCommandInput.command}`,
-      `args: ${JSON.stringify(tmuxCommandInput.args)}`,
+      formatArgs(tmuxCommandInput.args),
     ].join("\n");
   }

package/src/cliInteractive.mjs CHANGED Viewed

@@ -1,6 +1,7 @@
 /**
  * @import { UserEventEmitter, AgentEventEmitter, AgentCommands } from "./agent"
  * @import { ClaudeCodePlugin } from "./claudeCodePlugin.mjs"
+ * @import { VoiceInputConfig, VoiceSession } from "./voiceInput.mjs"
  */
 import readline from "node:readline";
@@ -13,8 +14,10 @@ import {
   printMessage,
 } from "./cliFormatter.mjs";
 import { createInterruptTransform } from "./cliInterruptTransform.mjs";
+import { createMuteTransform } from "./cliMuteTransform.mjs";
 import { createPasteHandler } from "./cliPasteTransform.mjs";
 import { notify } from "./utils/notify.mjs";
+import { parseVoiceToggleKey, startVoiceSession } from "./voiceInput.mjs";
 const HELP_MESSAGE = [
   "Commands:",
@@ -57,6 +60,7 @@ const HELP_MESSAGE = [
  * @property {boolean} sandbox
  * @property {() => Promise<void>} onStop
  * @property {ClaudeCodePlugin[]} [claudeCodePlugins]
+ * @property {VoiceInputConfig} [voiceInput]
  */
 /**
@@ -72,6 +76,7 @@ export function startInteractiveSession({
   sandbox,
   onStop,
   claudeCodePlugins,
+  voiceInput,
 }) {
   /** @type {{ turn: boolean, multiLineBuffer: string[] | null, subagentName: string }} */
   const state = {
@@ -80,6 +85,16 @@ export function startInteractiveSession({
     subagentName: "",
   };
+  /**
+   * Active voice input session, or null when not recording.
+   * @type {{ session: VoiceSession, startCursor: number, transcriptLength: number } | null}
+   */
+  let voice = null;
+  // Parse the voice toggle key once at startup so misconfiguration fails
+  // loudly instead of silently falling back.
+  const voiceToggle = parseVoiceToggleKey(voiceInput?.toggleKey);
   const getCliPrompt = (subagentName = "", flashMessage = "") =>
     [
       "",
@@ -136,7 +151,100 @@ export function startInteractiveSession({
     cli.prompt();
   };
+  const stopVoiceSession = async () => {
+    if (!voice) return;
+    const current = voice;
+    voice = null;
+    await current.session.stop();
+    cli.setPrompt(currentCliPrompt);
+    // @ts-expect-error - internal property
+    cli._refreshLine?.();
+  };
+  const handleVoiceToggle = () => {
+    // Ignore while the agent is working.
+    if (!state.turn) return;
+    if (voice) {
+      stopVoiceSession();
+      return;
+    }
+    if (!voiceInput) {
+      cli.setPrompt(
+        getCliPrompt(
+          state.subagentName,
+          styleText(
+            "yellow",
+            `Voice input not configured. Set \`voiceInput\` in your config to enable ${voiceToggle.label}.`,
+          ),
+        ),
+      );
+      cli.prompt(true);
+      return;
+    }
+    const startCursor = cli.cursor;
+    const session = startVoiceSession({
+      config: voiceInput,
+      callbacks: {
+        onTranscript: (delta) => {
+          if (!voice) return;
+          const insertAt = voice.startCursor + voice.transcriptLength;
+          // Insert delta at the recording's insertion point. User input is
+          // swallowed while recording, so the buffer around `insertAt` is
+          // stable.
+          const before = cli.line.slice(0, insertAt);
+          const after = cli.line.slice(insertAt);
+          // `line` and `cursor` are declared readonly in the Node typings but
+          // are writable at runtime — the existing code already patches
+          // `_refreshLine` in the same way.
+          const mutableCli = /** @type {{ line: string, cursor: number }} */ (
+            /** @type {unknown} */ (cli)
+          );
+          mutableCli.line = before + delta + after;
+          mutableCli.cursor = insertAt + delta.length;
+          voice.transcriptLength += delta.length;
+          // @ts-expect-error - internal property
+          cli._refreshLine?.();
+        },
+        onError: (err) => {
+          voice = null;
+          cli.setPrompt(
+            getCliPrompt(
+              state.subagentName,
+              styleText("red", `Voice input error: ${err.message}`),
+            ),
+          );
+          cli.prompt(true);
+        },
+        onClose: () => {
+          if (!voice) return;
+          voice = null;
+          cli.setPrompt(currentCliPrompt);
+          // @ts-expect-error - internal property
+          cli._refreshLine?.();
+        },
+      },
+    });
+    voice = { session, startCursor, transcriptLength: 0 };
+    cli.setPrompt(
+      getCliPrompt(
+        state.subagentName,
+        styleText(["red", "bold"], `● REC  (${voiceToggle.label} to stop)`),
+      ),
+    );
+    // @ts-expect-error - internal property
+    cli._refreshLine?.();
+  };
   const handleCtrlC = () => {
+    // Stop voice recording first if active.
+    if (voice) {
+      stopVoiceSession();
+      return;
+    }
     // Agent turn: pause auto-approve; do not clear input.
     if (!state.turn) {
       agentCommands.pauseAutoApprove();
@@ -192,14 +300,20 @@ export function startInteractiveSession({
   };
   // Pre-readline pipeline:
-  //   stdin -> interrupt (Ctrl-C / Ctrl-D) -> paste (bracketed paste) -> readline
+  //   stdin -> interrupt (Ctrl-C / Ctrl-D) -> mute (voice recording) -> paste (bracketed paste) -> readline
   const interrupt = createInterruptTransform({
     onCtrlC: handleCtrlC,
     onCtrlD: handleCtrlD,
+    onVoiceToggle: handleVoiceToggle,
+    voiceToggleByte: voiceToggle.byte,
   });
+  // While a voice session is recording, swallow all stdin bytes other than
+  // Ctrl-C / Ctrl-D / the voice toggle key so transcript insertion stays
+  // consistent.
+  const mute = createMuteTransform({ isMuted: () => voice !== null });
   const paste = createPasteHandler();
-  process.stdin.pipe(interrupt).pipe(paste.transform);
+  process.stdin.pipe(interrupt).pipe(mute).pipe(paste.transform);
   // Enable bracketed paste mode
   if (process.stdout.isTTY) {

package/src/cliInterruptTransform.mjs CHANGED Viewed

@@ -1,19 +1,31 @@
 import { Transform } from "node:stream";
 /**
- * Create a Transform that intercepts Ctrl-C (0x03) and Ctrl-D (0x04). When
- * either byte is seen anywhere in a chunk, the corresponding callback is
- * invoked and the entire chunk is dropped so that downstream consumers (e.g.
+ * Create a Transform that intercepts Ctrl-C (0x03), Ctrl-D (0x04), and an
+ * optional "voice toggle" byte (default Ctrl-O, 0x0f). When one of those
+ * bytes is seen anywhere in a chunk, the corresponding callback is invoked
+ * and the entire chunk is dropped so that downstream consumers (e.g.
  * readline) never observe it. All other input flows through unchanged.
  *
- * If both bytes appear in the same chunk, Ctrl-C is handled first.
+ * Priority when multiple handled bytes appear in the same chunk:
+ * Ctrl-C > Ctrl-D > voice toggle.
  *
  * @param {object} handlers
  * @param {() => void} handlers.onCtrlC - Called when Ctrl-C is detected
  * @param {() => void} handlers.onCtrlD - Called when Ctrl-D is detected
+ * @param {() => void} [handlers.onVoiceToggle]
+ *   Called when the voice toggle byte is detected.
+ * @param {number} [handlers.voiceToggleByte]
+ *   Byte value for the voice toggle key. Defaults to 0x0f (Ctrl-O).
  * @returns {Transform}
  */
-export function createInterruptTransform({ onCtrlC, onCtrlD }) {
+export function createInterruptTransform({
+  onCtrlC,
+  onCtrlD,
+  onVoiceToggle,
+  voiceToggleByte = 0x0f,
+}) {
+  const voiceToggleChar = String.fromCharCode(voiceToggleByte);
   return new Transform({
     transform(chunk, _encoding, callback) {
       const data = chunk.toString("utf8");
@@ -27,6 +39,11 @@ export function createInterruptTransform({ onCtrlC, onCtrlD }) {
         callback();
         return;
       }
+      if (onVoiceToggle && data.includes(voiceToggleChar)) {
+        onVoiceToggle();
+        callback();
+        return;
+      }
       this.push(chunk);
       callback();
     },

package/src/cliMuteTransform.mjs ADDED Viewed

@@ -0,0 +1,26 @@
+import { Transform } from "node:stream";
+/**
+ * Create a Transform that swallows all chunks while `isMuted()` returns true,
+ * and passes them through unchanged while it returns false.
+ *
+ * Intended to sit between `createInterruptTransform` and the paste handler so
+ * that callers can fully silence regular stdin input during special modes
+ * (e.g. while a voice input session is recording) without coupling that
+ * concern to the interrupt-detection logic.
+ *
+ * @param {object} options
+ * @param {() => boolean} options.isMuted
+ *   Called for each incoming chunk; when true the chunk is dropped.
+ * @returns {Transform}
+ */
+export function createMuteTransform({ isMuted }) {
+  return new Transform({
+    transform(chunk, _encoding, callback) {
+      if (!isMuted()) {
+        this.push(chunk);
+      }
+      callback();
+    },
+  });
+}

package/src/config.d.ts CHANGED Viewed

@@ -4,6 +4,7 @@ import { AskURLToolOptions } from "./tools/askURL.mjs";
 import { AskWebToolOptions } from "./tools/askWeb.mjs";
 import { ExecCommandSanboxConfig } from "./tools/execCommand";
 import { ClaudeCodePluginRepo } from "./claudeCodePlugin.mjs";
+import { VoiceInputConfig } from "./voiceInput.mjs";
 export type AppConfig = {
   model?: string;
@@ -21,6 +22,7 @@ export type AppConfig = {
   };
   mcpServers?: Record<string, MCPServerConfig>;
   notifyCmd?: string;
+  voiceInput?: VoiceInputConfig;
   claudeCodePlugins?: ClaudeCodePluginRepo[];
 };

package/src/config.mjs CHANGED Viewed

@@ -98,6 +98,9 @@ export async function loadAppConfig(options = {}) {
         ...(merged.claudeCodePlugins ?? []),
         ...(config.claudeCodePlugins ?? []),
       ],
+      voiceInput: config.voiceInput
+        ? { ...(merged.voiceInput ?? {}), ...config.voiceInput }
+        : merged.voiceInput,
     };
   }