npm - palmier - Versions diffs - 0.4.8 → 0.4.9 - Mend

palmier 0.4.8 → 0.4.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/README.md +3 -68
package/dist/agents/agent-instructions.md +1 -1
package/dist/agents/gemini.js +5 -5
package/dist/commands/run.js +3 -3
package/dist/platform/windows.js +3 -2
package/dist/spawn-command.js +4 -1
package/package.json +1 -1
package/src/agents/agent-instructions.md +1 -1
package/src/agents/gemini.ts +5 -5
package/src/commands/run.ts +3 -3
package/src/platform/windows.ts +3 -2
package/src/spawn-command.ts +4 -1

package/README.md CHANGED Viewed

@@ -85,7 +85,9 @@ palmier sessions revoke-all
 The `init` command:
 - Detects installed agent CLIs (Claude Code, Gemini CLI, Codex CLI, GitHub Copilot) and caches the result
-- Saves host configuration to `~/.config/palmier/host.json`
+- Configures access modes (HTTP port, LAN access)
+- Shows a summary and asks for confirmation before making changes
+- Registers with the Palmier server, saves configuration to `~/.config/palmier/host.json`
 - Installs a background daemon (systemd user service on Linux, Registry Run key on Windows)
 - Auto-enters pair mode to connect your first device
@@ -128,76 +130,9 @@ palmier restart
 - **Tasks** are stored locally as Markdown files in a `tasks/` directory. Each task has a name, prompt, execution plan, and optional schedules (cron schedules or one-time dates).
 - **Plan generation** is automatic — when you create or update a task, the host invokes your chosen agent CLI to generate an execution plan and name.
 - **Schedules** are backed by systemd timers (Linux) or Task Scheduler (Windows). You can enable/disable them without deleting the task, and any task can still be run manually at any time.
-- **Task execution** uses the system scheduler on both platforms — `systemctl --user start` on Linux, `schtasks /run` on Windows. On Windows, tasks run via a VBS wrapper (`wscript.exe`) to avoid visible console windows. The daemon polls every 30 seconds to detect crashed tasks (processes that exited without updating status) and marks them as failed, broadcasting the failure to connected clients.
 - **Command-triggered tasks** — optionally specify a shell command (e.g., `tail -f /var/log/app.log`). Palmier runs the command continuously and invokes the agent for each line of stdout, passing it alongside your prompt. Useful for log monitoring, event-driven automation, and reactive workflows.
-- **Task confirmation** — tasks can optionally require your approval before running. You'll get a push notification (server mode) or a prompt in the PWA to confirm or abort.
-- **Conversational run history** — each run gets its own directory (`tasks/<id>/<timestamp>/`) with a `TASKRUN.md` file containing a conversational thread: assistant messages (agent output), user messages (input responses, permission grants, confirmations), and status entries (started, finished, failed, aborted, stopped). The agent runs inside the run directory, so each run's session files and artifacts are isolated. The PWA displays runs as a chat-like thread with follow-up support.
-- **Follow-up messages** — after a task run completes, users can send follow-up messages from the run detail view. The agent is invoked inline by the serve daemon (no new process spawning), and the response is appended to the same conversation thread.
-- **Real-time updates** — task status changes and result updates are pushed to connected PWA clients via NATS pub/sub (server mode) and/or SSE (local/LAN mode). The run detail view live-updates as the agent produces output. Events are scoped to specific runs.
 - **Agent HTTP endpoints** — the serve daemon exposes localhost-only endpoints (`/notify`, `/request-input`) that agents call to send push notifications and request user input during task execution.
-## NATS Subjects
-| Subject | Direction | Description |
-|---|---|---|
-| `host.<hostId>.rpc.<method>` | Client → Host | RPC request/reply (e.g., `task.list`, `task.create`) |
-| `host-event.<hostId>.<taskId>` | Host → Client | Real-time task events (`running-state`, `result-updated`, `confirm-request`, `permission-request`, `input-request`) |
-| `host.<hostId>.push.send` | Host → Server | Request server to deliver a push notification |
-| `pair.<code>` | Client → Host | OTP pairing request/reply |
-## Project Structure
-```
-src/
-  index.ts            # CLI entrypoint (commander setup)
-  config.ts           # Host configuration (read/write ~/.config/palmier)
-  rpc-handler.ts      # Transport-agnostic RPC handler (with session validation)
-  session-store.ts    # Session token management (~/.config/palmier/sessions.json)
-  nats-client.ts      # NATS connection helper
-  spawn-command.ts    # Shared helper for spawning CLI tools
-  task.ts             # Task file management
-  types.ts            # Shared type definitions
-  pending-requests.ts # In-memory registry for held HTTP connections (confirmation, permission, input)
-  events.ts           # Event broadcasting (NATS pub/sub or HTTP SSE)
-  agents/
-    agent.ts          # AgentTool interface, registry, and agent detection
-    shared-prompt.ts  # Agent instructions loader
-    agent-instructions.md  # System prompt injected into every agent invocation
-    claude.ts         # Claude Code agent implementation
-    gemini.ts         # Gemini CLI agent implementation
-    codex.ts          # Codex CLI agent implementation
-    copilot.ts        # GitHub Copilot agent implementation
-    openclaw.ts       # OpenClaw agent implementation
-  commands/
-    init.ts           # Interactive setup wizard (auto-pair)
-    pair.ts           # OTP code generation and pairing handler
-    sessions.ts       # Session token management CLI (list, revoke, revoke-all)
-    info.ts           # Print host connection info
-    serve.ts          # NATS + HTTP transport startup, crash detection polling
-    restart.ts        # Daemon restart (cross-platform)
-    run.ts            # Single task execution
-  platform/
-    platform.ts       # PlatformService interface
-    index.ts          # Platform factory (Linux vs Windows)
-    linux.ts          # Linux: systemd daemon, timers, systemctl task control
-    windows.ts        # Windows: Registry Run key, Task Scheduler, schtasks-based task control
-  transports/
-    nats-transport.ts # NATS subscription loop (host.<hostId>.rpc.>)
-    http-transport.ts # HTTP server with RPC, SSE, PWA reverse proxy, and internal event endpoints
-```
-## Agent HTTP Endpoints
-The serve daemon exposes localhost-only HTTP endpoints for agents during task execution. The port is baked into the agent's system prompt automatically.
-| Endpoint | Method | Description |
-|---|---|---|
-| `/notify` | POST | Send a push notification (requires server mode) |
-| `/request-input` | POST | Request user input; blocks until a response is provided |
-See [agent-instructions.md](src/agents/agent-instructions.md) for usage examples.
 ## Uninstalling
 To fully remove Palmier from a machine:

package/dist/agents/agent-instructions.md CHANGED Viewed

@@ -24,7 +24,7 @@ If the task fails because a tool was denied or you lack the required permissions
 The following HTTP endpoints are available at http://localhost:{{PORT}} during task execution. Use curl to call them.
-**Requesting user input** — When you need information from the user (credentials, questions, preferences, clarifications, etc.), do not guess, fail, or prompt via stdout. Instead, POST to `/request-input` with:
+**Requesting user input** — When you need information from the user (credentials, answers to questions, preferences, clarifications, etc.), do not guess, fail, or prompt via stdout, even in a non-interactive environment. Instead, POST to `/request-input` with:
 ```json
 {"taskId":"{{TASK_ID}}","descriptions":["question 1","question 2"]}
 ```

package/dist/agents/gemini.js CHANGED Viewed

@@ -5,12 +5,12 @@ export class GeminiAgent {
     getPlanGenerationCommandLine(prompt) {
         return {
             command: "gemini",
-            args: ["--approval-mode", "auto_edit", "--prompt", prompt],
+            args: ["--prompt", prompt],
         };
     }
     getTaskRunCommandLine(task, followupPrompt, extraPermissions) {
-        const fullPrompt = followupPrompt ?? (getAgentInstructions(task.frontmatter.id) + "\n\n" + (task.body || task.frontmatter.user_prompt));
-        const args = ["--allowed-tools", "web_fetch"];
+        const prompt = followupPrompt ?? (getAgentInstructions(task.frontmatter.id) + "\n\n" + (task.body || task.frontmatter.user_prompt));
+        const args = ["--approval-mode", "auto_edit", "--allowed-tools", "web_fetch"];
         const allPerms = [...(task.frontmatter.permissions ?? []), ...(extraPermissions ?? [])];
         if (allPerms.length > 0) {
             for (const p of allPerms) {
@@ -20,8 +20,8 @@ export class GeminiAgent {
         if (followupPrompt) {
             args.push("--resume");
         } // continue mode for followups
-        args.push("--prompt", "-"); // read prompt from stdin
-        return { command: "gemini", args, stdin: fullPrompt };
+        args.push("--prompt", prompt);
+        return { command: "gemini", args };
     }
     async init() {
         try {

package/dist/commands/run.js CHANGED Viewed

@@ -16,7 +16,7 @@ import { publishHostEvent } from "../events.js";
  * The `invokeTask` is the ParsedTask whose prompt is passed to the agent
  * (for command-triggered mode this is the per-line augmented task).
  */
-async function invokeAgentWithContinuation(ctx, invokeTask) {
+async function invokeAgentWithRetries(ctx, invokeTask) {
     // eslint-disable-next-line no-constant-condition
     while (true) {
         const { command, args, stdin } = ctx.agent.getTaskRunCommandLine(invokeTask, undefined, ctx.transientPermissions);
@@ -174,7 +174,7 @@ export async function runCommand(taskId) {
                 time: Date.now(),
                 content: task.body || task.frontmatter.user_prompt,
             });
-            const result = await invokeAgentWithContinuation(ctx, task);
+            const result = await invokeAgentWithRetries(ctx, task);
             const outcome = resolveOutcome(taskDir, result.outcome);
             appendRunMessage(taskDir, runId, { role: "status", time: Date.now(), content: "", type: outcome });
             await publishTaskEvent(nc, config, taskDir, taskId, outcome, taskName, runId);
@@ -252,7 +252,7 @@ async function runCommandTriggeredMode(ctx) {
             frontmatter: { ...ctx.task.frontmatter, user_prompt: perLinePrompt },
             body: "",
         };
-        const result = await invokeAgentWithContinuation(ctx, perLineTask);
+        const result = await invokeAgentWithRetries(ctx, perLineTask);
         if (result.outcome === "finished") {
             invocationsSucceeded++;
         }

package/dist/platform/windows.js CHANGED Viewed

@@ -123,8 +123,9 @@ export class WindowsPlatform {
         // Write a VBS launcher that starts the daemon with no visible console window.
         const vbs = `CreateObject("WScript.Shell").Run """${process.execPath}"" ""${script}"" serve", 0, False`;
         fs.writeFileSync(DAEMON_VBS_FILE, vbs, "utf-8");
-        const wscript = `${process.env.SYSTEMROOT || "C:\\Windows"}\\System32\\wscript.exe`;
-        const child = nodeSpawn(wscript, [DAEMON_VBS_FILE], {
+        // Use `cmd /c start` to break out of the SSH session's job object.
+        // Without this, the daemon is killed when the SSH session disconnects.
+        const child = nodeSpawn("cmd", ["/c", "start", "/b", "wscript.exe", DAEMON_VBS_FILE], {
             detached: true,
             stdio: "ignore",
             windowsHide: true,

package/dist/spawn-command.js CHANGED Viewed

@@ -58,7 +58,10 @@ export function spawnCommand(command, args, opts) {
             if (opts.echoStdout)
                 process.stdout.write(d);
         });
-        child.stderr.on("data", (d) => process.stderr.write(d));
+        child.stderr.on("data", (d) => {
+            chunks.push(d);
+            process.stderr.write(d);
+        });
         let timer;
         if (opts.timeout) {
             timer = setTimeout(() => {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "palmier",
-  "version": "0.4.8",
+  "version": "0.4.9",
   "description": "Palmier host CLI - provisions, executes tasks, and serves NATS RPC",
   "license": "Apache-2.0",
   "author": "Hongxu Cai",

package/src/agents/agent-instructions.md CHANGED Viewed

@@ -24,7 +24,7 @@ If the task fails because a tool was denied or you lack the required permissions
 The following HTTP endpoints are available at http://localhost:{{PORT}} during task execution. Use curl to call them.
-**Requesting user input** — When you need information from the user (credentials, questions, preferences, clarifications, etc.), do not guess, fail, or prompt via stdout. Instead, POST to `/request-input` with:
+**Requesting user input** — When you need information from the user (credentials, answers to questions, preferences, clarifications, etc.), do not guess, fail, or prompt via stdout, even in a non-interactive environment. Instead, POST to `/request-input` with:
 ```json
 {"taskId":"{{TASK_ID}}","descriptions":["question 1","question 2"]}
 ```

package/src/agents/gemini.ts CHANGED Viewed

@@ -8,13 +8,13 @@ export class GeminiAgent implements AgentTool {
   getPlanGenerationCommandLine(prompt: string): CommandLine {
     return {
       command: "gemini",
-      args: ["--approval-mode", "auto_edit", "--prompt", prompt],
+      args: ["--prompt", prompt],
     };
   }
   getTaskRunCommandLine(task: ParsedTask, followupPrompt?: string, extraPermissions?: RequiredPermission[]): CommandLine {
-    const fullPrompt = followupPrompt ?? (getAgentInstructions(task.frontmatter.id) + "\n\n" + (task.body || task.frontmatter.user_prompt));
-    const args = ["--allowed-tools", "web_fetch"];
+    const prompt = followupPrompt ?? (getAgentInstructions(task.frontmatter.id) + "\n\n" + (task.body || task.frontmatter.user_prompt));
+    const args = ["--approval-mode", "auto_edit", "--allowed-tools", "web_fetch"];
     const allPerms = [...(task.frontmatter.permissions ?? []), ...(extraPermissions ?? [])];
     if (allPerms.length > 0) {
@@ -24,9 +24,9 @@ export class GeminiAgent implements AgentTool {
     }
     if (followupPrompt) {args.push("--resume");} // continue mode for followups
-    args.push("--prompt", "-"); // read prompt from stdin
+    args.push("--prompt", prompt);
-    return { command: "gemini", args, stdin: fullPrompt };
+    return { command: "gemini", args };
   }
   async init(): Promise<boolean> {

package/src/commands/run.ts CHANGED Viewed

@@ -41,7 +41,7 @@ interface InvocationResult {
  * The `invokeTask` is the ParsedTask whose prompt is passed to the agent
  * (for command-triggered mode this is the per-line augmented task).
  */
-async function invokeAgentWithContinuation(
+async function invokeAgentWithRetries(
   ctx: InvocationContext,
   invokeTask: ParsedTask,
 ): Promise<InvocationResult> {
@@ -226,7 +226,7 @@ export async function runCommand(taskId: string): Promise<void> {
         content: task.body || task.frontmatter.user_prompt,
       });
-      const result = await invokeAgentWithContinuation(ctx, task);
+      const result = await invokeAgentWithRetries(ctx, task);
       const outcome = resolveOutcome(taskDir, result.outcome);
       appendRunMessage(taskDir, runId, { role: "status", time: Date.now(), content: "", type: outcome });
       await publishTaskEvent(nc, config, taskDir, taskId, outcome, taskName, runId);
@@ -313,7 +313,7 @@ async function runCommandTriggeredMode(
       body: "",
     };
-    const result = await invokeAgentWithContinuation(ctx, perLineTask);
+    const result = await invokeAgentWithRetries(ctx, perLineTask);
     if (result.outcome === "finished") {
       invocationsSucceeded++;
     } else {

package/src/platform/windows.ts CHANGED Viewed

@@ -147,8 +147,9 @@ export class WindowsPlatform implements PlatformService {
     const vbs = `CreateObject("WScript.Shell").Run """${process.execPath}"" ""${script}"" serve", 0, False`;
     fs.writeFileSync(DAEMON_VBS_FILE, vbs, "utf-8");
-    const wscript = `${process.env.SYSTEMROOT || "C:\\Windows"}\\System32\\wscript.exe`;
-    const child = nodeSpawn(wscript, [DAEMON_VBS_FILE], {
+    // Use `cmd /c start` to break out of the SSH session's job object.
+    // Without this, the daemon is killed when the SSH session disconnects.
+    const child = nodeSpawn("cmd", ["/c", "start", "/b", "wscript.exe", DAEMON_VBS_FILE], {
       detached: true,
       stdio: "ignore",
       windowsHide: true,

package/src/spawn-command.ts CHANGED Viewed

@@ -106,7 +106,10 @@ export function spawnCommand(
       chunks.push(d);
       if (opts.echoStdout) process.stdout.write(d);
     });
-    child.stderr!.on("data", (d: Buffer) => process.stderr.write(d));
+    child.stderr!.on("data", (d: Buffer) => {
+      chunks.push(d);
+      process.stderr.write(d);
+    });
     let timer: ReturnType<typeof setTimeout> | undefined;
     if (opts.timeout) {