@ai-dev-methodologies/rlp-desk 0.14.6 → 0.15.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@ai-dev-methodologies/rlp-desk",
3
- "version": "0.14.6",
3
+ "version": "0.15.1",
4
4
  "description": "Fresh-context iterative loops for Claude Code — autonomous task completion with independent verification",
5
5
  "scripts": {
6
6
  "postinstall": "node scripts/postinstall.js",
@@ -33,6 +33,8 @@ const runtimeSources = [
33
33
  ["docs/rlp-desk/protocol-reference.md", path.join(docsDir, "rlp-desk", "protocol-reference.md")],
34
34
  ["docs/rlp-desk/TODO-verification-next.md", path.join(docsDir, "rlp-desk", "TODO-verification-next.md")],
35
35
  ["docs/rlp-desk/multi-mission-orchestration.md", path.join(docsDir, "rlp-desk", "multi-mission-orchestration.md")],
36
+ // Plan v6 PR-0a: signal protocol documentation (Architect/Critic codex iter 6).
37
+ ["docs/rlp-desk/signal-protocol.md", path.join(docsDir, "rlp-desk", "signal-protocol.md")],
36
38
  ];
37
39
  // v0.14.0: legacy-deletion list cleared. The Node-canonical era (v5.7+)
38
40
  // removed zsh after install; v0.14.0 reverts that — the zsh runner is the
@@ -189,7 +189,7 @@ Tell the user:
189
189
  /rlp-desk run <actual-slug> --debug
190
190
 
191
191
  # Full options reference:
192
- # --mode agent|tmux (default: agent)
192
+ # --mode native|tmux (default: native; legacy `agent` redirects to native)
193
193
  # --worker-model MODEL haiku|sonnet|opus or gpt-5.5:high|spark:high (default: haiku)
194
194
  # --lock-worker-model disable auto model upgrade
195
195
  # --verifier-model MODEL per-US verifier (default: sonnet)
@@ -217,14 +217,14 @@ Tell the user:
217
217
  # ★ Recommended: tmux mode + claude-only (real-time visibility):
218
218
  /rlp-desk run <actual-slug> --mode tmux --debug
219
219
 
220
- # Agent mode:
221
- /rlp-desk run <actual-slug> --debug
220
+ # Native Agent() mode (slash leader, short / interactive campaigns):
221
+ /rlp-desk run <actual-slug> --mode native --debug
222
222
 
223
223
  # Install codex for cost savings + cross-engine blind-spot coverage:
224
224
  npm install -g @openai/codex
225
225
 
226
226
  # Full options reference:
227
- # --mode agent|tmux (default: agent)
227
+ # --mode native|tmux (default: native; legacy `agent` redirects to native)
228
228
  # --worker-model MODEL haiku|sonnet|opus (default: haiku)
229
229
  # --lock-worker-model disable auto model upgrade
230
230
  # --verifier-model MODEL per-US verifier (default: sonnet)
@@ -252,7 +252,7 @@ Tell the user:
252
252
  **YOU are the leader. Do NOT delegate leadership.**
253
253
 
254
254
  Options (parse from `$ARGUMENTS`):
255
- - `--mode agent|tmux` (default: `agent`) — execution mode
255
+ - `--mode native|tmux` (default: `native`) — execution mode. `native` = slash command is the leader, calls `Agent(...)` (claude) and `Bash("codex exec ...")` (codex). `tmux` = slash command spawns the zsh runner via `node run.mjs --mode tmux`. Legacy `--mode agent` typed against the slash command emits a deprecation notice and redirects to `--mode native` (NOT to be confused with `node run.mjs --mode agent`, which is the deprecated Node-leader alpha — see "Direct Node CLI invocation" below).
256
256
  - `--worker-model MODEL` (default: `haiku`) — Worker model. Format: `model` = claude engine, `model:reasoning` = codex engine. Examples: `haiku`, `sonnet`, `opus`, `spark:high`, `gpt-5.5:high`. Parsed by `parse_model_flag()` which auto-splits engine/model/reasoning.
257
257
  - `--lock-worker-model` — disable automatic model upgrade on failure. Worker stays on the specified model regardless of consecutive failures.
258
258
  - `--verifier-model MODEL` (default: `sonnet`) — per-US verification model. Campaign-fixed (no progressive upgrade). Lighter than final verifier.
@@ -284,20 +284,26 @@ Cross-project aggregation: scan `~/.claude/ralph-desk/analytics/` and read each
284
284
 
285
285
  ### Mode Selection
286
286
 
287
- Parse the `--mode` flag. If absent or `agent`, use the Agent() path below. If `tmux`, use the Tmux path.
287
+ Parse the `--mode` flag. Slash command canonical labels:
288
+
289
+ - `--mode native` (default): **Native Agent() path** below. The slash command IS the leader. It calls `Agent(description=…, model=<m>, mode="bypassPermissions", prompt=…)` for claude workers/verifiers and `Bash("codex exec --model <m> --reasoning-effort <r> <prompt>")` for codex workers/verifiers.
290
+ - `--mode tmux`: **zsh runner path** below. The slash command shells out to `node ~/.claude/ralph-desk/node/run.mjs run --mode tmux …` which spawns `run_ralph_desk.zsh` as a subprocess.
288
291
 
289
- > **v0.14.0 stability tiers:**
290
- > - `--mode tmux` is the **stable, production** path. The Node leader (`run.mjs`)
291
- > now routes tmux invocations to `~/.claude/ralph-desk/run_ralph_desk.zsh`
292
- > as a subprocess that runner has the full safety net (heartbeat,
293
- > copy-mode guard, prompt-stall, no-progress detection, claude model
294
- > upgrade chain). Recommend this for autonomous campaigns.
295
- > - `--mode agent` is **alpha** (Node-native LLM-driven Leader). The runner
296
- > emits a stderr warning when this mode is invoked.
292
+ Legacy `--mode agent` typed against this slash command emits a deprecation notice and redirects to `--mode native`. **Do NOT confuse `/rlp-desk run --mode agent`** (slash command, redirects to Native Agent()) **with** `node run.mjs run --mode agent` (deprecated Node-leader alpha, direct CLI invocation, unrelated code path — see "Direct Node CLI invocation" below).
293
+
294
+ > **Stability tiers:**
295
+ > - `--mode tmux` is the **stable, production** path. The slash command spawns
296
+ > the Node leader, which spawns `run_ralph_desk.zsh` — the zsh runner has the
297
+ > full safety net (heartbeat, copy-mode guard, prompt-stall, no-progress
298
+ > detection, claude model upgrade chain). Recommend this for autonomous
299
+ > campaigns.
300
+ > - `--mode native` is **for short / interactive campaigns**. Native Agent()
301
+ > has no timeout API (platform constraint). Long-running autonomous campaigns
302
+ > SHOULD use `--mode tmux`.
297
303
 
298
304
  #### Tmux Mode (`--mode tmux`)
299
305
 
300
- When `--mode tmux` is specified (v0.14.0+: `run.mjs` accepts the same flags as before but spawns `run_ralph_desk.zsh` as a subprocess and inherits stdio. Flywheel and self-verification flags are not honored under tmux mode — they require `--mode agent`):
306
+ When `--mode tmux` is specified (v0.14.0+: `run.mjs` accepts the same flags as before but spawns `run_ralph_desk.zsh` as a subprocess and inherits stdio. Flywheel and self-verification flags are not honored under tmux mode — they currently require the deprecated Node-leader direct-CLI path `node run.mjs --mode agent` (see "Direct Node CLI invocation" below). Native Agent() port is a post-Node-leader-retirement task):
301
307
 
302
308
  1. **Validate scaffold** — same as Agent() mode: check `.rlp-desk/prompts/<slug>.worker.prompt.md` etc.
303
309
  2. **Check sentinels** — same as Agent() mode.
@@ -331,7 +337,7 @@ node ~/.claude/ralph-desk/node/run.mjs run '<slug>' \
331
337
 
332
338
  **Env-var translation (v5.7 §4.1)**: the slash command historically built `LANE_MODE=strict zsh ...` and `TEST_DENSITY_MODE=strict zsh ...` from CLI flags. The Node leader uses CLI flags instead — translate `--lane-strict` and `--test-density-strict` into the corresponding flags. Direct env-var users (running zsh directly) are unaffected.
333
339
 
334
- 6. **If the Node leader exits with error** — report the error to the user and STOP. Do NOT attempt to work around it. Do NOT create tmux sessions yourself. Do NOT re-launch in a different way. Tell the user what went wrong and suggest `--mode agent` as alternative.
340
+ 6. **If the Node leader exits with error** — report the error to the user and STOP. Do NOT attempt to work around it. Do NOT create tmux sessions yourself. Do NOT re-launch in a different way. Tell the user what went wrong and suggest `--mode native` (slash command Native Agent() path) as alternative.
335
341
  7. **If successful** — tell the user the tmux session has been started. The Node leader takes over as the deterministic Leader. No Agent() calls are made in tmux mode.
336
342
 
337
343
  **IMPORTANT RULES:**
@@ -339,35 +345,36 @@ node ~/.claude/ralph-desk/node/run.mjs run '<slug>' \
339
345
  - MUST launch with `run_in_background: true` so `/rlp-desk` returns control immediately while preserving live tmux visibility.
340
346
  - Run-in-background is used so the shell can keep the command visible and keep the pane layout stable for status checks and completion flow.
341
347
  - Do NOT kill panes after completion. Panes stay alive for inspection. User cleans up with `/rlp-desk clean <slug> --kill-session`.
342
- - v0.14.0: `--with-self-verification`, `--flywheel`, and `--flywheel-guard` are **not honored** under `--mode tmux` — the zsh runner has no SV/flywheel implementation. The Node leader emits a stderr WARNING listing the dropped flags. For SV/flywheel, use `--mode agent` (alpha).
343
- - The slash command always invokes `node ~/.claude/ralph-desk/node/run.mjs run --mode tmux ...`. Do NOT invoke `~/.claude/ralph-desk/run_ralph_desk.zsh` directly — the Node router resolves the runner path, runs legacy detection, and surfaces actionable errors when the runner is missing.
348
+ - v0.14.0: `--with-self-verification`, `--flywheel`, and `--flywheel-guard` are **not honored** under `--mode tmux` — the zsh runner has no SV/flywheel implementation. The Node leader emits a stderr WARNING listing the dropped flags. For SV/flywheel today, use the deprecated Node-leader direct-CLI path `node run.mjs --mode agent` (see "Direct Node CLI invocation" below). The slash command's Native Agent() (`--mode native`) does not yet implement SV/flywheel — port is a post-Node-leader-retirement task.
349
+ - **For `--mode tmux` only**: the slash command invokes `node ~/.claude/ralph-desk/node/run.mjs run --mode tmux ...`. Do NOT invoke `~/.claude/ralph-desk/run_ralph_desk.zsh` directly — the Node router resolves the runner path, runs legacy detection, and surfaces actionable errors when the runner is missing. **For `--mode native`**, the slash command does NOT invoke the Node CLI — it acts as the leader itself; see Native Agent() Mode section below.
344
350
 
345
351
  **tmux UX model (5 items):**
346
352
  - The session returns immediately after launch (`run_in_background: true`) so the command returns control to the parent CLI.
347
353
  - Worker/Verifier panes remain visible to the user during execution.
348
354
  - Users check progress with the **status command**: `/rlp-desk status <slug>`.
349
355
  - On completion, the command returns a completion notification before the loop ends.
350
- - Agent mode remains unchanged, and no tmux-specific behavior is mixed into Agent mode.
351
-
352
- #### Agent Mode (`--mode agent` or default — **alpha**)
353
-
354
- > **v0.14.0:** Agent mode is the alpha LLM-driven path. The Node port shipped
355
- > without zsh-equivalent safety nets (heartbeat, copy-mode guard, prompt-stall
356
- > timeout, no-progress detection, claude model upgrade chain). The runner
357
- > emits a stderr WARNING when agent mode is invoked. For production
358
- > autonomous campaigns, prefer `--mode tmux`.
359
-
360
- **Why Agent mode is structurally immune to Bug 4/5 (mid-execution prompt hang
361
- & A4 premature dispatch):** Worker/Verifier are dispatched as `Agent(...,
362
- mode="bypassPermissions", ...)`. The subagent runs non-interactively under
363
- the platform's bypass it has no tmux pane, no TUI surface, and cannot
364
- surface a `[y/N]` prompt to the parent Leader. The auto-dismiss /
365
- prompt-stall / no-progress timeouts in `run_ralph_desk.zsh` (v5.7 §4.13.b /
366
- §4.16 / §4.17) are therefore tmux-only by design. **Tradeoff**: because
367
- `Agent()` has no timeout API, agent-mode iterations are not bounded — if
368
- the platform's `bypassPermissions` ever fails to suppress an interactive
369
- prompt at the SDK level, the call hangs indefinitely with no rlp-desk-side
370
- watchdog. Use `--mode tmux` if you need bounded execution time.
356
+ - Native Agent() mode remains unchanged, and no tmux-specific behavior is mixed into it.
357
+
358
+ #### Native Agent() Mode (`--mode native` or default)
359
+
360
+ The slash command IS the leader. Workers/Verifiers are spawned via `Agent(model=…, mode="bypassPermissions", prompt=…)` (claude) or `Bash("codex exec --model <m> --reasoning-effort <r> <prompt>")` (codex).
361
+
362
+ ### Native Agent() Safety Contract
363
+
364
+ This contract MUST be observed in every iteration of the leader loop below. Future PRs deleting any of these guarantees break the slash command's behavior.
365
+
366
+ 1. **Turn-keepalive**: every status report uses `Bash("echo '...'")` to emit messages. NEVER output plain text without an accompanying tool call. Plain text = turn ends = loop stops. (Mitigation for commit `29fd29b` platform constraint, permanent.)
367
+ 2. **no `subagent_type` parameter**: the `Agent(...)` call form is exactly `Agent(description=…, model=<m>, mode="bypassPermissions", prompt=…)`. Do NOT pass `subagent_type`. (Mitigation for commit `920a31c`: `subagent_type="executor"` overrode `bypassPermissions` and surfaced a permission popup; permanent.)
368
+ 3. **`mode="bypassPermissions"` mandatory**: every claude `Agent()` worker/verifier dispatch must include `mode="bypassPermissions"`.
369
+ 4. **Long-running campaigns: prefer `--mode tmux`** for production. Native Agent() has no timeout API (platform constraint) — if `bypassPermissions` fails to suppress an interactive prompt at the SDK level, the call hangs indefinitely with no rlp-desk-side watchdog.
370
+
371
+ **Why Native Agent() is structurally immune to Bug 4/5 (mid-execution prompt hang & A4 premature dispatch)**: Worker/Verifier run non-interactively under the platform's bypass — they have no tmux pane, no TUI surface, and cannot surface a `[y/N]` prompt to the parent Leader. The auto-dismiss / prompt-stall / no-progress timeouts in `run_ralph_desk.zsh` (v5.7 §4.13.b / §4.16 / §4.17) are therefore tmux-only by design.
372
+
373
+ **Tradeoff**: because `Agent()` has no timeout API, Native Agent() iterations are not bounded — if the platform's `bypassPermissions` ever fails to suppress an interactive prompt at the SDK level, the call hangs indefinitely with no rlp-desk-side watchdog. Use `--mode tmux` if you need bounded execution time.
374
+
375
+ #### Direct Node CLI invocation (`node run.mjs run <slug> --mode agent` — deprecated alpha)
376
+
377
+ Direct invocation of `node ~/.claude/ralph-desk/node/run.mjs run <slug> --mode agent` is **the deprecated Node-leader alpha path**. This is unrelated to the slash command's Native Agent() path above — different code, different leader, different lifecycle. The Node leader currently retains SV/flywheel implementations not yet ported to Native Agent(). The Node CLI emits a deprecation banner on this mode and is scheduled for hard-error in the next major release. For production tmux orchestration, use `--mode tmux`. For Claude Code Native Agent() campaigns, use `/rlp-desk run <slug> --mode native` from a Claude Code session.
371
378
 
372
379
  ### Preparation
373
380
  1. Validate scaffold: `.rlp-desk/prompts/<slug>.worker.prompt.md` etc.
@@ -775,13 +782,13 @@ Example:
775
782
  ```
776
783
  /rlp-desk brainstorm <description> Plan before init (interactive)
777
784
  /rlp-desk init <slug> [objective] Create project scaffold
778
- /rlp-desk run <slug> [options] Run loop (agent=LLM leader, tmux=shell leader)
785
+ /rlp-desk run <slug> [options] Run loop (native=Native Agent() leader (slash), tmux=zsh leader (production); legacy `agent` redirects to `native` — direct Node CLI `--mode agent` is deprecated alpha)
779
786
  /rlp-desk status <slug> Show loop status
780
787
  /rlp-desk logs <slug> [N] Show iteration log
781
788
  /rlp-desk clean <slug> [--kill-session] Reset for re-run (--kill-session kills tmux)
782
789
 
783
790
  Run options:
784
- --mode agent|tmux Execution mode (default: agent)
791
+ --mode native|tmux Execution mode (default: native)
785
792
  --worker-model MODEL Worker model: haiku|sonnet|opus or gpt-5.5:high|spark:high (default: haiku)
786
793
  --lock-worker-model Disable auto model upgrade on failure
787
794
  --verifier-model MODEL per-US verifier (default: sonnet)
@@ -799,15 +806,18 @@ Run options:
799
806
 
800
807
  ## Architecture
801
808
 
802
- ### Agent Mode (default: `--mode agent`)
809
+ ### Native Agent() Mode (default: `--mode native`)
803
810
  ```
804
- [This session = LEADER (LLM)]
811
+ [This session = LEADER (LLM, slash command itself)]
805
812
 
806
- Agent()├──▶ [Worker: executor (fresh context)]
813
+ Agent()├──▶ [Worker: claude subagent (fresh context, mode="bypassPermissions")]
807
814
  │ └── reads desk files, implements, updates memory
808
815
 
809
- Agent()└──▶ [Verifier: executor (fresh context)]
810
- └── reads done-claim, runs checks, writes verdict
816
+ Agent()└──▶ [Verifier: claude subagent (fresh context, mode="bypassPermissions")]
817
+ └── reads done-claim, runs checks, writes verdict
818
+
819
+ Bash() ───▶ [Worker/Verifier: codex CLI subprocess]
820
+ └── `codex exec --model <m> --reasoning-effort <r> <prompt>`
811
821
  ```
812
822
 
813
823
  ### Tmux Mode (`--mode tmux`)
package/src/node/run.mjs CHANGED
@@ -48,14 +48,14 @@ function buildHelpText() {
48
48
  'Commands:',
49
49
  ' brainstorm <description> Plan before init (not implemented in the Node rewrite yet)',
50
50
  ' init <slug> [objective] Create project scaffold',
51
- ' run <slug> [options] Run loop (agent=LLM leader, tmux=shell leader)',
51
+ ' run <slug> [options] Run loop (tmux=zsh leader [production], agent=Node leader [deprecated alpha], native=slash-only error)',
52
52
  ' status <slug> Show loop status',
53
53
  ' logs <slug> [N] Show iteration log (not implemented in the Node rewrite yet)',
54
54
  ' clean <slug> [--kill-session] Reset for re-run (not implemented in the Node rewrite yet)',
55
55
  ' resume <slug> Resume loop (not implemented in the Node rewrite yet)',
56
56
  '',
57
57
  'Run Options:',
58
- ' --mode agent|tmux',
58
+ ' --mode tmux|agent|native (CLI: tmux=production, agent=deprecated, native=errors with redirect to slash command)',
59
59
  ' --worker-model MODEL',
60
60
  ' --lock-worker-model',
61
61
  ' --verifier-model MODEL',
@@ -358,10 +358,32 @@ async function runRunCommand(args, deps) {
358
358
  return runTmuxViaZsh(slug, options, deps);
359
359
  }
360
360
 
361
- // v0.14.0: agent mode is the alpha LLM-driven path. The Node port shipped
362
- // without zsh-equivalent safety nets (heartbeat, copy-mode guard,
363
- // prompt-stall timeout, no-progress detection, claude model upgrade chain).
364
- // Surface that explicitly so production users pick --mode tmux instead.
361
+ // P1.b (native-agent-revert plan v7): --mode native is slash-command-only.
362
+ // The Node CLI does not implement Native Agent() that path lives in
363
+ // src/commands/rlp-desk.md and runs in a Claude Code session. Surface a
364
+ // hard error here so direct CLI invocation does not silently fall through
365
+ // to the deprecated Node-leader path.
366
+ if (options.mode === 'native') {
367
+ write(
368
+ deps.stderr,
369
+ 'ERROR: --mode native is slash-command-only. The Node CLI does not implement it.',
370
+ );
371
+ write(
372
+ deps.stderr,
373
+ 'Use `/rlp-desk run <slug> --mode native` from a Claude Code session,',
374
+ );
375
+ write(
376
+ deps.stderr,
377
+ 'or use `--mode tmux` (production) / `--mode agent` (deprecated alpha) for direct CLI invocation.',
378
+ );
379
+ return 2;
380
+ }
381
+
382
+ // P1.b: --mode agent (Node-leader alpha) is deprecated. The slash command's
383
+ // Native Agent() path (`/rlp-desk run --mode native`) is unrelated — different
384
+ // code, different leader. We keep the Node-leader behavior unchanged for
385
+ // backward compatibility but surface a strong deprecation banner so wrappers
386
+ // can migrate before the next major release hard-errors this mode.
365
387
  if (
366
388
  options.mode === 'agent'
367
389
  && !process.env.RLP_DESK_QUIET_WARNINGS
@@ -369,7 +391,23 @@ async function runRunCommand(args, deps) {
369
391
  ) {
370
392
  write(
371
393
  deps.stderr,
372
- 'WARNING: --mode agent is alpha. For production tmux orchestration, prefer --mode tmux (zsh-backed, stable).',
394
+ 'WARNING: --mode agent (Node-leader alpha) is deprecated.',
395
+ );
396
+ write(
397
+ deps.stderr,
398
+ 'This is the direct Node-CLI alpha path — UNRELATED to the slash command Native Agent() path (`/rlp-desk run --mode native`).',
399
+ );
400
+ write(
401
+ deps.stderr,
402
+ 'For production tmux orchestration, use `--mode tmux`.',
403
+ );
404
+ write(
405
+ deps.stderr,
406
+ 'For Claude Code Native Agent() campaigns, use `/rlp-desk run --mode native` from a Claude Code session.',
407
+ );
408
+ write(
409
+ deps.stderr,
410
+ 'This mode will hard-error in the next major release.',
373
411
  );
374
412
  }
375
413