pi-crew 0.2.2 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (354) hide show
  1. package/AGENTS.md +57 -32
  2. package/CHANGELOG.md +466 -413
  3. package/LICENSE +21 -21
  4. package/NOTICE.md +16 -16
  5. package/README.md +323 -323
  6. package/docs/FEATURE_INTAKE.md +126 -0
  7. package/docs/HARNESS.md +86 -0
  8. package/docs/HARNESS_BACKLOG.md +41 -0
  9. package/docs/TEST_MATRIX.md +49 -0
  10. package/docs/actions-reference.md +595 -595
  11. package/docs/architecture.md +180 -180
  12. package/docs/code-review-2026-05-11.md +592 -0
  13. package/docs/commands-reference.md +347 -347
  14. package/docs/comparison-pi-subagents-vs-pi-crew.md +303 -0
  15. package/docs/decisions/0001-durable-state.md +41 -0
  16. package/docs/decisions/0002-child-process-for-async.md +42 -0
  17. package/docs/decisions/0003-depth-guard.md +36 -0
  18. package/docs/decisions/0004-execfile-over-exec.md +34 -0
  19. package/docs/decisions/0005-no-parameter-properties.md +49 -0
  20. package/docs/decisions/0006-publish-bundled-esm.md +63 -0
  21. package/docs/decisions/0007-active-run-binary-index.md +54 -0
  22. package/docs/decisions/0008-child-pi-warm-pool.md +61 -0
  23. package/docs/decisions/README.md +23 -0
  24. package/docs/followup-plan-2026-05-12.md +463 -0
  25. package/docs/followup-review-2026-05-12.md +297 -0
  26. package/docs/followup-review-round3-2026-05-12.md +342 -0
  27. package/docs/followup-review-round4-2026-05-13.md +107 -0
  28. package/docs/implementation-plan-top3.md +333 -0
  29. package/docs/live-mailbox-runtime.md +36 -36
  30. package/docs/next-upgrade-roadmap.md +808 -808
  31. package/docs/oh-my-pi-research.md +509 -0
  32. package/docs/perf/baseline-2026-05.md +113 -0
  33. package/docs/perf/final-report-2026-05.md +206 -0
  34. package/docs/perf/sprint-1-report.md +71 -0
  35. package/docs/perf/sprint-2-report.md +81 -0
  36. package/docs/perf/sprint-2.5-report.md +53 -0
  37. package/docs/perf/sprint-3-report.md +36 -0
  38. package/docs/perf/sprint-4-report.md +47 -0
  39. package/docs/perf/sprint-5-report.md +51 -0
  40. package/docs/perf/sprint-6-report.md +94 -0
  41. package/docs/perf/sprint-7-report.md +74 -0
  42. package/docs/perf/upgrade-plan-2026-05.md +147 -0
  43. package/docs/pi-subagents3-deep-analysis.md +508 -0
  44. package/docs/product/README.md +31 -0
  45. package/docs/product/platform.md +27 -0
  46. package/docs/product/runtime-safety.md +37 -0
  47. package/docs/product/team-run.md +39 -0
  48. package/docs/product/team-tool.md +37 -0
  49. package/docs/publishing.md +65 -65
  50. package/docs/resource-formats.md +134 -134
  51. package/docs/runtime-analysis-child-vs-live.md +171 -0
  52. package/docs/runtime-flow.md +148 -148
  53. package/docs/runtime-migration-in-process-analysis.md +250 -0
  54. package/docs/stories/README.md +30 -0
  55. package/docs/stories/backlog.md +36 -0
  56. package/docs/templates/decision.md +27 -0
  57. package/docs/templates/story.md +44 -0
  58. package/docs/templates/validation-report.md +32 -0
  59. package/docs/usage.md +238 -238
  60. package/index.ts +7 -6
  61. package/install.mjs +65 -65
  62. package/package.json +107 -99
  63. package/schema.json +222 -222
  64. package/skills/child-pi-spawning/SKILL.md +213 -0
  65. package/skills/context-artifact-hygiene/SKILL.md +32 -0
  66. package/skills/event-log-tracing/SKILL.md +299 -0
  67. package/skills/git-master/SKILL.md +225 -24
  68. package/skills/live-agent-lifecycle/SKILL.md +192 -0
  69. package/skills/mailbox-interactive/SKILL.md +300 -19
  70. package/skills/model-routing-context/SKILL.md +94 -0
  71. package/skills/multi-perspective-review/SKILL.md +88 -0
  72. package/skills/read-only-explorer/SKILL.md +250 -26
  73. package/skills/safe-bash/SKILL.md +307 -21
  74. package/skills/verification-before-done/SKILL.md +11 -2
  75. package/skills/widget-rendering/SKILL.md +258 -0
  76. package/skills/workspace-isolation/SKILL.md +202 -0
  77. package/skills/worktree-isolation/SKILL.md +202 -18
  78. package/src/adapters/claude-adapter.ts +25 -25
  79. package/src/adapters/codex-adapter.ts +21 -21
  80. package/src/adapters/cursor-adapter.ts +17 -17
  81. package/src/adapters/export-util.ts +137 -137
  82. package/src/adapters/index.ts +15 -15
  83. package/src/adapters/registry.ts +18 -18
  84. package/src/adapters/types.ts +23 -23
  85. package/src/agents/agent-config.ts +38 -38
  86. package/src/agents/agent-serializer.ts +38 -38
  87. package/src/agents/discover-agents.ts +121 -118
  88. package/src/config/config.ts +740 -858
  89. package/src/config/defaults.ts +96 -96
  90. package/src/config/drift-detector.ts +211 -211
  91. package/src/config/markers.ts +327 -327
  92. package/src/config/resilient-parser.ts +109 -108
  93. package/src/config/suggestions.ts +74 -74
  94. package/src/config/types.ts +199 -0
  95. package/src/extension/async-notifier.ts +123 -89
  96. package/src/extension/autonomous-policy.ts +169 -169
  97. package/src/extension/cross-extension-rpc.ts +104 -103
  98. package/src/extension/help.ts +47 -47
  99. package/src/extension/import-index.ts +69 -69
  100. package/src/extension/management.ts +395 -382
  101. package/src/extension/notification-router.ts +116 -116
  102. package/src/extension/notification-sink.ts +51 -51
  103. package/src/extension/project-init.ts +168 -168
  104. package/src/extension/register.ts +859 -668
  105. package/src/extension/registration/artifact-cleanup.ts +15 -15
  106. package/src/extension/registration/command-utils.ts +54 -54
  107. package/src/extension/registration/commands.ts +559 -452
  108. package/src/extension/registration/compaction-guard.ts +125 -125
  109. package/src/extension/registration/subagent-helpers.ts +102 -102
  110. package/src/extension/registration/subagent-tools.ts +220 -158
  111. package/src/extension/registration/team-tool.ts +159 -98
  112. package/src/extension/registration/viewers.ts +29 -0
  113. package/src/extension/result-watcher.ts +128 -128
  114. package/src/extension/run-bundle-schema.ts +89 -89
  115. package/src/extension/run-export.ts +73 -73
  116. package/src/extension/run-import.ts +84 -84
  117. package/src/extension/run-index.ts +94 -94
  118. package/src/extension/run-maintenance.ts +142 -142
  119. package/src/extension/session-summary.ts +8 -8
  120. package/src/extension/team-manager-command.ts +96 -95
  121. package/src/extension/team-recommendation.ts +188 -188
  122. package/src/extension/team-tool/api.ts +5 -2
  123. package/src/extension/team-tool/cancel.ts +224 -209
  124. package/src/extension/team-tool/config-patch.ts +36 -36
  125. package/src/extension/team-tool/context.ts +60 -60
  126. package/src/extension/team-tool/doctor.ts +242 -242
  127. package/src/extension/team-tool/handle-settings.ts +421 -195
  128. package/src/extension/team-tool/inspect.ts +41 -41
  129. package/src/extension/team-tool/lifecycle-actions.ts +139 -139
  130. package/src/extension/team-tool/parallel-dispatch.ts +156 -156
  131. package/src/extension/team-tool/plan.ts +19 -19
  132. package/src/extension/team-tool/respond.ts +112 -111
  133. package/src/extension/team-tool/run.ts +246 -228
  134. package/src/extension/team-tool/status.ts +110 -110
  135. package/src/extension/team-tool-types.ts +13 -13
  136. package/src/extension/team-tool.ts +16 -4
  137. package/src/extension/tool-result.ts +16 -16
  138. package/src/extension/validate-resources.ts +77 -77
  139. package/src/hooks/registry.ts +61 -61
  140. package/src/hooks/types.ts +40 -40
  141. package/src/i18n.ts +184 -184
  142. package/src/observability/correlation.ts +35 -35
  143. package/src/observability/event-to-metric.ts +68 -68
  144. package/src/observability/exporters/adapter.ts +30 -30
  145. package/src/observability/exporters/otlp-exporter.ts +106 -92
  146. package/src/observability/exporters/prometheus-exporter.ts +54 -54
  147. package/src/observability/metric-registry.ts +87 -87
  148. package/src/observability/metric-retention.ts +54 -54
  149. package/src/observability/metric-sink.ts +81 -56
  150. package/src/observability/metrics-primitives.ts +167 -167
  151. package/src/prompt/prompt-runtime.ts +72 -72
  152. package/src/runtime/adaptive-plan.ts +338 -0
  153. package/src/runtime/agent-control.ts +169 -169
  154. package/src/runtime/agent-memory.ts +72 -72
  155. package/src/runtime/agent-observability.ts +114 -114
  156. package/src/runtime/async-marker.ts +26 -26
  157. package/src/runtime/async-runner.ts +153 -79
  158. package/src/runtime/attention-events.ts +28 -28
  159. package/src/runtime/auto-resume.ts +100 -100
  160. package/src/runtime/background-runner.ts +122 -88
  161. package/src/runtime/cancellation.ts +61 -61
  162. package/src/runtime/capability-inventory.ts +116 -116
  163. package/src/runtime/child-pi-pool.ts +68 -0
  164. package/src/runtime/child-pi.ts +541 -463
  165. package/src/runtime/code-summary.ts +247 -247
  166. package/src/runtime/compaction-summary.ts +271 -271
  167. package/src/runtime/concurrency.ts +58 -58
  168. package/src/runtime/crash-recovery.ts +317 -301
  169. package/src/runtime/crew-agent-records.ts +379 -281
  170. package/src/runtime/crew-agent-runtime.ts +60 -60
  171. package/src/runtime/cross-extension-rpc.ts +72 -0
  172. package/src/runtime/custom-tools/irc-tool.ts +201 -201
  173. package/src/runtime/custom-tools/submit-result-tool.ts +90 -90
  174. package/src/runtime/deadletter.ts +47 -47
  175. package/src/runtime/delivery-coordinator.ts +176 -176
  176. package/src/runtime/delta-conflict.ts +360 -360
  177. package/src/runtime/diagnostic-export.ts +102 -102
  178. package/src/runtime/direct-run.ts +35 -35
  179. package/src/runtime/effectiveness.ts +82 -81
  180. package/src/runtime/errors/crew-errors.ts +166 -0
  181. package/src/runtime/event-stream-bridge.ts +92 -92
  182. package/src/runtime/foreground-control.ts +82 -82
  183. package/src/runtime/green-contract.ts +46 -46
  184. package/src/runtime/group-join.ts +234 -106
  185. package/src/runtime/heartbeat-watcher.ts +145 -124
  186. package/src/runtime/iteration-hooks.ts +267 -264
  187. package/src/runtime/live-agent-control.ts +88 -88
  188. package/src/runtime/live-agent-manager.ts +377 -179
  189. package/src/runtime/live-control-realtime.ts +36 -36
  190. package/src/runtime/live-session-runtime.ts +676 -599
  191. package/src/runtime/loop-gates.ts +129 -129
  192. package/src/runtime/manifest-cache.ts +263 -263
  193. package/src/runtime/mcp-proxy.ts +113 -113
  194. package/src/runtime/metric-parser.ts +40 -40
  195. package/src/runtime/model-fallback.ts +282 -274
  196. package/src/runtime/model-resolver.ts +118 -0
  197. package/src/runtime/output-validator.ts +187 -187
  198. package/src/runtime/overflow-recovery.ts +175 -175
  199. package/src/runtime/parallel-research.ts +44 -44
  200. package/src/runtime/parallel-utils.ts +156 -156
  201. package/src/runtime/parent-guard.ts +80 -80
  202. package/src/runtime/phase-progress.ts +217 -217
  203. package/src/runtime/pi-args.ts +165 -165
  204. package/src/runtime/pi-json-output.ts +111 -111
  205. package/src/runtime/pi-spawn.ts +167 -167
  206. package/src/runtime/policy-engine.ts +79 -79
  207. package/src/runtime/post-checks.ts +125 -122
  208. package/src/runtime/post-exit-stdio-guard.ts +86 -86
  209. package/src/runtime/process-status.ts +97 -73
  210. package/src/runtime/progress-event-coalescer.ts +43 -43
  211. package/src/runtime/recovery-recipes.ts +74 -74
  212. package/src/runtime/retry-executor.ts +81 -81
  213. package/src/runtime/role-permission.ts +39 -39
  214. package/src/runtime/run-tracker.ts +99 -0
  215. package/src/runtime/runtime-policy.ts +21 -0
  216. package/src/runtime/runtime-resolver.ts +94 -90
  217. package/src/runtime/scheduler.ts +294 -0
  218. package/src/runtime/semaphore.ts +131 -131
  219. package/src/runtime/sensitive-paths.ts +92 -92
  220. package/src/runtime/session-usage.ts +79 -79
  221. package/src/runtime/settings-store.ts +103 -0
  222. package/src/runtime/sidechain-output.ts +29 -29
  223. package/src/runtime/skill-instructions.ts +222 -222
  224. package/src/runtime/stale-reconciler.ts +198 -189
  225. package/src/runtime/streaming-output.ts +47 -0
  226. package/src/runtime/subagent-manager.ts +404 -395
  227. package/src/runtime/subprocess-tool-registry.ts +67 -67
  228. package/src/runtime/task-display.ts +38 -38
  229. package/src/runtime/task-graph-scheduler.ts +122 -122
  230. package/src/runtime/task-graph.ts +207 -207
  231. package/src/runtime/task-output-context.ts +177 -177
  232. package/src/runtime/task-packet.ts +93 -93
  233. package/src/runtime/task-quality.ts +207 -207
  234. package/src/runtime/task-runner/capabilities.ts +78 -78
  235. package/src/runtime/task-runner/live-executor.ts +131 -113
  236. package/src/runtime/task-runner/progress.ts +119 -119
  237. package/src/runtime/task-runner/prompt-builder.ts +139 -139
  238. package/src/runtime/task-runner/prompt-pipeline.ts +64 -64
  239. package/src/runtime/task-runner/result-utils.ts +14 -14
  240. package/src/runtime/task-runner/run-projection.ts +103 -103
  241. package/src/runtime/task-runner/state-helpers.ts +22 -22
  242. package/src/runtime/task-runner.ts +469 -458
  243. package/src/runtime/team-runner.ts +693 -945
  244. package/src/runtime/usage-tracker.ts +71 -0
  245. package/src/runtime/worker-heartbeat.ts +21 -21
  246. package/src/runtime/worker-startup.ts +57 -57
  247. package/src/runtime/workflow-state.ts +187 -187
  248. package/src/runtime/yield-handler.ts +190 -189
  249. package/src/schema/config-schema.ts +172 -168
  250. package/src/schema/team-tool-schema.ts +126 -125
  251. package/src/schema/validation-types.ts +151 -148
  252. package/src/skills/discover-skills.ts +67 -67
  253. package/src/skills/skill-templates.ts +374 -374
  254. package/src/state/active-run-registry.ts +227 -191
  255. package/src/state/artifact-store.ts +130 -129
  256. package/src/state/atomic-write.ts +262 -178
  257. package/src/state/blob-store.ts +116 -116
  258. package/src/state/contracts.ts +111 -111
  259. package/src/state/event-log-rotation.ts +161 -158
  260. package/src/state/event-log.ts +383 -240
  261. package/src/state/event-reconstructor.ts +217 -217
  262. package/src/state/jsonl-writer.ts +82 -82
  263. package/src/state/locks.ts +146 -148
  264. package/src/state/mailbox.ts +446 -405
  265. package/src/state/state-store.ts +364 -351
  266. package/src/state/task-claims.ts +44 -44
  267. package/src/state/types.ts +285 -285
  268. package/src/state/usage.ts +29 -29
  269. package/src/subagents/async-entry.ts +1 -1
  270. package/src/subagents/index.ts +3 -3
  271. package/src/subagents/live/control.ts +1 -1
  272. package/src/subagents/live/manager.ts +1 -1
  273. package/src/subagents/live/realtime.ts +1 -1
  274. package/src/subagents/live/session-runtime.ts +1 -1
  275. package/src/subagents/manager.ts +1 -1
  276. package/src/subagents/spawn.ts +1 -1
  277. package/src/teams/discover-teams.ts +116 -116
  278. package/src/teams/team-config.ts +27 -27
  279. package/src/teams/team-serializer.ts +38 -38
  280. package/src/types/diff.d.ts +18 -18
  281. package/src/ui/agent-management-overlay.ts +144 -144
  282. package/src/ui/crew-widget.ts +487 -370
  283. package/src/ui/dashboard-panes/agents-pane.ts +109 -28
  284. package/src/ui/dashboard-panes/cancellation-pane.ts +42 -42
  285. package/src/ui/dashboard-panes/capability-pane.ts +59 -59
  286. package/src/ui/dashboard-panes/health-pane.ts +30 -30
  287. package/src/ui/dashboard-panes/mailbox-pane.ts +35 -35
  288. package/src/ui/dashboard-panes/progress-pane.ts +30 -30
  289. package/src/ui/dashboard-panes/transcript-pane.ts +10 -10
  290. package/src/ui/heartbeat-aggregator.ts +63 -63
  291. package/src/ui/keybinding-map.ts +97 -94
  292. package/src/ui/live-conversation-overlay.ts +152 -0
  293. package/src/ui/live-run-sidebar.ts +180 -180
  294. package/src/ui/mascot.ts +442 -442
  295. package/src/ui/overlays/agent-picker-overlay.ts +57 -57
  296. package/src/ui/overlays/confirm-overlay.ts +58 -58
  297. package/src/ui/overlays/mailbox-compose-overlay.ts +144 -144
  298. package/src/ui/overlays/mailbox-compose-preview.ts +63 -63
  299. package/src/ui/overlays/mailbox-detail-overlay.ts +122 -122
  300. package/src/ui/pi-ui-compat.ts +57 -57
  301. package/src/ui/powerbar-publisher.ts +221 -197
  302. package/src/ui/render-scheduler.ts +216 -143
  303. package/src/ui/run-action-dispatcher.ts +118 -117
  304. package/src/ui/run-dashboard.ts +526 -464
  305. package/src/ui/run-event-bus.ts +208 -208
  306. package/src/ui/run-snapshot-cache.ts +826 -777
  307. package/src/ui/settings-overlay.ts +721 -0
  308. package/src/ui/snapshot-types.ts +86 -70
  309. package/src/ui/theme-adapter.ts +190 -190
  310. package/src/ui/tool-progress-formatter.ts +89 -0
  311. package/src/ui/transcript-cache.ts +94 -94
  312. package/src/ui/transcript-viewer.ts +335 -335
  313. package/src/utils/conflict-detect.ts +662 -0
  314. package/src/utils/env-filter.ts +30 -0
  315. package/src/utils/file-coalescer.ts +86 -86
  316. package/src/utils/frontmatter.ts +68 -68
  317. package/src/utils/fs-watch.ts +88 -31
  318. package/src/utils/gh-protocol.ts +479 -0
  319. package/src/utils/ids.ts +17 -17
  320. package/src/utils/incremental-reader.ts +104 -104
  321. package/src/utils/internal-error.ts +6 -6
  322. package/src/utils/names.ts +27 -27
  323. package/src/utils/paths.ts +102 -63
  324. package/src/utils/redaction.ts +44 -44
  325. package/src/utils/resolve-shell.ts +34 -0
  326. package/src/utils/safe-paths.ts +47 -47
  327. package/src/utils/scan-cache.ts +136 -136
  328. package/src/utils/sleep.ts +2 -1
  329. package/src/utils/sse-parser.ts +134 -134
  330. package/src/utils/task-name-generator.ts +337 -337
  331. package/src/utils/timings.ts +33 -33
  332. package/src/utils/visual.ts +243 -198
  333. package/src/workflows/discover-workflows.ts +139 -139
  334. package/src/workflows/validate-workflow.ts +40 -40
  335. package/src/workflows/workflow-config.ts +26 -26
  336. package/src/workflows/workflow-serializer.ts +32 -32
  337. package/src/worktree/branch-freshness.ts +45 -45
  338. package/src/worktree/cleanup.ts +75 -72
  339. package/src/worktree/worktree-manager.ts +188 -146
  340. package/teams/default.team.md +12 -12
  341. package/teams/fast-fix.team.md +11 -11
  342. package/teams/implementation.team.md +18 -18
  343. package/teams/parallel-research.team.md +14 -14
  344. package/teams/research.team.md +11 -11
  345. package/teams/review.team.md +12 -12
  346. package/tsconfig.json +19 -19
  347. package/workflows/default.workflow.md +30 -30
  348. package/workflows/fast-fix.workflow.md +23 -23
  349. package/workflows/implementation.workflow.md +43 -43
  350. package/workflows/parallel-research.workflow.md +46 -46
  351. package/workflows/research.workflow.md +22 -22
  352. package/workflows/review.workflow.md +30 -30
  353. package/skills/task-packet/SKILL.md +0 -28
  354. package/skills/verify-evidence/SKILL.md +0 -27
@@ -1,463 +1,541 @@
1
- import { spawn, type ChildProcess, type SpawnOptions } from "node:child_process";
2
- import * as fs from "node:fs";
3
- import * as path from "node:path";
4
- import type { AgentConfig } from "../agents/agent-config.ts";
5
- import type { WorkerExitStatus } from "../state/types.ts";
6
- import { buildPiWorkerArgs, checkCrewDepth, cleanupTempDir } from "./pi-args.ts";
7
- import { getPiSpawnCommand } from "./pi-spawn.ts";
8
- import { DEFAULT_CHILD_PI } from "../config/defaults.ts";
9
- import { logInternalError } from "../utils/internal-error.ts";
10
- import { attachPostExitStdioGuard, trySignalChild } from "./post-exit-stdio-guard.ts";
11
- import { redactJsonLine, SECRET_KEY_PATTERN } from "../utils/redaction.ts";
12
-
13
- const POST_EXIT_STDIO_GUARD_MS = DEFAULT_CHILD_PI.postExitStdioGuardMs;
14
- const FINAL_DRAIN_MS = DEFAULT_CHILD_PI.finalDrainMs;
15
- const HARD_KILL_MS = DEFAULT_CHILD_PI.hardKillMs;
16
- const RESPONSE_TIMEOUT_MS = DEFAULT_CHILD_PI.responseTimeoutMs;
17
- const MAX_CAPTURE_BYTES = DEFAULT_CHILD_PI.maxCaptureBytes;
18
- const MAX_ASSISTANT_TEXT_CHARS = DEFAULT_CHILD_PI.maxAssistantTextChars;
19
- const MAX_TOOL_RESULT_CHARS = DEFAULT_CHILD_PI.maxToolResultChars;
20
- const MAX_TOOL_INPUT_CHARS = DEFAULT_CHILD_PI.maxToolInputChars;
21
- const MAX_COMPACT_CONTENT_CHARS = DEFAULT_CHILD_PI.maxCompactContentChars;
22
- const activeChildProcesses = new Map<number, ChildProcess>();
23
- const childHardKillTimers = new Map<number, NodeJS.Timeout>();
24
-
25
- function appendBoundedTail(current: string, chunk: string, maxBytes = MAX_CAPTURE_BYTES): string {
26
- const combined = current + chunk;
27
- if (Buffer.byteLength(combined, "utf-8") <= maxBytes) return combined;
28
- let tail = combined.slice(Math.max(0, combined.length - maxBytes));
29
- while (Buffer.byteLength(tail, "utf-8") > maxBytes) tail = tail.slice(1024);
30
- return `[pi-crew captured output truncated to last ${Math.round(maxBytes / 1024)} KiB]\n${tail}`;
31
- }
32
-
33
- function clearHardKillTimer(pid: number | undefined): void {
34
- if (!pid) return;
35
- const timer = childHardKillTimers.get(pid);
36
- if (!timer) return;
37
- clearTimeout(timer);
38
- childHardKillTimers.delete(pid);
39
- }
40
-
41
- function killProcessTree(pid: number | undefined, child?: ChildProcess): void {
42
- if (!pid || !Number.isInteger(pid) || pid <= 0) return;
43
- if (child && child.exitCode !== null) return;
44
- try {
45
- if (process.platform === "win32") {
46
- spawn("taskkill", ["/pid", String(pid), "/t", "/f"], { stdio: "ignore", windowsHide: true });
47
- return;
48
- }
49
- try {
50
- process.kill(-pid, "SIGTERM");
51
- } catch (error) {
52
- logInternalError("child-pi.sigterm", error, `pid=${pid}`);
53
- try {
54
- process.kill(pid, "SIGTERM");
55
- } catch (fallbackError) {
56
- logInternalError("child-pi.sigterm-absolute", fallbackError, `pid=${pid}`);
57
- }
58
- }
59
- clearHardKillTimer(pid);
60
- const hardKillTimer = setTimeout(() => {
61
- try {
62
- process.kill(-pid, "SIGKILL");
63
- } catch (error) {
64
- logInternalError("child-pi.sigkill", error, `pid=${pid}`);
65
- try {
66
- process.kill(pid, "SIGKILL");
67
- } catch (fallbackError) {
68
- logInternalError("child-pi.sigkill-absolute", fallbackError, `pid=${pid}`);
69
- }
70
- }
71
- childHardKillTimers.delete(pid);
72
- }, HARD_KILL_MS);
73
- hardKillTimer.unref();
74
- child?.once("exit", () => clearHardKillTimer(pid));
75
- childHardKillTimers.set(pid, hardKillTimer);
76
- } catch (error) {
77
- logInternalError("child-pi.kill-process-tree", error, `pid=${pid}`);
78
- }
79
- }
80
-
81
- export function terminateActiveChildPiProcesses(): number {
82
- const entries = [...activeChildProcesses.entries()];
83
- for (const [pid, child] of entries) killProcessTree(pid, child);
84
- return entries.length;
85
- }
86
-
87
- export interface ChildPiRunInput {
88
- cwd: string;
89
- task: string;
90
- agent: AgentConfig;
91
- model?: string;
92
- skillPaths?: string[];
93
- signal?: AbortSignal;
94
- transcriptPath?: string;
95
- onStdoutLine?: (line: string) => void;
96
- onJsonEvent?: (event: unknown) => void;
97
- onSpawn?: (pid: number) => void;
98
- maxDepth?: number;
99
- finalDrainMs?: number;
100
- hardKillMs?: number;
101
- responseTimeoutMs?: number;
102
- }
103
-
104
- export interface ChildPiRunResult {
105
- exitCode: number | null;
106
- stdout: string;
107
- stderr: string;
108
- error?: string;
109
- exitStatus?: WorkerExitStatus;
110
- }
111
-
112
- export function buildChildPiSpawnOptions(cwd: string, env: NodeJS.ProcessEnv): SpawnOptions {
113
- // Filter out env vars whose keys match secret patterns to avoid leaking credentials to child processes
114
- const filteredEnv: Record<string, string> = {};
115
- for (const [key, value] of Object.entries(env)) {
116
- if (value !== undefined && !SECRET_KEY_PATTERN.test(key)) filteredEnv[key] = value;
117
- }
118
- return {
119
- cwd,
120
- env: { ...filteredEnv, PI_CREW_PARENT_PID: String(process.pid) },
121
- stdio: ["ignore", "pipe", "pipe"],
122
- detached: process.platform !== "win32",
123
- windowsHide: true,
124
- };
125
- }
126
-
127
- function appendTranscript(input: ChildPiRunInput, line: string): void {
128
- if (!input.transcriptPath) return;
129
- fs.mkdirSync(path.dirname(input.transcriptPath), { recursive: true });
130
- fs.appendFileSync(input.transcriptPath, `${redactJsonLine(line)}\n`, "utf-8");
131
- }
132
-
133
- function compactString(value: string, maxChars = MAX_COMPACT_CONTENT_CHARS): string {
134
- if (value.length <= maxChars) return value;
135
- return `${value.slice(0, maxChars)}\n[pi-crew compacted ${value.length - maxChars} chars]`;
136
- }
137
-
138
- function compactValue(value: unknown): unknown {
139
- if (typeof value === "string") return compactString(value);
140
- if (Array.isArray(value)) return value.slice(0, 20).map(compactValue);
141
- const record = asRecord(value);
142
- if (!record) return value;
143
- const compacted: Record<string, unknown> = {};
144
- for (const [key, entry] of Object.entries(record).slice(0, 20)) compacted[key] = compactValue(entry);
145
- return compacted;
146
- }
147
-
148
- function compactContentPart(part: unknown): unknown | undefined {
149
- const record = asRecord(part);
150
- if (!record) return undefined;
151
- if (record.type === "text") return { type: "text", text: typeof record.text === "string" ? compactString(record.text, MAX_ASSISTANT_TEXT_CHARS) : "" };
152
- if (record.type === "toolCall") return { type: "toolCall", name: record.name, input: compactValue(typeof record.input === "string" ? compactString(record.input, MAX_TOOL_INPUT_CHARS) : record.input) };
153
- if (record.type === "toolResult") return { type: "toolResult", name: record.name, content: compactValue(typeof record.content === "string" ? compactString(record.content, MAX_TOOL_RESULT_CHARS) : record.content) };
154
- return undefined;
155
- }
156
-
157
- function compactChildPiEvent(event: unknown): unknown | undefined {
158
- const record = asRecord(event);
159
- if (!record) return undefined;
160
- if (record.type === "message_update") return undefined;
161
- if (record.type === "tool_execution_start" || record.type === "tool_execution_end") {
162
- return { type: record.type, toolName: record.toolName, args: record.args };
163
- }
164
- if (record.type === "tool_result_end" || record.type === "message_end" || record.type === "message") {
165
- const message = asRecord(record.message);
166
- if (message?.role === "user" || message?.role === "system") return undefined;
167
- const content = Array.isArray(message?.content) ? message.content.map(compactContentPart).filter((part) => part !== undefined) : undefined;
168
- return {
169
- type: record.type,
170
- ...(typeof record.text === "string" ? { text: record.text } : {}),
171
- ...(message ? { message: { role: message.role, ...(content ? { content } : {}), usage: message.usage, model: message.model, errorMessage: message.errorMessage, stopReason: message.stopReason } } : {}),
172
- usage: record.usage,
173
- model: record.model,
174
- provider: record.provider,
175
- stopReason: record.stopReason,
176
- };
177
- }
178
- return record.type ? { type: record.type } : undefined;
179
- }
180
-
181
- function displayTextFromCompactEvent(event: unknown): string | undefined {
182
- const record = asRecord(event);
183
- if (!record) return undefined;
184
- if (record.type === "tool_execution_start") {
185
- return typeof record.toolName === "string" ? `tool: ${record.toolName}` : "tool started";
186
- }
187
- if (record.type !== "message" && record.type !== "message_end") return undefined;
188
- const message = asRecord(record.message);
189
- if (message?.role !== undefined && message.role !== "assistant") return undefined;
190
- const content = Array.isArray(message?.content) ? message.content : [];
191
- const text = content.flatMap((part) => {
192
- const item = asRecord(part);
193
- return item?.type === "text" && typeof item.text === "string" ? [item.text] : [];
194
- }).join("\n").trim();
195
- return text || (typeof record.text === "string" ? record.text : undefined);
196
- }
197
-
198
- function compactChildPiLine(line: string): { persistedLine: string; event?: unknown; displayLine?: string; json: boolean } {
199
- try {
200
- const parsed = JSON.parse(line);
201
- const compact = compactChildPiEvent(parsed);
202
- return { json: true, event: compact, persistedLine: compact ? JSON.stringify(compact) : "", displayLine: displayTextFromCompactEvent(compact) };
203
- } catch {
204
- return { json: false, persistedLine: line, displayLine: line };
205
- }
206
- }
207
-
208
- export class ChildPiLineObserver {
209
- private buffer = "";
210
- private readonly input: ChildPiRunInput;
211
-
212
- constructor(input: ChildPiRunInput) {
213
- this.input = input;
214
- }
215
-
216
- observe(text: string): void {
217
- this.buffer += text;
218
- const lines = this.buffer.split(/\r?\n/);
219
- this.buffer = lines.pop() ?? "";
220
- for (const line of lines) this.emitLine(line);
221
- }
222
-
223
- flush(): void {
224
- if (!this.buffer) return;
225
- const line = this.buffer;
226
- this.buffer = "";
227
- this.emitLine(line);
228
- }
229
-
230
- private emitLine(line: string): void {
231
- if (!line.trim()) return;
232
- const compact = compactChildPiLine(line);
233
- if (compact.event !== undefined) {
234
- try {
235
- this.input.onJsonEvent?.(compact.event);
236
- } catch (error) {
237
- logInternalError("child-pi.on-json-event", error, `line=${compact.persistedLine ?? compact.displayLine ?? ""}`);
238
- }
239
- }
240
- if (compact.persistedLine) appendTranscript(this.input, compact.persistedLine);
241
- if (compact.displayLine?.trim()) {
242
- try {
243
- this.input.onStdoutLine?.(compact.displayLine);
244
- } catch (error) {
245
- logInternalError("child-pi.on-stdout-line", error, `line=${compact.displayLine}`);
246
- }
247
- }
248
- }
249
- }
250
-
251
- /** Mock-only path — real code path reuses a single observer. */
252
- function observeStdoutChunk(input: ChildPiRunInput, text: string): void {
253
- const observer = new ChildPiLineObserver(input);
254
- observer.observe(text);
255
- observer.flush();
256
- }
257
-
258
- function asRecord(value: unknown): Record<string, unknown> | undefined {
259
- return value && typeof value === "object" && !Array.isArray(value) ? value as Record<string, unknown> : undefined;
260
- }
261
-
262
- function isFinalAssistantEvent(event: unknown): boolean {
263
- const obj = asRecord(event);
264
- if (!obj || obj.type !== "message_end") return false;
265
- const message = asRecord(obj.message);
266
- const role = message?.role;
267
- if (role !== undefined && role !== "assistant") return false;
268
- const stopReason = typeof message?.stopReason === "string" ? message.stopReason : typeof obj.stopReason === "string" ? obj.stopReason : undefined;
269
- if (stopReason !== undefined && stopReason !== "stop") return false;
270
- const content = Array.isArray(message?.content) ? message.content : [];
271
- return !content.some((part) => asRecord(part)?.type === "toolCall");
272
- }
273
-
274
- export async function runChildPi(input: ChildPiRunInput): Promise<ChildPiRunResult> {
275
- const depth = checkCrewDepth(input.maxDepth);
276
- if (depth.blocked) return { exitCode: 1, stdout: "", stderr: `pi-crew depth guard blocked child worker: depth ${depth.depth} >= max ${depth.maxDepth}` };
277
- const mock = process.env.PI_TEAMS_MOCK_CHILD_PI;
278
- if (mock) {
279
- if (mock === "success") {
280
- const stdout = `Mock child Pi success for ${input.agent.name}\n`;
281
- observeStdoutChunk(input, stdout);
282
- return { exitCode: 0, stdout, stderr: "" };
283
- }
284
- if (mock === "json-success" || mock === "adaptive-plan") {
285
- const text = mock === "adaptive-plan" && input.task.includes("ADAPTIVE_PLAN_JSON_START")
286
- ? `Adaptive mock plan\nADAPTIVE_PLAN_JSON_START\n${JSON.stringify({ phases: [{ name: "research", tasks: [{ role: "explorer", task: "Explore adaptive target" }, { role: "analyst", task: "Analyze adaptive target" }, { role: "planner", task: "Plan adaptive target" }] }, { name: "build", tasks: [{ role: "executor", task: "Implement adaptive target" }] }, { name: "check", tasks: [{ role: "reviewer", task: "Review adaptive target" }, { role: "test-engineer", task: "Test adaptive target" }, { role: "writer", task: "Summarize adaptive target" }] }] })}\nADAPTIVE_PLAN_JSON_END`
287
- : `Mock JSON success for ${input.agent.name}`;
288
- const stdout = `${JSON.stringify({ type: "message", message: { role: "assistant", content: [{ type: "text", text }] } })}\n${JSON.stringify({ type: "message_end", usage: { input: 10, output: 5, cost: 0.001, turns: 1 } })}\n`;
289
- observeStdoutChunk(input, stdout);
290
- return { exitCode: 0, stdout, stderr: "" };
291
- }
292
- if (mock === "retryable-failure") return { exitCode: 1, stdout: "", stderr: "rate limit: mock failure" };
293
- return { exitCode: 1, stdout: "", stderr: `mock failure: ${mock}` };
294
- }
295
- const built = buildPiWorkerArgs({ task: input.task, agent: input.agent, model: input.model, sessionEnabled: false, maxDepth: input.maxDepth, skillPaths: input.skillPaths });
296
- const spawnSpec = getPiSpawnCommand(built.args);
297
- try {
298
- return await new Promise<ChildPiRunResult>((resolve) => {
299
- const child = spawn(spawnSpec.command, spawnSpec.args, buildChildPiSpawnOptions(input.cwd, { ...process.env, ...built.env }));
300
- if (child.pid) {
301
- activeChildProcesses.set(child.pid, child);
302
- input.onSpawn?.(child.pid);
303
- }
304
- let stdout = "";
305
- let stderr = "";
306
- let settled = false;
307
- let childExited = false;
308
- let postExitGuardCleanup: (() => void) | undefined;
309
- let finalDrainTimer: NodeJS.Timeout | undefined;
310
- let hardKillTimer: NodeJS.Timeout | undefined;
311
- let noResponseTimer: NodeJS.Timeout | undefined;
312
- const finalDrainMs = input.finalDrainMs ?? FINAL_DRAIN_MS;
313
- const hardKillMs = input.hardKillMs ?? HARD_KILL_MS;
314
- const responseTimeoutEnv = Number.parseInt(process.env.PI_TEAMS_CHILD_RESPONSE_TIMEOUT_MS ?? "", 10);
315
- const responseTimeoutMs = Number.isFinite(responseTimeoutEnv) && responseTimeoutEnv >= 0 ? responseTimeoutEnv : input.responseTimeoutMs ?? RESPONSE_TIMEOUT_MS;
316
- let responseTimeoutHit = false;
317
- let forcedFinalDrain = false;
318
- let abortRequested = input.signal?.aborted === true;
319
- let hardKilled = false;
320
- const cleanupErrors: string[] = [];
321
- const restartNoResponseTimer = (): void => {
322
- if (responseTimeoutMs <= 0) return;
323
- if (noResponseTimer) clearTimeout(noResponseTimer);
324
- noResponseTimer = setTimeout(() => {
325
- responseTimeoutHit = true;
326
- killProcessTree(child.pid, child);
327
- try {
328
- child.kill(process.platform === "win32" ? undefined : "SIGTERM");
329
- } catch (error) {
330
- logInternalError("child-pi.response-timeout-term", error, `pid=${child.pid}`);
331
- }
332
- }, responseTimeoutMs);
333
- noResponseTimer.unref();
334
- };
335
- const clearNoResponseTimer = (): void => {
336
- if (noResponseTimer) clearTimeout(noResponseTimer);
337
- noResponseTimer = undefined;
338
- };
339
- restartNoResponseTimer();
340
- const lineObserver = new ChildPiLineObserver({
341
- ...input,
342
- onStdoutLine: (line) => {
343
- restartNoResponseTimer();
344
- stdout = appendBoundedTail(stdout, `${line}\n`);
345
- input.onStdoutLine?.(line);
346
- },
347
- onJsonEvent: (event) => {
348
- restartNoResponseTimer();
349
- input.onJsonEvent?.(event);
350
- if (!isFinalAssistantEvent(event) || childExited || settled || finalDrainTimer) return;
351
- finalDrainTimer = setTimeout(() => {
352
- if (settled || childExited) return;
353
- forcedFinalDrain = true;
354
- try {
355
- child.kill(process.platform === "win32" ? undefined : "SIGTERM");
356
- } catch (error) {
357
- logInternalError("child-pi.final-drain-term", error, `pid=${child.pid}`);
358
- }
359
- hardKillTimer = setTimeout(() => {
360
- if (settled || childExited) return;
361
- try {
362
- hardKilled = true;
363
- child.kill(process.platform === "win32" ? undefined : "SIGKILL");
364
- } catch (error) {
365
- logInternalError("child-pi.final-drain-kill", error, `pid=${child.pid}`);
366
- }
367
- }, hardKillMs);
368
- hardKillTimer.unref();
369
- }, finalDrainMs);
370
- finalDrainTimer.unref();
371
- },
372
- });
373
-
374
- const clearFinalDrainTimers = (): void => {
375
- if (finalDrainTimer) clearTimeout(finalDrainTimer);
376
- if (hardKillTimer) clearTimeout(hardKillTimer);
377
- finalDrainTimer = undefined;
378
- hardKillTimer = undefined;
379
- };
380
- const clearPostExitGuard = (): void => {
381
- if (postExitGuardCleanup) {
382
- postExitGuardCleanup();
383
- postExitGuardCleanup = undefined;
384
- }
385
- };
386
- const clearChildPiTimeouts = (): void => {
387
- clearNoResponseTimer();
388
- clearFinalDrainTimers();
389
- clearPostExitGuard();
390
- };
391
-
392
- const settle = (result: ChildPiRunResult): void => {
393
- if (settled) return;
394
- settled = true;
395
- clearChildPiTimeouts();
396
- lineObserver.flush();
397
- input.signal?.removeEventListener("abort", abort);
398
- try {
399
- cleanupTempDir(built.tempDir);
400
- } catch (error) {
401
- cleanupErrors.push(error instanceof Error ? error.message : String(error));
402
- }
403
- resolve({ ...result, exitStatus: result.exitStatus ?? { exitCode: result.exitCode, cancelled: abortRequested, timedOut: responseTimeoutHit, killed: hardKilled, cleanupErrors, finalDrainMs } });
404
- };
405
-
406
- const abort = (): void => {
407
- abortRequested = true;
408
- killProcessTree(child.pid, child);
409
- if (process.platform !== "win32") {
410
- trySignalChild(child, "SIGTERM");
411
- }
412
- try {
413
- child.kill(process.platform === "win32" ? undefined : "SIGTERM");
414
- } catch {
415
- // Ignore kill races.
416
- }
417
- };
418
-
419
- input.signal?.addEventListener("abort", abort, { once: true });
420
- child.stdout?.on("data", (chunk: Buffer) => {
421
- restartNoResponseTimer();
422
- lineObserver.observe(chunk.toString("utf-8"));
423
- });
424
- child.stderr?.on("data", (chunk: Buffer) => {
425
- restartNoResponseTimer();
426
- stderr = appendBoundedTail(stderr, chunk.toString("utf-8"));
427
- });
428
- child.on("error", (error) => {
429
- settle({ exitCode: null, stdout, stderr, error: error.message });
430
- });
431
- child.on("exit", () => {
432
- if (child.pid) {
433
- activeChildProcesses.delete(child.pid);
434
- clearHardKillTimer(child.pid);
435
- }
436
- childExited = true;
437
- clearNoResponseTimer();
438
- clearFinalDrainTimers();
439
- if (!postExitGuardCleanup) {
440
- postExitGuardCleanup = attachPostExitStdioGuard(child, {
441
- idleMs: POST_EXIT_STDIO_GUARD_MS,
442
- hardMs: HARD_KILL_MS,
443
- });
444
- }
445
- });
446
- child.on("close", (exitCode) => {
447
- if (child.pid) {
448
- activeChildProcesses.delete(child.pid);
449
- clearHardKillTimer(child.pid);
450
- }
451
- const timeoutError = responseTimeoutHit && !stderr.trim() ? { error: `Child Pi produced no new output for ${responseTimeoutMs}ms; process was terminated as unresponsive.` } : undefined;
452
- const finalExitCode = forcedFinalDrain && !timeoutError ? 0 : exitCode;
453
- // A final assistant event is the child Pi contract for "the worker produced its answer".
454
- // Some Pi processes can linger during post-final cleanup/stdio shutdown; finalDrain terminates
455
- // that lingering process so the parent can continue, but it must not turn a completed
456
- // subagent answer into a failed task. Real pre-final response timeouts still report errors.
457
- settle({ exitCode: finalExitCode, stdout, stderr, ...(timeoutError ? { error: timeoutError.error } : {}), exitStatus: { exitCode: finalExitCode, cancelled: abortRequested, timedOut: responseTimeoutHit, killed: hardKilled, cleanupErrors, finalDrainMs } });
458
- });
459
- });
460
- } finally {
461
- cleanupTempDir(built.tempDir);
462
- }
463
- }
1
+ import { spawn, type ChildProcess, type SpawnOptions } from "node:child_process";
2
+ import * as fs from "node:fs";
3
+ import * as path from "node:path";
4
+ import type { AgentConfig } from "../agents/agent-config.ts";
5
+ import type { WorkerExitStatus } from "../state/types.ts";
6
+ import { buildPiWorkerArgs, checkCrewDepth, cleanupTempDir } from "./pi-args.ts";
7
+ import { getPiSpawnCommand } from "./pi-spawn.ts";
8
+ import { DEFAULT_CHILD_PI } from "../config/defaults.ts";
9
+ import { logInternalError } from "../utils/internal-error.ts";
10
+ import { attachPostExitStdioGuard, trySignalChild } from "./post-exit-stdio-guard.ts";
11
+ import { redactJsonLine, SECRET_KEY_PATTERN } from "../utils/redaction.ts";
12
+ import { sanitizeEnvSecrets } from "../utils/env-filter.ts";
13
+
14
+ const POST_EXIT_STDIO_GUARD_MS = DEFAULT_CHILD_PI.postExitStdioGuardMs;
15
+ const FINAL_DRAIN_MS = DEFAULT_CHILD_PI.finalDrainMs;
16
+ const HARD_KILL_MS = DEFAULT_CHILD_PI.hardKillMs;
17
+ const RESPONSE_TIMEOUT_MS = DEFAULT_CHILD_PI.responseTimeoutMs;
18
+ const MAX_CAPTURE_BYTES = DEFAULT_CHILD_PI.maxCaptureBytes;
19
+ const MAX_ASSISTANT_TEXT_CHARS = DEFAULT_CHILD_PI.maxAssistantTextChars;
20
+ const MAX_TOOL_RESULT_CHARS = DEFAULT_CHILD_PI.maxToolResultChars;
21
+ const MAX_TOOL_INPUT_CHARS = DEFAULT_CHILD_PI.maxToolInputChars;
22
+ const MAX_COMPACT_CONTENT_CHARS = DEFAULT_CHILD_PI.maxCompactContentChars;
23
+ const activeChildProcesses = new Map<number, ChildProcess>();
24
+ const childHardKillTimers = new Map<number, NodeJS.Timeout>();
25
+
26
+ function appendBoundedTail(current: string, chunk: string, maxBytes = MAX_CAPTURE_BYTES): string {
27
+ const combined = current + chunk;
28
+ if (Buffer.byteLength(combined, "utf-8") <= maxBytes) return combined;
29
+ let tail = combined.slice(Math.max(0, combined.length - maxBytes));
30
+ while (Buffer.byteLength(tail, "utf-8") > maxBytes) tail = tail.slice(1024);
31
+ return `[pi-crew captured output truncated to last ${Math.round(maxBytes / 1024)} KiB]\n${tail}`;
32
+ }
33
+
34
+ function clearHardKillTimer(pid: number | undefined): void {
35
+ if (!pid) return;
36
+ const timer = childHardKillTimers.get(pid);
37
+ if (!timer) return;
38
+ clearTimeout(timer);
39
+ childHardKillTimers.delete(pid);
40
+ }
41
+
42
+ export function killProcessPid(pid: number): void {
43
+ if (!Number.isInteger(pid) || pid <= 0) return;
44
+ try {
45
+ if (process.platform === "win32") {
46
+ // 3.8: Windows path uses taskkill /T /F (force kill the entire tree).
47
+ // taskkill itself can silently fail (PID gone, permission denied, etc.)
48
+ // so verify after 2s and log a warning if the process is still alive.
49
+ spawn("taskkill", ["/pid", String(pid), "/t", "/f"], { stdio: "ignore", windowsHide: true });
50
+ const verifyTimer = setTimeout(() => {
51
+ try {
52
+ process.kill(pid, 0); // throws ESRCH when dead
53
+ // Still alive — log and retry once.
54
+ logInternalError("child-pi.taskkill-stuck", new Error(`process ${pid} still alive 2s after taskkill /T /F; retrying`), `pid=${pid}`);
55
+ try { spawn("taskkill", ["/pid", String(pid), "/t", "/f"], { stdio: "ignore", windowsHide: true }); } catch { /* best-effort */ }
56
+ } catch {
57
+ // ESRCH or EPERM — process is gone. OK.
58
+ }
59
+ }, 2000);
60
+ verifyTimer.unref();
61
+ return;
62
+ }
63
+ try {
64
+ process.kill(-pid, "SIGTERM");
65
+ } catch (error) {
66
+ logInternalError("child-pi.sigterm", error, `pid=${pid}`);
67
+ try {
68
+ process.kill(pid, "SIGTERM");
69
+ } catch (fallbackError) {
70
+ logInternalError("child-pi.sigterm-absolute", fallbackError, `pid=${pid}`);
71
+ }
72
+ }
73
+ clearHardKillTimer(pid);
74
+ const hardKillTimer = setTimeout(() => {
75
+ try {
76
+ process.kill(-pid, "SIGKILL");
77
+ } catch (error) {
78
+ logInternalError("child-pi.sigkill", error, `pid=${pid}`);
79
+ try {
80
+ process.kill(pid, "SIGKILL");
81
+ } catch (fallbackError) {
82
+ logInternalError("child-pi.sigkill-absolute", fallbackError, `pid=${pid}`);
83
+ }
84
+ }
85
+ childHardKillTimers.delete(pid);
86
+ }, HARD_KILL_MS);
87
+ hardKillTimer.unref();
88
+ childHardKillTimers.set(pid, hardKillTimer);
89
+ } catch (error) {
90
+ logInternalError("child-pi.kill-process-pid", error, `pid=${pid}`);
91
+ }
92
+ }
93
+
94
+ function killProcessTree(pid: number | undefined, child?: ChildProcess): void {
95
+ if (!pid || !Number.isInteger(pid) || pid <= 0) return;
96
+ if (child && child.exitCode !== null) return;
97
+ killProcessPid(pid);
98
+ child?.once("exit", () => clearHardKillTimer(pid));
99
+ }
100
+
101
+ export function terminateActiveChildPiProcesses(): number {
102
+ const entries = [...activeChildProcesses.entries()];
103
+ for (const [pid, child] of entries) killProcessTree(pid, child);
104
+ return entries.length;
105
+ }
106
+
107
+
108
+ /** Structured lifecycle event emitted by child-pi for critical transitions. */
109
+ export interface ChildPiLifecycleEvent {
110
+ /** Event discriminator. */
111
+ type: "spawned" | "spawn_error" | "response_timeout" | "final_drain" | "hard_kill" | "exit" | "close";
112
+ /** Process ID when available. */
113
+ pid?: number;
114
+ /** Exit code for exit/close events. */
115
+ exitCode?: number | null;
116
+ /** Error message for error events. */
117
+ error?: string;
118
+ /** Timestamp (ISO). */
119
+ ts: string;
120
+ }
121
+
122
+ export interface ChildPiRunInput {
123
+ cwd: string;
124
+ task: string;
125
+ agent: AgentConfig;
126
+ model?: string;
127
+ skillPaths?: string[];
128
+ signal?: AbortSignal;
129
+ transcriptPath?: string;
130
+ onStdoutLine?: (line: string) => void;
131
+ onJsonEvent?: (event: unknown) => void;
132
+ onSpawn?: (pid: number) => void;
133
+ /** Structured lifecycle events for durable logging (spawn, crash, timeout, kill, exit). */
134
+ onLifecycleEvent?: (event: ChildPiLifecycleEvent) => void;
135
+ maxDepth?: number;
136
+ finalDrainMs?: number;
137
+ hardKillMs?: number;
138
+ responseTimeoutMs?: number;
139
+ }
140
+
141
+ export interface ChildPiRunResult {
142
+ exitCode: number | null;
143
+ stdout: string;
144
+ stderr: string;
145
+ error?: string;
146
+ exitStatus?: WorkerExitStatus;
147
+ }
148
+
149
+ export function buildChildPiSpawnOptions(cwd: string, env: NodeJS.ProcessEnv): SpawnOptions {
150
+ // Filter out env vars whose keys match secret patterns to avoid leaking credentials to child processes
151
+ const filteredEnv = sanitizeEnvSecrets(env);
152
+ return {
153
+ cwd,
154
+ env: { ...filteredEnv, PI_CREW_PARENT_PID: String(process.pid) },
155
+ stdio: ["ignore", "pipe", "pipe"],
156
+ detached: process.platform !== "win32",
157
+ windowsHide: true,
158
+ };
159
+ }
160
+
161
+ function appendTranscript(input: ChildPiRunInput, line: string): void {
162
+ if (!input.transcriptPath) return;
163
+ fs.mkdirSync(path.dirname(input.transcriptPath), { recursive: true });
164
+ fs.appendFileSync(input.transcriptPath, `${redactJsonLine(line)}\n`, "utf-8");
165
+ }
166
+
167
+ function compactString(value: string, maxChars = MAX_COMPACT_CONTENT_CHARS): string {
168
+ if (value.length <= maxChars) return value;
169
+ return `${value.slice(0, maxChars)}\n[pi-crew compacted ${value.length - maxChars} chars]`;
170
+ }
171
+
172
+ function compactValue(value: unknown): unknown {
173
+ if (typeof value === "string") return compactString(value);
174
+ if (Array.isArray(value)) return value.slice(0, 20).map(compactValue);
175
+ const record = asRecord(value);
176
+ if (!record) return value;
177
+ const compacted: Record<string, unknown> = {};
178
+ for (const [key, entry] of Object.entries(record).slice(0, 20)) compacted[key] = compactValue(entry);
179
+ return compacted;
180
+ }
181
+
182
+ function compactContentPart(part: unknown): unknown | undefined {
183
+ const record = asRecord(part);
184
+ if (!record) return undefined;
185
+ if (record.type === "text") return { type: "text", text: typeof record.text === "string" ? compactString(record.text, MAX_ASSISTANT_TEXT_CHARS) : "" };
186
+ if (record.type === "toolCall") return { type: "toolCall", name: record.name, input: compactValue(typeof record.input === "string" ? compactString(record.input, MAX_TOOL_INPUT_CHARS) : record.input) };
187
+ if (record.type === "toolResult") return { type: "toolResult", name: record.name, content: compactValue(typeof record.content === "string" ? compactString(record.content, MAX_TOOL_RESULT_CHARS) : record.content) };
188
+ return undefined;
189
+ }
190
+
191
+ function compactChildPiEvent(event: unknown): unknown | undefined {
192
+ const record = asRecord(event);
193
+ if (!record) return undefined;
194
+ if (record.type === "message_update") return undefined;
195
+ if (record.type === "tool_execution_start" || record.type === "tool_execution_end") {
196
+ return { type: record.type, toolName: record.toolName, args: record.args };
197
+ }
198
+ if (record.type === "tool_result_end" || record.type === "message_end" || record.type === "message") {
199
+ const message = asRecord(record.message);
200
+ if (message?.role === "user" || message?.role === "system") return undefined;
201
+ const content = Array.isArray(message?.content) ? message.content.map(compactContentPart).filter((part) => part !== undefined) : undefined;
202
+ return {
203
+ type: record.type,
204
+ ...(typeof record.text === "string" ? { text: record.text } : {}),
205
+ ...(message ? { message: { role: message.role, ...(content ? { content } : {}), usage: message.usage, model: message.model, errorMessage: message.errorMessage, stopReason: message.stopReason } } : {}),
206
+ usage: record.usage,
207
+ model: record.model,
208
+ provider: record.provider,
209
+ stopReason: record.stopReason,
210
+ };
211
+ }
212
+ return record.type ? { type: record.type } : undefined;
213
+ }
214
+
215
+ function displayTextFromCompactEvent(event: unknown): string | undefined {
216
+ const record = asRecord(event);
217
+ if (!record) return undefined;
218
+ if (record.type === "tool_execution_start") {
219
+ return typeof record.toolName === "string" ? `tool: ${record.toolName}` : "tool started";
220
+ }
221
+ if (record.type !== "message" && record.type !== "message_end") return undefined;
222
+ const message = asRecord(record.message);
223
+ if (message?.role !== undefined && message.role !== "assistant") return undefined;
224
+ const content = Array.isArray(message?.content) ? message.content : [];
225
+ const text = content.flatMap((part) => {
226
+ const item = asRecord(part);
227
+ return item?.type === "text" && typeof item.text === "string" ? [item.text] : [];
228
+ }).join("\n").trim();
229
+ return text || (typeof record.text === "string" ? record.text : undefined);
230
+ }
231
+
232
+ function compactChildPiLine(line: string): { persistedLine: string; event?: unknown; displayLine?: string; json: boolean } {
233
+ try {
234
+ const parsed = JSON.parse(line);
235
+ const compact = compactChildPiEvent(parsed);
236
+ return { json: true, event: compact, persistedLine: compact ? JSON.stringify(compact) : "", displayLine: displayTextFromCompactEvent(compact) };
237
+ } catch {
238
+ return { json: false, persistedLine: line, displayLine: line };
239
+ }
240
+ }
241
+
242
+ export class ChildPiLineObserver {
243
+ private buffer = "";
244
+ private readonly input: ChildPiRunInput;
245
+
246
+ constructor(input: ChildPiRunInput) {
247
+ this.input = input;
248
+ }
249
+
250
+ observe(text: string): void {
251
+ this.buffer += text;
252
+ const lines = this.buffer.split(/\r?\n/);
253
+ this.buffer = lines.pop() ?? "";
254
+ for (const line of lines) this.emitLine(line);
255
+ }
256
+
257
+ flush(): void {
258
+ if (!this.buffer) return;
259
+ const line = this.buffer;
260
+ this.buffer = "";
261
+ this.emitLine(line);
262
+ }
263
+
264
+ private emitLine(line: string): void {
265
+ if (!line.trim()) return;
266
+ const compact = compactChildPiLine(line);
267
+ if (compact.event !== undefined) {
268
+ try {
269
+ this.input.onJsonEvent?.(compact.event);
270
+ } catch (error) {
271
+ logInternalError("child-pi.on-json-event", error, `line=${compact.persistedLine ?? compact.displayLine ?? ""}`);
272
+ }
273
+ }
274
+ if (compact.persistedLine) appendTranscript(this.input, compact.persistedLine);
275
+ if (compact.displayLine?.trim()) {
276
+ try {
277
+ this.input.onStdoutLine?.(compact.displayLine);
278
+ } catch (error) {
279
+ logInternalError("child-pi.on-stdout-line", error, `line=${compact.displayLine}`);
280
+ }
281
+ }
282
+ }
283
+ }
284
+
285
+ /** Mock-only path real code path reuses a single observer. */
286
+ function observeStdoutChunk(input: ChildPiRunInput, text: string): void {
287
+ const observer = new ChildPiLineObserver(input);
288
+ observer.observe(text);
289
+ observer.flush();
290
+ }
291
+
292
+ function asRecord(value: unknown): Record<string, unknown> | undefined {
293
+ return value && typeof value === "object" && !Array.isArray(value) ? value as Record<string, unknown> : undefined;
294
+ }
295
+
296
+ function isFinalAssistantEvent(event: unknown): boolean {
297
+ const obj = asRecord(event);
298
+ if (!obj || obj.type !== "message_end") return false;
299
+ const message = asRecord(obj.message);
300
+ const role = message?.role;
301
+ if (role !== undefined && role !== "assistant") return false;
302
+ const stopReason = typeof message?.stopReason === "string" ? message.stopReason : typeof obj.stopReason === "string" ? obj.stopReason : undefined;
303
+ if (stopReason !== undefined && stopReason !== "stop") return false;
304
+ const content = Array.isArray(message?.content) ? message.content : [];
305
+ return !content.some((part) => asRecord(part)?.type === "toolCall");
306
+ }
307
+
308
+ export async function runChildPi(input: ChildPiRunInput): Promise<ChildPiRunResult> {
309
+ const depth = checkCrewDepth(input.maxDepth);
310
+ if (depth.blocked) return { exitCode: 1, stdout: "", stderr: `pi-crew depth guard blocked child worker: depth ${depth.depth} >= max ${depth.maxDepth}` };
311
+ const mock = process.env.PI_TEAMS_MOCK_CHILD_PI;
312
+ if (mock) {
313
+ if (mock === "success") {
314
+ const stdout = `Mock child Pi success for ${input.agent.name}\n`;
315
+ observeStdoutChunk(input, stdout);
316
+ return { exitCode: 0, stdout, stderr: "" };
317
+ }
318
+ if (mock === "json-success" || mock === "adaptive-plan") {
319
+ const text = mock === "adaptive-plan" && input.task.includes("ADAPTIVE_PLAN_JSON_START")
320
+ ? `Adaptive mock plan\nADAPTIVE_PLAN_JSON_START\n${JSON.stringify({ phases: [{ name: "research", tasks: [{ role: "explorer", task: "Explore adaptive target" }, { role: "analyst", task: "Analyze adaptive target" }, { role: "planner", task: "Plan adaptive target" }] }, { name: "build", tasks: [{ role: "executor", task: "Implement adaptive target" }] }, { name: "check", tasks: [{ role: "reviewer", task: "Review adaptive target" }, { role: "test-engineer", task: "Test adaptive target" }, { role: "writer", task: "Summarize adaptive target" }] }] })}\nADAPTIVE_PLAN_JSON_END`
321
+ : `Mock JSON success for ${input.agent.name}`;
322
+ const stdout = `${JSON.stringify({ type: "message", message: { role: "assistant", content: [{ type: "text", text }] } })}\n${JSON.stringify({ type: "message_end", usage: { input: 10, output: 5, cost: 0.001, turns: 1 } })}\n`;
323
+ observeStdoutChunk(input, stdout);
324
+ return { exitCode: 0, stdout, stderr: "" };
325
+ }
326
+ if (mock === "retryable-failure") return { exitCode: 1, stdout: "", stderr: "rate limit: mock failure" };
327
+ return { exitCode: 1, stdout: "", stderr: `mock failure: ${mock}` };
328
+ }
329
+ const built = buildPiWorkerArgs({ task: input.task, agent: input.agent, model: input.model, sessionEnabled: false, maxDepth: input.maxDepth, skillPaths: input.skillPaths });
330
+ const spawnSpec = getPiSpawnCommand(built.args);
331
+ try {
332
+ return await new Promise<ChildPiRunResult>((resolve) => {
333
+ const child = spawn(spawnSpec.command, spawnSpec.args, buildChildPiSpawnOptions(input.cwd, { ...process.env, ...built.env }));
334
+ if (child.pid) {
335
+ activeChildProcesses.set(child.pid, child);
336
+ input.onSpawn?.(child.pid);
337
+ input.onLifecycleEvent?.({ type: "spawned", pid: child.pid, ts: new Date().toISOString() });
338
+ } else {
339
+ input.onLifecycleEvent?.({ type: "spawn_error", error: "spawn returned no pid", ts: new Date().toISOString() });
340
+ }
341
+ let stdout = "";
342
+ let stderr = "";
343
+ let settled = false;
344
+ let childExited = false;
345
+ let postExitGuardCleanup: (() => void) | undefined;
346
+ let finalDrainTimer: NodeJS.Timeout | undefined;
347
+ let hardKillTimer: NodeJS.Timeout | undefined;
348
+ let noResponseTimer: NodeJS.Timeout | undefined;
349
+ const finalDrainMs = input.finalDrainMs ?? FINAL_DRAIN_MS;
350
+ const hardKillMs = input.hardKillMs ?? HARD_KILL_MS;
351
+ const responseTimeoutEnv = Number.parseInt(process.env.PI_TEAMS_CHILD_RESPONSE_TIMEOUT_MS ?? "", 10);
352
+ const responseTimeoutMs = Number.isFinite(responseTimeoutEnv) && responseTimeoutEnv >= 0 ? responseTimeoutEnv : input.responseTimeoutMs ?? RESPONSE_TIMEOUT_MS;
353
+ let responseTimeoutHit = false;
354
+ let forcedFinalDrain = false;
355
+ let abortRequested = input.signal?.aborted === true;
356
+ let hardKilled = false;
357
+ const cleanupErrors: string[] = [];
358
+ const restartNoResponseTimer = (): void => {
359
+ if (responseTimeoutMs <= 0) return;
360
+ if (noResponseTimer) clearTimeout(noResponseTimer);
361
+ noResponseTimer = setTimeout(() => {
362
+ responseTimeoutHit = true;
363
+ input.onLifecycleEvent?.({ type: "response_timeout", pid: child.pid, error: `No output for ${responseTimeoutMs}ms`, ts: new Date().toISOString() });
364
+ killProcessTree(child.pid, child);
365
+ try {
366
+ child.kill(process.platform === "win32" ? undefined : "SIGTERM");
367
+ } catch (error) {
368
+ logInternalError("child-pi.response-timeout-term", error, `pid=${child.pid}`);
369
+ }
370
+ }, responseTimeoutMs);
371
+ noResponseTimer.unref();
372
+ };
373
+ const clearNoResponseTimer = (): void => {
374
+ if (noResponseTimer) clearTimeout(noResponseTimer);
375
+ noResponseTimer = undefined;
376
+ };
377
+ restartNoResponseTimer();
378
+ const lineObserver = new ChildPiLineObserver({
379
+ ...input,
380
+ onStdoutLine: (line) => {
381
+ restartNoResponseTimer();
382
+ stdout = appendBoundedTail(stdout, `${line}\n`);
383
+ input.onStdoutLine?.(line);
384
+ },
385
+ onJsonEvent: (event) => {
386
+ restartNoResponseTimer();
387
+ input.onJsonEvent?.(event);
388
+ if (!isFinalAssistantEvent(event) || childExited || settled || finalDrainTimer) return;
389
+ finalDrainTimer = setTimeout(() => {
390
+ if (settled || childExited) return;
391
+ forcedFinalDrain = true;
392
+ input.onLifecycleEvent?.({ type: "final_drain", pid: child.pid, ts: new Date().toISOString() });
393
+ try {
394
+ child.kill(process.platform === "win32" ? undefined : "SIGTERM");
395
+ } catch (error) {
396
+ logInternalError("child-pi.final-drain-term", error, `pid=${child.pid}`);
397
+ }
398
+ hardKillTimer = setTimeout(() => {
399
+ if (settled || childExited) return;
400
+ try {
401
+ hardKilled = true;
402
+ input.onLifecycleEvent?.({ type: "hard_kill", pid: child.pid, ts: new Date().toISOString() });
403
+ child.kill(process.platform === "win32" ? undefined : "SIGKILL");
404
+ } catch (error) {
405
+ logInternalError("child-pi.final-drain-kill", error, `pid=${child.pid}`);
406
+ }
407
+ }, hardKillMs);
408
+ hardKillTimer.unref();
409
+ }, finalDrainMs);
410
+ finalDrainTimer.unref();
411
+ },
412
+ });
413
+
414
+ const clearFinalDrainTimers = (): void => {
415
+ if (finalDrainTimer) clearTimeout(finalDrainTimer);
416
+ if (hardKillTimer) clearTimeout(hardKillTimer);
417
+ finalDrainTimer = undefined;
418
+ hardKillTimer = undefined;
419
+ };
420
+ const clearPostExitGuard = (): void => {
421
+ if (postExitGuardCleanup) {
422
+ postExitGuardCleanup();
423
+ postExitGuardCleanup = undefined;
424
+ }
425
+ };
426
+ const clearChildPiTimeouts = (): void => {
427
+ clearNoResponseTimer();
428
+ clearFinalDrainTimers();
429
+ clearPostExitGuard();
430
+ };
431
+
432
+ const settle = (result: ChildPiRunResult): void => {
433
+ if (settled) return;
434
+ settled = true;
435
+ clearChildPiTimeouts();
436
+ lineObserver.flush();
437
+ input.signal?.removeEventListener("abort", abort);
438
+ try {
439
+ cleanupTempDir(built.tempDir);
440
+ } catch (error) {
441
+ cleanupErrors.push(error instanceof Error ? error.message : String(error));
442
+ }
443
+ resolve({ ...result, exitStatus: result.exitStatus ?? { exitCode: result.exitCode, cancelled: abortRequested, timedOut: responseTimeoutHit, killed: hardKilled, cleanupErrors, finalDrainMs } });
444
+ };
445
+
446
+ const abort = (): void => {
447
+ abortRequested = true;
448
+ killProcessTree(child.pid, child);
449
+ if (process.platform !== "win32") {
450
+ trySignalChild(child, "SIGTERM");
451
+ }
452
+ try {
453
+ child.kill(process.platform === "win32" ? undefined : "SIGTERM");
454
+ } catch {
455
+ // Ignore kill races.
456
+ }
457
+ // 3.5 fast-escalate to SIGKILL within 200ms on explicit cancel
458
+ // so /team-cancel completes round-trip well under the operator
459
+ // expectation. The standard finalDrainMs / HARD_KILL_MS paths
460
+ // are for graceful drain, not user-initiated cancel.
461
+ const cancelHardKill = setTimeout(() => {
462
+ if (settled || childExited) return;
463
+ try {
464
+ hardKilled = true;
465
+ child.kill(process.platform === "win32" ? undefined : "SIGKILL");
466
+ } catch (error) {
467
+ logInternalError("child-pi.cancel-fast-kill", error, `pid=${child.pid}`);
468
+ }
469
+ }, 200);
470
+ cancelHardKill.unref();
471
+ };
472
+
473
+ input.signal?.addEventListener("abort", abort, { once: true });
474
+ // 3.1 — soft watermark backpressure. When inbound stdout exceeds
475
+ // 256KB before the next macrotask, pause for 50ms so the line
476
+ // observer + ancillary handlers get to drain. Prevents the runaway
477
+ // case where a chatty child saturates the parent event loop.
478
+ const BACKPRESSURE_HIGH = 256 * 1024;
479
+ let backpressureBytes = 0;
480
+ const releaseBackpressure = (): void => {
481
+ backpressureBytes = 0;
482
+ try { child.stdout?.resume(); } catch { /* ignore */ }
483
+ };
484
+ child.stdout?.on("data", (chunk: Buffer) => {
485
+ restartNoResponseTimer();
486
+ const text = chunk.toString("utf-8");
487
+ backpressureBytes += text.length;
488
+ lineObserver.observe(text);
489
+ if (backpressureBytes > BACKPRESSURE_HIGH && child.stdout && !child.stdout.isPaused()) {
490
+ try { child.stdout.pause(); } catch { /* ignore */ }
491
+ const timer = setTimeout(releaseBackpressure, 50);
492
+ timer.unref();
493
+ }
494
+ });
495
+ child.stderr?.on("data", (chunk: Buffer) => {
496
+ restartNoResponseTimer();
497
+ stderr = appendBoundedTail(stderr, chunk.toString("utf-8"));
498
+ });
499
+ child.on("error", (error) => {
500
+ input.onLifecycleEvent?.({ type: "spawn_error", pid: child.pid, error: error.message, ts: new Date().toISOString() });
501
+ settle({ exitCode: null, stdout, stderr, error: error.message });
502
+ });
503
+ child.on("exit", (code) => {
504
+ if (child.pid) {
505
+ activeChildProcesses.delete(child.pid);
506
+ clearHardKillTimer(child.pid);
507
+ }
508
+ input.onLifecycleEvent?.({ type: "exit", pid: child.pid, exitCode: code, ts: new Date().toISOString() });
509
+ childExited = true;
510
+ clearNoResponseTimer();
511
+ clearFinalDrainTimers();
512
+ if (!postExitGuardCleanup) {
513
+ postExitGuardCleanup = attachPostExitStdioGuard(child, {
514
+ idleMs: POST_EXIT_STDIO_GUARD_MS,
515
+ hardMs: HARD_KILL_MS,
516
+ });
517
+ }
518
+ });
519
+ child.on("close", (exitCode) => {
520
+ if (child.pid) {
521
+ activeChildProcesses.delete(child.pid);
522
+ clearHardKillTimer(child.pid);
523
+ }
524
+ input.onLifecycleEvent?.({ type: "close", pid: child.pid, exitCode, ts: new Date().toISOString() });
525
+ const timeoutError = responseTimeoutHit && !stderr.trim() ? { error: `Child Pi produced no new output for ${responseTimeoutMs}ms; process was terminated as unresponsive.` } : undefined;
526
+ const finalExitCode = forcedFinalDrain && !timeoutError ? 0 : exitCode;
527
+ // A final assistant event is the child Pi contract for "the worker produced its answer".
528
+ // Some Pi processes can linger during post-final cleanup/stdio shutdown; finalDrain terminates
529
+ // that lingering process so the parent can continue, but it must not turn a completed
530
+ // subagent answer into a failed task. Real pre-final response timeouts still report errors.
531
+ settle({ exitCode: finalExitCode, stdout, stderr, ...(timeoutError ? { error: timeoutError.error } : {}), exitStatus: { exitCode: finalExitCode, cancelled: abortRequested, timedOut: responseTimeoutHit, killed: hardKilled, cleanupErrors, finalDrainMs } });
532
+ });
533
+ });
534
+ } finally {
535
+ // cleanupTempDir is already called inside settle(), but guard against
536
+ // the case where settle() was never reached (spawn throws synchronously).
537
+ if (built.tempDir && fs.existsSync(built.tempDir)) {
538
+ cleanupTempDir(built.tempDir);
539
+ }
540
+ }
541
+ }