pi-crew 0.1.49 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (249) hide show
  1. package/CHANGELOG.md +74 -1
  2. package/README.md +176 -781
  3. package/agents/analyst.md +11 -11
  4. package/agents/critic.md +11 -11
  5. package/agents/executor.md +11 -11
  6. package/agents/explorer.md +11 -11
  7. package/agents/planner.md +11 -11
  8. package/agents/reviewer.md +11 -11
  9. package/agents/security-reviewer.md +11 -11
  10. package/agents/test-engineer.md +11 -11
  11. package/agents/verifier.md +70 -11
  12. package/agents/writer.md +11 -11
  13. package/docs/actions-reference.md +595 -0
  14. package/docs/commands-reference.md +347 -0
  15. package/docs/runtime-flow.md +148 -148
  16. package/index.ts +6 -6
  17. package/package.json +99 -99
  18. package/skills/async-worker-recovery/SKILL.md +42 -42
  19. package/skills/context-artifact-hygiene/SKILL.md +52 -52
  20. package/skills/delegation-patterns/SKILL.md +54 -54
  21. package/skills/mailbox-interactive/SKILL.md +40 -40
  22. package/skills/model-routing-context/SKILL.md +39 -39
  23. package/skills/multi-perspective-review/SKILL.md +58 -58
  24. package/skills/observability-reliability/SKILL.md +41 -41
  25. package/skills/orchestration/SKILL.md +157 -157
  26. package/skills/ownership-session-security/SKILL.md +41 -41
  27. package/skills/pi-extension-lifecycle/SKILL.md +39 -39
  28. package/skills/requirements-to-task-packet/SKILL.md +63 -63
  29. package/skills/resource-discovery-config/SKILL.md +41 -41
  30. package/skills/runtime-state-reader/SKILL.md +44 -44
  31. package/skills/secure-agent-orchestration-review/SKILL.md +45 -45
  32. package/skills/state-mutation-locking/SKILL.md +42 -42
  33. package/skills/systematic-debugging/SKILL.md +67 -67
  34. package/skills/ui-render-performance/SKILL.md +39 -39
  35. package/skills/verification-before-done/SKILL.md +57 -57
  36. package/skills/worktree-isolation/SKILL.md +39 -39
  37. package/src/adapters/claude-adapter.ts +25 -0
  38. package/src/adapters/codex-adapter.ts +21 -0
  39. package/src/adapters/cursor-adapter.ts +17 -0
  40. package/src/adapters/export-util.ts +137 -0
  41. package/src/adapters/index.ts +15 -0
  42. package/src/adapters/registry.ts +18 -0
  43. package/src/adapters/types.ts +23 -0
  44. package/src/agents/agent-config.ts +2 -0
  45. package/src/agents/agent-search.ts +98 -98
  46. package/src/agents/discover-agents.ts +2 -1
  47. package/src/config/config.ts +14 -1
  48. package/src/config/defaults.ts +5 -5
  49. package/src/config/drift-detector.ts +211 -0
  50. package/src/config/markers.ts +327 -0
  51. package/src/config/resilient-parser.ts +108 -0
  52. package/src/config/suggestions.ts +74 -0
  53. package/src/extension/cross-extension-rpc.ts +103 -82
  54. package/src/extension/project-init.ts +36 -4
  55. package/src/extension/register.ts +67 -22
  56. package/src/extension/registration/commands.ts +77 -8
  57. package/src/extension/registration/subagent-tools.ts +10 -1
  58. package/src/extension/registration/team-tool.ts +10 -1
  59. package/src/extension/registration/viewers.ts +48 -34
  60. package/src/extension/run-bundle-schema.ts +89 -89
  61. package/src/extension/run-export.ts +26 -12
  62. package/src/extension/run-import.ts +25 -1
  63. package/src/extension/run-index.ts +5 -1
  64. package/src/extension/run-maintenance.ts +142 -68
  65. package/src/extension/team-manager-command.ts +10 -1
  66. package/src/extension/team-tool/context.ts +1 -1
  67. package/src/extension/team-tool/doctor.ts +28 -3
  68. package/src/extension/team-tool/handle-settings.ts +195 -188
  69. package/src/extension/team-tool/inspect.ts +41 -41
  70. package/src/extension/team-tool/intent-policy.ts +42 -42
  71. package/src/extension/team-tool/lifecycle-actions.ts +27 -8
  72. package/src/extension/team-tool/plan.ts +19 -19
  73. package/src/extension/team-tool/run.ts +12 -1
  74. package/src/extension/team-tool.ts +14 -3
  75. package/src/i18n.ts +184 -184
  76. package/src/observability/exporters/otlp-exporter.ts +92 -77
  77. package/src/prompt/prompt-runtime.ts +72 -72
  78. package/src/runtime/agent-memory.ts +72 -72
  79. package/src/runtime/agent-observability.ts +114 -114
  80. package/src/runtime/async-marker.ts +26 -26
  81. package/src/runtime/attention-events.ts +28 -28
  82. package/src/runtime/auto-resume.ts +100 -0
  83. package/src/runtime/background-runner.ts +11 -1
  84. package/src/runtime/cancellation-token.ts +89 -89
  85. package/src/runtime/cancellation.ts +61 -61
  86. package/src/runtime/capability-inventory.ts +116 -116
  87. package/src/runtime/child-pi.ts +7 -2
  88. package/src/runtime/compaction-summary.ts +271 -0
  89. package/src/runtime/completion-guard.ts +190 -190
  90. package/src/runtime/concurrency.ts +3 -1
  91. package/src/runtime/crash-recovery.ts +33 -0
  92. package/src/runtime/delta-conflict.ts +360 -0
  93. package/src/runtime/diagnostic-export.ts +3 -1
  94. package/src/runtime/direct-run.ts +35 -35
  95. package/src/runtime/event-stream-bridge.ts +3 -1
  96. package/src/runtime/foreground-control.ts +82 -82
  97. package/src/runtime/green-contract.ts +46 -46
  98. package/src/runtime/group-join.ts +106 -106
  99. package/src/runtime/heartbeat-gradient.ts +28 -28
  100. package/src/runtime/heartbeat-watcher.ts +124 -124
  101. package/src/runtime/iteration-hooks.ts +262 -0
  102. package/src/runtime/live-agent-control.ts +88 -88
  103. package/src/runtime/live-control-realtime.ts +36 -36
  104. package/src/runtime/live-extension-bridge.ts +150 -150
  105. package/src/runtime/live-irc.ts +92 -92
  106. package/src/runtime/live-session-health.ts +100 -100
  107. package/src/runtime/loop-gates.ts +129 -0
  108. package/src/runtime/metric-parser.ts +40 -0
  109. package/src/runtime/notebook-helpers.ts +90 -90
  110. package/src/runtime/orphan-sentinel.ts +7 -7
  111. package/src/runtime/parallel-research.ts +44 -44
  112. package/src/runtime/phase-progress.ts +217 -0
  113. package/src/runtime/pi-args.ts +38 -2
  114. package/src/runtime/pi-json-output.ts +111 -111
  115. package/src/runtime/pi-spawn.ts +74 -6
  116. package/src/runtime/policy-engine.ts +79 -79
  117. package/src/runtime/post-checks.ts +122 -0
  118. package/src/runtime/process-status.ts +14 -1
  119. package/src/runtime/progress-event-coalescer.ts +43 -43
  120. package/src/runtime/prose-compressor.ts +164 -164
  121. package/src/runtime/recovery-recipes.ts +74 -74
  122. package/src/runtime/result-extractor.ts +121 -121
  123. package/src/runtime/role-permission.ts +39 -39
  124. package/src/runtime/sensitive-paths.ts +3 -3
  125. package/src/runtime/session-resources.ts +25 -25
  126. package/src/runtime/session-snapshot.ts +59 -59
  127. package/src/runtime/session-usage.ts +79 -79
  128. package/src/runtime/sidechain-output.ts +29 -29
  129. package/src/runtime/stream-preview.ts +177 -177
  130. package/src/runtime/supervisor-contact.ts +59 -59
  131. package/src/runtime/task-display.ts +38 -38
  132. package/src/runtime/task-graph.ts +207 -0
  133. package/src/runtime/task-quality.ts +207 -0
  134. package/src/runtime/task-runner/capabilities.ts +78 -78
  135. package/src/runtime/task-runner/live-executor.ts +7 -1
  136. package/src/runtime/task-runner/progress.ts +119 -119
  137. package/src/runtime/task-runner/prompt-builder.ts +1 -1
  138. package/src/runtime/task-runner/prompt-pipeline.ts +64 -64
  139. package/src/runtime/task-runner/result-utils.ts +14 -14
  140. package/src/runtime/task-runner/run-projection.ts +103 -103
  141. package/src/runtime/task-runner/state-helpers.ts +22 -22
  142. package/src/runtime/team-runner.ts +126 -7
  143. package/src/runtime/worker-heartbeat.ts +21 -21
  144. package/src/runtime/worker-startup.ts +57 -57
  145. package/src/runtime/workflow-state.ts +187 -0
  146. package/src/runtime/workspace-tree.ts +298 -298
  147. package/src/schema/config-schema.ts +12 -0
  148. package/src/schema/validation-types.ts +148 -0
  149. package/src/skills/skill-templates.ts +374 -0
  150. package/src/state/active-run-registry.ts +35 -11
  151. package/src/state/atomic-write.ts +33 -26
  152. package/src/state/contracts.ts +1 -0
  153. package/src/state/event-reconstructor.ts +217 -0
  154. package/src/state/locks.ts +2 -11
  155. package/src/state/mailbox.ts +4 -3
  156. package/src/state/state-store.ts +32 -14
  157. package/src/state/task-claims.ts +44 -44
  158. package/src/state/types.ts +9 -0
  159. package/src/state/usage.ts +29 -29
  160. package/src/subagents/async-entry.ts +1 -1
  161. package/src/subagents/index.ts +3 -3
  162. package/src/subagents/live/control.ts +1 -1
  163. package/src/subagents/live/manager.ts +1 -1
  164. package/src/subagents/live/realtime.ts +1 -1
  165. package/src/subagents/live/session-runtime.ts +1 -1
  166. package/src/subagents/manager.ts +1 -1
  167. package/src/subagents/spawn.ts +1 -1
  168. package/src/teams/team-serializer.ts +38 -38
  169. package/src/types/diff.d.ts +18 -18
  170. package/src/ui/crew-footer.ts +101 -101
  171. package/src/ui/crew-select-list.ts +111 -111
  172. package/src/ui/crew-widget.ts +9 -4
  173. package/src/ui/dashboard-panes/cancellation-pane.ts +42 -42
  174. package/src/ui/dashboard-panes/capability-pane.ts +59 -59
  175. package/src/ui/dashboard-panes/mailbox-pane.ts +35 -35
  176. package/src/ui/dashboard-panes/metrics-pane.ts +34 -34
  177. package/src/ui/dashboard-panes/progress-pane.ts +11 -0
  178. package/src/ui/dynamic-border.ts +25 -25
  179. package/src/ui/layout-primitives.ts +106 -106
  180. package/src/ui/loaders.ts +158 -158
  181. package/src/ui/powerbar-publisher.ts +6 -0
  182. package/src/ui/render-coalescer.ts +51 -51
  183. package/src/ui/render-diff.ts +119 -119
  184. package/src/ui/render-scheduler.ts +143 -143
  185. package/src/ui/run-action-dispatcher.ts +10 -1
  186. package/src/ui/spinner.ts +17 -17
  187. package/src/ui/status-colors.ts +58 -58
  188. package/src/ui/syntax-highlight.ts +116 -116
  189. package/src/ui/transcript-entries.ts +258 -258
  190. package/src/utils/completion-dedupe.ts +63 -63
  191. package/src/utils/frontmatter.ts +68 -68
  192. package/src/utils/git.ts +262 -262
  193. package/src/utils/ids.ts +17 -17
  194. package/src/utils/incremental-reader.ts +104 -104
  195. package/src/utils/names.ts +27 -27
  196. package/src/utils/redaction.ts +44 -44
  197. package/src/utils/safe-paths.ts +47 -47
  198. package/src/utils/scan-cache.ts +136 -136
  199. package/src/utils/sleep.ts +40 -26
  200. package/src/utils/task-name-generator.ts +337 -337
  201. package/src/workflows/validate-workflow.ts +40 -40
  202. package/src/worktree/branch-freshness.ts +45 -45
  203. package/src/worktree/worktree-manager.ts +11 -3
  204. package/teams/default.team.md +12 -12
  205. package/teams/fast-fix.team.md +11 -11
  206. package/teams/implementation.team.md +18 -18
  207. package/teams/parallel-research.team.md +14 -14
  208. package/teams/research.team.md +11 -11
  209. package/teams/review.team.md +12 -12
  210. package/workflows/default.workflow.md +30 -29
  211. package/workflows/fast-fix.workflow.md +23 -22
  212. package/workflows/implementation.workflow.md +43 -38
  213. package/workflows/parallel-research.workflow.md +46 -46
  214. package/workflows/research.workflow.md +22 -22
  215. package/workflows/review.workflow.md +30 -30
  216. package/docs/refactor-tasks-phase3.md +0 -394
  217. package/docs/refactor-tasks-phase4.md +0 -564
  218. package/docs/refactor-tasks-phase5.md +0 -402
  219. package/docs/refactor-tasks-phase6.md +0 -662
  220. package/docs/refactor-tasks.md +0 -1484
  221. package/docs/research/AGENT-EXECUTION-ARCHITECTURE.md +0 -261
  222. package/docs/research/AGENT-LIFECYCLE-COMPARISON.md +0 -111
  223. package/docs/research/AUDIT_OH_MY_PI.md +0 -261
  224. package/docs/research/AUDIT_PI_CREW.md +0 -457
  225. package/docs/research/CAVEMAN-DEEP-RESEARCH.md +0 -281
  226. package/docs/research/COMPARISON_OH_MY_PI_VS_PI_CREW.md +0 -264
  227. package/docs/research/DEEP-RESEARCH-PI-POWERBAR.md +0 -343
  228. package/docs/research/DEEP_RESEARCH_SUBAGENT_ARCHITECTURE.md +0 -480
  229. package/docs/research/GAP_CLOSURE_IMPLEMENTATION_PLAN.md +0 -354
  230. package/docs/research/IMPLEMENTATION_PLAN.md +0 -385
  231. package/docs/research/LIVE-SESSION-PRODUCTION-READY-PLAN.md +0 -502
  232. package/docs/research/OH-MY-PI-DEEP-RESEARCH-v14.7.6.md +0 -266
  233. package/docs/research/REMAINING-GAPS-PLAN.md +0 -363
  234. package/docs/research/SESSION-SUMMARY-2026-05-08.md +0 -146
  235. package/docs/research/UI-RESPONSIVENESS-AUDIT.md +0 -173
  236. package/docs/research-awesome-agent-skills-distillation.md +0 -100
  237. package/docs/research-extension-examples.md +0 -297
  238. package/docs/research-extension-system.md +0 -324
  239. package/docs/research-oh-my-pi-distillation.md +0 -369
  240. package/docs/research-optimization-plan.md +0 -548
  241. package/docs/research-phase10-distillation.md +0 -199
  242. package/docs/research-phase11-distillation.md +0 -201
  243. package/docs/research-phase8-operator-experience-plan.md +0 -819
  244. package/docs/research-phase9-observability-reliability-plan.md +0 -1190
  245. package/docs/research-pi-coding-agent.md +0 -357
  246. package/docs/research-source-pi-crew-reference.md +0 -174
  247. package/docs/research-ui-optimization-plan.md +0 -480
  248. package/docs/source-runtime-refactor-map.md +0 -107
  249. package/src/utils/atomic-write.ts +0 -33
@@ -1,92 +1,92 @@
1
- /**
2
- * Phase 7: Inter-agent communication for live-session workers.
3
- *
4
- * Provides IRC-like messaging between live-session workers, adapted from
5
- * oh-my-pi's IrcTool pattern. Uses the existing LiveAgentHandle manager
6
- * for message routing.
7
- *
8
- * Features:
9
- * - DM: Send a message to a specific agent
10
- * - Broadcast: Send a message to all live agents
11
- * - Side-channel: Non-blocking message injection (via pendingFollowUps)
12
- *
13
- * For child-process workers, messages fall back to file-based mailbox.
14
- */
15
-
16
- export type IrcOperation = "send" | "list";
17
-
18
- export interface IrcMessage {
19
- from: string;
20
- to: string;
21
- content: string;
22
- timestamp: string;
23
- /** Whether the sender expects a reply. */
24
- awaitReply?: boolean;
25
- }
26
-
27
- export interface IrcSendMessage {
28
- op: IrcOperation;
29
- /** Target agent ID or "all" for broadcast. */
30
- to: string;
31
- /** Message content. */
32
- message: string;
33
- /** Whether to wait for a reply (default: true for DM, false for broadcast). */
34
- awaitReply?: boolean;
35
- }
36
-
37
- export interface IrcListResult {
38
- peers: Array<{ id: string; name: string; status: string }>;
39
- }
40
-
41
- /**
42
- * Build IRC peer roster for injection into system prompt.
43
- * Lists all currently live agents except the caller.
44
- */
45
- export function renderIrcPeerRoster(selfId: string, peers: Array<{ agentId: string; status: string }>): string {
46
- const visible = peers.filter((p) => p.agentId !== selfId && (p.status === "running" || p.status === "idle"));
47
- if (visible.length === 0) return "- (no other live agents)";
48
- return visible.map((peer) => `- \`${peer.agentId}\` (${peer.status})`).join("\n");
49
- }
50
-
51
- /**
52
- * Build the IRC system prompt section for a live-session worker.
53
- */
54
- export function buildIrcSystemSection(selfId: string, peers: Array<{ agentId: string; status: string }>): string {
55
- const roster = renderIrcPeerRoster(selfId, peers);
56
- return [
57
- "## Inter-Agent Communication",
58
- `Your agent ID: \`${selfId}\``,
59
- "You can send messages to other live agents via the `irc` tool.",
60
- "Available peers:",
61
- roster,
62
- ].join("\n");
63
- }
64
-
65
- /**
66
- * Route an IRC message to the appropriate agent(s).
67
- * Returns the list of agent IDs that received the message.
68
- */
69
- export function routeIrcMessage(
70
- message: IrcSendMessage,
71
- selfId: string,
72
- routing: {
73
- sendDm: (agentId: string, content: string) => void;
74
- broadcast: (content: string, excludeId: string) => string[];
75
- },
76
- ): { deliveredTo: string[]; error?: string } {
77
- if (!message.to || !message.message?.trim()) {
78
- return { deliveredTo: [], error: "Missing 'to' (agent ID or 'all') and 'message' fields." };
79
- }
80
- if (message.to === selfId) {
81
- return { deliveredTo: [], error: "Cannot send a message to yourself." };
82
- }
83
-
84
- if (message.to === "all") {
85
- const recipients = routing.broadcast(message.message, selfId);
86
- return { deliveredTo: recipients };
87
- }
88
-
89
- // DM to specific agent
90
- routing.sendDm(message.to, message.message);
91
- return { deliveredTo: [message.to] };
92
- }
1
+ /**
2
+ * Phase 7: Inter-agent communication for live-session workers.
3
+ *
4
+ * Provides IRC-like messaging between live-session workers, adapted from
5
+ * oh-my-pi's IrcTool pattern. Uses the existing LiveAgentHandle manager
6
+ * for message routing.
7
+ *
8
+ * Features:
9
+ * - DM: Send a message to a specific agent
10
+ * - Broadcast: Send a message to all live agents
11
+ * - Side-channel: Non-blocking message injection (via pendingFollowUps)
12
+ *
13
+ * For child-process workers, messages fall back to file-based mailbox.
14
+ */
15
+
16
+ export type IrcOperation = "send" | "list";
17
+
18
+ export interface IrcMessage {
19
+ from: string;
20
+ to: string;
21
+ content: string;
22
+ timestamp: string;
23
+ /** Whether the sender expects a reply. */
24
+ awaitReply?: boolean;
25
+ }
26
+
27
+ export interface IrcSendMessage {
28
+ op: IrcOperation;
29
+ /** Target agent ID or "all" for broadcast. */
30
+ to: string;
31
+ /** Message content. */
32
+ message: string;
33
+ /** Whether to wait for a reply (default: true for DM, false for broadcast). */
34
+ awaitReply?: boolean;
35
+ }
36
+
37
+ export interface IrcListResult {
38
+ peers: Array<{ id: string; name: string; status: string }>;
39
+ }
40
+
41
+ /**
42
+ * Build IRC peer roster for injection into system prompt.
43
+ * Lists all currently live agents except the caller.
44
+ */
45
+ export function renderIrcPeerRoster(selfId: string, peers: Array<{ agentId: string; status: string }>): string {
46
+ const visible = peers.filter((p) => p.agentId !== selfId && (p.status === "running" || p.status === "idle"));
47
+ if (visible.length === 0) return "- (no other live agents)";
48
+ return visible.map((peer) => `- \`${peer.agentId}\` (${peer.status})`).join("\n");
49
+ }
50
+
51
+ /**
52
+ * Build the IRC system prompt section for a live-session worker.
53
+ */
54
+ export function buildIrcSystemSection(selfId: string, peers: Array<{ agentId: string; status: string }>): string {
55
+ const roster = renderIrcPeerRoster(selfId, peers);
56
+ return [
57
+ "## Inter-Agent Communication",
58
+ `Your agent ID: \`${selfId}\``,
59
+ "You can send messages to other live agents via the `irc` tool.",
60
+ "Available peers:",
61
+ roster,
62
+ ].join("\n");
63
+ }
64
+
65
+ /**
66
+ * Route an IRC message to the appropriate agent(s).
67
+ * Returns the list of agent IDs that received the message.
68
+ */
69
+ export function routeIrcMessage(
70
+ message: IrcSendMessage,
71
+ selfId: string,
72
+ routing: {
73
+ sendDm: (agentId: string, content: string) => void;
74
+ broadcast: (content: string, excludeId: string) => string[];
75
+ },
76
+ ): { deliveredTo: string[]; error?: string } {
77
+ if (!message.to || !message.message?.trim()) {
78
+ return { deliveredTo: [], error: "Missing 'to' (agent ID or 'all') and 'message' fields." };
79
+ }
80
+ if (message.to === selfId) {
81
+ return { deliveredTo: [], error: "Cannot send a message to yourself." };
82
+ }
83
+
84
+ if (message.to === "all") {
85
+ const recipients = routing.broadcast(message.message, selfId);
86
+ return { deliveredTo: recipients };
87
+ }
88
+
89
+ // DM to specific agent
90
+ routing.sendDm(message.to, message.message);
91
+ return { deliveredTo: [message.to] };
92
+ }
@@ -1,100 +1,100 @@
1
- /**
2
- * Phase 8: Monitoring and observability for live-session workers.
3
- *
4
- * Provides health checks, metrics collection, and diagnostics
5
- * for live-session workers running in-process.
6
- */
7
-
8
- export interface LiveSessionHealth {
9
- /** Total number of registered live agents. */
10
- totalAgents: number;
11
- /** Number of agents currently running. */
12
- runningAgents: number;
13
- /** Number of agents in idle state. */
14
- idleAgents: number;
15
- /** Number of agents that have completed. */
16
- completedAgents: number;
17
- /** Number of agents that have failed. */
18
- failedAgents: number;
19
- /** Total tokens consumed across all live sessions. */
20
- totalTokens: number;
21
- /** Timestamp of this health snapshot. */
22
- timestamp: string;
23
- }
24
-
25
- export interface LiveSessionMetrics {
26
- agentId: string;
27
- taskId: string;
28
- status: string;
29
- /** Accumulated usage from session stats. */
30
- usage?: {
31
- input?: number;
32
- output?: number;
33
- cacheRead?: number;
34
- cacheWrite?: number;
35
- cost?: number;
36
- turns?: number;
37
- };
38
- /** Session duration in milliseconds. */
39
- durationMs?: number;
40
- /** Number of IRC messages received. */
41
- ircMessagesReceived?: number;
42
- /** Number of yield reminders sent. */
43
- yieldReminders?: number;
44
- /** Whether yield was called. */
45
- yieldCalled: boolean;
46
- }
47
-
48
- /**
49
- * Collect health snapshot from live agent handles.
50
- */
51
- export function collectLiveSessionHealth(
52
- agents: Array<{ status: string }>,
53
- getUsage: (agentId: string) => { input?: number; output?: number; turns?: number } | undefined,
54
- ): LiveSessionHealth {
55
- let running = 0;
56
- let idle = 0;
57
- let completed = 0;
58
- let failed = 0;
59
- let totalTokens = 0;
60
-
61
- for (const agent of agents) {
62
- switch (agent.status) {
63
- case "running": running++; break;
64
- case "idle": idle++; break;
65
- case "completed": completed++; break;
66
- case "failed": failed++; break;
67
- }
68
- }
69
-
70
- // Sum tokens from usage data
71
- for (const agent of agents) {
72
- const agentAny = agent as Record<string, unknown>;
73
- const agentId = agentAny.agentId as string | undefined;
74
- if (agentId) {
75
- const usage = getUsage(agentId);
76
- if (usage) {
77
- totalTokens += (usage.input ?? 0) + (usage.output ?? 0);
78
- }
79
- }
80
- }
81
-
82
- return {
83
- totalAgents: agents.length,
84
- runningAgents: running,
85
- idleAgents: idle,
86
- completedAgents: completed,
87
- failedAgents: failed,
88
- totalTokens,
89
- timestamp: new Date().toISOString(),
90
- };
91
- }
92
-
93
- /**
94
- * Build a diagnostic summary string for logging.
95
- */
96
- export function formatLiveSessionDiagnostics(health: LiveSessionHealth): string {
97
- return [
98
- `[Live-Session Health] agents=${health.totalAgents} running=${health.runningAgents} idle=${health.idleAgents} completed=${health.completedAgents} failed=${health.failedAgents} tokens=${health.totalTokens}`,
99
- ].join("\n");
100
- }
1
+ /**
2
+ * Phase 8: Monitoring and observability for live-session workers.
3
+ *
4
+ * Provides health checks, metrics collection, and diagnostics
5
+ * for live-session workers running in-process.
6
+ */
7
+
8
+ export interface LiveSessionHealth {
9
+ /** Total number of registered live agents. */
10
+ totalAgents: number;
11
+ /** Number of agents currently running. */
12
+ runningAgents: number;
13
+ /** Number of agents in idle state. */
14
+ idleAgents: number;
15
+ /** Number of agents that have completed. */
16
+ completedAgents: number;
17
+ /** Number of agents that have failed. */
18
+ failedAgents: number;
19
+ /** Total tokens consumed across all live sessions. */
20
+ totalTokens: number;
21
+ /** Timestamp of this health snapshot. */
22
+ timestamp: string;
23
+ }
24
+
25
+ export interface LiveSessionMetrics {
26
+ agentId: string;
27
+ taskId: string;
28
+ status: string;
29
+ /** Accumulated usage from session stats. */
30
+ usage?: {
31
+ input?: number;
32
+ output?: number;
33
+ cacheRead?: number;
34
+ cacheWrite?: number;
35
+ cost?: number;
36
+ turns?: number;
37
+ };
38
+ /** Session duration in milliseconds. */
39
+ durationMs?: number;
40
+ /** Number of IRC messages received. */
41
+ ircMessagesReceived?: number;
42
+ /** Number of yield reminders sent. */
43
+ yieldReminders?: number;
44
+ /** Whether yield was called. */
45
+ yieldCalled: boolean;
46
+ }
47
+
48
+ /**
49
+ * Collect health snapshot from live agent handles.
50
+ */
51
+ export function collectLiveSessionHealth(
52
+ agents: Array<{ status: string }>,
53
+ getUsage: (agentId: string) => { input?: number; output?: number; turns?: number } | undefined,
54
+ ): LiveSessionHealth {
55
+ let running = 0;
56
+ let idle = 0;
57
+ let completed = 0;
58
+ let failed = 0;
59
+ let totalTokens = 0;
60
+
61
+ for (const agent of agents) {
62
+ switch (agent.status) {
63
+ case "running": running++; break;
64
+ case "idle": idle++; break;
65
+ case "completed": completed++; break;
66
+ case "failed": failed++; break;
67
+ }
68
+ }
69
+
70
+ // Sum tokens from usage data
71
+ for (const agent of agents) {
72
+ const agentAny = agent as Record<string, unknown>;
73
+ const agentId = agentAny.agentId as string | undefined;
74
+ if (agentId) {
75
+ const usage = getUsage(agentId);
76
+ if (usage) {
77
+ totalTokens += (usage.input ?? 0) + (usage.output ?? 0);
78
+ }
79
+ }
80
+ }
81
+
82
+ return {
83
+ totalAgents: agents.length,
84
+ runningAgents: running,
85
+ idleAgents: idle,
86
+ completedAgents: completed,
87
+ failedAgents: failed,
88
+ totalTokens,
89
+ timestamp: new Date().toISOString(),
90
+ };
91
+ }
92
+
93
+ /**
94
+ * Build a diagnostic summary string for logging.
95
+ */
96
+ export function formatLiveSessionDiagnostics(health: LiveSessionHealth): string {
97
+ return [
98
+ `[Live-Session Health] agents=${health.totalAgents} running=${health.runningAgents} idle=${health.idleAgents} completed=${health.completedAgents} failed=${health.failedAgents} tokens=${health.totalTokens}`,
99
+ ].join("\n");
100
+ }
@@ -0,0 +1,129 @@
1
+ /**
2
+ * Dual-gate loop control — determines whether a task should auto-resume
3
+ * based on meaningful progress and turn limits.
4
+ *
5
+ * Gate 1: At least one signal of meaningful progress must be true.
6
+ * Gate 2: The auto-resume turn count must be below the maximum.
7
+ *
8
+ * Distilled from pi-autoresearch's dual-gate loop pattern.
9
+ */
10
+ import * as fs from "node:fs";
11
+ import * as path from "node:path";
12
+ import type { TeamTaskState } from "../state/types.ts";
13
+
14
+ /**
15
+ * Signal indicating what kind of progress a task has made.
16
+ */
17
+ export interface TaskProgressSignal {
18
+ /** Whether the task has edited files or produced non-empty results. */
19
+ editedFiles: boolean;
20
+ /** Whether the task has produced artifacts in the artifacts directory. */
21
+ producedArtifacts: boolean;
22
+ /** Whether the task has run tests (detected via result text). */
23
+ ranTests: boolean;
24
+ }
25
+
26
+ /**
27
+ * Runtime state for auto-resume turn tracking.
28
+ */
29
+ export interface AutoResumeRuntime {
30
+ /** Current number of auto-resume turns taken. */
31
+ autoResumeTurns: number;
32
+ /** Maximum allowed auto-resume turns. */
33
+ maxTurns: number;
34
+ }
35
+
36
+ /** Keywords in result text that indicate tests were run. */
37
+ const TEST_KEYWORDS = [
38
+ "test passed",
39
+ "test failed",
40
+ "tests passed",
41
+ "tests failed",
42
+ "test results",
43
+ "jest",
44
+ "vitest",
45
+ "mocha",
46
+ "pytest",
47
+ "npx test",
48
+ "npm test",
49
+ "cargo test",
50
+ "all tests",
51
+ "test suite",
52
+ "✓",
53
+ "✗",
54
+ "PASS ",
55
+ " FAIL ",
56
+ ] as const;
57
+
58
+ /**
59
+ * Determine whether a task should auto-resume based on dual-gate logic.
60
+ *
61
+ * Gate 1 (meaningful progress): at least one of editedFiles, producedArtifacts,
62
+ * or ranTests must be true.
63
+ * Gate 2 (turn limit): autoResumeTurns must be strictly less than maxTurns.
64
+ *
65
+ * Both gates must pass for auto-resume to be allowed.
66
+ */
67
+ export function shouldAutoResume(runtime: AutoResumeRuntime, taskProgress: TaskProgressSignal): boolean {
68
+ // Gate 2: Turn limit check (check first — cheaper)
69
+ if (runtime.autoResumeTurns >= runtime.maxTurns) {
70
+ return false;
71
+ }
72
+
73
+ // Gate 1: Meaningful progress check
74
+ const hasProgress = taskProgress.editedFiles || taskProgress.producedArtifacts || taskProgress.ranTests;
75
+ if (!hasProgress) {
76
+ return false;
77
+ }
78
+
79
+ return true;
80
+ }
81
+
82
+ /**
83
+ * Compute the task progress signal from a task's state and artifacts directory.
84
+ *
85
+ * - editedFiles: true if task has artifact files or a non-empty result
86
+ * - producedArtifacts: true if artifacts directory contains task-specific files
87
+ * - ranTests: true if result text contains test-related keywords
88
+ *
89
+ * @param task - The task state to analyze
90
+ * @param artifactsDir - Path to the artifacts directory
91
+ * @returns TaskProgressSignal indicating what progress was made
92
+ */
93
+ export function computeTaskProgressSignal(task: TeamTaskState, artifactsDir: string): TaskProgressSignal {
94
+ // editedFiles: check if task has artifact descriptors or a non-empty result
95
+ const hasResultArtifact = task.resultArtifact !== undefined;
96
+ const hasNonEmptyResult = task.resultArtifact?.path !== undefined;
97
+ const editedFiles = hasResultArtifact || hasNonEmptyResult;
98
+
99
+ // producedArtifacts: check artifacts directory for task-specific files
100
+ let producedArtifacts = false;
101
+ if (artifactsDir && fs.existsSync(artifactsDir)) {
102
+ try {
103
+ const entries = fs.readdirSync(artifactsDir);
104
+ // Look for files/directories that START with the task ID prefix.
105
+ // Using startsWith instead of includes to avoid false positives
106
+ // from short task IDs like "01" matching unrelated entries.
107
+ const taskPrefix = task.id.replace(/[^a-zA-Z0-9_-]/g, "");
108
+ producedArtifacts = entries.some((entry) => {
109
+ const baseName = entry.split(".")[0] ?? entry;
110
+ return baseName.startsWith(taskPrefix);
111
+ });
112
+ } catch {
113
+ producedArtifacts = false;
114
+ }
115
+ }
116
+
117
+ // ranTests: check if result-related fields contain test keywords
118
+ let ranTests = false;
119
+ const textToSearch = [
120
+ task.error ?? "",
121
+ task.terminalEvidence ? JSON.stringify(task.terminalEvidence) : "",
122
+ task.diagnostics ? JSON.stringify(task.diagnostics) : "",
123
+ ].join(" ");
124
+
125
+ const lowerText = textToSearch.toLowerCase();
126
+ ranTests = TEST_KEYWORDS.some((keyword) => lowerText.includes(keyword.toLowerCase()));
127
+
128
+ return { editedFiles, producedArtifacts, ranTests };
129
+ }
@@ -0,0 +1,40 @@
1
+ /**
2
+ * Metric names that are denied to prevent prototype pollution.
3
+ */
4
+ export const DENIED_METRIC_NAMES: ReadonlySet<string> = new Set([
5
+ "__proto__",
6
+ "constructor",
7
+ "prototype",
8
+ ]);
9
+
10
+ const METRIC_LINE_RE = /^CREW_METRIC\s+(\w+)=(\S+)$/;
11
+
12
+ /**
13
+ * Parse CREW_METRIC lines from worker stdout.
14
+ *
15
+ * Lines must match the pattern: `CREW_METRIC name=value`
16
+ * - `name` must be a word character sequence (alphanumeric + underscore)
17
+ * - `value` must parse as a valid finite number
18
+ * - Denied names (__proto__, constructor, prototype) are silently skipped
19
+ *
20
+ * @param output - Raw worker stdout text
21
+ * @returns Map of metric name → numeric value
22
+ */
23
+ export function parseMetricLines(output: string): Record<string, number> {
24
+ const metrics: Record<string, number> = {};
25
+
26
+ for (const line of output.split("\n")) {
27
+ const match = METRIC_LINE_RE.exec(line);
28
+ if (!match) continue;
29
+
30
+ const [, name, rawValue] = match;
31
+ if (DENIED_METRIC_NAMES.has(name)) continue;
32
+
33
+ const value = Number(rawValue);
34
+ if (!Number.isFinite(value)) continue;
35
+
36
+ metrics[name] = value;
37
+ }
38
+
39
+ return metrics;
40
+ }