pi-crew 0.1.51 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (239) hide show
  1. package/CHANGELOG.md +56 -1
  2. package/README.md +176 -781
  3. package/agents/analyst.md +11 -11
  4. package/agents/critic.md +11 -11
  5. package/agents/executor.md +11 -11
  6. package/agents/explorer.md +11 -11
  7. package/agents/planner.md +11 -11
  8. package/agents/reviewer.md +11 -11
  9. package/agents/security-reviewer.md +11 -11
  10. package/agents/test-engineer.md +11 -11
  11. package/agents/verifier.md +70 -11
  12. package/agents/writer.md +11 -11
  13. package/docs/actions-reference.md +595 -0
  14. package/docs/commands-reference.md +347 -0
  15. package/docs/runtime-flow.md +148 -148
  16. package/index.ts +6 -6
  17. package/package.json +99 -99
  18. package/skills/async-worker-recovery/SKILL.md +42 -42
  19. package/skills/context-artifact-hygiene/SKILL.md +52 -52
  20. package/skills/delegation-patterns/SKILL.md +54 -54
  21. package/skills/mailbox-interactive/SKILL.md +40 -40
  22. package/skills/model-routing-context/SKILL.md +39 -39
  23. package/skills/multi-perspective-review/SKILL.md +58 -58
  24. package/skills/observability-reliability/SKILL.md +41 -41
  25. package/skills/orchestration/SKILL.md +157 -157
  26. package/skills/ownership-session-security/SKILL.md +41 -41
  27. package/skills/pi-extension-lifecycle/SKILL.md +39 -39
  28. package/skills/requirements-to-task-packet/SKILL.md +63 -63
  29. package/skills/resource-discovery-config/SKILL.md +41 -41
  30. package/skills/runtime-state-reader/SKILL.md +44 -44
  31. package/skills/secure-agent-orchestration-review/SKILL.md +45 -45
  32. package/skills/state-mutation-locking/SKILL.md +42 -42
  33. package/skills/systematic-debugging/SKILL.md +67 -67
  34. package/skills/ui-render-performance/SKILL.md +39 -39
  35. package/skills/verification-before-done/SKILL.md +57 -57
  36. package/skills/worktree-isolation/SKILL.md +39 -39
  37. package/src/adapters/claude-adapter.ts +25 -0
  38. package/src/adapters/codex-adapter.ts +21 -0
  39. package/src/adapters/cursor-adapter.ts +17 -0
  40. package/src/adapters/export-util.ts +137 -0
  41. package/src/adapters/index.ts +15 -0
  42. package/src/adapters/registry.ts +18 -0
  43. package/src/adapters/types.ts +23 -0
  44. package/src/agents/agent-config.ts +2 -0
  45. package/src/agents/agent-search.ts +98 -98
  46. package/src/agents/discover-agents.ts +2 -1
  47. package/src/config/config.ts +13 -1
  48. package/src/config/drift-detector.ts +211 -0
  49. package/src/config/markers.ts +327 -0
  50. package/src/config/resilient-parser.ts +108 -0
  51. package/src/config/suggestions.ts +74 -0
  52. package/src/extension/cross-extension-rpc.ts +103 -94
  53. package/src/extension/project-init.ts +21 -1
  54. package/src/extension/register.ts +45 -14
  55. package/src/extension/registration/commands.ts +77 -8
  56. package/src/extension/registration/subagent-tools.ts +10 -1
  57. package/src/extension/registration/team-tool.ts +10 -1
  58. package/src/extension/registration/viewers.ts +48 -34
  59. package/src/extension/run-bundle-schema.ts +89 -89
  60. package/src/extension/run-import.ts +25 -1
  61. package/src/extension/run-index.ts +5 -1
  62. package/src/extension/run-maintenance.ts +142 -68
  63. package/src/extension/team-manager-command.ts +10 -1
  64. package/src/extension/team-tool/doctor.ts +28 -3
  65. package/src/extension/team-tool/handle-settings.ts +195 -188
  66. package/src/extension/team-tool/inspect.ts +41 -41
  67. package/src/extension/team-tool/intent-policy.ts +42 -42
  68. package/src/extension/team-tool/lifecycle-actions.ts +27 -8
  69. package/src/extension/team-tool/plan.ts +19 -19
  70. package/src/extension/team-tool/run.ts +12 -1
  71. package/src/extension/team-tool.ts +11 -1
  72. package/src/i18n.ts +184 -184
  73. package/src/observability/exporters/otlp-exporter.ts +92 -77
  74. package/src/prompt/prompt-runtime.ts +72 -72
  75. package/src/runtime/agent-memory.ts +72 -72
  76. package/src/runtime/agent-observability.ts +114 -114
  77. package/src/runtime/async-marker.ts +26 -26
  78. package/src/runtime/attention-events.ts +28 -28
  79. package/src/runtime/auto-resume.ts +100 -0
  80. package/src/runtime/background-runner.ts +11 -1
  81. package/src/runtime/cancellation-token.ts +89 -89
  82. package/src/runtime/cancellation.ts +61 -61
  83. package/src/runtime/capability-inventory.ts +116 -116
  84. package/src/runtime/child-pi.ts +7 -2
  85. package/src/runtime/compaction-summary.ts +271 -0
  86. package/src/runtime/completion-guard.ts +190 -190
  87. package/src/runtime/crash-recovery.ts +33 -0
  88. package/src/runtime/delta-conflict.ts +360 -0
  89. package/src/runtime/direct-run.ts +35 -35
  90. package/src/runtime/foreground-control.ts +82 -82
  91. package/src/runtime/green-contract.ts +46 -46
  92. package/src/runtime/group-join.ts +106 -106
  93. package/src/runtime/heartbeat-gradient.ts +28 -28
  94. package/src/runtime/heartbeat-watcher.ts +124 -124
  95. package/src/runtime/iteration-hooks.ts +262 -0
  96. package/src/runtime/live-agent-control.ts +88 -88
  97. package/src/runtime/live-control-realtime.ts +36 -36
  98. package/src/runtime/live-extension-bridge.ts +150 -150
  99. package/src/runtime/live-irc.ts +92 -92
  100. package/src/runtime/live-session-health.ts +100 -100
  101. package/src/runtime/loop-gates.ts +129 -0
  102. package/src/runtime/metric-parser.ts +40 -0
  103. package/src/runtime/notebook-helpers.ts +90 -90
  104. package/src/runtime/orphan-sentinel.ts +7 -7
  105. package/src/runtime/parallel-research.ts +44 -44
  106. package/src/runtime/phase-progress.ts +217 -0
  107. package/src/runtime/pi-args.ts +38 -11
  108. package/src/runtime/pi-json-output.ts +111 -111
  109. package/src/runtime/pi-spawn.ts +57 -7
  110. package/src/runtime/policy-engine.ts +79 -79
  111. package/src/runtime/post-checks.ts +122 -0
  112. package/src/runtime/progress-event-coalescer.ts +43 -43
  113. package/src/runtime/prose-compressor.ts +164 -164
  114. package/src/runtime/recovery-recipes.ts +74 -74
  115. package/src/runtime/result-extractor.ts +121 -121
  116. package/src/runtime/role-permission.ts +39 -39
  117. package/src/runtime/sensitive-paths.ts +2 -2
  118. package/src/runtime/session-resources.ts +25 -25
  119. package/src/runtime/session-snapshot.ts +59 -59
  120. package/src/runtime/session-usage.ts +79 -79
  121. package/src/runtime/sidechain-output.ts +29 -29
  122. package/src/runtime/stream-preview.ts +177 -177
  123. package/src/runtime/supervisor-contact.ts +59 -59
  124. package/src/runtime/task-display.ts +38 -38
  125. package/src/runtime/task-graph.ts +207 -0
  126. package/src/runtime/task-quality.ts +207 -0
  127. package/src/runtime/task-runner/capabilities.ts +78 -78
  128. package/src/runtime/task-runner/live-executor.ts +7 -1
  129. package/src/runtime/task-runner/progress.ts +119 -119
  130. package/src/runtime/task-runner/prompt-pipeline.ts +64 -64
  131. package/src/runtime/task-runner/result-utils.ts +14 -14
  132. package/src/runtime/task-runner/run-projection.ts +103 -103
  133. package/src/runtime/task-runner/state-helpers.ts +22 -22
  134. package/src/runtime/team-runner.ts +117 -7
  135. package/src/runtime/worker-heartbeat.ts +21 -21
  136. package/src/runtime/worker-startup.ts +57 -57
  137. package/src/runtime/workflow-state.ts +187 -0
  138. package/src/runtime/workspace-tree.ts +298 -298
  139. package/src/schema/config-schema.ts +11 -0
  140. package/src/schema/validation-types.ts +148 -0
  141. package/src/skills/skill-templates.ts +374 -0
  142. package/src/state/active-run-registry.ts +35 -11
  143. package/src/state/atomic-write.ts +33 -26
  144. package/src/state/contracts.ts +1 -0
  145. package/src/state/event-reconstructor.ts +217 -0
  146. package/src/state/locks.ts +2 -13
  147. package/src/state/mailbox.ts +4 -3
  148. package/src/state/state-store.ts +32 -14
  149. package/src/state/task-claims.ts +44 -44
  150. package/src/state/types.ts +9 -0
  151. package/src/state/usage.ts +29 -29
  152. package/src/subagents/async-entry.ts +1 -1
  153. package/src/subagents/index.ts +3 -3
  154. package/src/subagents/live/control.ts +1 -1
  155. package/src/subagents/live/manager.ts +1 -1
  156. package/src/subagents/live/realtime.ts +1 -1
  157. package/src/subagents/live/session-runtime.ts +1 -1
  158. package/src/subagents/manager.ts +1 -1
  159. package/src/subagents/spawn.ts +1 -1
  160. package/src/teams/team-serializer.ts +38 -38
  161. package/src/types/diff.d.ts +18 -18
  162. package/src/ui/crew-footer.ts +101 -101
  163. package/src/ui/crew-select-list.ts +111 -111
  164. package/src/ui/crew-widget.ts +5 -2
  165. package/src/ui/dashboard-panes/cancellation-pane.ts +42 -42
  166. package/src/ui/dashboard-panes/capability-pane.ts +59 -59
  167. package/src/ui/dashboard-panes/mailbox-pane.ts +35 -35
  168. package/src/ui/dashboard-panes/metrics-pane.ts +34 -34
  169. package/src/ui/dashboard-panes/progress-pane.ts +11 -0
  170. package/src/ui/dynamic-border.ts +25 -25
  171. package/src/ui/layout-primitives.ts +106 -106
  172. package/src/ui/loaders.ts +158 -158
  173. package/src/ui/render-coalescer.ts +51 -51
  174. package/src/ui/render-diff.ts +119 -119
  175. package/src/ui/render-scheduler.ts +143 -143
  176. package/src/ui/run-action-dispatcher.ts +10 -1
  177. package/src/ui/spinner.ts +17 -17
  178. package/src/ui/status-colors.ts +58 -58
  179. package/src/ui/syntax-highlight.ts +116 -116
  180. package/src/ui/transcript-entries.ts +258 -258
  181. package/src/utils/completion-dedupe.ts +63 -63
  182. package/src/utils/frontmatter.ts +68 -68
  183. package/src/utils/git.ts +262 -262
  184. package/src/utils/ids.ts +17 -17
  185. package/src/utils/incremental-reader.ts +104 -104
  186. package/src/utils/names.ts +27 -27
  187. package/src/utils/redaction.ts +44 -44
  188. package/src/utils/safe-paths.ts +47 -47
  189. package/src/utils/scan-cache.ts +136 -136
  190. package/src/utils/sleep.ts +40 -26
  191. package/src/utils/task-name-generator.ts +337 -337
  192. package/src/workflows/validate-workflow.ts +40 -40
  193. package/src/worktree/branch-freshness.ts +45 -45
  194. package/teams/default.team.md +12 -12
  195. package/teams/fast-fix.team.md +11 -11
  196. package/teams/implementation.team.md +18 -18
  197. package/teams/parallel-research.team.md +14 -14
  198. package/teams/research.team.md +11 -11
  199. package/teams/review.team.md +12 -12
  200. package/workflows/default.workflow.md +30 -29
  201. package/workflows/fast-fix.workflow.md +23 -22
  202. package/workflows/implementation.workflow.md +43 -43
  203. package/workflows/parallel-research.workflow.md +46 -46
  204. package/workflows/research.workflow.md +22 -22
  205. package/workflows/review.workflow.md +30 -30
  206. package/docs/refactor-tasks-phase3.md +0 -394
  207. package/docs/refactor-tasks-phase4.md +0 -564
  208. package/docs/refactor-tasks-phase5.md +0 -402
  209. package/docs/refactor-tasks-phase6.md +0 -662
  210. package/docs/refactor-tasks.md +0 -1484
  211. package/docs/research/AGENT-EXECUTION-ARCHITECTURE.md +0 -261
  212. package/docs/research/AGENT-LIFECYCLE-COMPARISON.md +0 -111
  213. package/docs/research/AUDIT_OH_MY_PI.md +0 -261
  214. package/docs/research/AUDIT_PI_CREW.md +0 -457
  215. package/docs/research/CAVEMAN-DEEP-RESEARCH.md +0 -281
  216. package/docs/research/COMPARISON_OH_MY_PI_VS_PI_CREW.md +0 -264
  217. package/docs/research/DEEP-RESEARCH-PI-POWERBAR.md +0 -343
  218. package/docs/research/DEEP_RESEARCH_SUBAGENT_ARCHITECTURE.md +0 -480
  219. package/docs/research/GAP_CLOSURE_IMPLEMENTATION_PLAN.md +0 -354
  220. package/docs/research/IMPLEMENTATION_PLAN.md +0 -385
  221. package/docs/research/LIVE-SESSION-PRODUCTION-READY-PLAN.md +0 -502
  222. package/docs/research/OH-MY-PI-DEEP-RESEARCH-v14.7.6.md +0 -266
  223. package/docs/research/REMAINING-GAPS-PLAN.md +0 -363
  224. package/docs/research/SESSION-SUMMARY-2026-05-08.md +0 -146
  225. package/docs/research/UI-RESPONSIVENESS-AUDIT.md +0 -173
  226. package/docs/research-awesome-agent-skills-distillation.md +0 -100
  227. package/docs/research-extension-examples.md +0 -297
  228. package/docs/research-extension-system.md +0 -324
  229. package/docs/research-oh-my-pi-distillation.md +0 -369
  230. package/docs/research-optimization-plan.md +0 -548
  231. package/docs/research-phase10-distillation.md +0 -199
  232. package/docs/research-phase11-distillation.md +0 -201
  233. package/docs/research-phase8-operator-experience-plan.md +0 -819
  234. package/docs/research-phase9-observability-reliability-plan.md +0 -1190
  235. package/docs/research-pi-coding-agent.md +0 -357
  236. package/docs/research-source-pi-crew-reference.md +0 -174
  237. package/docs/research-ui-optimization-plan.md +0 -480
  238. package/docs/source-runtime-refactor-map.md +0 -107
  239. package/src/utils/atomic-write.ts +0 -33
@@ -1,100 +1,100 @@
1
- /**
2
- * Phase 8: Monitoring and observability for live-session workers.
3
- *
4
- * Provides health checks, metrics collection, and diagnostics
5
- * for live-session workers running in-process.
6
- */
7
-
8
- export interface LiveSessionHealth {
9
- /** Total number of registered live agents. */
10
- totalAgents: number;
11
- /** Number of agents currently running. */
12
- runningAgents: number;
13
- /** Number of agents in idle state. */
14
- idleAgents: number;
15
- /** Number of agents that have completed. */
16
- completedAgents: number;
17
- /** Number of agents that have failed. */
18
- failedAgents: number;
19
- /** Total tokens consumed across all live sessions. */
20
- totalTokens: number;
21
- /** Timestamp of this health snapshot. */
22
- timestamp: string;
23
- }
24
-
25
- export interface LiveSessionMetrics {
26
- agentId: string;
27
- taskId: string;
28
- status: string;
29
- /** Accumulated usage from session stats. */
30
- usage?: {
31
- input?: number;
32
- output?: number;
33
- cacheRead?: number;
34
- cacheWrite?: number;
35
- cost?: number;
36
- turns?: number;
37
- };
38
- /** Session duration in milliseconds. */
39
- durationMs?: number;
40
- /** Number of IRC messages received. */
41
- ircMessagesReceived?: number;
42
- /** Number of yield reminders sent. */
43
- yieldReminders?: number;
44
- /** Whether yield was called. */
45
- yieldCalled: boolean;
46
- }
47
-
48
- /**
49
- * Collect health snapshot from live agent handles.
50
- */
51
- export function collectLiveSessionHealth(
52
- agents: Array<{ status: string }>,
53
- getUsage: (agentId: string) => { input?: number; output?: number; turns?: number } | undefined,
54
- ): LiveSessionHealth {
55
- let running = 0;
56
- let idle = 0;
57
- let completed = 0;
58
- let failed = 0;
59
- let totalTokens = 0;
60
-
61
- for (const agent of agents) {
62
- switch (agent.status) {
63
- case "running": running++; break;
64
- case "idle": idle++; break;
65
- case "completed": completed++; break;
66
- case "failed": failed++; break;
67
- }
68
- }
69
-
70
- // Sum tokens from usage data
71
- for (const agent of agents) {
72
- const agentAny = agent as Record<string, unknown>;
73
- const agentId = agentAny.agentId as string | undefined;
74
- if (agentId) {
75
- const usage = getUsage(agentId);
76
- if (usage) {
77
- totalTokens += (usage.input ?? 0) + (usage.output ?? 0);
78
- }
79
- }
80
- }
81
-
82
- return {
83
- totalAgents: agents.length,
84
- runningAgents: running,
85
- idleAgents: idle,
86
- completedAgents: completed,
87
- failedAgents: failed,
88
- totalTokens,
89
- timestamp: new Date().toISOString(),
90
- };
91
- }
92
-
93
- /**
94
- * Build a diagnostic summary string for logging.
95
- */
96
- export function formatLiveSessionDiagnostics(health: LiveSessionHealth): string {
97
- return [
98
- `[Live-Session Health] agents=${health.totalAgents} running=${health.runningAgents} idle=${health.idleAgents} completed=${health.completedAgents} failed=${health.failedAgents} tokens=${health.totalTokens}`,
99
- ].join("\n");
100
- }
1
+ /**
2
+ * Phase 8: Monitoring and observability for live-session workers.
3
+ *
4
+ * Provides health checks, metrics collection, and diagnostics
5
+ * for live-session workers running in-process.
6
+ */
7
+
8
+ export interface LiveSessionHealth {
9
+ /** Total number of registered live agents. */
10
+ totalAgents: number;
11
+ /** Number of agents currently running. */
12
+ runningAgents: number;
13
+ /** Number of agents in idle state. */
14
+ idleAgents: number;
15
+ /** Number of agents that have completed. */
16
+ completedAgents: number;
17
+ /** Number of agents that have failed. */
18
+ failedAgents: number;
19
+ /** Total tokens consumed across all live sessions. */
20
+ totalTokens: number;
21
+ /** Timestamp of this health snapshot. */
22
+ timestamp: string;
23
+ }
24
+
25
+ export interface LiveSessionMetrics {
26
+ agentId: string;
27
+ taskId: string;
28
+ status: string;
29
+ /** Accumulated usage from session stats. */
30
+ usage?: {
31
+ input?: number;
32
+ output?: number;
33
+ cacheRead?: number;
34
+ cacheWrite?: number;
35
+ cost?: number;
36
+ turns?: number;
37
+ };
38
+ /** Session duration in milliseconds. */
39
+ durationMs?: number;
40
+ /** Number of IRC messages received. */
41
+ ircMessagesReceived?: number;
42
+ /** Number of yield reminders sent. */
43
+ yieldReminders?: number;
44
+ /** Whether yield was called. */
45
+ yieldCalled: boolean;
46
+ }
47
+
48
+ /**
49
+ * Collect health snapshot from live agent handles.
50
+ */
51
+ export function collectLiveSessionHealth(
52
+ agents: Array<{ status: string }>,
53
+ getUsage: (agentId: string) => { input?: number; output?: number; turns?: number } | undefined,
54
+ ): LiveSessionHealth {
55
+ let running = 0;
56
+ let idle = 0;
57
+ let completed = 0;
58
+ let failed = 0;
59
+ let totalTokens = 0;
60
+
61
+ for (const agent of agents) {
62
+ switch (agent.status) {
63
+ case "running": running++; break;
64
+ case "idle": idle++; break;
65
+ case "completed": completed++; break;
66
+ case "failed": failed++; break;
67
+ }
68
+ }
69
+
70
+ // Sum tokens from usage data
71
+ for (const agent of agents) {
72
+ const agentAny = agent as Record<string, unknown>;
73
+ const agentId = agentAny.agentId as string | undefined;
74
+ if (agentId) {
75
+ const usage = getUsage(agentId);
76
+ if (usage) {
77
+ totalTokens += (usage.input ?? 0) + (usage.output ?? 0);
78
+ }
79
+ }
80
+ }
81
+
82
+ return {
83
+ totalAgents: agents.length,
84
+ runningAgents: running,
85
+ idleAgents: idle,
86
+ completedAgents: completed,
87
+ failedAgents: failed,
88
+ totalTokens,
89
+ timestamp: new Date().toISOString(),
90
+ };
91
+ }
92
+
93
+ /**
94
+ * Build a diagnostic summary string for logging.
95
+ */
96
+ export function formatLiveSessionDiagnostics(health: LiveSessionHealth): string {
97
+ return [
98
+ `[Live-Session Health] agents=${health.totalAgents} running=${health.runningAgents} idle=${health.idleAgents} completed=${health.completedAgents} failed=${health.failedAgents} tokens=${health.totalTokens}`,
99
+ ].join("\n");
100
+ }
@@ -0,0 +1,129 @@
1
+ /**
2
+ * Dual-gate loop control — determines whether a task should auto-resume
3
+ * based on meaningful progress and turn limits.
4
+ *
5
+ * Gate 1: At least one signal of meaningful progress must be true.
6
+ * Gate 2: The auto-resume turn count must be below the maximum.
7
+ *
8
+ * Distilled from pi-autoresearch's dual-gate loop pattern.
9
+ */
10
+ import * as fs from "node:fs";
11
+ import * as path from "node:path";
12
+ import type { TeamTaskState } from "../state/types.ts";
13
+
14
+ /**
15
+ * Signal indicating what kind of progress a task has made.
16
+ */
17
+ export interface TaskProgressSignal {
18
+ /** Whether the task has edited files or produced non-empty results. */
19
+ editedFiles: boolean;
20
+ /** Whether the task has produced artifacts in the artifacts directory. */
21
+ producedArtifacts: boolean;
22
+ /** Whether the task has run tests (detected via result text). */
23
+ ranTests: boolean;
24
+ }
25
+
26
+ /**
27
+ * Runtime state for auto-resume turn tracking.
28
+ */
29
+ export interface AutoResumeRuntime {
30
+ /** Current number of auto-resume turns taken. */
31
+ autoResumeTurns: number;
32
+ /** Maximum allowed auto-resume turns. */
33
+ maxTurns: number;
34
+ }
35
+
36
+ /** Keywords in result text that indicate tests were run. */
37
+ const TEST_KEYWORDS = [
38
+ "test passed",
39
+ "test failed",
40
+ "tests passed",
41
+ "tests failed",
42
+ "test results",
43
+ "jest",
44
+ "vitest",
45
+ "mocha",
46
+ "pytest",
47
+ "npx test",
48
+ "npm test",
49
+ "cargo test",
50
+ "all tests",
51
+ "test suite",
52
+ "✓",
53
+ "✗",
54
+ "PASS ",
55
+ " FAIL ",
56
+ ] as const;
57
+
58
+ /**
59
+ * Determine whether a task should auto-resume based on dual-gate logic.
60
+ *
61
+ * Gate 1 (meaningful progress): at least one of editedFiles, producedArtifacts,
62
+ * or ranTests must be true.
63
+ * Gate 2 (turn limit): autoResumeTurns must be strictly less than maxTurns.
64
+ *
65
+ * Both gates must pass for auto-resume to be allowed.
66
+ */
67
+ export function shouldAutoResume(runtime: AutoResumeRuntime, taskProgress: TaskProgressSignal): boolean {
68
+ // Gate 2: Turn limit check (check first — cheaper)
69
+ if (runtime.autoResumeTurns >= runtime.maxTurns) {
70
+ return false;
71
+ }
72
+
73
+ // Gate 1: Meaningful progress check
74
+ const hasProgress = taskProgress.editedFiles || taskProgress.producedArtifacts || taskProgress.ranTests;
75
+ if (!hasProgress) {
76
+ return false;
77
+ }
78
+
79
+ return true;
80
+ }
81
+
82
+ /**
83
+ * Compute the task progress signal from a task's state and artifacts directory.
84
+ *
85
+ * - editedFiles: true if task has artifact files or a non-empty result
86
+ * - producedArtifacts: true if artifacts directory contains task-specific files
87
+ * - ranTests: true if result text contains test-related keywords
88
+ *
89
+ * @param task - The task state to analyze
90
+ * @param artifactsDir - Path to the artifacts directory
91
+ * @returns TaskProgressSignal indicating what progress was made
92
+ */
93
+ export function computeTaskProgressSignal(task: TeamTaskState, artifactsDir: string): TaskProgressSignal {
94
+ // editedFiles: check if task has artifact descriptors or a non-empty result
95
+ const hasResultArtifact = task.resultArtifact !== undefined;
96
+ const hasNonEmptyResult = task.resultArtifact?.path !== undefined;
97
+ const editedFiles = hasResultArtifact || hasNonEmptyResult;
98
+
99
+ // producedArtifacts: check artifacts directory for task-specific files
100
+ let producedArtifacts = false;
101
+ if (artifactsDir && fs.existsSync(artifactsDir)) {
102
+ try {
103
+ const entries = fs.readdirSync(artifactsDir);
104
+ // Look for files/directories that START with the task ID prefix.
105
+ // Using startsWith instead of includes to avoid false positives
106
+ // from short task IDs like "01" matching unrelated entries.
107
+ const taskPrefix = task.id.replace(/[^a-zA-Z0-9_-]/g, "");
108
+ producedArtifacts = entries.some((entry) => {
109
+ const baseName = entry.split(".")[0] ?? entry;
110
+ return baseName.startsWith(taskPrefix);
111
+ });
112
+ } catch {
113
+ producedArtifacts = false;
114
+ }
115
+ }
116
+
117
+ // ranTests: check if result-related fields contain test keywords
118
+ let ranTests = false;
119
+ const textToSearch = [
120
+ task.error ?? "",
121
+ task.terminalEvidence ? JSON.stringify(task.terminalEvidence) : "",
122
+ task.diagnostics ? JSON.stringify(task.diagnostics) : "",
123
+ ].join(" ");
124
+
125
+ const lowerText = textToSearch.toLowerCase();
126
+ ranTests = TEST_KEYWORDS.some((keyword) => lowerText.includes(keyword.toLowerCase()));
127
+
128
+ return { editedFiles, producedArtifacts, ranTests };
129
+ }
@@ -0,0 +1,40 @@
1
+ /**
2
+ * Metric names that are denied to prevent prototype pollution.
3
+ */
4
+ export const DENIED_METRIC_NAMES: ReadonlySet<string> = new Set([
5
+ "__proto__",
6
+ "constructor",
7
+ "prototype",
8
+ ]);
9
+
10
+ const METRIC_LINE_RE = /^CREW_METRIC\s+(\w+)=(\S+)$/;
11
+
12
+ /**
13
+ * Parse CREW_METRIC lines from worker stdout.
14
+ *
15
+ * Lines must match the pattern: `CREW_METRIC name=value`
16
+ * - `name` must be a word character sequence (alphanumeric + underscore)
17
+ * - `value` must parse as a valid finite number
18
+ * - Denied names (__proto__, constructor, prototype) are silently skipped
19
+ *
20
+ * @param output - Raw worker stdout text
21
+ * @returns Map of metric name → numeric value
22
+ */
23
+ export function parseMetricLines(output: string): Record<string, number> {
24
+ const metrics: Record<string, number> = {};
25
+
26
+ for (const line of output.split("\n")) {
27
+ const match = METRIC_LINE_RE.exec(line);
28
+ if (!match) continue;
29
+
30
+ const [, name, rawValue] = match;
31
+ if (DENIED_METRIC_NAMES.has(name)) continue;
32
+
33
+ const value = Number(rawValue);
34
+ if (!Number.isFinite(value)) continue;
35
+
36
+ metrics[name] = value;
37
+ }
38
+
39
+ return metrics;
40
+ }
@@ -1,90 +1,90 @@
1
- export interface NotebookCell {
2
- index: number;
3
- cellType: "code" | "markdown" | "raw";
4
- source: string;
5
- outputs?: unknown[];
6
- metadata?: Record<string, unknown>;
7
- }
8
-
9
- export interface Notebook {
10
- cells: NotebookCell[];
11
- metadata?: Record<string, unknown>;
12
- nbformat: number;
13
- }
14
-
15
- /** Check if a file path is a notebook */
16
- export function isNotebookPath(filePath: string): boolean {
17
- return filePath.toLowerCase().endsWith(".ipynb");
18
- }
19
-
20
- function normalizeSource(source: unknown): string {
21
- if (typeof source === "string") return source;
22
- if (Array.isArray(source)) return source.join("");
23
- return "";
24
- }
25
-
26
- /** Parse a .ipynb JSON file into a Notebook structure */
27
- export function parseNotebook(content: string): Notebook {
28
- let raw: unknown;
29
- try {
30
- raw = JSON.parse(content);
31
- } catch {
32
- return { cells: [], nbformat: 4 };
33
- }
34
- if (typeof raw !== "object" || raw === null) return { cells: [], nbformat: 4 };
35
- const obj = raw as Record<string, unknown>;
36
- const nbformat = typeof obj.nbformat === "number" ? obj.nbformat : 4;
37
- const rawCells = Array.isArray(obj.cells) ? obj.cells : [];
38
- const cells: NotebookCell[] = rawCells
39
- .map((c: unknown, i: number): NotebookCell | null => {
40
- if (typeof c !== "object" || c === null) return null;
41
- const cell = c as Record<string, unknown>;
42
- const cellType = cell.cell_type;
43
- if (cellType !== "code" && cellType !== "markdown" && cellType !== "raw") return null;
44
- return {
45
- index: i,
46
- cellType,
47
- source: normalizeSource(cell.source),
48
- outputs: Array.isArray(cell.outputs) ? cell.outputs : undefined,
49
- metadata:
50
- cell.metadata && typeof cell.metadata === "object" && !Array.isArray(cell.metadata)
51
- ? (cell.metadata as Record<string, unknown>)
52
- : undefined,
53
- };
54
- })
55
- .filter((c: NotebookCell | null): c is NotebookCell => c !== null);
56
- const metadata =
57
- obj.metadata && typeof obj.metadata === "object" && !Array.isArray(obj.metadata)
58
- ? (obj.metadata as Record<string, unknown>)
59
- : undefined;
60
- return { cells, metadata, nbformat };
61
- }
62
-
63
- /** Get a specific cell by index */
64
- export function getCell(notebook: Notebook, index: number): NotebookCell | undefined {
65
- return notebook.cells.find((c) => c.index === index);
66
- }
67
-
68
- /** Update a cell's source content, returning a new Notebook */
69
- export function updateCell(notebook: Notebook, index: number, source: string): Notebook {
70
- const cells = notebook.cells.map((c) =>
71
- c.index === index ? { ...c, source } : c,
72
- );
73
- return { ...notebook, cells };
74
- }
75
-
76
- /** Serialize a Notebook back to .ipynb JSON string */
77
- export function serializeNotebook(notebook: Notebook): string {
78
- const raw = {
79
- nbformat: notebook.nbformat,
80
- nbformat_minor: 5,
81
- metadata: notebook.metadata ?? {},
82
- cells: notebook.cells.map((c) => ({
83
- cell_type: c.cellType,
84
- source: c.source,
85
- metadata: c.metadata ?? {},
86
- ...(c.cellType === "code" ? { outputs: c.outputs ?? [], execution_count: null } : {}),
87
- })),
88
- };
89
- return JSON.stringify(raw, null, 2) + "\n";
90
- }
1
+ export interface NotebookCell {
2
+ index: number;
3
+ cellType: "code" | "markdown" | "raw";
4
+ source: string;
5
+ outputs?: unknown[];
6
+ metadata?: Record<string, unknown>;
7
+ }
8
+
9
+ export interface Notebook {
10
+ cells: NotebookCell[];
11
+ metadata?: Record<string, unknown>;
12
+ nbformat: number;
13
+ }
14
+
15
+ /** Check if a file path is a notebook */
16
+ export function isNotebookPath(filePath: string): boolean {
17
+ return filePath.toLowerCase().endsWith(".ipynb");
18
+ }
19
+
20
+ function normalizeSource(source: unknown): string {
21
+ if (typeof source === "string") return source;
22
+ if (Array.isArray(source)) return source.join("");
23
+ return "";
24
+ }
25
+
26
+ /** Parse a .ipynb JSON file into a Notebook structure */
27
+ export function parseNotebook(content: string): Notebook {
28
+ let raw: unknown;
29
+ try {
30
+ raw = JSON.parse(content);
31
+ } catch {
32
+ return { cells: [], nbformat: 4 };
33
+ }
34
+ if (typeof raw !== "object" || raw === null) return { cells: [], nbformat: 4 };
35
+ const obj = raw as Record<string, unknown>;
36
+ const nbformat = typeof obj.nbformat === "number" ? obj.nbformat : 4;
37
+ const rawCells = Array.isArray(obj.cells) ? obj.cells : [];
38
+ const cells: NotebookCell[] = rawCells
39
+ .map((c: unknown, i: number): NotebookCell | null => {
40
+ if (typeof c !== "object" || c === null) return null;
41
+ const cell = c as Record<string, unknown>;
42
+ const cellType = cell.cell_type;
43
+ if (cellType !== "code" && cellType !== "markdown" && cellType !== "raw") return null;
44
+ return {
45
+ index: i,
46
+ cellType,
47
+ source: normalizeSource(cell.source),
48
+ outputs: Array.isArray(cell.outputs) ? cell.outputs : undefined,
49
+ metadata:
50
+ cell.metadata && typeof cell.metadata === "object" && !Array.isArray(cell.metadata)
51
+ ? (cell.metadata as Record<string, unknown>)
52
+ : undefined,
53
+ };
54
+ })
55
+ .filter((c: NotebookCell | null): c is NotebookCell => c !== null);
56
+ const metadata =
57
+ obj.metadata && typeof obj.metadata === "object" && !Array.isArray(obj.metadata)
58
+ ? (obj.metadata as Record<string, unknown>)
59
+ : undefined;
60
+ return { cells, metadata, nbformat };
61
+ }
62
+
63
+ /** Get a specific cell by index */
64
+ export function getCell(notebook: Notebook, index: number): NotebookCell | undefined {
65
+ return notebook.cells.find((c) => c.index === index);
66
+ }
67
+
68
+ /** Update a cell's source content, returning a new Notebook */
69
+ export function updateCell(notebook: Notebook, index: number, source: string): Notebook {
70
+ const cells = notebook.cells.map((c) =>
71
+ c.index === index ? { ...c, source } : c,
72
+ );
73
+ return { ...notebook, cells };
74
+ }
75
+
76
+ /** Serialize a Notebook back to .ipynb JSON string */
77
+ export function serializeNotebook(notebook: Notebook): string {
78
+ const raw = {
79
+ nbformat: notebook.nbformat,
80
+ nbformat_minor: 5,
81
+ metadata: notebook.metadata ?? {},
82
+ cells: notebook.cells.map((c) => ({
83
+ cell_type: c.cellType,
84
+ source: c.source,
85
+ metadata: c.metadata ?? {},
86
+ ...(c.cellType === "code" ? { outputs: c.outputs ?? [], execution_count: null } : {}),
87
+ })),
88
+ };
89
+ return JSON.stringify(raw, null, 2) + "\n";
90
+ }
@@ -1,7 +1,7 @@
1
- /**
2
- * Orphan sentinel — DEPRECATED, replaced by parent-guard.ts.
3
- *
4
- * Keeping this file as a no-op placeholder until all references are removed.
5
- * Workers now self-monitor via startParentGuard() instead of relying on
6
- * an external sentinel process.
7
- */
1
+ /**
2
+ * Orphan sentinel — DEPRECATED, replaced by parent-guard.ts.
3
+ *
4
+ * Keeping this file as a no-op placeholder until all references are removed.
5
+ * Workers now self-monitor via startParentGuard() instead of relying on
6
+ * an external sentinel process.
7
+ */
@@ -1,44 +1,44 @@
1
- import * as fs from "node:fs";
2
- import * as path from "node:path";
3
- import type { WorkflowConfig, WorkflowStep } from "../workflows/workflow-config.ts";
4
-
5
- export function sourcePiProjects(cwd: string): string[] {
6
- const sourceDir = path.join(cwd, "Source");
7
- try {
8
- return fs.readdirSync(sourceDir, { withFileTypes: true })
9
- .filter((entry) => entry.isDirectory() && entry.name.startsWith("pi-"))
10
- .map((entry) => `Source/${entry.name}`)
11
- .sort();
12
- } catch {
13
- return [];
14
- }
15
- }
16
-
17
- export function chunkProjects(projects: string[], target = 6): string[][] {
18
- const chunks = Array.from({ length: Math.min(Math.max(1, target), Math.max(1, projects.length)) }, () => [] as string[]);
19
- projects.forEach((project, index) => chunks[index % chunks.length]!.push(project));
20
- return chunks.filter((chunk) => chunk.length > 0);
21
- }
22
-
23
- export function expandParallelResearchWorkflow(workflow: WorkflowConfig, cwd: string): WorkflowConfig {
24
- if (workflow.name !== "parallel-research") return workflow;
25
- const projects = sourcePiProjects(cwd);
26
- if (projects.length === 0) return workflow;
27
- const chunks = chunkProjects(projects, Math.min(8, Math.max(4, Math.ceil(projects.length / 3))));
28
- const exploreSteps: WorkflowStep[] = chunks.map((paths, index) => ({
29
- id: `explore-shard-${index + 1}`,
30
- role: "explorer",
31
- parallelGroup: "explore",
32
- reads: paths,
33
- task: [`Explore this dynamic shard for: {goal}`, "", "Paths:", ...paths.map((item) => `- ${item}`), "", "Focus on purpose, architecture, runtime/UI patterns, package config, docs, and lessons for pi-crew."].join("\n"),
34
- }));
35
- return {
36
- ...workflow,
37
- steps: [
38
- { id: "discover", role: "explorer", parallelGroup: "inventory", task: `Quickly inventory and validate ${projects.length} pi-* projects for: {goal}\n\nProjects:\n${projects.map((item) => `- ${item}`).join("\n")}\n\nDo not block shard work; summarize routing notes only.` },
39
- ...exploreSteps,
40
- { id: "synthesize", role: "analyst", dependsOn: exploreSteps.map((step) => step.id), task: "Synthesize all dynamic shard findings. Identify common patterns, gaps, and concrete recommendations. Use discover output if available, but prioritize completed shard outputs." },
41
- { id: "write", role: "writer", dependsOn: ["synthesize"], output: "research-summary.md", task: "Write a concise final summary with evidence, risks, and actionable next steps." },
42
- ],
43
- };
44
- }
1
+ import * as fs from "node:fs";
2
+ import * as path from "node:path";
3
+ import type { WorkflowConfig, WorkflowStep } from "../workflows/workflow-config.ts";
4
+
5
+ export function sourcePiProjects(cwd: string): string[] {
6
+ const sourceDir = path.join(cwd, "Source");
7
+ try {
8
+ return fs.readdirSync(sourceDir, { withFileTypes: true })
9
+ .filter((entry) => entry.isDirectory() && entry.name.startsWith("pi-"))
10
+ .map((entry) => `Source/${entry.name}`)
11
+ .sort();
12
+ } catch {
13
+ return [];
14
+ }
15
+ }
16
+
17
+ export function chunkProjects(projects: string[], target = 6): string[][] {
18
+ const chunks = Array.from({ length: Math.min(Math.max(1, target), Math.max(1, projects.length)) }, () => [] as string[]);
19
+ projects.forEach((project, index) => chunks[index % chunks.length]!.push(project));
20
+ return chunks.filter((chunk) => chunk.length > 0);
21
+ }
22
+
23
+ export function expandParallelResearchWorkflow(workflow: WorkflowConfig, cwd: string): WorkflowConfig {
24
+ if (workflow.name !== "parallel-research") return workflow;
25
+ const projects = sourcePiProjects(cwd);
26
+ if (projects.length === 0) return workflow;
27
+ const chunks = chunkProjects(projects, Math.min(8, Math.max(4, Math.ceil(projects.length / 3))));
28
+ const exploreSteps: WorkflowStep[] = chunks.map((paths, index) => ({
29
+ id: `explore-shard-${index + 1}`,
30
+ role: "explorer",
31
+ parallelGroup: "explore",
32
+ reads: paths,
33
+ task: [`Explore this dynamic shard for: {goal}`, "", "Paths:", ...paths.map((item) => `- ${item}`), "", "Focus on purpose, architecture, runtime/UI patterns, package config, docs, and lessons for pi-crew."].join("\n"),
34
+ }));
35
+ return {
36
+ ...workflow,
37
+ steps: [
38
+ { id: "discover", role: "explorer", parallelGroup: "inventory", task: `Quickly inventory and validate ${projects.length} pi-* projects for: {goal}\n\nProjects:\n${projects.map((item) => `- ${item}`).join("\n")}\n\nDo not block shard work; summarize routing notes only.` },
39
+ ...exploreSteps,
40
+ { id: "synthesize", role: "analyst", dependsOn: exploreSteps.map((step) => step.id), task: "Synthesize all dynamic shard findings. Identify common patterns, gaps, and concrete recommendations. Use discover output if available, but prioritize completed shard outputs." },
41
+ { id: "write", role: "writer", dependsOn: ["synthesize"], output: "research-summary.md", task: "Write a concise final summary with evidence, risks, and actionable next steps." },
42
+ ],
43
+ };
44
+ }