pi-crew 0.1.46 → 0.1.49

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (253) hide show
  1. package/CHANGELOG.md +97 -0
  2. package/agents/analyst.md +11 -11
  3. package/agents/critic.md +11 -11
  4. package/agents/executor.md +11 -11
  5. package/agents/explorer.md +11 -11
  6. package/agents/planner.md +11 -11
  7. package/agents/reviewer.md +11 -11
  8. package/agents/security-reviewer.md +11 -11
  9. package/agents/test-engineer.md +11 -11
  10. package/agents/verifier.md +11 -11
  11. package/agents/writer.md +11 -11
  12. package/docs/next-upgrade-roadmap.md +117 -42
  13. package/docs/refactor-tasks-phase3.md +394 -394
  14. package/docs/refactor-tasks-phase4.md +564 -564
  15. package/docs/refactor-tasks-phase5.md +402 -402
  16. package/docs/refactor-tasks-phase6.md +662 -662
  17. package/docs/research/AGENT-EXECUTION-ARCHITECTURE.md +261 -0
  18. package/docs/research/AGENT-LIFECYCLE-COMPARISON.md +111 -0
  19. package/docs/research/AUDIT_OH_MY_PI.md +261 -0
  20. package/docs/research/AUDIT_PI_CREW.md +457 -0
  21. package/docs/research/CAVEMAN-DEEP-RESEARCH.md +281 -0
  22. package/docs/research/COMPARISON_OH_MY_PI_VS_PI_CREW.md +264 -0
  23. package/docs/research/DEEP-RESEARCH-PI-POWERBAR.md +343 -0
  24. package/docs/research/DEEP_RESEARCH_SUBAGENT_ARCHITECTURE.md +480 -0
  25. package/docs/research/GAP_CLOSURE_IMPLEMENTATION_PLAN.md +354 -0
  26. package/docs/research/IMPLEMENTATION_PLAN.md +385 -0
  27. package/docs/research/LIVE-SESSION-PRODUCTION-READY-PLAN.md +502 -0
  28. package/docs/research/OH-MY-PI-DEEP-RESEARCH-v14.7.6.md +266 -0
  29. package/docs/research/REMAINING-GAPS-PLAN.md +363 -0
  30. package/docs/research/SESSION-SUMMARY-2026-05-08.md +146 -0
  31. package/docs/research/UI-RESPONSIVENESS-AUDIT.md +173 -0
  32. package/docs/research-awesome-agent-skills-distillation.md +100 -100
  33. package/docs/research-extension-examples.md +297 -297
  34. package/docs/research-extension-system.md +324 -324
  35. package/docs/research-oh-my-pi-distillation.md +56 -9
  36. package/docs/research-optimization-plan.md +548 -548
  37. package/docs/research-phase10-distillation.md +198 -198
  38. package/docs/research-phase11-distillation.md +201 -201
  39. package/docs/research-pi-coding-agent.md +357 -357
  40. package/docs/research-source-pi-crew-reference.md +174 -174
  41. package/docs/runtime-flow.md +148 -148
  42. package/docs/source-runtime-refactor-map.md +107 -107
  43. package/index.ts +6 -6
  44. package/package.json +99 -98
  45. package/schema.json +8 -0
  46. package/skills/async-worker-recovery/SKILL.md +42 -42
  47. package/skills/context-artifact-hygiene/SKILL.md +52 -52
  48. package/skills/delegation-patterns/SKILL.md +54 -54
  49. package/skills/mailbox-interactive/SKILL.md +40 -40
  50. package/skills/model-routing-context/SKILL.md +39 -39
  51. package/skills/multi-perspective-review/SKILL.md +58 -58
  52. package/skills/observability-reliability/SKILL.md +41 -41
  53. package/skills/orchestration/SKILL.md +157 -0
  54. package/skills/ownership-session-security/SKILL.md +41 -41
  55. package/skills/pi-extension-lifecycle/SKILL.md +39 -39
  56. package/skills/requirements-to-task-packet/SKILL.md +63 -63
  57. package/skills/resource-discovery-config/SKILL.md +41 -41
  58. package/skills/runtime-state-reader/SKILL.md +44 -44
  59. package/skills/secure-agent-orchestration-review/SKILL.md +45 -45
  60. package/skills/state-mutation-locking/SKILL.md +42 -42
  61. package/skills/systematic-debugging/SKILL.md +67 -67
  62. package/skills/ui-render-performance/SKILL.md +39 -39
  63. package/skills/verification-before-done/SKILL.md +57 -57
  64. package/skills/worktree-isolation/SKILL.md +39 -39
  65. package/src/agents/agent-config.ts +6 -0
  66. package/src/agents/agent-search.ts +98 -0
  67. package/src/agents/agent-serializer.ts +4 -0
  68. package/src/agents/discover-agents.ts +17 -4
  69. package/src/config/config.ts +24 -0
  70. package/src/config/defaults.ts +11 -0
  71. package/src/extension/autonomous-policy.ts +26 -33
  72. package/src/extension/cross-extension-rpc.ts +82 -82
  73. package/src/extension/help.ts +1 -0
  74. package/src/extension/management.ts +5 -0
  75. package/src/extension/register.ts +58 -13
  76. package/src/extension/registration/commands.ts +33 -1
  77. package/src/extension/registration/compaction-guard.ts +125 -125
  78. package/src/extension/registration/team-tool.ts +6 -4
  79. package/src/extension/run-bundle-schema.ts +89 -89
  80. package/src/extension/run-index.ts +24 -18
  81. package/src/extension/run-maintenance.ts +68 -62
  82. package/src/extension/team-tool/api.ts +23 -2
  83. package/src/extension/team-tool/cancel.ts +86 -11
  84. package/src/extension/team-tool/context.ts +3 -0
  85. package/src/extension/team-tool/handle-settings.ts +188 -188
  86. package/src/extension/team-tool/inspect.ts +41 -41
  87. package/src/extension/team-tool/intent-policy.ts +42 -0
  88. package/src/extension/team-tool/lifecycle-actions.ts +47 -18
  89. package/src/extension/team-tool/parallel-dispatch.ts +156 -0
  90. package/src/extension/team-tool/plan.ts +19 -19
  91. package/src/extension/team-tool/respond.ts +10 -2
  92. package/src/extension/team-tool/run.ts +3 -2
  93. package/src/extension/team-tool/status.ts +1 -1
  94. package/src/extension/team-tool-types.ts +1 -0
  95. package/src/extension/team-tool.ts +13 -3
  96. package/src/hooks/registry.ts +61 -0
  97. package/src/hooks/types.ts +41 -0
  98. package/src/i18n.ts +184 -184
  99. package/src/observability/exporters/otlp-exporter.ts +77 -77
  100. package/src/prompt/prompt-runtime.ts +72 -72
  101. package/src/runtime/agent-control.ts +108 -2
  102. package/src/runtime/agent-memory.ts +72 -72
  103. package/src/runtime/agent-observability.ts +114 -114
  104. package/src/runtime/async-marker.ts +26 -26
  105. package/src/runtime/async-runner.ts +3 -1
  106. package/src/runtime/attention-events.ts +28 -28
  107. package/src/runtime/background-runner.ts +19 -0
  108. package/src/runtime/cancellation-token.ts +89 -0
  109. package/src/runtime/cancellation.ts +61 -51
  110. package/src/runtime/capability-inventory.ts +116 -0
  111. package/src/runtime/child-pi.ts +2 -1
  112. package/src/runtime/code-summary.ts +247 -0
  113. package/src/runtime/completion-guard.ts +190 -190
  114. package/src/runtime/crash-recovery.ts +181 -0
  115. package/src/runtime/crew-agent-records.ts +35 -7
  116. package/src/runtime/crew-agent-runtime.ts +1 -0
  117. package/src/runtime/custom-tools/irc-tool.ts +201 -0
  118. package/src/runtime/custom-tools/submit-result-tool.ts +90 -0
  119. package/src/runtime/delivery-coordinator.ts +3 -1
  120. package/src/runtime/direct-run.ts +35 -35
  121. package/src/runtime/effectiveness.ts +81 -76
  122. package/src/runtime/event-stream-bridge.ts +90 -0
  123. package/src/runtime/foreground-control.ts +82 -82
  124. package/src/runtime/green-contract.ts +46 -46
  125. package/src/runtime/group-join.ts +106 -106
  126. package/src/runtime/heartbeat-gradient.ts +28 -28
  127. package/src/runtime/heartbeat-watcher.ts +124 -124
  128. package/src/runtime/live-agent-control.ts +88 -88
  129. package/src/runtime/live-agent-manager.ts +78 -2
  130. package/src/runtime/live-control-realtime.ts +36 -36
  131. package/src/runtime/live-extension-bridge.ts +150 -0
  132. package/src/runtime/live-irc.ts +92 -0
  133. package/src/runtime/live-session-health.ts +100 -0
  134. package/src/runtime/live-session-runtime.ts +297 -7
  135. package/src/runtime/mcp-proxy.ts +113 -0
  136. package/src/runtime/notebook-helpers.ts +90 -0
  137. package/src/runtime/orphan-sentinel.ts +7 -0
  138. package/src/runtime/output-validator.ts +187 -0
  139. package/src/runtime/parallel-research.ts +44 -44
  140. package/src/runtime/parallel-utils.ts +57 -0
  141. package/src/runtime/parent-guard.ts +80 -0
  142. package/src/runtime/pi-json-output.ts +111 -111
  143. package/src/runtime/policy-engine.ts +79 -79
  144. package/src/runtime/progress-event-coalescer.ts +43 -43
  145. package/src/runtime/prose-compressor.ts +164 -0
  146. package/src/runtime/recovery-recipes.ts +74 -74
  147. package/src/runtime/result-extractor.ts +121 -0
  148. package/src/runtime/role-permission.ts +39 -39
  149. package/src/runtime/runtime-resolver.ts +1 -4
  150. package/src/runtime/semaphore.ts +131 -0
  151. package/src/runtime/sensitive-paths.ts +92 -0
  152. package/src/runtime/session-resources.ts +25 -25
  153. package/src/runtime/session-snapshot.ts +59 -59
  154. package/src/runtime/session-usage.ts +79 -79
  155. package/src/runtime/sidechain-output.ts +29 -29
  156. package/src/runtime/stream-preview.ts +177 -0
  157. package/src/runtime/subagent-manager.ts +3 -2
  158. package/src/runtime/subprocess-tool-registry.ts +67 -0
  159. package/src/runtime/supervisor-contact.ts +59 -59
  160. package/src/runtime/task-display.ts +38 -38
  161. package/src/runtime/task-output-context.ts +59 -9
  162. package/src/runtime/task-runner/capabilities.ts +78 -78
  163. package/src/runtime/task-runner/live-executor.ts +2 -0
  164. package/src/runtime/task-runner/progress.ts +119 -119
  165. package/src/runtime/task-runner/prompt-builder.ts +70 -8
  166. package/src/runtime/task-runner/prompt-pipeline.ts +64 -64
  167. package/src/runtime/task-runner/result-utils.ts +14 -14
  168. package/src/runtime/task-runner/run-projection.ts +104 -0
  169. package/src/runtime/task-runner/state-helpers.ts +22 -22
  170. package/src/runtime/task-runner.ts +75 -4
  171. package/src/runtime/team-runner.ts +60 -8
  172. package/src/runtime/worker-heartbeat.ts +21 -21
  173. package/src/runtime/worker-startup.ts +57 -57
  174. package/src/runtime/workspace-tree.ts +298 -0
  175. package/src/runtime/yield-handler.ts +189 -0
  176. package/src/schema/config-schema.ts +6 -0
  177. package/src/schema/team-tool-schema.ts +11 -1
  178. package/src/skills/discover-skills.ts +67 -0
  179. package/src/state/active-run-registry.ts +4 -2
  180. package/src/state/artifact-store.ts +4 -1
  181. package/src/state/atomic-write.ts +50 -1
  182. package/src/state/blob-store.ts +117 -0
  183. package/src/state/contracts.ts +1 -0
  184. package/src/state/event-log-rotation.ts +158 -0
  185. package/src/state/event-log.ts +52 -2
  186. package/src/state/mailbox.ts +87 -7
  187. package/src/state/state-store.ts +24 -4
  188. package/src/state/task-claims.ts +44 -44
  189. package/src/state/types.ts +20 -0
  190. package/src/state/usage.ts +29 -29
  191. package/src/subagents/async-entry.ts +1 -1
  192. package/src/subagents/index.ts +3 -3
  193. package/src/subagents/live/control.ts +1 -1
  194. package/src/subagents/live/manager.ts +1 -1
  195. package/src/subagents/live/realtime.ts +1 -1
  196. package/src/subagents/live/session-runtime.ts +1 -1
  197. package/src/subagents/manager.ts +1 -1
  198. package/src/subagents/spawn.ts +1 -1
  199. package/src/teams/team-serializer.ts +38 -38
  200. package/src/types/diff.d.ts +18 -18
  201. package/src/ui/agent-management-overlay.ts +144 -0
  202. package/src/ui/crew-footer.ts +101 -101
  203. package/src/ui/crew-select-list.ts +111 -111
  204. package/src/ui/crew-widget.ts +11 -2
  205. package/src/ui/dashboard-panes/cancellation-pane.ts +43 -0
  206. package/src/ui/dashboard-panes/capability-pane.ts +60 -0
  207. package/src/ui/dashboard-panes/mailbox-pane.ts +35 -11
  208. package/src/ui/dashboard-panes/metrics-pane.ts +34 -34
  209. package/src/ui/dynamic-border.ts +25 -25
  210. package/src/ui/layout-primitives.ts +106 -106
  211. package/src/ui/live-run-sidebar.ts +4 -0
  212. package/src/ui/loaders.ts +158 -158
  213. package/src/ui/powerbar-publisher.ts +77 -15
  214. package/src/ui/render-coalescer.ts +51 -0
  215. package/src/ui/render-diff.ts +119 -119
  216. package/src/ui/render-scheduler.ts +143 -143
  217. package/src/ui/run-dashboard.ts +4 -0
  218. package/src/ui/run-event-bus.ts +209 -0
  219. package/src/ui/run-snapshot-cache.ts +68 -16
  220. package/src/ui/snapshot-types.ts +8 -0
  221. package/src/ui/spinner.ts +17 -17
  222. package/src/ui/status-colors.ts +58 -58
  223. package/src/ui/syntax-highlight.ts +116 -116
  224. package/src/ui/transcript-entries.ts +258 -0
  225. package/src/utils/atomic-write.ts +33 -33
  226. package/src/utils/completion-dedupe.ts +63 -63
  227. package/src/utils/frontmatter.ts +68 -68
  228. package/src/utils/git.ts +262 -262
  229. package/src/utils/ids.ts +17 -12
  230. package/src/utils/incremental-reader.ts +104 -0
  231. package/src/utils/names.ts +27 -27
  232. package/src/utils/redaction.ts +44 -44
  233. package/src/utils/safe-paths.ts +47 -47
  234. package/src/utils/scan-cache.ts +137 -0
  235. package/src/utils/sleep.ts +32 -32
  236. package/src/utils/sse-parser.ts +134 -0
  237. package/src/utils/task-name-generator.ts +337 -0
  238. package/src/utils/visual.ts +33 -2
  239. package/src/workflows/validate-workflow.ts +40 -40
  240. package/src/worktree/branch-freshness.ts +45 -45
  241. package/src/worktree/cleanup.ts +2 -1
  242. package/teams/default.team.md +12 -12
  243. package/teams/fast-fix.team.md +11 -11
  244. package/teams/implementation.team.md +18 -18
  245. package/teams/parallel-research.team.md +14 -14
  246. package/teams/research.team.md +11 -11
  247. package/teams/review.team.md +12 -12
  248. package/workflows/default.workflow.md +29 -29
  249. package/workflows/fast-fix.workflow.md +22 -22
  250. package/workflows/implementation.workflow.md +38 -38
  251. package/workflows/parallel-research.workflow.md +46 -46
  252. package/workflows/research.workflow.md +22 -22
  253. package/workflows/review.workflow.md +30 -30
@@ -1,74 +1,74 @@
1
- import type { PolicyDecision, PolicyDecisionReason } from "../state/types.ts";
2
-
3
- export type FailureScenario = "trust_prompt_unresolved" | "prompt_misdelivery" | "stale_branch" | "compile_red_cross_crate" | "mcp_handshake_failure" | "partial_plugin_startup" | "provider_failure" | "task_failed" | "worker_stale" | "green_unsatisfied";
4
- export type RecoveryStep = "accept_trust_prompt" | "redirect_prompt_to_agent" | "rebase_branch" | "clean_build" | "retry_mcp_handshake" | "restart_plugin" | "restart_worker" | "rerun_task" | "collect_verification_evidence" | "escalate_to_human";
5
- export type RecoveryResultState = "planned" | "skipped" | "escalation_required";
6
-
7
- export interface RecoveryRecipe {
8
- scenario: FailureScenario;
9
- steps: RecoveryStep[];
10
- maxAttempts: number;
11
- escalationPolicy: "alert_human" | "log_and_continue" | "abort";
12
- }
13
-
14
- export interface RecoveryLedgerEntry {
15
- scenario: FailureScenario;
16
- taskId?: string;
17
- decisionReason: PolicyDecisionReason;
18
- attempt: number;
19
- state: RecoveryResultState;
20
- steps: RecoveryStep[];
21
- message: string;
22
- createdAt: string;
23
- }
24
-
25
- export interface RecoveryLedger {
26
- entries: RecoveryLedgerEntry[];
27
- }
28
-
29
- export function scenarioForPolicyReason(reason: PolicyDecisionReason): FailureScenario {
30
- switch (reason) {
31
- case "branch_stale": return "stale_branch";
32
- case "worker_stale": return "worker_stale";
33
- case "green_unsatisfied": return "green_unsatisfied";
34
- case "task_failed": return "task_failed";
35
- default: return "provider_failure";
36
- }
37
- }
38
-
39
- export function recipeFor(scenario: FailureScenario): RecoveryRecipe {
40
- switch (scenario) {
41
- case "trust_prompt_unresolved": return { scenario, steps: ["accept_trust_prompt"], maxAttempts: 1, escalationPolicy: "alert_human" };
42
- case "prompt_misdelivery": return { scenario, steps: ["redirect_prompt_to_agent"], maxAttempts: 1, escalationPolicy: "alert_human" };
43
- case "stale_branch": return { scenario, steps: ["rebase_branch", "clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
44
- case "compile_red_cross_crate": return { scenario, steps: ["clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
45
- case "mcp_handshake_failure": return { scenario, steps: ["retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "abort" };
46
- case "partial_plugin_startup": return { scenario, steps: ["restart_plugin", "retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "log_and_continue" };
47
- case "worker_stale": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
48
- case "green_unsatisfied": return { scenario, steps: ["collect_verification_evidence"], maxAttempts: 1, escalationPolicy: "alert_human" };
49
- case "task_failed": return { scenario, steps: ["rerun_task"], maxAttempts: 1, escalationPolicy: "alert_human" };
50
- case "provider_failure": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
51
- }
52
- }
53
-
54
- export function buildRecoveryLedger(decisions: PolicyDecision[], previous: RecoveryLedger = { entries: [] }): RecoveryLedger {
55
- const entries = [...previous.entries];
56
- for (const item of decisions) {
57
- if (!["retry", "escalate", "block"].includes(item.action)) continue;
58
- const scenario = scenarioForPolicyReason(item.reason);
59
- const recipe = recipeFor(scenario);
60
- const priorAttempts = entries.filter((entry) => entry.scenario === scenario && entry.taskId === item.taskId).length;
61
- const attempt = priorAttempts + 1;
62
- entries.push({
63
- scenario,
64
- taskId: item.taskId,
65
- decisionReason: item.reason,
66
- attempt,
67
- state: attempt <= recipe.maxAttempts && item.action !== "block" ? "planned" : "escalation_required",
68
- steps: attempt <= recipe.maxAttempts ? recipe.steps : ["escalate_to_human"],
69
- message: item.message,
70
- createdAt: new Date().toISOString(),
71
- });
72
- }
73
- return { entries };
74
- }
1
+ import type { PolicyDecision, PolicyDecisionReason } from "../state/types.ts";
2
+
3
+ export type FailureScenario = "trust_prompt_unresolved" | "prompt_misdelivery" | "stale_branch" | "compile_red_cross_crate" | "mcp_handshake_failure" | "partial_plugin_startup" | "provider_failure" | "task_failed" | "worker_stale" | "green_unsatisfied";
4
+ export type RecoveryStep = "accept_trust_prompt" | "redirect_prompt_to_agent" | "rebase_branch" | "clean_build" | "retry_mcp_handshake" | "restart_plugin" | "restart_worker" | "rerun_task" | "collect_verification_evidence" | "escalate_to_human";
5
+ export type RecoveryResultState = "planned" | "skipped" | "escalation_required";
6
+
7
+ export interface RecoveryRecipe {
8
+ scenario: FailureScenario;
9
+ steps: RecoveryStep[];
10
+ maxAttempts: number;
11
+ escalationPolicy: "alert_human" | "log_and_continue" | "abort";
12
+ }
13
+
14
+ export interface RecoveryLedgerEntry {
15
+ scenario: FailureScenario;
16
+ taskId?: string;
17
+ decisionReason: PolicyDecisionReason;
18
+ attempt: number;
19
+ state: RecoveryResultState;
20
+ steps: RecoveryStep[];
21
+ message: string;
22
+ createdAt: string;
23
+ }
24
+
25
+ export interface RecoveryLedger {
26
+ entries: RecoveryLedgerEntry[];
27
+ }
28
+
29
+ export function scenarioForPolicyReason(reason: PolicyDecisionReason): FailureScenario {
30
+ switch (reason) {
31
+ case "branch_stale": return "stale_branch";
32
+ case "worker_stale": return "worker_stale";
33
+ case "green_unsatisfied": return "green_unsatisfied";
34
+ case "task_failed": return "task_failed";
35
+ default: return "provider_failure";
36
+ }
37
+ }
38
+
39
+ export function recipeFor(scenario: FailureScenario): RecoveryRecipe {
40
+ switch (scenario) {
41
+ case "trust_prompt_unresolved": return { scenario, steps: ["accept_trust_prompt"], maxAttempts: 1, escalationPolicy: "alert_human" };
42
+ case "prompt_misdelivery": return { scenario, steps: ["redirect_prompt_to_agent"], maxAttempts: 1, escalationPolicy: "alert_human" };
43
+ case "stale_branch": return { scenario, steps: ["rebase_branch", "clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
44
+ case "compile_red_cross_crate": return { scenario, steps: ["clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
45
+ case "mcp_handshake_failure": return { scenario, steps: ["retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "abort" };
46
+ case "partial_plugin_startup": return { scenario, steps: ["restart_plugin", "retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "log_and_continue" };
47
+ case "worker_stale": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
48
+ case "green_unsatisfied": return { scenario, steps: ["collect_verification_evidence"], maxAttempts: 1, escalationPolicy: "alert_human" };
49
+ case "task_failed": return { scenario, steps: ["rerun_task"], maxAttempts: 1, escalationPolicy: "alert_human" };
50
+ case "provider_failure": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
51
+ }
52
+ }
53
+
54
+ export function buildRecoveryLedger(decisions: PolicyDecision[], previous: RecoveryLedger = { entries: [] }): RecoveryLedger {
55
+ const entries = [...previous.entries];
56
+ for (const item of decisions) {
57
+ if (!["retry", "escalate", "block"].includes(item.action)) continue;
58
+ const scenario = scenarioForPolicyReason(item.reason);
59
+ const recipe = recipeFor(scenario);
60
+ const priorAttempts = entries.filter((entry) => entry.scenario === scenario && entry.taskId === item.taskId).length;
61
+ const attempt = priorAttempts + 1;
62
+ entries.push({
63
+ scenario,
64
+ taskId: item.taskId,
65
+ decisionReason: item.reason,
66
+ attempt,
67
+ state: attempt <= recipe.maxAttempts && item.action !== "block" ? "planned" : "escalation_required",
68
+ steps: attempt <= recipe.maxAttempts ? recipe.steps : ["escalate_to_human"],
69
+ message: item.message,
70
+ createdAt: new Date().toISOString(),
71
+ });
72
+ }
73
+ return { entries };
74
+ }
@@ -0,0 +1,121 @@
1
+ /**
2
+ * Structured Result Extractor — attempts to extract structured data from worker output.
3
+ * Tries multiple extraction strategies before falling back to raw text.
4
+ */
5
+ export interface ExtractedResult {
6
+ /** Whether structured data was successfully extracted */
7
+ structured: boolean;
8
+ /** Parsed structured data (if structured=true) */
9
+ data: unknown;
10
+ /** Raw text output (always available) */
11
+ rawText: string;
12
+ /** Error message if extraction was attempted but failed */
13
+ error?: string;
14
+ }
15
+
16
+ /**
17
+ * Extract structured result from raw worker output text.
18
+ * Tries strategies in order: direct JSON, fenced JSON, key-value markers.
19
+ */
20
+ export function extractStructuredResult(raw: string, _schema?: Record<string, unknown>): ExtractedResult {
21
+ const trimmed = raw.trim();
22
+ if (!trimmed) {
23
+ return { structured: false, data: null, rawText: raw };
24
+ }
25
+
26
+ // Strategy 1: Direct JSON parse (entire output is JSON)
27
+ const directResult = tryDirectJson(trimmed);
28
+ if (directResult !== undefined) {
29
+ return { structured: true, data: directResult, rawText: raw };
30
+ }
31
+
32
+ // Strategy 2: Extract from ```json ... ``` fence
33
+ const fencedResult = tryFencedJson(trimmed);
34
+ if (fencedResult !== undefined) {
35
+ return { structured: true, data: fencedResult, rawText: raw };
36
+ }
37
+
38
+ // Strategy 3: Extract from markers like "RESULT:" or "OUTPUT:"
39
+ const markerResult = tryMarkerExtraction(trimmed);
40
+ if (markerResult !== undefined) {
41
+ return { structured: true, data: markerResult, rawText: raw };
42
+ }
43
+
44
+ return { structured: false, data: null, rawText: raw };
45
+ }
46
+
47
+ function tryDirectJson(text: string): unknown | undefined {
48
+ if (!text.startsWith("{") && !text.startsWith("[")) return undefined;
49
+ try {
50
+ return JSON.parse(text);
51
+ } catch {
52
+ return undefined;
53
+ }
54
+ }
55
+
56
+ function tryFencedJson(text: string): unknown | undefined {
57
+ const match = text.match(/```json\s*\n([\s\S]*?)\n\s*```/);
58
+ if (!match?.[1]) return undefined;
59
+ try {
60
+ return JSON.parse(match[1].trim());
61
+ } catch {
62
+ return undefined;
63
+ }
64
+ }
65
+
66
+ function tryMarkerExtraction(text: string): unknown | undefined {
67
+ // Try to find JSON after common markers
68
+ const markers = ["RESULT:", "OUTPUT:", "ANSWER:", "### Result\n", "## Output\n"];
69
+ for (const marker of markers) {
70
+ const idx = text.indexOf(marker);
71
+ if (idx === -1) continue;
72
+ const after = text.slice(idx + marker.length).trim();
73
+ // Try JSON parse on text after marker
74
+ if (after.startsWith("{") || after.startsWith("[")) {
75
+ try {
76
+ return JSON.parse(after);
77
+ } catch {
78
+ // Try to find just the JSON object/array
79
+ const jsonEnd = findMatchingBracket(after);
80
+ if (jsonEnd > 0) {
81
+ try {
82
+ return JSON.parse(after.slice(0, jsonEnd));
83
+ } catch {
84
+ continue;
85
+ }
86
+ }
87
+ }
88
+ }
89
+ }
90
+ return undefined;
91
+ }
92
+
93
+ function findMatchingBracket(text: string): number {
94
+ const openChar = text[0];
95
+ const closeChar = openChar === "{" ? "}" : "]";
96
+ let depth = 0;
97
+ let inString = false;
98
+ let escape = false;
99
+ for (let i = 0; i < text.length; i++) {
100
+ const ch = text[i];
101
+ if (escape) {
102
+ escape = false;
103
+ continue;
104
+ }
105
+ if (ch === "\\") {
106
+ escape = true;
107
+ continue;
108
+ }
109
+ if (ch === '"') {
110
+ inString = !inString;
111
+ continue;
112
+ }
113
+ if (inString) continue;
114
+ if (ch === openChar) depth++;
115
+ if (ch === closeChar) {
116
+ depth--;
117
+ if (depth === 0) return i + 1;
118
+ }
119
+ }
120
+ return -1;
121
+ }
@@ -1,39 +1,39 @@
1
- export type RolePermissionMode = "read_only" | "workspace_write" | "danger_full_access" | "explicit_confirm";
2
-
3
- const READ_ONLY_ROLES = new Set(["explorer", "reviewer", "security-reviewer", "verifier", "analyst", "critic", "planner", "writer"]);
4
- const WRITE_ROLES = new Set(["executor", "test-engineer"]);
5
- const READ_ONLY_COMMANDS = new Set(["cat", "head", "tail", "less", "more", "wc", "ls", "find", "grep", "rg", "awk", "sed", "echo", "printf", "which", "where", "whoami", "pwd", "env", "printenv", "date", "df", "du", "uname", "file", "stat", "diff", "sort", "uniq", "tr", "cut", "paste", "test", "true", "false", "type", "readlink", "realpath", "basename", "dirname", "sha256sum", "md5sum", "xxd", "hexdump", "od", "strings", "tree", "jq", "git", "gh"]);
6
-
7
- export interface PermissionCheckResult {
8
- allowed: boolean;
9
- mode: RolePermissionMode;
10
- reason?: string;
11
- }
12
-
13
- export function permissionForRole(role: string): RolePermissionMode {
14
- if (READ_ONLY_ROLES.has(role)) return "read_only";
15
- if (WRITE_ROLES.has(role)) return "workspace_write";
16
- return "workspace_write";
17
- }
18
-
19
- export function isReadOnlyCommand(command: string): boolean {
20
- const first = command.trim().split(/\s+/)[0]?.split(/[\\/]/).pop() ?? "";
21
- return READ_ONLY_COMMANDS.has(first) && !/\s(-i|--in-place)\b|\s>{1,2}\s|\brm\b|\bmv\b|\bcp\b|\b(?:npm|pnpm|yarn|bun)\s+(install|add|ci|remove)\b|\bgit\s+(commit|push|merge|rebase|reset|checkout|clean)\b/.test(command);
22
- }
23
-
24
- export function checkRolePermission(role: string, command: string): PermissionCheckResult {
25
- const mode = permissionForRole(role);
26
- if (mode === "read_only" && !isReadOnlyCommand(command)) return { allowed: false, mode, reason: `Role '${role}' is read-only and command may modify state.` };
27
- return { allowed: true, mode };
28
- }
29
-
30
- export function currentCrewRole(env: NodeJS.ProcessEnv = process.env): string | undefined {
31
- return env.PI_CREW_ROLE?.trim() || env.PI_TEAMS_ROLE?.trim() || undefined;
32
- }
33
-
34
- export function checkSubagentSpawnPermission(role: string | undefined): PermissionCheckResult {
35
- if (!role) return { allowed: true, mode: "workspace_write" };
36
- const mode = permissionForRole(role);
37
- if (mode === "read_only") return { allowed: false, mode, reason: `Role '${role}' is read-only and cannot spawn additional subagents.` };
38
- return { allowed: true, mode };
39
- }
1
+ export type RolePermissionMode = "read_only" | "workspace_write" | "danger_full_access" | "explicit_confirm";
2
+
3
+ const READ_ONLY_ROLES = new Set(["explorer", "reviewer", "security-reviewer", "verifier", "analyst", "critic", "planner", "writer"]);
4
+ const WRITE_ROLES = new Set(["executor", "test-engineer"]);
5
+ const READ_ONLY_COMMANDS = new Set(["cat", "head", "tail", "less", "more", "wc", "ls", "find", "grep", "rg", "awk", "sed", "echo", "printf", "which", "where", "whoami", "pwd", "env", "printenv", "date", "df", "du", "uname", "file", "stat", "diff", "sort", "uniq", "tr", "cut", "paste", "test", "true", "false", "type", "readlink", "realpath", "basename", "dirname", "sha256sum", "md5sum", "xxd", "hexdump", "od", "strings", "tree", "jq", "git", "gh"]);
6
+
7
+ export interface PermissionCheckResult {
8
+ allowed: boolean;
9
+ mode: RolePermissionMode;
10
+ reason?: string;
11
+ }
12
+
13
+ export function permissionForRole(role: string): RolePermissionMode {
14
+ if (READ_ONLY_ROLES.has(role)) return "read_only";
15
+ if (WRITE_ROLES.has(role)) return "workspace_write";
16
+ return "workspace_write";
17
+ }
18
+
19
+ export function isReadOnlyCommand(command: string): boolean {
20
+ const first = command.trim().split(/\s+/)[0]?.split(/[\\/]/).pop() ?? "";
21
+ return READ_ONLY_COMMANDS.has(first) && !/\s(-i|--in-place)\b|\s>{1,2}\s|\brm\b|\bmv\b|\bcp\b|\b(?:npm|pnpm|yarn|bun)\s+(install|add|ci|remove)\b|\bgit\s+(commit|push|merge|rebase|reset|checkout|clean)\b/.test(command);
22
+ }
23
+
24
+ export function checkRolePermission(role: string, command: string): PermissionCheckResult {
25
+ const mode = permissionForRole(role);
26
+ if (mode === "read_only" && !isReadOnlyCommand(command)) return { allowed: false, mode, reason: `Role '${role}' is read-only and command may modify state.` };
27
+ return { allowed: true, mode };
28
+ }
29
+
30
+ export function currentCrewRole(env: NodeJS.ProcessEnv = process.env): string | undefined {
31
+ return env.PI_CREW_ROLE?.trim() || env.PI_TEAMS_ROLE?.trim() || undefined;
32
+ }
33
+
34
+ export function checkSubagentSpawnPermission(role: string | undefined): PermissionCheckResult {
35
+ if (!role) return { allowed: true, mode: "workspace_write" };
36
+ const mode = permissionForRole(role);
37
+ if (mode === "read_only") return { allowed: false, mode, reason: `Role '${role}' is read-only and cannot spawn additional subagents.` };
38
+ return { allowed: true, mode };
39
+ }
@@ -32,9 +32,6 @@ export function runtimeResolutionState(runtime: CrewRuntimeCapabilities, resolve
32
32
  }
33
33
 
34
34
  export async function isLiveSessionRuntimeAvailable(timeoutMs = 1500, env: NodeJS.ProcessEnv = process.env): Promise<{ available: boolean; reason?: string }> {
35
- if (env.PI_CREW_ENABLE_EXPERIMENTAL_LIVE_SESSION !== "1") {
36
- return { available: false, reason: "Live-session runtime adapter is experimental and disabled. Set PI_CREW_ENABLE_EXPERIMENTAL_LIVE_SESSION=1 to probe SDK support." };
37
- }
38
35
  if (env.PI_CREW_MOCK_LIVE_SESSION === "success") {
39
36
  return { available: true, reason: "Mock live-session runtime is enabled." };
40
37
  }
@@ -74,7 +71,7 @@ export async function resolveCrewRuntime(config: PiTeamsConfig, env: NodeJS.Proc
74
71
  if (requestedMode === "live-session" || (requestedMode === "auto" && config.runtime?.preferLiveSession === true)) {
75
72
  const live = await isLiveSessionRuntimeAvailable(1500, env);
76
73
  if (live.available) return liveCaps(requestedMode);
77
- if (requestedMode === "live-session" && config.runtime?.allowChildProcessFallback === false) return { ...scaffoldCaps(requestedMode), available: false, reason: live.reason };
74
+ if (requestedMode === "live-session" && config.runtime?.allowChildProcessFallback === false) return scaffoldCaps(requestedMode, live.reason, "blocked");
78
75
  return { ...childCaps(requestedMode), fallback: "child-process", reason: live.reason };
79
76
  }
80
77
  return childCaps(requestedMode);
@@ -0,0 +1,131 @@
1
+ /**
2
+ * Phase 6: Semaphore and fail-fast parallel execution.
3
+ *
4
+ * Adapted from oh-my-pi's `parallel.ts` Semaphore class and
5
+ * `mapWithConcurrencyLimit` implementation. Provides:
6
+ * - Explicit acquire/release Semaphore for concurrency control
7
+ * - Fail-fast on first error (via Promise.race)
8
+ * - AbortSignal support for graceful cancellation
9
+ * - Partial results on abort
10
+ */
11
+
12
+ /**
13
+ * Simple counting semaphore for limiting concurrency across independently-scheduled async work.
14
+ */
15
+ export class Semaphore {
16
+ #max: number;
17
+ #current = 0;
18
+ #queue: Array<() => void> = [];
19
+
20
+ constructor(max: number) {
21
+ this.#max = Math.max(1, max);
22
+ }
23
+
24
+ async acquire(): Promise<void> {
25
+ if (this.#current < this.#max) {
26
+ this.#current++;
27
+ return;
28
+ }
29
+ const { promise, resolve } = (() => {
30
+ let res: () => void;
31
+ const p = new Promise<void>((r) => { res = r; });
32
+ return { promise: p, resolve: res! };
33
+ })();
34
+ this.#queue.push(resolve);
35
+ return promise;
36
+ }
37
+
38
+ release(): void {
39
+ const next = this.#queue.shift();
40
+ if (next) {
41
+ next();
42
+ } else if (this.#current > 0) {
43
+ this.#current--;
44
+ }
45
+ // Guard: over-release is a no-op to prevent #current going negative
46
+ }
47
+
48
+ /** Current number of acquired slots. */
49
+ get current(): number {
50
+ return this.#current;
51
+ }
52
+
53
+ /** Number of waiters in the queue. */
54
+ get waiting(): number {
55
+ return this.#queue.length;
56
+ }
57
+ }
58
+
59
+ /**
60
+ * Result of parallel execution with fail-fast support.
61
+ */
62
+ export interface ParallelResult<R> {
63
+ /** Results array — undefined entries indicate tasks that were skipped due to abort. */
64
+ results: (R | undefined)[];
65
+ /** Whether execution was aborted before all tasks completed. */
66
+ aborted: boolean;
67
+ /** The first error that triggered fail-fast, if any. */
68
+ firstError?: unknown;
69
+ }
70
+
71
+ /**
72
+ * Execute items with a concurrency limit, fail-fast, and abort signal support.
73
+ *
74
+ * - On first error: aborts remaining workers and rethrows.
75
+ * - On external abort: returns partial results with `aborted: true`.
76
+ * - Results are returned in the same order as input items.
77
+ *
78
+ * Adapted from oh-my-pi's `mapWithConcurrencyLimit`.
79
+ */
80
+ export async function mapWithFailFast<T, R>(
81
+ items: T[],
82
+ concurrency: number,
83
+ fn: (item: T, index: number, signal: AbortSignal) => Promise<R>,
84
+ signal?: AbortSignal,
85
+ ): Promise<ParallelResult<R>> {
86
+ const limit = Math.max(1, Math.min(concurrency, items.length));
87
+ const results: (R | undefined)[] = new Array(items.length);
88
+ let nextIndex = 0;
89
+
90
+ // Internal abort controller for fail-fast
91
+ const abortController = new AbortController();
92
+ const workerSignal = signal
93
+ ? AbortSignal.any([signal, abortController.signal])
94
+ : abortController.signal;
95
+
96
+ // Promise that rejects on first error — used for fail-fast
97
+ let rejectFirst: (error: unknown) => void;
98
+ const firstErrorPromise = new Promise<never>((_, reject) => {
99
+ rejectFirst = reject;
100
+ });
101
+
102
+ const worker = async (): Promise<void> => {
103
+ while (true) {
104
+ if (workerSignal.aborted) return;
105
+ const index = nextIndex++;
106
+ if (index >= items.length) return;
107
+ try {
108
+ results[index] = await fn(items[index], index, workerSignal);
109
+ } catch (error) {
110
+ if (!workerSignal.aborted) {
111
+ abortController.abort();
112
+ rejectFirst(error);
113
+ throw error;
114
+ }
115
+ }
116
+ }
117
+ };
118
+
119
+ const workers = Array.from({ length: limit }, () => worker());
120
+
121
+ try {
122
+ await Promise.race([Promise.all(workers), firstErrorPromise]);
123
+ } catch (error) {
124
+ if (signal?.aborted) {
125
+ return { results, aborted: true, firstError: error };
126
+ }
127
+ throw error;
128
+ }
129
+
130
+ return { results, aborted: signal?.aborted ?? false };
131
+ }
@@ -0,0 +1,92 @@
1
+ /**
2
+ * Sensitive file detection for worker constraints.
3
+ *
4
+ * Inspired by caveman's compress.py — prevents workers from reading
5
+ * or compressing files that contain secrets, credentials, or PII.
6
+ *
7
+ * Workers should refuse operations on matching paths. This is enforced
8
+ * in the worker prompt and validated here for defense-in-depth.
9
+ */
10
+
11
+ import * as path from "node:path";
12
+
13
+ /** Basenames that almost certainly hold secrets or PII */
14
+ const SENSITIVE_BASENAMES = /\.(?:env|pem|key|p12|pfx|crt|cer|jks|keystore|asc|gpg)(?:\..+)?$/i;
15
+ const SENSITIVE_EXACT = /^(?:\.env|\.netrc|\.npmrc|\.pypirc|credentials|secrets?|passwords?|id_(?:rsa|dsa|ecdsa|ed25519)(?:\.pub)?|authorized_keys|known_hosts)$/i;
16
+
17
+ /** Path components that indicate sensitive directories */
18
+ const SENSITIVE_DIRS = new Set([".ssh", ".aws", ".gnupg", ".kube", ".docker", ".config/gcloud"]);
19
+
20
+ /** Name tokens that suggest sensitive content */
21
+ const SENSITIVE_TOKENS = ["secret", "credential", "password", "passwd", "apikey", "accesskey", "token", "privatekey"];
22
+
23
+ /**
24
+ * Check if a file path looks like it contains sensitive data.
25
+ * Returns true if the path should be refused for worker operations.
26
+ */
27
+ export function isSensitivePath(filePath: string): boolean {
28
+ const resolved = path.resolve(filePath);
29
+ const basename = path.basename(resolved);
30
+ const lower = basename.toLowerCase();
31
+
32
+ // Check exact sensitive filenames
33
+ if (SENSITIVE_EXACT.test(basename)) return true;
34
+
35
+ // Check sensitive extensions
36
+ if (SENSITIVE_BASENAMES.test(basename)) return true;
37
+
38
+ // Check path components
39
+ const parts = resolved.split(/[/\\]/).map((p) => p.toLowerCase());
40
+ for (const dir of SENSITIVE_DIRS) {
41
+ const dirParts = dir.split("/");
42
+ for (let i = 0; i <= parts.length - dirParts.length; i++) {
43
+ const slice = parts.slice(i, i + dirParts.length);
44
+ if (slice.join("/") === dir) return true;
45
+ }
46
+ }
47
+
48
+ // Check name tokens with word-boundary awareness to reduce false positives.
49
+ // Strategy: split filename on separators to get "words", then check if
50
+ // any token matches. For substring matching in the normalized form,
51
+ // we require the token to end at a segment boundary or string end.
52
+ // This matches 'secret', 'secrets' but NOT 'secretary'.
53
+ const words = lower.split(/[_\-\s.]+/).filter(Boolean);
54
+ const normalized = lower.replace(/[_\-\s.]/g, "");
55
+ for (const token of SENSITIVE_TOKENS) {
56
+ // Check individual words — exact match or token is prefix and word is <= token+2 chars
57
+ for (const word of words) {
58
+ if (word === token) return true;
59
+ // 'secrets' starts with 'secret' and is only 1 char longer → match
60
+ // 'secretary' starts with 'secret' but is 4 chars longer → no match
61
+ if (word.startsWith(token) && word.length <= token.length + 2) return true;
62
+ }
63
+ // Check fully-normalized form for compound tokens like 'api-key' → 'apikey'
64
+ // The token must appear as a complete segment (not a partial substring).
65
+ // After the token, the remaining chars must be a complete word (extension).
66
+ const idx = normalized.indexOf(token);
67
+ if (idx !== -1) {
68
+ const after = idx + token.length;
69
+ if (after === normalized.length) return true;
70
+ // Check if remaining chars after token correspond to a known word segment
71
+ const remaining = normalized.slice(after);
72
+ if (words.some((w) => remaining === w || remaining.startsWith(w))) return true;
73
+ }
74
+ }
75
+
76
+ return false;
77
+ }
78
+
79
+ /**
80
+ * Build a worker prompt constraint block listing forbidden paths.
81
+ * This goes into the worker system prompt to prevent accidental reads.
82
+ */
83
+ export function buildSensitivePathConstraint(): string {
84
+ return [
85
+ "## Security Constraints",
86
+ "NEVER read, compress, or include content from:",
87
+ "- Files matching: .env*, *.pem, *.key, *.p12, credentials*, secrets*, passwords*, id_rsa*",
88
+ "- Directories: .ssh/, .aws/, .gnupg/, .kube/, .docker/",
89
+ "- Files with names containing: secret, credential, password, apikey, token, privatekey",
90
+ "If asked to read such a file, refuse and explain the security risk.",
91
+ ].join("\n");
92
+ }
@@ -1,25 +1,25 @@
1
- import type { ExtensionAPI } from "@mariozechner/pi-coding-agent";
2
- import { logInternalError } from "../utils/internal-error.ts";
3
-
4
- /**
5
- * Try to register a cleanup function with Pi's session resource cleanup API (v0.72+).
6
- * Falls back to returning undefined if the API is not available.
7
- *
8
- * The returned function (if defined) can be called to unregister the cleanup.
9
- */
10
- export function tryRegisterSessionCleanup(pi: ExtensionAPI, cleanup: () => void): (() => void) | undefined {
11
- const api = pi as unknown as Record<string, unknown>;
12
- const registerFn = api["registerSessionResourceCleanup"];
13
- if (typeof registerFn === "function") {
14
- try {
15
- const unregister = (registerFn as (fn: () => void) => (() => void) | void)(cleanup);
16
- if (typeof unregister === "function") return unregister;
17
- // API returned void — cleanup is registered but cannot be unregistered
18
- return undefined;
19
- } catch (error) {
20
- logInternalError("session-resources.register", error);
21
- return undefined;
22
- }
23
- }
24
- return undefined;
25
- }
1
+ import type { ExtensionAPI } from "@mariozechner/pi-coding-agent";
2
+ import { logInternalError } from "../utils/internal-error.ts";
3
+
4
+ /**
5
+ * Try to register a cleanup function with Pi's session resource cleanup API (v0.72+).
6
+ * Falls back to returning undefined if the API is not available.
7
+ *
8
+ * The returned function (if defined) can be called to unregister the cleanup.
9
+ */
10
+ export function tryRegisterSessionCleanup(pi: ExtensionAPI, cleanup: () => void): (() => void) | undefined {
11
+ const api = pi as unknown as Record<string, unknown>;
12
+ const registerFn = api["registerSessionResourceCleanup"];
13
+ if (typeof registerFn === "function") {
14
+ try {
15
+ const unregister = (registerFn as (fn: () => void) => (() => void) | void)(cleanup);
16
+ if (typeof unregister === "function") return unregister;
17
+ // API returned void — cleanup is registered but cannot be unregistered
18
+ return undefined;
19
+ } catch (error) {
20
+ logInternalError("session-resources.register", error);
21
+ return undefined;
22
+ }
23
+ }
24
+ return undefined;
25
+ }