pi-crew 0.1.44 → 0.1.45

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (142) hide show
  1. package/CHANGELOG.md +27 -0
  2. package/agents/analyst.md +11 -11
  3. package/agents/critic.md +11 -11
  4. package/agents/executor.md +11 -11
  5. package/agents/explorer.md +11 -11
  6. package/agents/planner.md +11 -11
  7. package/agents/reviewer.md +11 -11
  8. package/agents/security-reviewer.md +11 -11
  9. package/agents/test-engineer.md +11 -11
  10. package/agents/verifier.md +11 -11
  11. package/agents/writer.md +11 -11
  12. package/docs/refactor-tasks-phase3.md +394 -394
  13. package/docs/refactor-tasks-phase4.md +564 -564
  14. package/docs/refactor-tasks-phase5.md +402 -402
  15. package/docs/refactor-tasks-phase6.md +662 -662
  16. package/docs/research-extension-examples.md +297 -297
  17. package/docs/research-extension-system.md +324 -324
  18. package/docs/research-optimization-plan.md +548 -548
  19. package/docs/research-phase10-distillation.md +198 -198
  20. package/docs/research-phase11-distillation.md +201 -201
  21. package/docs/research-pi-coding-agent.md +357 -357
  22. package/docs/research-source-pi-crew-reference.md +174 -174
  23. package/docs/runtime-flow.md +148 -148
  24. package/docs/source-runtime-refactor-map.md +83 -83
  25. package/index.ts +6 -6
  26. package/package.json +1 -1
  27. package/src/agents/agent-serializer.ts +34 -34
  28. package/src/extension/cross-extension-rpc.ts +82 -82
  29. package/src/extension/register.ts +8 -1
  30. package/src/extension/registration/commands.ts +18 -2
  31. package/src/extension/registration/compaction-guard.ts +125 -125
  32. package/src/extension/registration/subagent-tools.ts +148 -148
  33. package/src/extension/registration/team-tool.ts +26 -8
  34. package/src/extension/run-bundle-schema.ts +89 -89
  35. package/src/extension/run-maintenance.ts +43 -43
  36. package/src/extension/team-tool/cancel.ts +105 -102
  37. package/src/extension/team-tool/context.ts +1 -0
  38. package/src/extension/team-tool/handle-settings.ts +188 -188
  39. package/src/extension/team-tool/inspect.ts +41 -41
  40. package/src/extension/team-tool/lifecycle-actions.ts +79 -79
  41. package/src/extension/team-tool/plan.ts +19 -19
  42. package/src/extension/team-tool/respond.ts +83 -66
  43. package/src/extension/team-tool/run.ts +1 -0
  44. package/src/i18n.ts +184 -184
  45. package/src/observability/exporters/otlp-exporter.ts +77 -77
  46. package/src/prompt/prompt-runtime.ts +72 -72
  47. package/src/runtime/agent-control.ts +63 -63
  48. package/src/runtime/agent-memory.ts +72 -72
  49. package/src/runtime/agent-observability.ts +114 -114
  50. package/src/runtime/async-marker.ts +26 -26
  51. package/src/runtime/attention-events.ts +28 -28
  52. package/src/runtime/background-runner.ts +53 -53
  53. package/src/runtime/child-pi.ts +444 -444
  54. package/src/runtime/completion-guard.ts +190 -190
  55. package/src/runtime/crew-agent-records.ts +8 -0
  56. package/src/runtime/delivery-coordinator.ts +153 -142
  57. package/src/runtime/direct-run.ts +35 -35
  58. package/src/runtime/foreground-control.ts +82 -82
  59. package/src/runtime/green-contract.ts +46 -46
  60. package/src/runtime/group-join.ts +106 -106
  61. package/src/runtime/heartbeat-gradient.ts +28 -28
  62. package/src/runtime/heartbeat-watcher.ts +124 -124
  63. package/src/runtime/live-agent-control.ts +87 -87
  64. package/src/runtime/live-agent-manager.ts +85 -85
  65. package/src/runtime/live-control-realtime.ts +36 -36
  66. package/src/runtime/live-session-runtime.ts +305 -305
  67. package/src/runtime/overflow-recovery.ts +175 -156
  68. package/src/runtime/parallel-research.ts +44 -44
  69. package/src/runtime/pi-json-output.ts +111 -111
  70. package/src/runtime/policy-engine.ts +79 -79
  71. package/src/runtime/progress-event-coalescer.ts +43 -43
  72. package/src/runtime/recovery-recipes.ts +74 -74
  73. package/src/runtime/retry-executor.ts +64 -64
  74. package/src/runtime/role-permission.ts +39 -39
  75. package/src/runtime/session-resources.ts +25 -25
  76. package/src/runtime/session-snapshot.ts +59 -59
  77. package/src/runtime/session-usage.ts +79 -79
  78. package/src/runtime/sidechain-output.ts +29 -29
  79. package/src/runtime/stale-reconciler.ts +199 -179
  80. package/src/runtime/supervisor-contact.ts +59 -59
  81. package/src/runtime/task-display.ts +38 -38
  82. package/src/runtime/task-output-context.ts +127 -127
  83. package/src/runtime/task-runner/live-executor.ts +101 -101
  84. package/src/runtime/task-runner/progress.ts +119 -119
  85. package/src/runtime/task-runner/result-utils.ts +14 -14
  86. package/src/runtime/task-runner/state-helpers.ts +22 -22
  87. package/src/runtime/team-runner.ts +13 -4
  88. package/src/runtime/worker-heartbeat.ts +21 -21
  89. package/src/runtime/worker-startup.ts +57 -57
  90. package/src/state/state-store.ts +43 -0
  91. package/src/state/task-claims.ts +44 -44
  92. package/src/state/types.ts +2 -0
  93. package/src/state/usage.ts +29 -29
  94. package/src/subagents/async-entry.ts +1 -1
  95. package/src/subagents/index.ts +3 -3
  96. package/src/subagents/live/control.ts +1 -1
  97. package/src/subagents/live/manager.ts +1 -1
  98. package/src/subagents/live/realtime.ts +1 -1
  99. package/src/subagents/live/session-runtime.ts +1 -1
  100. package/src/subagents/manager.ts +1 -1
  101. package/src/subagents/spawn.ts +1 -1
  102. package/src/teams/team-serializer.ts +38 -38
  103. package/src/types/diff.d.ts +18 -18
  104. package/src/ui/crew-footer.ts +101 -101
  105. package/src/ui/crew-select-list.ts +111 -111
  106. package/src/ui/crew-widget.ts +5 -1
  107. package/src/ui/dashboard-panes/mailbox-pane.ts +2 -1
  108. package/src/ui/dashboard-panes/metrics-pane.ts +34 -34
  109. package/src/ui/dynamic-border.ts +25 -25
  110. package/src/ui/layout-primitives.ts +106 -106
  111. package/src/ui/loaders.ts +158 -158
  112. package/src/ui/powerbar-publisher.ts +1 -1
  113. package/src/ui/render-diff.ts +119 -119
  114. package/src/ui/render-scheduler.ts +143 -143
  115. package/src/ui/run-snapshot-cache.ts +56 -37
  116. package/src/ui/snapshot-types.ts +5 -0
  117. package/src/ui/spinner.ts +17 -17
  118. package/src/ui/status-colors.ts +58 -58
  119. package/src/ui/syntax-highlight.ts +116 -116
  120. package/src/utils/atomic-write.ts +33 -33
  121. package/src/utils/completion-dedupe.ts +63 -63
  122. package/src/utils/frontmatter.ts +68 -68
  123. package/src/utils/git.ts +262 -262
  124. package/src/utils/ids.ts +12 -12
  125. package/src/utils/names.ts +27 -27
  126. package/src/utils/redaction.ts +44 -44
  127. package/src/utils/safe-paths.ts +47 -47
  128. package/src/utils/sleep.ts +32 -32
  129. package/src/workflows/validate-workflow.ts +40 -40
  130. package/src/worktree/branch-freshness.ts +45 -45
  131. package/teams/default.team.md +12 -12
  132. package/teams/fast-fix.team.md +11 -11
  133. package/teams/implementation.team.md +18 -18
  134. package/teams/parallel-research.team.md +14 -14
  135. package/teams/research.team.md +11 -11
  136. package/teams/review.team.md +12 -12
  137. package/workflows/default.workflow.md +29 -29
  138. package/workflows/fast-fix.workflow.md +22 -22
  139. package/workflows/implementation.workflow.md +38 -38
  140. package/workflows/parallel-research.workflow.md +46 -46
  141. package/workflows/research.workflow.md +22 -22
  142. package/workflows/review.workflow.md +30 -30
@@ -1,79 +1,79 @@
1
- import type { CrewLimitsConfig } from "../config/config.ts";
2
- import type { PolicyDecision, PolicyDecisionAction, PolicyDecisionReason, TeamRunManifest, TeamTaskState } from "../state/types.ts";
3
- import { evaluateGreenContract } from "./green-contract.ts";
4
- import { isWorkerHeartbeatStale } from "./worker-heartbeat.ts";
5
-
6
- export interface PolicyEngineInput {
7
- manifest: TeamRunManifest;
8
- tasks: TeamTaskState[];
9
- limits?: CrewLimitsConfig;
10
- now?: Date;
11
- }
12
-
13
- function decision(action: PolicyDecisionAction, reason: PolicyDecisionReason, message: string, taskId?: string): PolicyDecision {
14
- return {
15
- action,
16
- reason,
17
- message,
18
- taskId,
19
- createdAt: new Date().toISOString(),
20
- };
21
- }
22
-
23
- function taskDepth(task: TeamTaskState, tasksById: Map<string, TeamTaskState>): number {
24
- let depth = 0;
25
- let current = task.graph?.parentId;
26
- const seen = new Set<string>();
27
- while (current && !seen.has(current)) {
28
- seen.add(current);
29
- depth += 1;
30
- current = tasksById.get(current)?.graph?.parentId;
31
- }
32
- return depth;
33
- }
34
-
35
- export function evaluateCrewPolicy(input: PolicyEngineInput): PolicyDecision[] {
36
- const decisions: PolicyDecision[] = [];
37
- const maxTasksPerRun = Number.isFinite(input.limits?.maxTasksPerRun) ? input.limits!.maxTasksPerRun : undefined;
38
- if (maxTasksPerRun !== undefined && input.tasks.length > maxTasksPerRun) {
39
- decisions.push(decision("block", "limit_exceeded", `Run has ${input.tasks.length} tasks, exceeding maxTasksPerRun=${maxTasksPerRun}.`));
40
- }
41
- const runningCount = input.tasks.filter((task) => task.status === "running").length;
42
- const maxConcurrentWorkers = Number.isFinite(input.limits?.maxConcurrentWorkers) ? input.limits!.maxConcurrentWorkers : undefined;
43
- if (maxConcurrentWorkers !== undefined && runningCount > maxConcurrentWorkers) {
44
- decisions.push(decision("block", "limit_exceeded", `Run has ${runningCount} running workers, exceeding maxConcurrentWorkers=${maxConcurrentWorkers}.`));
45
- }
46
- const tasksById = new Map(input.tasks.map((task) => [task.id, task]));
47
-
48
- for (const task of input.tasks) {
49
- if (input.limits?.maxChildrenPerTask !== undefined && (task.graph?.children.length ?? 0) > input.limits.maxChildrenPerTask) {
50
- decisions.push(decision("block", "limit_exceeded", `Task has ${task.graph?.children.length ?? 0} children, exceeding maxChildrenPerTask=${input.limits.maxChildrenPerTask}.`, task.id));
51
- }
52
- if (input.limits?.maxTaskDepth !== undefined && taskDepth(task, tasksById) > input.limits.maxTaskDepth) {
53
- decisions.push(decision("block", "limit_exceeded", `Task graph depth exceeds maxTaskDepth=${input.limits.maxTaskDepth}.`, task.id));
54
- }
55
- if (task.status === "failed") {
56
- const retryCount = task.policy?.retryCount ?? 0;
57
- const maxRetries = input.limits?.maxRetriesPerTask ?? 0;
58
- decisions.push(decision(retryCount < maxRetries ? "retry" : "escalate", "task_failed", task.error ? `Task failed: ${task.error}` : "Task failed.", task.id));
59
- }
60
- if ((task.status === "running" || task.status === "queued") && task.heartbeat && task.heartbeat.alive !== false && isWorkerHeartbeatStale(task.heartbeat, input.limits?.heartbeatStaleMs ?? 60_000, input.now)) {
61
- decisions.push(decision("escalate", "worker_stale", "Worker heartbeat is stale.", task.id));
62
- }
63
- if (task.taskPacket?.verification) {
64
- const outcome = evaluateGreenContract(task.taskPacket.verification, task.verification);
65
- if (!outcome.satisfied && task.status === "completed") {
66
- decisions.push(decision("block", "green_unsatisfied", `Green contract unsatisfied: required=${outcome.requiredGreenLevel}, observed=${outcome.observedGreenLevel}.`, task.id));
67
- }
68
- }
69
- }
70
-
71
- if (decisions.length === 0 && input.tasks.length > 0 && input.tasks.every((task) => task.status === "completed")) {
72
- decisions.push(decision("closeout", "run_complete", "All tasks completed and no policy blockers were found."));
73
- }
74
- return decisions;
75
- }
76
-
77
- export function summarizePolicyDecisions(decisions: PolicyDecision[]): string[] {
78
- return decisions.map((item) => `- ${item.action} (${item.reason})${item.taskId ? ` ${item.taskId}` : ""}: ${item.message}`);
79
- }
1
+ import type { CrewLimitsConfig } from "../config/config.ts";
2
+ import type { PolicyDecision, PolicyDecisionAction, PolicyDecisionReason, TeamRunManifest, TeamTaskState } from "../state/types.ts";
3
+ import { evaluateGreenContract } from "./green-contract.ts";
4
+ import { isWorkerHeartbeatStale } from "./worker-heartbeat.ts";
5
+
6
+ export interface PolicyEngineInput {
7
+ manifest: TeamRunManifest;
8
+ tasks: TeamTaskState[];
9
+ limits?: CrewLimitsConfig;
10
+ now?: Date;
11
+ }
12
+
13
+ function decision(action: PolicyDecisionAction, reason: PolicyDecisionReason, message: string, taskId?: string): PolicyDecision {
14
+ return {
15
+ action,
16
+ reason,
17
+ message,
18
+ taskId,
19
+ createdAt: new Date().toISOString(),
20
+ };
21
+ }
22
+
23
+ function taskDepth(task: TeamTaskState, tasksById: Map<string, TeamTaskState>): number {
24
+ let depth = 0;
25
+ let current = task.graph?.parentId;
26
+ const seen = new Set<string>();
27
+ while (current && !seen.has(current)) {
28
+ seen.add(current);
29
+ depth += 1;
30
+ current = tasksById.get(current)?.graph?.parentId;
31
+ }
32
+ return depth;
33
+ }
34
+
35
+ export function evaluateCrewPolicy(input: PolicyEngineInput): PolicyDecision[] {
36
+ const decisions: PolicyDecision[] = [];
37
+ const maxTasksPerRun = Number.isFinite(input.limits?.maxTasksPerRun) ? input.limits!.maxTasksPerRun : undefined;
38
+ if (maxTasksPerRun !== undefined && input.tasks.length > maxTasksPerRun) {
39
+ decisions.push(decision("block", "limit_exceeded", `Run has ${input.tasks.length} tasks, exceeding maxTasksPerRun=${maxTasksPerRun}.`));
40
+ }
41
+ const runningCount = input.tasks.filter((task) => task.status === "running").length;
42
+ const maxConcurrentWorkers = Number.isFinite(input.limits?.maxConcurrentWorkers) ? input.limits!.maxConcurrentWorkers : undefined;
43
+ if (maxConcurrentWorkers !== undefined && runningCount > maxConcurrentWorkers) {
44
+ decisions.push(decision("block", "limit_exceeded", `Run has ${runningCount} running workers, exceeding maxConcurrentWorkers=${maxConcurrentWorkers}.`));
45
+ }
46
+ const tasksById = new Map(input.tasks.map((task) => [task.id, task]));
47
+
48
+ for (const task of input.tasks) {
49
+ if (input.limits?.maxChildrenPerTask !== undefined && (task.graph?.children.length ?? 0) > input.limits.maxChildrenPerTask) {
50
+ decisions.push(decision("block", "limit_exceeded", `Task has ${task.graph?.children.length ?? 0} children, exceeding maxChildrenPerTask=${input.limits.maxChildrenPerTask}.`, task.id));
51
+ }
52
+ if (input.limits?.maxTaskDepth !== undefined && taskDepth(task, tasksById) > input.limits.maxTaskDepth) {
53
+ decisions.push(decision("block", "limit_exceeded", `Task graph depth exceeds maxTaskDepth=${input.limits.maxTaskDepth}.`, task.id));
54
+ }
55
+ if (task.status === "failed") {
56
+ const retryCount = task.policy?.retryCount ?? 0;
57
+ const maxRetries = input.limits?.maxRetriesPerTask ?? 0;
58
+ decisions.push(decision(retryCount < maxRetries ? "retry" : "escalate", "task_failed", task.error ? `Task failed: ${task.error}` : "Task failed.", task.id));
59
+ }
60
+ if ((task.status === "running" || task.status === "queued") && task.heartbeat && task.heartbeat.alive !== false && isWorkerHeartbeatStale(task.heartbeat, input.limits?.heartbeatStaleMs ?? 60_000, input.now)) {
61
+ decisions.push(decision("escalate", "worker_stale", "Worker heartbeat is stale.", task.id));
62
+ }
63
+ if (task.taskPacket?.verification) {
64
+ const outcome = evaluateGreenContract(task.taskPacket.verification, task.verification);
65
+ if (!outcome.satisfied && task.status === "completed") {
66
+ decisions.push(decision("block", "green_unsatisfied", `Green contract unsatisfied: required=${outcome.requiredGreenLevel}, observed=${outcome.observedGreenLevel}.`, task.id));
67
+ }
68
+ }
69
+ }
70
+
71
+ if (decisions.length === 0 && input.tasks.length > 0 && input.tasks.every((task) => task.status === "completed")) {
72
+ decisions.push(decision("closeout", "run_complete", "All tasks completed and no policy blockers were found."));
73
+ }
74
+ return decisions;
75
+ }
76
+
77
+ export function summarizePolicyDecisions(decisions: PolicyDecision[]): string[] {
78
+ return decisions.map((item) => `- ${item.action} (${item.reason})${item.taskId ? ` ${item.taskId}` : ""}: ${item.message}`);
79
+ }
@@ -1,43 +1,43 @@
1
- export interface ProgressEventSummary {
2
- eventType: string;
3
- currentTool?: string;
4
- toolCount?: number;
5
- tokens?: number;
6
- turns?: number;
7
- activityState?: string;
8
- lastActivityAt?: string;
9
- }
10
-
11
- export interface ProgressEventCoalesceDecision {
12
- shouldAppend: boolean;
13
- reason: string;
14
- }
15
-
16
- export interface ProgressEventCoalesceInput {
17
- previous?: ProgressEventSummary;
18
- next: ProgressEventSummary;
19
- nowMs: number;
20
- lastAppendMs?: number;
21
- minIntervalMs: number;
22
- force?: boolean;
23
- tokenThreshold?: number;
24
- }
25
-
26
- const DEFAULT_TOKEN_THRESHOLD = 256;
27
-
28
- function numericIncrease(previous: number | undefined, next: number | undefined): number {
29
- return next !== undefined && previous !== undefined ? next - previous : next !== undefined ? next : 0;
30
- }
31
-
32
- export function shouldAppendProgressEventUpdate(input: ProgressEventCoalesceInput): ProgressEventCoalesceDecision {
33
- if (input.force) return { shouldAppend: true, reason: "force" };
34
- if (!input.previous) return { shouldAppend: true, reason: "first" };
35
- if (input.previous.activityState !== input.next.activityState) return { shouldAppend: true, reason: "activity_changed" };
36
- if (input.previous.currentTool !== input.next.currentTool) return { shouldAppend: true, reason: "tool_changed" };
37
- if (numericIncrease(input.previous.toolCount, input.next.toolCount) > 0) return { shouldAppend: true, reason: "tool_count_increased" };
38
- if (numericIncrease(input.previous.turns, input.next.turns) > 0) return { shouldAppend: true, reason: "turns_increased" };
39
- const tokenIncrease = numericIncrease(input.previous.tokens, input.next.tokens);
40
- if (tokenIncrease >= (input.tokenThreshold ?? DEFAULT_TOKEN_THRESHOLD)) return { shouldAppend: true, reason: "tokens_increased" };
41
- if (input.lastAppendMs === undefined || input.nowMs - input.lastAppendMs >= input.minIntervalMs) return { shouldAppend: true, reason: "interval" };
42
- return { shouldAppend: false, reason: "coalesced" };
43
- }
1
+ export interface ProgressEventSummary {
2
+ eventType: string;
3
+ currentTool?: string;
4
+ toolCount?: number;
5
+ tokens?: number;
6
+ turns?: number;
7
+ activityState?: string;
8
+ lastActivityAt?: string;
9
+ }
10
+
11
+ export interface ProgressEventCoalesceDecision {
12
+ shouldAppend: boolean;
13
+ reason: string;
14
+ }
15
+
16
+ export interface ProgressEventCoalesceInput {
17
+ previous?: ProgressEventSummary;
18
+ next: ProgressEventSummary;
19
+ nowMs: number;
20
+ lastAppendMs?: number;
21
+ minIntervalMs: number;
22
+ force?: boolean;
23
+ tokenThreshold?: number;
24
+ }
25
+
26
+ const DEFAULT_TOKEN_THRESHOLD = 256;
27
+
28
+ function numericIncrease(previous: number | undefined, next: number | undefined): number {
29
+ return next !== undefined && previous !== undefined ? next - previous : next !== undefined ? next : 0;
30
+ }
31
+
32
+ export function shouldAppendProgressEventUpdate(input: ProgressEventCoalesceInput): ProgressEventCoalesceDecision {
33
+ if (input.force) return { shouldAppend: true, reason: "force" };
34
+ if (!input.previous) return { shouldAppend: true, reason: "first" };
35
+ if (input.previous.activityState !== input.next.activityState) return { shouldAppend: true, reason: "activity_changed" };
36
+ if (input.previous.currentTool !== input.next.currentTool) return { shouldAppend: true, reason: "tool_changed" };
37
+ if (numericIncrease(input.previous.toolCount, input.next.toolCount) > 0) return { shouldAppend: true, reason: "tool_count_increased" };
38
+ if (numericIncrease(input.previous.turns, input.next.turns) > 0) return { shouldAppend: true, reason: "turns_increased" };
39
+ const tokenIncrease = numericIncrease(input.previous.tokens, input.next.tokens);
40
+ if (tokenIncrease >= (input.tokenThreshold ?? DEFAULT_TOKEN_THRESHOLD)) return { shouldAppend: true, reason: "tokens_increased" };
41
+ if (input.lastAppendMs === undefined || input.nowMs - input.lastAppendMs >= input.minIntervalMs) return { shouldAppend: true, reason: "interval" };
42
+ return { shouldAppend: false, reason: "coalesced" };
43
+ }
@@ -1,74 +1,74 @@
1
- import type { PolicyDecision, PolicyDecisionReason } from "../state/types.ts";
2
-
3
- export type FailureScenario = "trust_prompt_unresolved" | "prompt_misdelivery" | "stale_branch" | "compile_red_cross_crate" | "mcp_handshake_failure" | "partial_plugin_startup" | "provider_failure" | "task_failed" | "worker_stale" | "green_unsatisfied";
4
- export type RecoveryStep = "accept_trust_prompt" | "redirect_prompt_to_agent" | "rebase_branch" | "clean_build" | "retry_mcp_handshake" | "restart_plugin" | "restart_worker" | "rerun_task" | "collect_verification_evidence" | "escalate_to_human";
5
- export type RecoveryResultState = "planned" | "skipped" | "escalation_required";
6
-
7
- export interface RecoveryRecipe {
8
- scenario: FailureScenario;
9
- steps: RecoveryStep[];
10
- maxAttempts: number;
11
- escalationPolicy: "alert_human" | "log_and_continue" | "abort";
12
- }
13
-
14
- export interface RecoveryLedgerEntry {
15
- scenario: FailureScenario;
16
- taskId?: string;
17
- decisionReason: PolicyDecisionReason;
18
- attempt: number;
19
- state: RecoveryResultState;
20
- steps: RecoveryStep[];
21
- message: string;
22
- createdAt: string;
23
- }
24
-
25
- export interface RecoveryLedger {
26
- entries: RecoveryLedgerEntry[];
27
- }
28
-
29
- export function scenarioForPolicyReason(reason: PolicyDecisionReason): FailureScenario {
30
- switch (reason) {
31
- case "branch_stale": return "stale_branch";
32
- case "worker_stale": return "worker_stale";
33
- case "green_unsatisfied": return "green_unsatisfied";
34
- case "task_failed": return "task_failed";
35
- default: return "provider_failure";
36
- }
37
- }
38
-
39
- export function recipeFor(scenario: FailureScenario): RecoveryRecipe {
40
- switch (scenario) {
41
- case "trust_prompt_unresolved": return { scenario, steps: ["accept_trust_prompt"], maxAttempts: 1, escalationPolicy: "alert_human" };
42
- case "prompt_misdelivery": return { scenario, steps: ["redirect_prompt_to_agent"], maxAttempts: 1, escalationPolicy: "alert_human" };
43
- case "stale_branch": return { scenario, steps: ["rebase_branch", "clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
44
- case "compile_red_cross_crate": return { scenario, steps: ["clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
45
- case "mcp_handshake_failure": return { scenario, steps: ["retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "abort" };
46
- case "partial_plugin_startup": return { scenario, steps: ["restart_plugin", "retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "log_and_continue" };
47
- case "worker_stale": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
48
- case "green_unsatisfied": return { scenario, steps: ["collect_verification_evidence"], maxAttempts: 1, escalationPolicy: "alert_human" };
49
- case "task_failed": return { scenario, steps: ["rerun_task"], maxAttempts: 1, escalationPolicy: "alert_human" };
50
- case "provider_failure": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
51
- }
52
- }
53
-
54
- export function buildRecoveryLedger(decisions: PolicyDecision[], previous: RecoveryLedger = { entries: [] }): RecoveryLedger {
55
- const entries = [...previous.entries];
56
- for (const item of decisions) {
57
- if (!["retry", "escalate", "block"].includes(item.action)) continue;
58
- const scenario = scenarioForPolicyReason(item.reason);
59
- const recipe = recipeFor(scenario);
60
- const priorAttempts = entries.filter((entry) => entry.scenario === scenario && entry.taskId === item.taskId).length;
61
- const attempt = priorAttempts + 1;
62
- entries.push({
63
- scenario,
64
- taskId: item.taskId,
65
- decisionReason: item.reason,
66
- attempt,
67
- state: attempt <= recipe.maxAttempts && item.action !== "block" ? "planned" : "escalation_required",
68
- steps: attempt <= recipe.maxAttempts ? recipe.steps : ["escalate_to_human"],
69
- message: item.message,
70
- createdAt: new Date().toISOString(),
71
- });
72
- }
73
- return { entries };
74
- }
1
+ import type { PolicyDecision, PolicyDecisionReason } from "../state/types.ts";
2
+
3
+ export type FailureScenario = "trust_prompt_unresolved" | "prompt_misdelivery" | "stale_branch" | "compile_red_cross_crate" | "mcp_handshake_failure" | "partial_plugin_startup" | "provider_failure" | "task_failed" | "worker_stale" | "green_unsatisfied";
4
+ export type RecoveryStep = "accept_trust_prompt" | "redirect_prompt_to_agent" | "rebase_branch" | "clean_build" | "retry_mcp_handshake" | "restart_plugin" | "restart_worker" | "rerun_task" | "collect_verification_evidence" | "escalate_to_human";
5
+ export type RecoveryResultState = "planned" | "skipped" | "escalation_required";
6
+
7
+ export interface RecoveryRecipe {
8
+ scenario: FailureScenario;
9
+ steps: RecoveryStep[];
10
+ maxAttempts: number;
11
+ escalationPolicy: "alert_human" | "log_and_continue" | "abort";
12
+ }
13
+
14
+ export interface RecoveryLedgerEntry {
15
+ scenario: FailureScenario;
16
+ taskId?: string;
17
+ decisionReason: PolicyDecisionReason;
18
+ attempt: number;
19
+ state: RecoveryResultState;
20
+ steps: RecoveryStep[];
21
+ message: string;
22
+ createdAt: string;
23
+ }
24
+
25
+ export interface RecoveryLedger {
26
+ entries: RecoveryLedgerEntry[];
27
+ }
28
+
29
+ export function scenarioForPolicyReason(reason: PolicyDecisionReason): FailureScenario {
30
+ switch (reason) {
31
+ case "branch_stale": return "stale_branch";
32
+ case "worker_stale": return "worker_stale";
33
+ case "green_unsatisfied": return "green_unsatisfied";
34
+ case "task_failed": return "task_failed";
35
+ default: return "provider_failure";
36
+ }
37
+ }
38
+
39
+ export function recipeFor(scenario: FailureScenario): RecoveryRecipe {
40
+ switch (scenario) {
41
+ case "trust_prompt_unresolved": return { scenario, steps: ["accept_trust_prompt"], maxAttempts: 1, escalationPolicy: "alert_human" };
42
+ case "prompt_misdelivery": return { scenario, steps: ["redirect_prompt_to_agent"], maxAttempts: 1, escalationPolicy: "alert_human" };
43
+ case "stale_branch": return { scenario, steps: ["rebase_branch", "clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
44
+ case "compile_red_cross_crate": return { scenario, steps: ["clean_build"], maxAttempts: 1, escalationPolicy: "alert_human" };
45
+ case "mcp_handshake_failure": return { scenario, steps: ["retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "abort" };
46
+ case "partial_plugin_startup": return { scenario, steps: ["restart_plugin", "retry_mcp_handshake"], maxAttempts: 1, escalationPolicy: "log_and_continue" };
47
+ case "worker_stale": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
48
+ case "green_unsatisfied": return { scenario, steps: ["collect_verification_evidence"], maxAttempts: 1, escalationPolicy: "alert_human" };
49
+ case "task_failed": return { scenario, steps: ["rerun_task"], maxAttempts: 1, escalationPolicy: "alert_human" };
50
+ case "provider_failure": return { scenario, steps: ["restart_worker"], maxAttempts: 1, escalationPolicy: "alert_human" };
51
+ }
52
+ }
53
+
54
+ export function buildRecoveryLedger(decisions: PolicyDecision[], previous: RecoveryLedger = { entries: [] }): RecoveryLedger {
55
+ const entries = [...previous.entries];
56
+ for (const item of decisions) {
57
+ if (!["retry", "escalate", "block"].includes(item.action)) continue;
58
+ const scenario = scenarioForPolicyReason(item.reason);
59
+ const recipe = recipeFor(scenario);
60
+ const priorAttempts = entries.filter((entry) => entry.scenario === scenario && entry.taskId === item.taskId).length;
61
+ const attempt = priorAttempts + 1;
62
+ entries.push({
63
+ scenario,
64
+ taskId: item.taskId,
65
+ decisionReason: item.reason,
66
+ attempt,
67
+ state: attempt <= recipe.maxAttempts && item.action !== "block" ? "planned" : "escalation_required",
68
+ steps: attempt <= recipe.maxAttempts ? recipe.steps : ["escalate_to_human"],
69
+ message: item.message,
70
+ createdAt: new Date().toISOString(),
71
+ });
72
+ }
73
+ return { entries };
74
+ }
@@ -1,64 +1,64 @@
1
- import { sleep } from "../utils/sleep.ts";
2
-
3
- export interface RetryPolicy {
4
- maxAttempts: number;
5
- backoffMs: number;
6
- jitterRatio: number;
7
- exponentialFactor: number;
8
- retryableErrors?: string[];
9
- }
10
-
11
- export interface RetryHooks {
12
- onAttemptFailed?: (attempt: number, error: Error, nextDelayMs: number) => void;
13
- onRetryGivenUp?: (attempts: number, error: Error) => void;
14
- signal?: AbortSignal;
15
- }
16
-
17
- export const DEFAULT_RETRY_POLICY: RetryPolicy = { maxAttempts: 3, backoffMs: 1000, jitterRatio: 0.3, exponentialFactor: 2 };
18
-
19
- function asError(error: unknown): Error {
20
- return error instanceof Error ? error : new Error(String(error));
21
- }
22
-
23
- function globToRegex(pattern: string): RegExp {
24
- const escaped = pattern.replace(/[.+^${}()|[\]\\]/g, "\\$&").replace(/\*/g, ".*");
25
- return new RegExp(`^${escaped}$`, "i");
26
- }
27
-
28
- function isRetryable(error: Error, policy: RetryPolicy): boolean {
29
- const patterns = policy.retryableErrors ?? [];
30
- if (!patterns.length) return true;
31
- return patterns.some((pattern) => globToRegex(pattern).test(error.message));
32
- }
33
-
34
- export function calculateRetryDelay(attempt: number, policy: RetryPolicy = DEFAULT_RETRY_POLICY, random = Math.random): number {
35
- const base = policy.backoffMs * Math.pow(policy.exponentialFactor, Math.max(0, attempt - 1));
36
- const jitter = (random() * 2 - 1) * policy.jitterRatio * base;
37
- return Math.max(0, base + jitter);
38
- }
39
-
40
- export async function executeWithRetry<T>(fn: (attempt: number) => Promise<T>, policy: RetryPolicy = DEFAULT_RETRY_POLICY, hooks: RetryHooks = {}): Promise<T> {
41
- const normalized: RetryPolicy = { ...DEFAULT_RETRY_POLICY, ...policy, maxAttempts: Math.max(1, policy.maxAttempts ?? DEFAULT_RETRY_POLICY.maxAttempts) };
42
- let lastError: Error | undefined;
43
- for (let attempt = 1; attempt <= normalized.maxAttempts; attempt += 1) {
44
- if (hooks.signal?.aborted) throw new Error("Retry aborted.");
45
- try {
46
- return await fn(attempt);
47
- } catch (error) {
48
- lastError = asError(error);
49
- // Never retry if aborted — sleep() would immediately reject on every attempt.
50
- if (hooks.signal?.aborted) {
51
- hooks.onRetryGivenUp?.(attempt, lastError);
52
- throw lastError;
53
- }
54
- if (attempt >= normalized.maxAttempts || !isRetryable(lastError, normalized)) {
55
- hooks.onRetryGivenUp?.(attempt, lastError);
56
- throw lastError;
57
- }
58
- const delay = calculateRetryDelay(attempt, normalized);
59
- hooks.onAttemptFailed?.(attempt, lastError, delay);
60
- await sleep(delay, hooks.signal);
61
- }
62
- }
63
- throw lastError ?? new Error("Retry failed without error.");
64
- }
1
+ import { sleep } from "../utils/sleep.ts";
2
+
3
+ export interface RetryPolicy {
4
+ maxAttempts: number;
5
+ backoffMs: number;
6
+ jitterRatio: number;
7
+ exponentialFactor: number;
8
+ retryableErrors?: string[];
9
+ }
10
+
11
+ export interface RetryHooks {
12
+ onAttemptFailed?: (attempt: number, error: Error, nextDelayMs: number) => void;
13
+ onRetryGivenUp?: (attempts: number, error: Error) => void;
14
+ signal?: AbortSignal;
15
+ }
16
+
17
+ export const DEFAULT_RETRY_POLICY: RetryPolicy = { maxAttempts: 3, backoffMs: 1000, jitterRatio: 0.3, exponentialFactor: 2 };
18
+
19
+ function asError(error: unknown): Error {
20
+ return error instanceof Error ? error : new Error(String(error));
21
+ }
22
+
23
+ function globToRegex(pattern: string): RegExp {
24
+ const escaped = pattern.replace(/[.+^${}()|[\]\\]/g, "\\$&").replace(/\*/g, ".*");
25
+ return new RegExp(`^${escaped}$`, "i");
26
+ }
27
+
28
+ function isRetryable(error: Error, policy: RetryPolicy): boolean {
29
+ const patterns = policy.retryableErrors ?? [];
30
+ if (!patterns.length) return true;
31
+ return patterns.some((pattern) => globToRegex(pattern).test(error.message));
32
+ }
33
+
34
+ export function calculateRetryDelay(attempt: number, policy: RetryPolicy = DEFAULT_RETRY_POLICY, random = Math.random): number {
35
+ const base = policy.backoffMs * Math.pow(policy.exponentialFactor, Math.max(0, attempt - 1));
36
+ const jitter = (random() * 2 - 1) * policy.jitterRatio * base;
37
+ return Math.max(0, base + jitter);
38
+ }
39
+
40
+ export async function executeWithRetry<T>(fn: (attempt: number) => Promise<T>, policy: RetryPolicy = DEFAULT_RETRY_POLICY, hooks: RetryHooks = {}): Promise<T> {
41
+ const normalized: RetryPolicy = { ...DEFAULT_RETRY_POLICY, ...policy, maxAttempts: Math.max(1, policy.maxAttempts ?? DEFAULT_RETRY_POLICY.maxAttempts) };
42
+ let lastError: Error | undefined;
43
+ for (let attempt = 1; attempt <= normalized.maxAttempts; attempt += 1) {
44
+ if (hooks.signal?.aborted) throw new Error("Retry aborted.");
45
+ try {
46
+ return await fn(attempt);
47
+ } catch (error) {
48
+ lastError = asError(error);
49
+ // Never retry if aborted — sleep() would immediately reject on every attempt.
50
+ if (hooks.signal?.aborted) {
51
+ hooks.onRetryGivenUp?.(attempt, lastError);
52
+ throw lastError;
53
+ }
54
+ if (attempt >= normalized.maxAttempts || !isRetryable(lastError, normalized)) {
55
+ hooks.onRetryGivenUp?.(attempt, lastError);
56
+ throw lastError;
57
+ }
58
+ const delay = calculateRetryDelay(attempt, normalized);
59
+ hooks.onAttemptFailed?.(attempt, lastError, delay);
60
+ await sleep(delay, hooks.signal);
61
+ }
62
+ }
63
+ throw lastError ?? new Error("Retry failed without error.");
64
+ }
@@ -1,39 +1,39 @@
1
- export type RolePermissionMode = "read_only" | "workspace_write" | "danger_full_access" | "explicit_confirm";
2
-
3
- const READ_ONLY_ROLES = new Set(["explorer", "reviewer", "security-reviewer", "verifier", "analyst", "critic", "planner", "writer"]);
4
- const WRITE_ROLES = new Set(["executor", "test-engineer"]);
5
- const READ_ONLY_COMMANDS = new Set(["cat", "head", "tail", "less", "more", "wc", "ls", "find", "grep", "rg", "awk", "sed", "echo", "printf", "which", "where", "whoami", "pwd", "env", "printenv", "date", "df", "du", "uname", "file", "stat", "diff", "sort", "uniq", "tr", "cut", "paste", "test", "true", "false", "type", "readlink", "realpath", "basename", "dirname", "sha256sum", "md5sum", "xxd", "hexdump", "od", "strings", "tree", "jq", "git", "gh"]);
6
-
7
- export interface PermissionCheckResult {
8
- allowed: boolean;
9
- mode: RolePermissionMode;
10
- reason?: string;
11
- }
12
-
13
- export function permissionForRole(role: string): RolePermissionMode {
14
- if (READ_ONLY_ROLES.has(role)) return "read_only";
15
- if (WRITE_ROLES.has(role)) return "workspace_write";
16
- return "workspace_write";
17
- }
18
-
19
- export function isReadOnlyCommand(command: string): boolean {
20
- const first = command.trim().split(/\s+/)[0]?.split(/[\\/]/).pop() ?? "";
21
- return READ_ONLY_COMMANDS.has(first) && !/\s(-i|--in-place)\b|\s>{1,2}\s|\brm\b|\bmv\b|\bcp\b|\b(?:npm|pnpm|yarn|bun)\s+(install|add|ci|remove)\b|\bgit\s+(commit|push|merge|rebase|reset|checkout|clean)\b/.test(command);
22
- }
23
-
24
- export function checkRolePermission(role: string, command: string): PermissionCheckResult {
25
- const mode = permissionForRole(role);
26
- if (mode === "read_only" && !isReadOnlyCommand(command)) return { allowed: false, mode, reason: `Role '${role}' is read-only and command may modify state.` };
27
- return { allowed: true, mode };
28
- }
29
-
30
- export function currentCrewRole(env: NodeJS.ProcessEnv = process.env): string | undefined {
31
- return env.PI_CREW_ROLE?.trim() || env.PI_TEAMS_ROLE?.trim() || undefined;
32
- }
33
-
34
- export function checkSubagentSpawnPermission(role: string | undefined): PermissionCheckResult {
35
- if (!role) return { allowed: true, mode: "workspace_write" };
36
- const mode = permissionForRole(role);
37
- if (mode === "read_only") return { allowed: false, mode, reason: `Role '${role}' is read-only and cannot spawn additional subagents.` };
38
- return { allowed: true, mode };
39
- }
1
+ export type RolePermissionMode = "read_only" | "workspace_write" | "danger_full_access" | "explicit_confirm";
2
+
3
+ const READ_ONLY_ROLES = new Set(["explorer", "reviewer", "security-reviewer", "verifier", "analyst", "critic", "planner", "writer"]);
4
+ const WRITE_ROLES = new Set(["executor", "test-engineer"]);
5
+ const READ_ONLY_COMMANDS = new Set(["cat", "head", "tail", "less", "more", "wc", "ls", "find", "grep", "rg", "awk", "sed", "echo", "printf", "which", "where", "whoami", "pwd", "env", "printenv", "date", "df", "du", "uname", "file", "stat", "diff", "sort", "uniq", "tr", "cut", "paste", "test", "true", "false", "type", "readlink", "realpath", "basename", "dirname", "sha256sum", "md5sum", "xxd", "hexdump", "od", "strings", "tree", "jq", "git", "gh"]);
6
+
7
+ export interface PermissionCheckResult {
8
+ allowed: boolean;
9
+ mode: RolePermissionMode;
10
+ reason?: string;
11
+ }
12
+
13
+ export function permissionForRole(role: string): RolePermissionMode {
14
+ if (READ_ONLY_ROLES.has(role)) return "read_only";
15
+ if (WRITE_ROLES.has(role)) return "workspace_write";
16
+ return "workspace_write";
17
+ }
18
+
19
+ export function isReadOnlyCommand(command: string): boolean {
20
+ const first = command.trim().split(/\s+/)[0]?.split(/[\\/]/).pop() ?? "";
21
+ return READ_ONLY_COMMANDS.has(first) && !/\s(-i|--in-place)\b|\s>{1,2}\s|\brm\b|\bmv\b|\bcp\b|\b(?:npm|pnpm|yarn|bun)\s+(install|add|ci|remove)\b|\bgit\s+(commit|push|merge|rebase|reset|checkout|clean)\b/.test(command);
22
+ }
23
+
24
+ export function checkRolePermission(role: string, command: string): PermissionCheckResult {
25
+ const mode = permissionForRole(role);
26
+ if (mode === "read_only" && !isReadOnlyCommand(command)) return { allowed: false, mode, reason: `Role '${role}' is read-only and command may modify state.` };
27
+ return { allowed: true, mode };
28
+ }
29
+
30
+ export function currentCrewRole(env: NodeJS.ProcessEnv = process.env): string | undefined {
31
+ return env.PI_CREW_ROLE?.trim() || env.PI_TEAMS_ROLE?.trim() || undefined;
32
+ }
33
+
34
+ export function checkSubagentSpawnPermission(role: string | undefined): PermissionCheckResult {
35
+ if (!role) return { allowed: true, mode: "workspace_write" };
36
+ const mode = permissionForRole(role);
37
+ if (mode === "read_only") return { allowed: false, mode, reason: `Role '${role}' is read-only and cannot spawn additional subagents.` };
38
+ return { allowed: true, mode };
39
+ }