pi-crew 0.1.37 → 0.1.39

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (162) hide show
  1. package/AGENTS.md +1 -1
  2. package/CHANGELOG.md +27 -0
  3. package/README.md +5 -0
  4. package/agents/analyst.md +11 -11
  5. package/agents/critic.md +11 -11
  6. package/agents/executor.md +11 -11
  7. package/agents/explorer.md +11 -11
  8. package/agents/planner.md +11 -11
  9. package/agents/reviewer.md +11 -11
  10. package/agents/security-reviewer.md +11 -11
  11. package/agents/test-engineer.md +11 -11
  12. package/agents/verifier.md +11 -11
  13. package/agents/writer.md +11 -11
  14. package/docs/refactor-tasks-phase3.md +394 -394
  15. package/docs/refactor-tasks-phase4.md +564 -564
  16. package/docs/refactor-tasks-phase5.md +402 -402
  17. package/docs/refactor-tasks-phase6.md +662 -662
  18. package/docs/research-extension-examples.md +297 -297
  19. package/docs/research-extension-system.md +324 -324
  20. package/docs/research-optimization-plan.md +548 -548
  21. package/docs/research-pi-coding-agent.md +357 -357
  22. package/docs/research-source-pi-crew-reference.md +174 -174
  23. package/docs/resource-formats.md +10 -8
  24. package/docs/runtime-flow.md +148 -148
  25. package/docs/source-runtime-refactor-map.md +83 -83
  26. package/docs/usage.md +6 -0
  27. package/index.ts +6 -6
  28. package/package.json +3 -3
  29. package/schema.json +2 -2
  30. package/src/agents/agent-serializer.ts +34 -34
  31. package/src/config/config.ts +8 -4
  32. package/src/extension/cross-extension-rpc.ts +82 -82
  33. package/src/extension/import-index.ts +18 -2
  34. package/src/extension/register.ts +11 -1
  35. package/src/extension/registration/compaction-guard.ts +125 -125
  36. package/src/extension/registration/subagent-helpers.ts +30 -6
  37. package/src/extension/registration/subagent-tools.ts +8 -3
  38. package/src/extension/result-watcher.ts +98 -98
  39. package/src/extension/run-import.ts +12 -2
  40. package/src/extension/run-index.ts +12 -2
  41. package/src/extension/run-maintenance.ts +24 -24
  42. package/src/extension/team-tool/api.ts +54 -14
  43. package/src/extension/team-tool/cancel.ts +31 -31
  44. package/src/extension/team-tool/doctor.ts +179 -179
  45. package/src/extension/team-tool/inspect.ts +41 -41
  46. package/src/extension/team-tool/lifecycle-actions.ts +79 -79
  47. package/src/extension/team-tool/plan.ts +19 -19
  48. package/src/extension/team-tool/status.ts +73 -73
  49. package/src/observability/correlation.ts +35 -35
  50. package/src/observability/event-to-metric.ts +54 -54
  51. package/src/observability/exporters/adapter.ts +24 -24
  52. package/src/observability/exporters/otlp-exporter.ts +65 -65
  53. package/src/observability/exporters/prometheus-exporter.ts +47 -47
  54. package/src/observability/metric-registry.ts +72 -72
  55. package/src/observability/metric-retention.ts +46 -46
  56. package/src/observability/metric-sink.ts +51 -51
  57. package/src/observability/metrics-primitives.ts +166 -166
  58. package/src/prompt/prompt-runtime.ts +68 -68
  59. package/src/runtime/agent-control.ts +64 -64
  60. package/src/runtime/agent-memory.ts +72 -72
  61. package/src/runtime/agent-observability.ts +114 -113
  62. package/src/runtime/async-marker.ts +26 -26
  63. package/src/runtime/background-runner.ts +53 -53
  64. package/src/runtime/crash-recovery.ts +56 -56
  65. package/src/runtime/crew-agent-records.ts +54 -9
  66. package/src/runtime/crew-agent-runtime.ts +58 -58
  67. package/src/runtime/deadletter.ts +36 -36
  68. package/src/runtime/direct-run.ts +35 -35
  69. package/src/runtime/foreground-control.ts +82 -82
  70. package/src/runtime/green-contract.ts +46 -46
  71. package/src/runtime/group-join.ts +88 -88
  72. package/src/runtime/heartbeat-gradient.ts +28 -28
  73. package/src/runtime/heartbeat-watcher.ts +80 -80
  74. package/src/runtime/live-agent-control.ts +87 -78
  75. package/src/runtime/live-agent-manager.ts +85 -85
  76. package/src/runtime/live-control-realtime.ts +36 -36
  77. package/src/runtime/live-session-runtime.ts +299 -299
  78. package/src/runtime/manifest-cache.ts +248 -212
  79. package/src/runtime/model-fallback.ts +261 -261
  80. package/src/runtime/parallel-research.ts +44 -44
  81. package/src/runtime/parallel-utils.ts +99 -99
  82. package/src/runtime/pi-json-output.ts +111 -111
  83. package/src/runtime/policy-engine.ts +78 -78
  84. package/src/runtime/post-exit-stdio-guard.ts +86 -86
  85. package/src/runtime/process-status.ts +56 -56
  86. package/src/runtime/progress-event-coalescer.ts +43 -43
  87. package/src/runtime/recovery-recipes.ts +74 -74
  88. package/src/runtime/retry-executor.ts +59 -59
  89. package/src/runtime/role-permission.ts +39 -39
  90. package/src/runtime/session-usage.ts +79 -79
  91. package/src/runtime/sidechain-output.ts +28 -28
  92. package/src/runtime/subagent-manager.ts +80 -12
  93. package/src/runtime/task-display.ts +38 -38
  94. package/src/runtime/task-output-context.ts +127 -106
  95. package/src/runtime/task-runner/live-executor.ts +98 -98
  96. package/src/runtime/task-runner/progress.ts +111 -111
  97. package/src/runtime/task-runner/result-utils.ts +14 -14
  98. package/src/runtime/task-runner/state-helpers.ts +22 -22
  99. package/src/runtime/team-runner.ts +1 -1
  100. package/src/runtime/worker-heartbeat.ts +21 -21
  101. package/src/runtime/worker-startup.ts +57 -57
  102. package/src/schema/config-schema.ts +21 -21
  103. package/src/schema/team-tool-schema.ts +100 -100
  104. package/src/state/artifact-store.ts +122 -108
  105. package/src/state/contracts.ts +105 -105
  106. package/src/state/jsonl-writer.ts +77 -77
  107. package/src/state/mailbox.ts +67 -22
  108. package/src/state/state-store.ts +36 -5
  109. package/src/state/task-claims.ts +42 -42
  110. package/src/state/usage.ts +29 -29
  111. package/src/subagents/async-entry.ts +1 -1
  112. package/src/subagents/index.ts +3 -3
  113. package/src/subagents/live/control.ts +1 -1
  114. package/src/subagents/live/manager.ts +1 -1
  115. package/src/subagents/live/realtime.ts +1 -1
  116. package/src/subagents/live/session-runtime.ts +1 -1
  117. package/src/subagents/manager.ts +1 -1
  118. package/src/subagents/spawn.ts +1 -1
  119. package/src/teams/discover-teams.ts +27 -5
  120. package/src/teams/team-serializer.ts +38 -36
  121. package/src/types/diff.d.ts +18 -18
  122. package/src/ui/crew-footer.ts +101 -101
  123. package/src/ui/crew-select-list.ts +111 -111
  124. package/src/ui/dashboard-panes/metrics-pane.ts +34 -34
  125. package/src/ui/dynamic-border.ts +25 -25
  126. package/src/ui/layout-primitives.ts +106 -106
  127. package/src/ui/loaders.ts +158 -158
  128. package/src/ui/mascot.ts +441 -441
  129. package/src/ui/render-diff.ts +119 -119
  130. package/src/ui/run-dashboard.ts +5 -2
  131. package/src/ui/run-snapshot-cache.ts +19 -8
  132. package/src/ui/spinner.ts +17 -17
  133. package/src/ui/status-colors.ts +54 -54
  134. package/src/ui/syntax-highlight.ts +116 -116
  135. package/src/ui/transcript-viewer.ts +15 -1
  136. package/src/utils/completion-dedupe.ts +63 -63
  137. package/src/utils/file-coalescer.ts +84 -84
  138. package/src/utils/frontmatter.ts +36 -36
  139. package/src/utils/fs-watch.ts +31 -31
  140. package/src/utils/git.ts +262 -262
  141. package/src/utils/ids.ts +12 -12
  142. package/src/utils/names.ts +26 -26
  143. package/src/utils/paths.ts +3 -2
  144. package/src/utils/safe-paths.ts +34 -0
  145. package/src/utils/sleep.ts +32 -32
  146. package/src/utils/timings.ts +31 -31
  147. package/src/utils/visual.ts +159 -159
  148. package/src/workflows/discover-workflows.ts +30 -3
  149. package/src/workflows/validate-workflow.ts +40 -40
  150. package/src/worktree/branch-freshness.ts +45 -45
  151. package/teams/default.team.md +12 -12
  152. package/teams/fast-fix.team.md +11 -11
  153. package/teams/implementation.team.md +18 -18
  154. package/teams/parallel-research.team.md +14 -14
  155. package/teams/research.team.md +11 -11
  156. package/teams/review.team.md +12 -12
  157. package/workflows/default.workflow.md +29 -29
  158. package/workflows/fast-fix.workflow.md +22 -22
  159. package/workflows/implementation.workflow.md +38 -38
  160. package/workflows/parallel-research.workflow.md +46 -46
  161. package/workflows/research.workflow.md +22 -22
  162. package/workflows/review.workflow.md +30 -30
@@ -1,46 +1,46 @@
1
- import type { GreenLevel, VerificationContract, VerificationEvidence } from "../state/types.ts";
2
-
3
- const GREEN_ORDER: Record<GreenLevel, number> = {
4
- none: 0,
5
- targeted: 1,
6
- package: 2,
7
- workspace: 3,
8
- merge_ready: 4,
9
- };
10
-
11
- export interface GreenContractOutcome {
12
- requiredGreenLevel: GreenLevel;
13
- observedGreenLevel: GreenLevel;
14
- satisfied: boolean;
15
- }
16
-
17
- export function greenLevelSatisfies(observed: GreenLevel, required: GreenLevel): boolean {
18
- return GREEN_ORDER[observed] >= GREEN_ORDER[required];
19
- }
20
-
21
- export function evaluateGreenContract(contract: VerificationContract, evidence?: VerificationEvidence): GreenContractOutcome {
22
- const observedGreenLevel = evidence?.observedGreenLevel ?? "none";
23
- return {
24
- requiredGreenLevel: contract.requiredGreenLevel,
25
- observedGreenLevel,
26
- satisfied: greenLevelSatisfies(observedGreenLevel, contract.requiredGreenLevel),
27
- };
28
- }
29
-
30
- export function inferGreenLevelFromTask(success: boolean, contract: VerificationContract): GreenLevel {
31
- if (!success) return "none";
32
- if (contract.requiredGreenLevel === "none") return "none";
33
- return contract.allowManualEvidence ? contract.requiredGreenLevel : "targeted";
34
- }
35
-
36
- export function createVerificationEvidence(contract: VerificationContract, success: boolean, notes: string): VerificationEvidence {
37
- const observedGreenLevel = inferGreenLevelFromTask(success, contract);
38
- const outcome = evaluateGreenContract(contract, { requiredGreenLevel: contract.requiredGreenLevel, observedGreenLevel, satisfied: false, commands: [], notes });
39
- return {
40
- requiredGreenLevel: contract.requiredGreenLevel,
41
- observedGreenLevel,
42
- satisfied: outcome.satisfied,
43
- commands: contract.commands.map((cmd) => ({ cmd, status: "not_run" as const })),
44
- notes,
45
- };
46
- }
1
+ import type { GreenLevel, VerificationContract, VerificationEvidence } from "../state/types.ts";
2
+
3
+ const GREEN_ORDER: Record<GreenLevel, number> = {
4
+ none: 0,
5
+ targeted: 1,
6
+ package: 2,
7
+ workspace: 3,
8
+ merge_ready: 4,
9
+ };
10
+
11
+ export interface GreenContractOutcome {
12
+ requiredGreenLevel: GreenLevel;
13
+ observedGreenLevel: GreenLevel;
14
+ satisfied: boolean;
15
+ }
16
+
17
+ export function greenLevelSatisfies(observed: GreenLevel, required: GreenLevel): boolean {
18
+ return GREEN_ORDER[observed] >= GREEN_ORDER[required];
19
+ }
20
+
21
+ export function evaluateGreenContract(contract: VerificationContract, evidence?: VerificationEvidence): GreenContractOutcome {
22
+ const observedGreenLevel = evidence?.observedGreenLevel ?? "none";
23
+ return {
24
+ requiredGreenLevel: contract.requiredGreenLevel,
25
+ observedGreenLevel,
26
+ satisfied: greenLevelSatisfies(observedGreenLevel, contract.requiredGreenLevel),
27
+ };
28
+ }
29
+
30
+ export function inferGreenLevelFromTask(success: boolean, contract: VerificationContract): GreenLevel {
31
+ if (!success) return "none";
32
+ if (contract.requiredGreenLevel === "none") return "none";
33
+ return contract.allowManualEvidence ? contract.requiredGreenLevel : "targeted";
34
+ }
35
+
36
+ export function createVerificationEvidence(contract: VerificationContract, success: boolean, notes: string): VerificationEvidence {
37
+ const observedGreenLevel = inferGreenLevelFromTask(success, contract);
38
+ const outcome = evaluateGreenContract(contract, { requiredGreenLevel: contract.requiredGreenLevel, observedGreenLevel, satisfied: false, commands: [], notes });
39
+ return {
40
+ requiredGreenLevel: contract.requiredGreenLevel,
41
+ observedGreenLevel,
42
+ satisfied: outcome.satisfied,
43
+ commands: contract.commands.map((cmd) => ({ cmd, status: "not_run" as const })),
44
+ notes,
45
+ };
46
+ }
@@ -1,88 +1,88 @@
1
- import type { CrewRuntimeConfig } from "../config/config.ts";
2
- import { writeArtifact } from "../state/artifact-store.ts";
3
- import { appendEvent } from "../state/event-log.ts";
4
- import { appendMailboxMessage } from "../state/mailbox.ts";
5
- import type { ArtifactDescriptor, TeamRunManifest, TeamTaskState } from "../state/types.ts";
6
- import { aggregateTaskOutputs } from "./task-output-context.ts";
7
-
8
- export type CrewGroupJoinMode = "off" | "group" | "smart";
9
-
10
- export interface CrewGroupJoinDelivery {
11
- batchId: string;
12
- mode: CrewGroupJoinMode;
13
- partial: boolean;
14
- taskIds: string[];
15
- completed: string[];
16
- failed: string[];
17
- skipped: string[];
18
- remaining: string[];
19
- artifact?: ArtifactDescriptor;
20
- messageId?: string;
21
- }
22
-
23
- export function resolveGroupJoinMode(runtime?: CrewRuntimeConfig): CrewGroupJoinMode {
24
- return runtime?.groupJoin ?? "smart";
25
- }
26
-
27
- export function shouldGroupJoin(mode: CrewGroupJoinMode, batch: TeamTaskState[]): boolean {
28
- if (mode === "off") return false;
29
- if (mode === "group") return batch.length > 0;
30
- return batch.length > 1;
31
- }
32
-
33
- function batchIdFor(runId: string, taskIds: string[]): string {
34
- return `${runId}_${taskIds.join("+").replace(/[^a-zA-Z0-9_+-]/g, "_")}`;
35
- }
36
-
37
- function statusList(tasks: TeamTaskState[], status: TeamTaskState["status"]): string[] {
38
- return tasks.filter((task) => task.status === status).map((task) => task.id);
39
- }
40
-
41
- export function deliverGroupJoin(input: {
42
- manifest: TeamRunManifest;
43
- mode: CrewGroupJoinMode;
44
- batch: TeamTaskState[];
45
- allTasks: TeamTaskState[];
46
- partial?: boolean;
47
- }): CrewGroupJoinDelivery | undefined {
48
- if (!shouldGroupJoin(input.mode, input.batch)) return undefined;
49
- const taskIds = input.batch.map((task) => task.id);
50
- const latest = taskIds.map((id) => input.allTasks.find((task) => task.id === id)).filter((task): task is TeamTaskState => Boolean(task));
51
- const completed = statusList(latest, "completed");
52
- const failed = statusList(latest, "failed");
53
- const skipped = statusList(latest, "skipped");
54
- const remaining = latest.filter((task) => task.status === "queued" || task.status === "running").map((task) => task.id);
55
- const partial = input.partial ?? remaining.length > 0;
56
- const batchId = batchIdFor(input.manifest.runId, taskIds);
57
- const summary = aggregateTaskOutputs(latest);
58
- const delivery: CrewGroupJoinDelivery = { batchId, mode: input.mode, partial, taskIds, completed, failed, skipped, remaining };
59
- const content = `${JSON.stringify({ ...delivery, createdAt: new Date().toISOString() }, null, 2)}\n`;
60
- const artifact = writeArtifact(input.manifest.artifactsRoot, {
61
- kind: "metadata",
62
- relativePath: `metadata/group-joins/${batchId}.json`,
63
- producer: "group-join",
64
- content,
65
- });
66
- const mailbox = appendMailboxMessage(input.manifest, {
67
- direction: "outbox",
68
- from: "group-join",
69
- to: "leader",
70
- body: [
71
- `Group join ${partial ? "partial" : "completed"}: ${taskIds.join(", ")}`,
72
- `Completed: ${completed.join(", ") || "none"}`,
73
- `Failed: ${failed.join(", ") || "none"}`,
74
- `Skipped: ${skipped.join(", ") || "none"}`,
75
- `Remaining: ${remaining.join(", ") || "none"}`,
76
- "",
77
- summary,
78
- ].join("\n"),
79
- status: "delivered",
80
- });
81
- appendEvent(input.manifest.eventsPath, {
82
- type: partial ? "agent.group_join.partial" : "agent.group_join.completed",
83
- runId: input.manifest.runId,
84
- message: `Group join ${partial ? "partial" : "completed"} for ${taskIds.length} task(s).`,
85
- data: { ...delivery, artifactPath: artifact.path, messageId: mailbox.id },
86
- });
87
- return { ...delivery, artifact, messageId: mailbox.id };
88
- }
1
+ import type { CrewRuntimeConfig } from "../config/config.ts";
2
+ import { writeArtifact } from "../state/artifact-store.ts";
3
+ import { appendEvent } from "../state/event-log.ts";
4
+ import { appendMailboxMessage } from "../state/mailbox.ts";
5
+ import type { ArtifactDescriptor, TeamRunManifest, TeamTaskState } from "../state/types.ts";
6
+ import { aggregateTaskOutputs } from "./task-output-context.ts";
7
+
8
+ export type CrewGroupJoinMode = "off" | "group" | "smart";
9
+
10
+ export interface CrewGroupJoinDelivery {
11
+ batchId: string;
12
+ mode: CrewGroupJoinMode;
13
+ partial: boolean;
14
+ taskIds: string[];
15
+ completed: string[];
16
+ failed: string[];
17
+ skipped: string[];
18
+ remaining: string[];
19
+ artifact?: ArtifactDescriptor;
20
+ messageId?: string;
21
+ }
22
+
23
+ export function resolveGroupJoinMode(runtime?: CrewRuntimeConfig): CrewGroupJoinMode {
24
+ return runtime?.groupJoin ?? "smart";
25
+ }
26
+
27
+ export function shouldGroupJoin(mode: CrewGroupJoinMode, batch: TeamTaskState[]): boolean {
28
+ if (mode === "off") return false;
29
+ if (mode === "group") return batch.length > 0;
30
+ return batch.length > 1;
31
+ }
32
+
33
+ function batchIdFor(runId: string, taskIds: string[]): string {
34
+ return `${runId}_${taskIds.join("+").replace(/[^a-zA-Z0-9_+-]/g, "_")}`;
35
+ }
36
+
37
+ function statusList(tasks: TeamTaskState[], status: TeamTaskState["status"]): string[] {
38
+ return tasks.filter((task) => task.status === status).map((task) => task.id);
39
+ }
40
+
41
+ export function deliverGroupJoin(input: {
42
+ manifest: TeamRunManifest;
43
+ mode: CrewGroupJoinMode;
44
+ batch: TeamTaskState[];
45
+ allTasks: TeamTaskState[];
46
+ partial?: boolean;
47
+ }): CrewGroupJoinDelivery | undefined {
48
+ if (!shouldGroupJoin(input.mode, input.batch)) return undefined;
49
+ const taskIds = input.batch.map((task) => task.id);
50
+ const latest = taskIds.map((id) => input.allTasks.find((task) => task.id === id)).filter((task): task is TeamTaskState => Boolean(task));
51
+ const completed = statusList(latest, "completed");
52
+ const failed = statusList(latest, "failed");
53
+ const skipped = statusList(latest, "skipped");
54
+ const remaining = latest.filter((task) => task.status === "queued" || task.status === "running").map((task) => task.id);
55
+ const partial = input.partial ?? remaining.length > 0;
56
+ const batchId = batchIdFor(input.manifest.runId, taskIds);
57
+ const summary = aggregateTaskOutputs(latest, input.manifest);
58
+ const delivery: CrewGroupJoinDelivery = { batchId, mode: input.mode, partial, taskIds, completed, failed, skipped, remaining };
59
+ const content = `${JSON.stringify({ ...delivery, createdAt: new Date().toISOString() }, null, 2)}\n`;
60
+ const artifact = writeArtifact(input.manifest.artifactsRoot, {
61
+ kind: "metadata",
62
+ relativePath: `metadata/group-joins/${batchId}.json`,
63
+ producer: "group-join",
64
+ content,
65
+ });
66
+ const mailbox = appendMailboxMessage(input.manifest, {
67
+ direction: "outbox",
68
+ from: "group-join",
69
+ to: "leader",
70
+ body: [
71
+ `Group join ${partial ? "partial" : "completed"}: ${taskIds.join(", ")}`,
72
+ `Completed: ${completed.join(", ") || "none"}`,
73
+ `Failed: ${failed.join(", ") || "none"}`,
74
+ `Skipped: ${skipped.join(", ") || "none"}`,
75
+ `Remaining: ${remaining.join(", ") || "none"}`,
76
+ "",
77
+ summary,
78
+ ].join("\n"),
79
+ status: "delivered",
80
+ });
81
+ appendEvent(input.manifest.eventsPath, {
82
+ type: partial ? "agent.group_join.partial" : "agent.group_join.completed",
83
+ runId: input.manifest.runId,
84
+ message: `Group join ${partial ? "partial" : "completed"} for ${taskIds.length} task(s).`,
85
+ data: { ...delivery, artifactPath: artifact.path, messageId: mailbox.id },
86
+ });
87
+ return { ...delivery, artifact, messageId: mailbox.id };
88
+ }
@@ -1,28 +1,28 @@
1
- import type { WorkerHeartbeatState } from "./worker-heartbeat.ts";
2
-
3
- export type HeartbeatLevel = "healthy" | "warn" | "stale" | "dead";
4
-
5
- export interface GradientThresholds {
6
- warnMs: number;
7
- staleMs: number;
8
- deadMs: number;
9
- }
10
-
11
- export const DEFAULT_GRADIENT_THRESHOLDS: GradientThresholds = { warnMs: 30_000, staleMs: 60_000, deadMs: 300_000 };
12
-
13
- export function heartbeatAgeMs(heartbeat: WorkerHeartbeatState | undefined, now = Date.now()): number {
14
- if (!heartbeat) return Number.POSITIVE_INFINITY;
15
- const lastSeen = Date.parse(heartbeat.lastSeenAt);
16
- return Number.isFinite(lastSeen) ? Math.max(0, now - lastSeen) : Number.POSITIVE_INFINITY;
17
- }
18
-
19
- export function classifyHeartbeat(heartbeat: WorkerHeartbeatState | undefined, thresholds: GradientThresholds = DEFAULT_GRADIENT_THRESHOLDS, now = Date.now()): HeartbeatLevel {
20
- if (!heartbeat) return "dead";
21
- if (heartbeat.alive === false) return "dead";
22
- const elapsed = heartbeatAgeMs(heartbeat, now);
23
- if (!Number.isFinite(elapsed)) return "dead";
24
- if (elapsed > thresholds.deadMs) return "dead";
25
- if (elapsed > thresholds.staleMs) return "stale";
26
- if (elapsed > thresholds.warnMs) return "warn";
27
- return "healthy";
28
- }
1
+ import type { WorkerHeartbeatState } from "./worker-heartbeat.ts";
2
+
3
+ export type HeartbeatLevel = "healthy" | "warn" | "stale" | "dead";
4
+
5
+ export interface GradientThresholds {
6
+ warnMs: number;
7
+ staleMs: number;
8
+ deadMs: number;
9
+ }
10
+
11
+ export const DEFAULT_GRADIENT_THRESHOLDS: GradientThresholds = { warnMs: 30_000, staleMs: 60_000, deadMs: 300_000 };
12
+
13
+ export function heartbeatAgeMs(heartbeat: WorkerHeartbeatState | undefined, now = Date.now()): number {
14
+ if (!heartbeat) return Number.POSITIVE_INFINITY;
15
+ const lastSeen = Date.parse(heartbeat.lastSeenAt);
16
+ return Number.isFinite(lastSeen) ? Math.max(0, now - lastSeen) : Number.POSITIVE_INFINITY;
17
+ }
18
+
19
+ export function classifyHeartbeat(heartbeat: WorkerHeartbeatState | undefined, thresholds: GradientThresholds = DEFAULT_GRADIENT_THRESHOLDS, now = Date.now()): HeartbeatLevel {
20
+ if (!heartbeat) return "dead";
21
+ if (heartbeat.alive === false) return "dead";
22
+ const elapsed = heartbeatAgeMs(heartbeat, now);
23
+ if (!Number.isFinite(elapsed)) return "dead";
24
+ if (elapsed > thresholds.deadMs) return "dead";
25
+ if (elapsed > thresholds.staleMs) return "stale";
26
+ if (elapsed > thresholds.warnMs) return "warn";
27
+ return "healthy";
28
+ }
@@ -1,80 +1,80 @@
1
- import type { NotificationDescriptor } from "../extension/notification-router.ts";
2
- import type { MetricRegistry } from "../observability/metric-registry.ts";
3
- import { appendEvent } from "../state/event-log.ts";
4
- import { loadRunManifestById } from "../state/state-store.ts";
5
- import type { TeamRunManifest } from "../state/types.ts";
6
- import type { ManifestCache } from "./manifest-cache.ts";
7
- import { classifyHeartbeat, DEFAULT_GRADIENT_THRESHOLDS, heartbeatAgeMs, type GradientThresholds, type HeartbeatLevel } from "./heartbeat-gradient.ts";
8
-
9
- export interface HeartbeatWatcherRouter {
10
- enqueue(notification: NotificationDescriptor): boolean;
11
- }
12
-
13
- export interface HeartbeatWatcherOptions {
14
- cwd: string;
15
- pollIntervalMs?: number;
16
- thresholds?: GradientThresholds;
17
- manifestCache: ManifestCache;
18
- registry: MetricRegistry;
19
- router: HeartbeatWatcherRouter;
20
- deadletterTickThreshold?: number;
21
- onDead?: (runId: string, taskId: string, elapsed: number) => void;
22
- onDeadletterTrigger?: (manifest: TeamRunManifest, taskId: string) => void;
23
- }
24
-
25
- export class HeartbeatWatcher {
26
- private timer?: ReturnType<typeof setInterval>;
27
- private lastLevel = new Map<string, HeartbeatLevel>();
28
- private consecutiveDead = new Map<string, number>();
29
- private readonly opts: HeartbeatWatcherOptions;
30
-
31
- constructor(opts: HeartbeatWatcherOptions) {
32
- this.opts = opts;
33
- }
34
-
35
- start(): void {
36
- this.dispose();
37
- this.timer = setInterval(() => this.tick(), this.opts.pollIntervalMs ?? 5000);
38
- this.timer.unref?.();
39
- }
40
-
41
- tick(now = Date.now()): void {
42
- const thresholds = this.opts.thresholds ?? DEFAULT_GRADIENT_THRESHOLDS;
43
- const tickThreshold = this.opts.deadletterTickThreshold ?? 3;
44
- for (const run of this.opts.manifestCache.list(50)) {
45
- if (run.status !== "running") continue;
46
- const loaded = loadRunManifestById(this.opts.cwd, run.runId);
47
- if (!loaded) continue;
48
- for (const task of loaded.tasks) {
49
- if (task.status !== "running") continue;
50
- const key = `${run.runId}:${task.id}`;
51
- const elapsed = heartbeatAgeMs(task.heartbeat, now);
52
- const level = classifyHeartbeat(task.heartbeat, thresholds, now);
53
- this.opts.registry.gauge("crew.heartbeat.staleness_ms", "Heartbeat elapsed since last seen, milliseconds").set({ runId: run.runId, taskId: task.id }, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
54
- this.opts.registry.counter("crew.heartbeat.level_total", "Heartbeat classifications by level").inc({ runId: run.runId, level });
55
- const previous = this.lastLevel.get(key);
56
- this.lastLevel.set(key, level);
57
- if (level === "dead" && previous !== "dead") {
58
- this.opts.registry.counter("crew.heartbeat.dead_total", "Dead heartbeat detections").inc({ runId: run.runId });
59
- appendEvent(loaded.manifest.eventsPath, { type: "crew.task.heartbeat_dead", runId: run.runId, taskId: task.id, message: `Task ${task.id} heartbeat dead.`, data: { elapsedMs: Number.isFinite(elapsed) ? elapsed : undefined } });
60
- this.opts.router.enqueue({ id: `dead_${run.runId}_${task.id}`, severity: "warning", source: "heartbeat-watcher", runId: run.runId, title: `Task ${task.id} heartbeat dead`, body: "Background watcher detected a stuck worker." });
61
- this.opts.onDead?.(run.runId, task.id, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
62
- }
63
- if (level === "dead") {
64
- const count = (this.consecutiveDead.get(key) ?? 0) + 1;
65
- this.consecutiveDead.set(key, count);
66
- if (count === tickThreshold) this.opts.onDeadletterTrigger?.(loaded.manifest, task.id);
67
- } else {
68
- this.consecutiveDead.delete(key);
69
- }
70
- }
71
- }
72
- }
73
-
74
- dispose(): void {
75
- if (this.timer) clearInterval(this.timer);
76
- this.timer = undefined;
77
- this.lastLevel.clear();
78
- this.consecutiveDead.clear();
79
- }
80
- }
1
+ import type { NotificationDescriptor } from "../extension/notification-router.ts";
2
+ import type { MetricRegistry } from "../observability/metric-registry.ts";
3
+ import { appendEvent } from "../state/event-log.ts";
4
+ import { loadRunManifestById } from "../state/state-store.ts";
5
+ import type { TeamRunManifest } from "../state/types.ts";
6
+ import type { ManifestCache } from "./manifest-cache.ts";
7
+ import { classifyHeartbeat, DEFAULT_GRADIENT_THRESHOLDS, heartbeatAgeMs, type GradientThresholds, type HeartbeatLevel } from "./heartbeat-gradient.ts";
8
+
9
+ export interface HeartbeatWatcherRouter {
10
+ enqueue(notification: NotificationDescriptor): boolean;
11
+ }
12
+
13
+ export interface HeartbeatWatcherOptions {
14
+ cwd: string;
15
+ pollIntervalMs?: number;
16
+ thresholds?: GradientThresholds;
17
+ manifestCache: ManifestCache;
18
+ registry: MetricRegistry;
19
+ router: HeartbeatWatcherRouter;
20
+ deadletterTickThreshold?: number;
21
+ onDead?: (runId: string, taskId: string, elapsed: number) => void;
22
+ onDeadletterTrigger?: (manifest: TeamRunManifest, taskId: string) => void;
23
+ }
24
+
25
+ export class HeartbeatWatcher {
26
+ private timer?: ReturnType<typeof setInterval>;
27
+ private lastLevel = new Map<string, HeartbeatLevel>();
28
+ private consecutiveDead = new Map<string, number>();
29
+ private readonly opts: HeartbeatWatcherOptions;
30
+
31
+ constructor(opts: HeartbeatWatcherOptions) {
32
+ this.opts = opts;
33
+ }
34
+
35
+ start(): void {
36
+ this.dispose();
37
+ this.timer = setInterval(() => this.tick(), this.opts.pollIntervalMs ?? 5000);
38
+ this.timer.unref?.();
39
+ }
40
+
41
+ tick(now = Date.now()): void {
42
+ const thresholds = this.opts.thresholds ?? DEFAULT_GRADIENT_THRESHOLDS;
43
+ const tickThreshold = this.opts.deadletterTickThreshold ?? 3;
44
+ for (const run of this.opts.manifestCache.list(50)) {
45
+ if (run.status !== "running") continue;
46
+ const loaded = loadRunManifestById(this.opts.cwd, run.runId);
47
+ if (!loaded) continue;
48
+ for (const task of loaded.tasks) {
49
+ if (task.status !== "running") continue;
50
+ const key = `${run.runId}:${task.id}`;
51
+ const elapsed = heartbeatAgeMs(task.heartbeat, now);
52
+ const level = classifyHeartbeat(task.heartbeat, thresholds, now);
53
+ this.opts.registry.gauge("crew.heartbeat.staleness_ms", "Heartbeat elapsed since last seen, milliseconds").set({ runId: run.runId, taskId: task.id }, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
54
+ this.opts.registry.counter("crew.heartbeat.level_total", "Heartbeat classifications by level").inc({ runId: run.runId, level });
55
+ const previous = this.lastLevel.get(key);
56
+ this.lastLevel.set(key, level);
57
+ if (level === "dead" && previous !== "dead") {
58
+ this.opts.registry.counter("crew.heartbeat.dead_total", "Dead heartbeat detections").inc({ runId: run.runId });
59
+ appendEvent(loaded.manifest.eventsPath, { type: "crew.task.heartbeat_dead", runId: run.runId, taskId: task.id, message: `Task ${task.id} heartbeat dead.`, data: { elapsedMs: Number.isFinite(elapsed) ? elapsed : undefined } });
60
+ this.opts.router.enqueue({ id: `dead_${run.runId}_${task.id}`, severity: "warning", source: "heartbeat-watcher", runId: run.runId, title: `Task ${task.id} heartbeat dead`, body: "Background watcher detected a stuck worker." });
61
+ this.opts.onDead?.(run.runId, task.id, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
62
+ }
63
+ if (level === "dead") {
64
+ const count = (this.consecutiveDead.get(key) ?? 0) + 1;
65
+ this.consecutiveDead.set(key, count);
66
+ if (count === tickThreshold) this.opts.onDeadletterTrigger?.(loaded.manifest, task.id);
67
+ } else {
68
+ this.consecutiveDead.delete(key);
69
+ }
70
+ }
71
+ }
72
+ }
73
+
74
+ dispose(): void {
75
+ if (this.timer) clearInterval(this.timer);
76
+ this.timer = undefined;
77
+ this.lastLevel.clear();
78
+ this.consecutiveDead.clear();
79
+ }
80
+ }