pi-crew 0.1.37 → 0.1.39
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +1 -1
- package/CHANGELOG.md +27 -0
- package/README.md +5 -0
- package/agents/analyst.md +11 -11
- package/agents/critic.md +11 -11
- package/agents/executor.md +11 -11
- package/agents/explorer.md +11 -11
- package/agents/planner.md +11 -11
- package/agents/reviewer.md +11 -11
- package/agents/security-reviewer.md +11 -11
- package/agents/test-engineer.md +11 -11
- package/agents/verifier.md +11 -11
- package/agents/writer.md +11 -11
- package/docs/refactor-tasks-phase3.md +394 -394
- package/docs/refactor-tasks-phase4.md +564 -564
- package/docs/refactor-tasks-phase5.md +402 -402
- package/docs/refactor-tasks-phase6.md +662 -662
- package/docs/research-extension-examples.md +297 -297
- package/docs/research-extension-system.md +324 -324
- package/docs/research-optimization-plan.md +548 -548
- package/docs/research-pi-coding-agent.md +357 -357
- package/docs/research-source-pi-crew-reference.md +174 -174
- package/docs/resource-formats.md +10 -8
- package/docs/runtime-flow.md +148 -148
- package/docs/source-runtime-refactor-map.md +83 -83
- package/docs/usage.md +6 -0
- package/index.ts +6 -6
- package/package.json +3 -3
- package/schema.json +2 -2
- package/src/agents/agent-serializer.ts +34 -34
- package/src/config/config.ts +8 -4
- package/src/extension/cross-extension-rpc.ts +82 -82
- package/src/extension/import-index.ts +18 -2
- package/src/extension/register.ts +11 -1
- package/src/extension/registration/compaction-guard.ts +125 -125
- package/src/extension/registration/subagent-helpers.ts +30 -6
- package/src/extension/registration/subagent-tools.ts +8 -3
- package/src/extension/result-watcher.ts +98 -98
- package/src/extension/run-import.ts +12 -2
- package/src/extension/run-index.ts +12 -2
- package/src/extension/run-maintenance.ts +24 -24
- package/src/extension/team-tool/api.ts +54 -14
- package/src/extension/team-tool/cancel.ts +31 -31
- package/src/extension/team-tool/doctor.ts +179 -179
- package/src/extension/team-tool/inspect.ts +41 -41
- package/src/extension/team-tool/lifecycle-actions.ts +79 -79
- package/src/extension/team-tool/plan.ts +19 -19
- package/src/extension/team-tool/status.ts +73 -73
- package/src/observability/correlation.ts +35 -35
- package/src/observability/event-to-metric.ts +54 -54
- package/src/observability/exporters/adapter.ts +24 -24
- package/src/observability/exporters/otlp-exporter.ts +65 -65
- package/src/observability/exporters/prometheus-exporter.ts +47 -47
- package/src/observability/metric-registry.ts +72 -72
- package/src/observability/metric-retention.ts +46 -46
- package/src/observability/metric-sink.ts +51 -51
- package/src/observability/metrics-primitives.ts +166 -166
- package/src/prompt/prompt-runtime.ts +68 -68
- package/src/runtime/agent-control.ts +64 -64
- package/src/runtime/agent-memory.ts +72 -72
- package/src/runtime/agent-observability.ts +114 -113
- package/src/runtime/async-marker.ts +26 -26
- package/src/runtime/background-runner.ts +53 -53
- package/src/runtime/crash-recovery.ts +56 -56
- package/src/runtime/crew-agent-records.ts +54 -9
- package/src/runtime/crew-agent-runtime.ts +58 -58
- package/src/runtime/deadletter.ts +36 -36
- package/src/runtime/direct-run.ts +35 -35
- package/src/runtime/foreground-control.ts +82 -82
- package/src/runtime/green-contract.ts +46 -46
- package/src/runtime/group-join.ts +88 -88
- package/src/runtime/heartbeat-gradient.ts +28 -28
- package/src/runtime/heartbeat-watcher.ts +80 -80
- package/src/runtime/live-agent-control.ts +87 -78
- package/src/runtime/live-agent-manager.ts +85 -85
- package/src/runtime/live-control-realtime.ts +36 -36
- package/src/runtime/live-session-runtime.ts +299 -299
- package/src/runtime/manifest-cache.ts +248 -212
- package/src/runtime/model-fallback.ts +261 -261
- package/src/runtime/parallel-research.ts +44 -44
- package/src/runtime/parallel-utils.ts +99 -99
- package/src/runtime/pi-json-output.ts +111 -111
- package/src/runtime/policy-engine.ts +78 -78
- package/src/runtime/post-exit-stdio-guard.ts +86 -86
- package/src/runtime/process-status.ts +56 -56
- package/src/runtime/progress-event-coalescer.ts +43 -43
- package/src/runtime/recovery-recipes.ts +74 -74
- package/src/runtime/retry-executor.ts +59 -59
- package/src/runtime/role-permission.ts +39 -39
- package/src/runtime/session-usage.ts +79 -79
- package/src/runtime/sidechain-output.ts +28 -28
- package/src/runtime/subagent-manager.ts +80 -12
- package/src/runtime/task-display.ts +38 -38
- package/src/runtime/task-output-context.ts +127 -106
- package/src/runtime/task-runner/live-executor.ts +98 -98
- package/src/runtime/task-runner/progress.ts +111 -111
- package/src/runtime/task-runner/result-utils.ts +14 -14
- package/src/runtime/task-runner/state-helpers.ts +22 -22
- package/src/runtime/team-runner.ts +1 -1
- package/src/runtime/worker-heartbeat.ts +21 -21
- package/src/runtime/worker-startup.ts +57 -57
- package/src/schema/config-schema.ts +21 -21
- package/src/schema/team-tool-schema.ts +100 -100
- package/src/state/artifact-store.ts +122 -108
- package/src/state/contracts.ts +105 -105
- package/src/state/jsonl-writer.ts +77 -77
- package/src/state/mailbox.ts +67 -22
- package/src/state/state-store.ts +36 -5
- package/src/state/task-claims.ts +42 -42
- package/src/state/usage.ts +29 -29
- package/src/subagents/async-entry.ts +1 -1
- package/src/subagents/index.ts +3 -3
- package/src/subagents/live/control.ts +1 -1
- package/src/subagents/live/manager.ts +1 -1
- package/src/subagents/live/realtime.ts +1 -1
- package/src/subagents/live/session-runtime.ts +1 -1
- package/src/subagents/manager.ts +1 -1
- package/src/subagents/spawn.ts +1 -1
- package/src/teams/discover-teams.ts +27 -5
- package/src/teams/team-serializer.ts +38 -36
- package/src/types/diff.d.ts +18 -18
- package/src/ui/crew-footer.ts +101 -101
- package/src/ui/crew-select-list.ts +111 -111
- package/src/ui/dashboard-panes/metrics-pane.ts +34 -34
- package/src/ui/dynamic-border.ts +25 -25
- package/src/ui/layout-primitives.ts +106 -106
- package/src/ui/loaders.ts +158 -158
- package/src/ui/mascot.ts +441 -441
- package/src/ui/render-diff.ts +119 -119
- package/src/ui/run-dashboard.ts +5 -2
- package/src/ui/run-snapshot-cache.ts +19 -8
- package/src/ui/spinner.ts +17 -17
- package/src/ui/status-colors.ts +54 -54
- package/src/ui/syntax-highlight.ts +116 -116
- package/src/ui/transcript-viewer.ts +15 -1
- package/src/utils/completion-dedupe.ts +63 -63
- package/src/utils/file-coalescer.ts +84 -84
- package/src/utils/frontmatter.ts +36 -36
- package/src/utils/fs-watch.ts +31 -31
- package/src/utils/git.ts +262 -262
- package/src/utils/ids.ts +12 -12
- package/src/utils/names.ts +26 -26
- package/src/utils/paths.ts +3 -2
- package/src/utils/safe-paths.ts +34 -0
- package/src/utils/sleep.ts +32 -32
- package/src/utils/timings.ts +31 -31
- package/src/utils/visual.ts +159 -159
- package/src/workflows/discover-workflows.ts +30 -3
- package/src/workflows/validate-workflow.ts +40 -40
- package/src/worktree/branch-freshness.ts +45 -45
- package/teams/default.team.md +12 -12
- package/teams/fast-fix.team.md +11 -11
- package/teams/implementation.team.md +18 -18
- package/teams/parallel-research.team.md +14 -14
- package/teams/research.team.md +11 -11
- package/teams/review.team.md +12 -12
- package/workflows/default.workflow.md +29 -29
- package/workflows/fast-fix.workflow.md +22 -22
- package/workflows/implementation.workflow.md +38 -38
- package/workflows/parallel-research.workflow.md +46 -46
- package/workflows/research.workflow.md +22 -22
- package/workflows/review.workflow.md +30 -30
|
@@ -1,46 +1,46 @@
|
|
|
1
|
-
import type { GreenLevel, VerificationContract, VerificationEvidence } from "../state/types.ts";
|
|
2
|
-
|
|
3
|
-
const GREEN_ORDER: Record<GreenLevel, number> = {
|
|
4
|
-
none: 0,
|
|
5
|
-
targeted: 1,
|
|
6
|
-
package: 2,
|
|
7
|
-
workspace: 3,
|
|
8
|
-
merge_ready: 4,
|
|
9
|
-
};
|
|
10
|
-
|
|
11
|
-
export interface GreenContractOutcome {
|
|
12
|
-
requiredGreenLevel: GreenLevel;
|
|
13
|
-
observedGreenLevel: GreenLevel;
|
|
14
|
-
satisfied: boolean;
|
|
15
|
-
}
|
|
16
|
-
|
|
17
|
-
export function greenLevelSatisfies(observed: GreenLevel, required: GreenLevel): boolean {
|
|
18
|
-
return GREEN_ORDER[observed] >= GREEN_ORDER[required];
|
|
19
|
-
}
|
|
20
|
-
|
|
21
|
-
export function evaluateGreenContract(contract: VerificationContract, evidence?: VerificationEvidence): GreenContractOutcome {
|
|
22
|
-
const observedGreenLevel = evidence?.observedGreenLevel ?? "none";
|
|
23
|
-
return {
|
|
24
|
-
requiredGreenLevel: contract.requiredGreenLevel,
|
|
25
|
-
observedGreenLevel,
|
|
26
|
-
satisfied: greenLevelSatisfies(observedGreenLevel, contract.requiredGreenLevel),
|
|
27
|
-
};
|
|
28
|
-
}
|
|
29
|
-
|
|
30
|
-
export function inferGreenLevelFromTask(success: boolean, contract: VerificationContract): GreenLevel {
|
|
31
|
-
if (!success) return "none";
|
|
32
|
-
if (contract.requiredGreenLevel === "none") return "none";
|
|
33
|
-
return contract.allowManualEvidence ? contract.requiredGreenLevel : "targeted";
|
|
34
|
-
}
|
|
35
|
-
|
|
36
|
-
export function createVerificationEvidence(contract: VerificationContract, success: boolean, notes: string): VerificationEvidence {
|
|
37
|
-
const observedGreenLevel = inferGreenLevelFromTask(success, contract);
|
|
38
|
-
const outcome = evaluateGreenContract(contract, { requiredGreenLevel: contract.requiredGreenLevel, observedGreenLevel, satisfied: false, commands: [], notes });
|
|
39
|
-
return {
|
|
40
|
-
requiredGreenLevel: contract.requiredGreenLevel,
|
|
41
|
-
observedGreenLevel,
|
|
42
|
-
satisfied: outcome.satisfied,
|
|
43
|
-
commands: contract.commands.map((cmd) => ({ cmd, status: "not_run" as const })),
|
|
44
|
-
notes,
|
|
45
|
-
};
|
|
46
|
-
}
|
|
1
|
+
import type { GreenLevel, VerificationContract, VerificationEvidence } from "../state/types.ts";
|
|
2
|
+
|
|
3
|
+
const GREEN_ORDER: Record<GreenLevel, number> = {
|
|
4
|
+
none: 0,
|
|
5
|
+
targeted: 1,
|
|
6
|
+
package: 2,
|
|
7
|
+
workspace: 3,
|
|
8
|
+
merge_ready: 4,
|
|
9
|
+
};
|
|
10
|
+
|
|
11
|
+
export interface GreenContractOutcome {
|
|
12
|
+
requiredGreenLevel: GreenLevel;
|
|
13
|
+
observedGreenLevel: GreenLevel;
|
|
14
|
+
satisfied: boolean;
|
|
15
|
+
}
|
|
16
|
+
|
|
17
|
+
export function greenLevelSatisfies(observed: GreenLevel, required: GreenLevel): boolean {
|
|
18
|
+
return GREEN_ORDER[observed] >= GREEN_ORDER[required];
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
export function evaluateGreenContract(contract: VerificationContract, evidence?: VerificationEvidence): GreenContractOutcome {
|
|
22
|
+
const observedGreenLevel = evidence?.observedGreenLevel ?? "none";
|
|
23
|
+
return {
|
|
24
|
+
requiredGreenLevel: contract.requiredGreenLevel,
|
|
25
|
+
observedGreenLevel,
|
|
26
|
+
satisfied: greenLevelSatisfies(observedGreenLevel, contract.requiredGreenLevel),
|
|
27
|
+
};
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
export function inferGreenLevelFromTask(success: boolean, contract: VerificationContract): GreenLevel {
|
|
31
|
+
if (!success) return "none";
|
|
32
|
+
if (contract.requiredGreenLevel === "none") return "none";
|
|
33
|
+
return contract.allowManualEvidence ? contract.requiredGreenLevel : "targeted";
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
export function createVerificationEvidence(contract: VerificationContract, success: boolean, notes: string): VerificationEvidence {
|
|
37
|
+
const observedGreenLevel = inferGreenLevelFromTask(success, contract);
|
|
38
|
+
const outcome = evaluateGreenContract(contract, { requiredGreenLevel: contract.requiredGreenLevel, observedGreenLevel, satisfied: false, commands: [], notes });
|
|
39
|
+
return {
|
|
40
|
+
requiredGreenLevel: contract.requiredGreenLevel,
|
|
41
|
+
observedGreenLevel,
|
|
42
|
+
satisfied: outcome.satisfied,
|
|
43
|
+
commands: contract.commands.map((cmd) => ({ cmd, status: "not_run" as const })),
|
|
44
|
+
notes,
|
|
45
|
+
};
|
|
46
|
+
}
|
|
@@ -1,88 +1,88 @@
|
|
|
1
|
-
import type { CrewRuntimeConfig } from "../config/config.ts";
|
|
2
|
-
import { writeArtifact } from "../state/artifact-store.ts";
|
|
3
|
-
import { appendEvent } from "../state/event-log.ts";
|
|
4
|
-
import { appendMailboxMessage } from "../state/mailbox.ts";
|
|
5
|
-
import type { ArtifactDescriptor, TeamRunManifest, TeamTaskState } from "../state/types.ts";
|
|
6
|
-
import { aggregateTaskOutputs } from "./task-output-context.ts";
|
|
7
|
-
|
|
8
|
-
export type CrewGroupJoinMode = "off" | "group" | "smart";
|
|
9
|
-
|
|
10
|
-
export interface CrewGroupJoinDelivery {
|
|
11
|
-
batchId: string;
|
|
12
|
-
mode: CrewGroupJoinMode;
|
|
13
|
-
partial: boolean;
|
|
14
|
-
taskIds: string[];
|
|
15
|
-
completed: string[];
|
|
16
|
-
failed: string[];
|
|
17
|
-
skipped: string[];
|
|
18
|
-
remaining: string[];
|
|
19
|
-
artifact?: ArtifactDescriptor;
|
|
20
|
-
messageId?: string;
|
|
21
|
-
}
|
|
22
|
-
|
|
23
|
-
export function resolveGroupJoinMode(runtime?: CrewRuntimeConfig): CrewGroupJoinMode {
|
|
24
|
-
return runtime?.groupJoin ?? "smart";
|
|
25
|
-
}
|
|
26
|
-
|
|
27
|
-
export function shouldGroupJoin(mode: CrewGroupJoinMode, batch: TeamTaskState[]): boolean {
|
|
28
|
-
if (mode === "off") return false;
|
|
29
|
-
if (mode === "group") return batch.length > 0;
|
|
30
|
-
return batch.length > 1;
|
|
31
|
-
}
|
|
32
|
-
|
|
33
|
-
function batchIdFor(runId: string, taskIds: string[]): string {
|
|
34
|
-
return `${runId}_${taskIds.join("+").replace(/[^a-zA-Z0-9_+-]/g, "_")}`;
|
|
35
|
-
}
|
|
36
|
-
|
|
37
|
-
function statusList(tasks: TeamTaskState[], status: TeamTaskState["status"]): string[] {
|
|
38
|
-
return tasks.filter((task) => task.status === status).map((task) => task.id);
|
|
39
|
-
}
|
|
40
|
-
|
|
41
|
-
export function deliverGroupJoin(input: {
|
|
42
|
-
manifest: TeamRunManifest;
|
|
43
|
-
mode: CrewGroupJoinMode;
|
|
44
|
-
batch: TeamTaskState[];
|
|
45
|
-
allTasks: TeamTaskState[];
|
|
46
|
-
partial?: boolean;
|
|
47
|
-
}): CrewGroupJoinDelivery | undefined {
|
|
48
|
-
if (!shouldGroupJoin(input.mode, input.batch)) return undefined;
|
|
49
|
-
const taskIds = input.batch.map((task) => task.id);
|
|
50
|
-
const latest = taskIds.map((id) => input.allTasks.find((task) => task.id === id)).filter((task): task is TeamTaskState => Boolean(task));
|
|
51
|
-
const completed = statusList(latest, "completed");
|
|
52
|
-
const failed = statusList(latest, "failed");
|
|
53
|
-
const skipped = statusList(latest, "skipped");
|
|
54
|
-
const remaining = latest.filter((task) => task.status === "queued" || task.status === "running").map((task) => task.id);
|
|
55
|
-
const partial = input.partial ?? remaining.length > 0;
|
|
56
|
-
const batchId = batchIdFor(input.manifest.runId, taskIds);
|
|
57
|
-
const summary = aggregateTaskOutputs(latest);
|
|
58
|
-
const delivery: CrewGroupJoinDelivery = { batchId, mode: input.mode, partial, taskIds, completed, failed, skipped, remaining };
|
|
59
|
-
const content = `${JSON.stringify({ ...delivery, createdAt: new Date().toISOString() }, null, 2)}\n`;
|
|
60
|
-
const artifact = writeArtifact(input.manifest.artifactsRoot, {
|
|
61
|
-
kind: "metadata",
|
|
62
|
-
relativePath: `metadata/group-joins/${batchId}.json`,
|
|
63
|
-
producer: "group-join",
|
|
64
|
-
content,
|
|
65
|
-
});
|
|
66
|
-
const mailbox = appendMailboxMessage(input.manifest, {
|
|
67
|
-
direction: "outbox",
|
|
68
|
-
from: "group-join",
|
|
69
|
-
to: "leader",
|
|
70
|
-
body: [
|
|
71
|
-
`Group join ${partial ? "partial" : "completed"}: ${taskIds.join(", ")}`,
|
|
72
|
-
`Completed: ${completed.join(", ") || "none"}`,
|
|
73
|
-
`Failed: ${failed.join(", ") || "none"}`,
|
|
74
|
-
`Skipped: ${skipped.join(", ") || "none"}`,
|
|
75
|
-
`Remaining: ${remaining.join(", ") || "none"}`,
|
|
76
|
-
"",
|
|
77
|
-
summary,
|
|
78
|
-
].join("\n"),
|
|
79
|
-
status: "delivered",
|
|
80
|
-
});
|
|
81
|
-
appendEvent(input.manifest.eventsPath, {
|
|
82
|
-
type: partial ? "agent.group_join.partial" : "agent.group_join.completed",
|
|
83
|
-
runId: input.manifest.runId,
|
|
84
|
-
message: `Group join ${partial ? "partial" : "completed"} for ${taskIds.length} task(s).`,
|
|
85
|
-
data: { ...delivery, artifactPath: artifact.path, messageId: mailbox.id },
|
|
86
|
-
});
|
|
87
|
-
return { ...delivery, artifact, messageId: mailbox.id };
|
|
88
|
-
}
|
|
1
|
+
import type { CrewRuntimeConfig } from "../config/config.ts";
|
|
2
|
+
import { writeArtifact } from "../state/artifact-store.ts";
|
|
3
|
+
import { appendEvent } from "../state/event-log.ts";
|
|
4
|
+
import { appendMailboxMessage } from "../state/mailbox.ts";
|
|
5
|
+
import type { ArtifactDescriptor, TeamRunManifest, TeamTaskState } from "../state/types.ts";
|
|
6
|
+
import { aggregateTaskOutputs } from "./task-output-context.ts";
|
|
7
|
+
|
|
8
|
+
export type CrewGroupJoinMode = "off" | "group" | "smart";
|
|
9
|
+
|
|
10
|
+
export interface CrewGroupJoinDelivery {
|
|
11
|
+
batchId: string;
|
|
12
|
+
mode: CrewGroupJoinMode;
|
|
13
|
+
partial: boolean;
|
|
14
|
+
taskIds: string[];
|
|
15
|
+
completed: string[];
|
|
16
|
+
failed: string[];
|
|
17
|
+
skipped: string[];
|
|
18
|
+
remaining: string[];
|
|
19
|
+
artifact?: ArtifactDescriptor;
|
|
20
|
+
messageId?: string;
|
|
21
|
+
}
|
|
22
|
+
|
|
23
|
+
export function resolveGroupJoinMode(runtime?: CrewRuntimeConfig): CrewGroupJoinMode {
|
|
24
|
+
return runtime?.groupJoin ?? "smart";
|
|
25
|
+
}
|
|
26
|
+
|
|
27
|
+
export function shouldGroupJoin(mode: CrewGroupJoinMode, batch: TeamTaskState[]): boolean {
|
|
28
|
+
if (mode === "off") return false;
|
|
29
|
+
if (mode === "group") return batch.length > 0;
|
|
30
|
+
return batch.length > 1;
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
function batchIdFor(runId: string, taskIds: string[]): string {
|
|
34
|
+
return `${runId}_${taskIds.join("+").replace(/[^a-zA-Z0-9_+-]/g, "_")}`;
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
function statusList(tasks: TeamTaskState[], status: TeamTaskState["status"]): string[] {
|
|
38
|
+
return tasks.filter((task) => task.status === status).map((task) => task.id);
|
|
39
|
+
}
|
|
40
|
+
|
|
41
|
+
export function deliverGroupJoin(input: {
|
|
42
|
+
manifest: TeamRunManifest;
|
|
43
|
+
mode: CrewGroupJoinMode;
|
|
44
|
+
batch: TeamTaskState[];
|
|
45
|
+
allTasks: TeamTaskState[];
|
|
46
|
+
partial?: boolean;
|
|
47
|
+
}): CrewGroupJoinDelivery | undefined {
|
|
48
|
+
if (!shouldGroupJoin(input.mode, input.batch)) return undefined;
|
|
49
|
+
const taskIds = input.batch.map((task) => task.id);
|
|
50
|
+
const latest = taskIds.map((id) => input.allTasks.find((task) => task.id === id)).filter((task): task is TeamTaskState => Boolean(task));
|
|
51
|
+
const completed = statusList(latest, "completed");
|
|
52
|
+
const failed = statusList(latest, "failed");
|
|
53
|
+
const skipped = statusList(latest, "skipped");
|
|
54
|
+
const remaining = latest.filter((task) => task.status === "queued" || task.status === "running").map((task) => task.id);
|
|
55
|
+
const partial = input.partial ?? remaining.length > 0;
|
|
56
|
+
const batchId = batchIdFor(input.manifest.runId, taskIds);
|
|
57
|
+
const summary = aggregateTaskOutputs(latest, input.manifest);
|
|
58
|
+
const delivery: CrewGroupJoinDelivery = { batchId, mode: input.mode, partial, taskIds, completed, failed, skipped, remaining };
|
|
59
|
+
const content = `${JSON.stringify({ ...delivery, createdAt: new Date().toISOString() }, null, 2)}\n`;
|
|
60
|
+
const artifact = writeArtifact(input.manifest.artifactsRoot, {
|
|
61
|
+
kind: "metadata",
|
|
62
|
+
relativePath: `metadata/group-joins/${batchId}.json`,
|
|
63
|
+
producer: "group-join",
|
|
64
|
+
content,
|
|
65
|
+
});
|
|
66
|
+
const mailbox = appendMailboxMessage(input.manifest, {
|
|
67
|
+
direction: "outbox",
|
|
68
|
+
from: "group-join",
|
|
69
|
+
to: "leader",
|
|
70
|
+
body: [
|
|
71
|
+
`Group join ${partial ? "partial" : "completed"}: ${taskIds.join(", ")}`,
|
|
72
|
+
`Completed: ${completed.join(", ") || "none"}`,
|
|
73
|
+
`Failed: ${failed.join(", ") || "none"}`,
|
|
74
|
+
`Skipped: ${skipped.join(", ") || "none"}`,
|
|
75
|
+
`Remaining: ${remaining.join(", ") || "none"}`,
|
|
76
|
+
"",
|
|
77
|
+
summary,
|
|
78
|
+
].join("\n"),
|
|
79
|
+
status: "delivered",
|
|
80
|
+
});
|
|
81
|
+
appendEvent(input.manifest.eventsPath, {
|
|
82
|
+
type: partial ? "agent.group_join.partial" : "agent.group_join.completed",
|
|
83
|
+
runId: input.manifest.runId,
|
|
84
|
+
message: `Group join ${partial ? "partial" : "completed"} for ${taskIds.length} task(s).`,
|
|
85
|
+
data: { ...delivery, artifactPath: artifact.path, messageId: mailbox.id },
|
|
86
|
+
});
|
|
87
|
+
return { ...delivery, artifact, messageId: mailbox.id };
|
|
88
|
+
}
|
|
@@ -1,28 +1,28 @@
|
|
|
1
|
-
import type { WorkerHeartbeatState } from "./worker-heartbeat.ts";
|
|
2
|
-
|
|
3
|
-
export type HeartbeatLevel = "healthy" | "warn" | "stale" | "dead";
|
|
4
|
-
|
|
5
|
-
export interface GradientThresholds {
|
|
6
|
-
warnMs: number;
|
|
7
|
-
staleMs: number;
|
|
8
|
-
deadMs: number;
|
|
9
|
-
}
|
|
10
|
-
|
|
11
|
-
export const DEFAULT_GRADIENT_THRESHOLDS: GradientThresholds = { warnMs: 30_000, staleMs: 60_000, deadMs: 300_000 };
|
|
12
|
-
|
|
13
|
-
export function heartbeatAgeMs(heartbeat: WorkerHeartbeatState | undefined, now = Date.now()): number {
|
|
14
|
-
if (!heartbeat) return Number.POSITIVE_INFINITY;
|
|
15
|
-
const lastSeen = Date.parse(heartbeat.lastSeenAt);
|
|
16
|
-
return Number.isFinite(lastSeen) ? Math.max(0, now - lastSeen) : Number.POSITIVE_INFINITY;
|
|
17
|
-
}
|
|
18
|
-
|
|
19
|
-
export function classifyHeartbeat(heartbeat: WorkerHeartbeatState | undefined, thresholds: GradientThresholds = DEFAULT_GRADIENT_THRESHOLDS, now = Date.now()): HeartbeatLevel {
|
|
20
|
-
if (!heartbeat) return "dead";
|
|
21
|
-
if (heartbeat.alive === false) return "dead";
|
|
22
|
-
const elapsed = heartbeatAgeMs(heartbeat, now);
|
|
23
|
-
if (!Number.isFinite(elapsed)) return "dead";
|
|
24
|
-
if (elapsed > thresholds.deadMs) return "dead";
|
|
25
|
-
if (elapsed > thresholds.staleMs) return "stale";
|
|
26
|
-
if (elapsed > thresholds.warnMs) return "warn";
|
|
27
|
-
return "healthy";
|
|
28
|
-
}
|
|
1
|
+
import type { WorkerHeartbeatState } from "./worker-heartbeat.ts";
|
|
2
|
+
|
|
3
|
+
export type HeartbeatLevel = "healthy" | "warn" | "stale" | "dead";
|
|
4
|
+
|
|
5
|
+
export interface GradientThresholds {
|
|
6
|
+
warnMs: number;
|
|
7
|
+
staleMs: number;
|
|
8
|
+
deadMs: number;
|
|
9
|
+
}
|
|
10
|
+
|
|
11
|
+
export const DEFAULT_GRADIENT_THRESHOLDS: GradientThresholds = { warnMs: 30_000, staleMs: 60_000, deadMs: 300_000 };
|
|
12
|
+
|
|
13
|
+
export function heartbeatAgeMs(heartbeat: WorkerHeartbeatState | undefined, now = Date.now()): number {
|
|
14
|
+
if (!heartbeat) return Number.POSITIVE_INFINITY;
|
|
15
|
+
const lastSeen = Date.parse(heartbeat.lastSeenAt);
|
|
16
|
+
return Number.isFinite(lastSeen) ? Math.max(0, now - lastSeen) : Number.POSITIVE_INFINITY;
|
|
17
|
+
}
|
|
18
|
+
|
|
19
|
+
export function classifyHeartbeat(heartbeat: WorkerHeartbeatState | undefined, thresholds: GradientThresholds = DEFAULT_GRADIENT_THRESHOLDS, now = Date.now()): HeartbeatLevel {
|
|
20
|
+
if (!heartbeat) return "dead";
|
|
21
|
+
if (heartbeat.alive === false) return "dead";
|
|
22
|
+
const elapsed = heartbeatAgeMs(heartbeat, now);
|
|
23
|
+
if (!Number.isFinite(elapsed)) return "dead";
|
|
24
|
+
if (elapsed > thresholds.deadMs) return "dead";
|
|
25
|
+
if (elapsed > thresholds.staleMs) return "stale";
|
|
26
|
+
if (elapsed > thresholds.warnMs) return "warn";
|
|
27
|
+
return "healthy";
|
|
28
|
+
}
|
|
@@ -1,80 +1,80 @@
|
|
|
1
|
-
import type { NotificationDescriptor } from "../extension/notification-router.ts";
|
|
2
|
-
import type { MetricRegistry } from "../observability/metric-registry.ts";
|
|
3
|
-
import { appendEvent } from "../state/event-log.ts";
|
|
4
|
-
import { loadRunManifestById } from "../state/state-store.ts";
|
|
5
|
-
import type { TeamRunManifest } from "../state/types.ts";
|
|
6
|
-
import type { ManifestCache } from "./manifest-cache.ts";
|
|
7
|
-
import { classifyHeartbeat, DEFAULT_GRADIENT_THRESHOLDS, heartbeatAgeMs, type GradientThresholds, type HeartbeatLevel } from "./heartbeat-gradient.ts";
|
|
8
|
-
|
|
9
|
-
export interface HeartbeatWatcherRouter {
|
|
10
|
-
enqueue(notification: NotificationDescriptor): boolean;
|
|
11
|
-
}
|
|
12
|
-
|
|
13
|
-
export interface HeartbeatWatcherOptions {
|
|
14
|
-
cwd: string;
|
|
15
|
-
pollIntervalMs?: number;
|
|
16
|
-
thresholds?: GradientThresholds;
|
|
17
|
-
manifestCache: ManifestCache;
|
|
18
|
-
registry: MetricRegistry;
|
|
19
|
-
router: HeartbeatWatcherRouter;
|
|
20
|
-
deadletterTickThreshold?: number;
|
|
21
|
-
onDead?: (runId: string, taskId: string, elapsed: number) => void;
|
|
22
|
-
onDeadletterTrigger?: (manifest: TeamRunManifest, taskId: string) => void;
|
|
23
|
-
}
|
|
24
|
-
|
|
25
|
-
export class HeartbeatWatcher {
|
|
26
|
-
private timer?: ReturnType<typeof setInterval>;
|
|
27
|
-
private lastLevel = new Map<string, HeartbeatLevel>();
|
|
28
|
-
private consecutiveDead = new Map<string, number>();
|
|
29
|
-
private readonly opts: HeartbeatWatcherOptions;
|
|
30
|
-
|
|
31
|
-
constructor(opts: HeartbeatWatcherOptions) {
|
|
32
|
-
this.opts = opts;
|
|
33
|
-
}
|
|
34
|
-
|
|
35
|
-
start(): void {
|
|
36
|
-
this.dispose();
|
|
37
|
-
this.timer = setInterval(() => this.tick(), this.opts.pollIntervalMs ?? 5000);
|
|
38
|
-
this.timer.unref?.();
|
|
39
|
-
}
|
|
40
|
-
|
|
41
|
-
tick(now = Date.now()): void {
|
|
42
|
-
const thresholds = this.opts.thresholds ?? DEFAULT_GRADIENT_THRESHOLDS;
|
|
43
|
-
const tickThreshold = this.opts.deadletterTickThreshold ?? 3;
|
|
44
|
-
for (const run of this.opts.manifestCache.list(50)) {
|
|
45
|
-
if (run.status !== "running") continue;
|
|
46
|
-
const loaded = loadRunManifestById(this.opts.cwd, run.runId);
|
|
47
|
-
if (!loaded) continue;
|
|
48
|
-
for (const task of loaded.tasks) {
|
|
49
|
-
if (task.status !== "running") continue;
|
|
50
|
-
const key = `${run.runId}:${task.id}`;
|
|
51
|
-
const elapsed = heartbeatAgeMs(task.heartbeat, now);
|
|
52
|
-
const level = classifyHeartbeat(task.heartbeat, thresholds, now);
|
|
53
|
-
this.opts.registry.gauge("crew.heartbeat.staleness_ms", "Heartbeat elapsed since last seen, milliseconds").set({ runId: run.runId, taskId: task.id }, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
|
|
54
|
-
this.opts.registry.counter("crew.heartbeat.level_total", "Heartbeat classifications by level").inc({ runId: run.runId, level });
|
|
55
|
-
const previous = this.lastLevel.get(key);
|
|
56
|
-
this.lastLevel.set(key, level);
|
|
57
|
-
if (level === "dead" && previous !== "dead") {
|
|
58
|
-
this.opts.registry.counter("crew.heartbeat.dead_total", "Dead heartbeat detections").inc({ runId: run.runId });
|
|
59
|
-
appendEvent(loaded.manifest.eventsPath, { type: "crew.task.heartbeat_dead", runId: run.runId, taskId: task.id, message: `Task ${task.id} heartbeat dead.`, data: { elapsedMs: Number.isFinite(elapsed) ? elapsed : undefined } });
|
|
60
|
-
this.opts.router.enqueue({ id: `dead_${run.runId}_${task.id}`, severity: "warning", source: "heartbeat-watcher", runId: run.runId, title: `Task ${task.id} heartbeat dead`, body: "Background watcher detected a stuck worker." });
|
|
61
|
-
this.opts.onDead?.(run.runId, task.id, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
|
|
62
|
-
}
|
|
63
|
-
if (level === "dead") {
|
|
64
|
-
const count = (this.consecutiveDead.get(key) ?? 0) + 1;
|
|
65
|
-
this.consecutiveDead.set(key, count);
|
|
66
|
-
if (count === tickThreshold) this.opts.onDeadletterTrigger?.(loaded.manifest, task.id);
|
|
67
|
-
} else {
|
|
68
|
-
this.consecutiveDead.delete(key);
|
|
69
|
-
}
|
|
70
|
-
}
|
|
71
|
-
}
|
|
72
|
-
}
|
|
73
|
-
|
|
74
|
-
dispose(): void {
|
|
75
|
-
if (this.timer) clearInterval(this.timer);
|
|
76
|
-
this.timer = undefined;
|
|
77
|
-
this.lastLevel.clear();
|
|
78
|
-
this.consecutiveDead.clear();
|
|
79
|
-
}
|
|
80
|
-
}
|
|
1
|
+
import type { NotificationDescriptor } from "../extension/notification-router.ts";
|
|
2
|
+
import type { MetricRegistry } from "../observability/metric-registry.ts";
|
|
3
|
+
import { appendEvent } from "../state/event-log.ts";
|
|
4
|
+
import { loadRunManifestById } from "../state/state-store.ts";
|
|
5
|
+
import type { TeamRunManifest } from "../state/types.ts";
|
|
6
|
+
import type { ManifestCache } from "./manifest-cache.ts";
|
|
7
|
+
import { classifyHeartbeat, DEFAULT_GRADIENT_THRESHOLDS, heartbeatAgeMs, type GradientThresholds, type HeartbeatLevel } from "./heartbeat-gradient.ts";
|
|
8
|
+
|
|
9
|
+
export interface HeartbeatWatcherRouter {
|
|
10
|
+
enqueue(notification: NotificationDescriptor): boolean;
|
|
11
|
+
}
|
|
12
|
+
|
|
13
|
+
export interface HeartbeatWatcherOptions {
|
|
14
|
+
cwd: string;
|
|
15
|
+
pollIntervalMs?: number;
|
|
16
|
+
thresholds?: GradientThresholds;
|
|
17
|
+
manifestCache: ManifestCache;
|
|
18
|
+
registry: MetricRegistry;
|
|
19
|
+
router: HeartbeatWatcherRouter;
|
|
20
|
+
deadletterTickThreshold?: number;
|
|
21
|
+
onDead?: (runId: string, taskId: string, elapsed: number) => void;
|
|
22
|
+
onDeadletterTrigger?: (manifest: TeamRunManifest, taskId: string) => void;
|
|
23
|
+
}
|
|
24
|
+
|
|
25
|
+
export class HeartbeatWatcher {
|
|
26
|
+
private timer?: ReturnType<typeof setInterval>;
|
|
27
|
+
private lastLevel = new Map<string, HeartbeatLevel>();
|
|
28
|
+
private consecutiveDead = new Map<string, number>();
|
|
29
|
+
private readonly opts: HeartbeatWatcherOptions;
|
|
30
|
+
|
|
31
|
+
constructor(opts: HeartbeatWatcherOptions) {
|
|
32
|
+
this.opts = opts;
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
start(): void {
|
|
36
|
+
this.dispose();
|
|
37
|
+
this.timer = setInterval(() => this.tick(), this.opts.pollIntervalMs ?? 5000);
|
|
38
|
+
this.timer.unref?.();
|
|
39
|
+
}
|
|
40
|
+
|
|
41
|
+
tick(now = Date.now()): void {
|
|
42
|
+
const thresholds = this.opts.thresholds ?? DEFAULT_GRADIENT_THRESHOLDS;
|
|
43
|
+
const tickThreshold = this.opts.deadletterTickThreshold ?? 3;
|
|
44
|
+
for (const run of this.opts.manifestCache.list(50)) {
|
|
45
|
+
if (run.status !== "running") continue;
|
|
46
|
+
const loaded = loadRunManifestById(this.opts.cwd, run.runId);
|
|
47
|
+
if (!loaded) continue;
|
|
48
|
+
for (const task of loaded.tasks) {
|
|
49
|
+
if (task.status !== "running") continue;
|
|
50
|
+
const key = `${run.runId}:${task.id}`;
|
|
51
|
+
const elapsed = heartbeatAgeMs(task.heartbeat, now);
|
|
52
|
+
const level = classifyHeartbeat(task.heartbeat, thresholds, now);
|
|
53
|
+
this.opts.registry.gauge("crew.heartbeat.staleness_ms", "Heartbeat elapsed since last seen, milliseconds").set({ runId: run.runId, taskId: task.id }, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
|
|
54
|
+
this.opts.registry.counter("crew.heartbeat.level_total", "Heartbeat classifications by level").inc({ runId: run.runId, level });
|
|
55
|
+
const previous = this.lastLevel.get(key);
|
|
56
|
+
this.lastLevel.set(key, level);
|
|
57
|
+
if (level === "dead" && previous !== "dead") {
|
|
58
|
+
this.opts.registry.counter("crew.heartbeat.dead_total", "Dead heartbeat detections").inc({ runId: run.runId });
|
|
59
|
+
appendEvent(loaded.manifest.eventsPath, { type: "crew.task.heartbeat_dead", runId: run.runId, taskId: task.id, message: `Task ${task.id} heartbeat dead.`, data: { elapsedMs: Number.isFinite(elapsed) ? elapsed : undefined } });
|
|
60
|
+
this.opts.router.enqueue({ id: `dead_${run.runId}_${task.id}`, severity: "warning", source: "heartbeat-watcher", runId: run.runId, title: `Task ${task.id} heartbeat dead`, body: "Background watcher detected a stuck worker." });
|
|
61
|
+
this.opts.onDead?.(run.runId, task.id, Number.isFinite(elapsed) ? elapsed : thresholds.deadMs);
|
|
62
|
+
}
|
|
63
|
+
if (level === "dead") {
|
|
64
|
+
const count = (this.consecutiveDead.get(key) ?? 0) + 1;
|
|
65
|
+
this.consecutiveDead.set(key, count);
|
|
66
|
+
if (count === tickThreshold) this.opts.onDeadletterTrigger?.(loaded.manifest, task.id);
|
|
67
|
+
} else {
|
|
68
|
+
this.consecutiveDead.delete(key);
|
|
69
|
+
}
|
|
70
|
+
}
|
|
71
|
+
}
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
dispose(): void {
|
|
75
|
+
if (this.timer) clearInterval(this.timer);
|
|
76
|
+
this.timer = undefined;
|
|
77
|
+
this.lastLevel.clear();
|
|
78
|
+
this.consecutiveDead.clear();
|
|
79
|
+
}
|
|
80
|
+
}
|