pi-crew 0.2.3 → 0.2.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +57 -32
- package/CHANGELOG.md +466 -448
- package/LICENSE +21 -21
- package/NOTICE.md +16 -16
- package/README.md +323 -323
- package/docs/FEATURE_INTAKE.md +126 -0
- package/docs/HARNESS.md +86 -0
- package/docs/HARNESS_BACKLOG.md +41 -0
- package/docs/TEST_MATRIX.md +49 -0
- package/docs/actions-reference.md +595 -595
- package/docs/architecture.md +180 -180
- package/docs/code-review-2026-05-11.md +592 -592
- package/docs/commands-reference.md +347 -347
- package/docs/comparison-pi-subagents-vs-pi-crew.md +303 -0
- package/docs/decisions/0001-durable-state.md +41 -0
- package/docs/decisions/0002-child-process-for-async.md +42 -0
- package/docs/decisions/0003-depth-guard.md +36 -0
- package/docs/decisions/0004-execfile-over-exec.md +34 -0
- package/docs/decisions/0005-no-parameter-properties.md +49 -0
- package/docs/decisions/0006-publish-bundled-esm.md +63 -0
- package/docs/decisions/0007-active-run-binary-index.md +54 -0
- package/docs/decisions/0008-child-pi-warm-pool.md +61 -0
- package/docs/decisions/README.md +23 -0
- package/docs/followup-review-round4-2026-05-13.md +107 -0
- package/docs/implementation-plan-top3.md +333 -0
- package/docs/live-mailbox-runtime.md +36 -36
- package/docs/next-upgrade-roadmap.md +808 -808
- package/docs/oh-my-pi-research.md +509 -0
- package/docs/perf/baseline-2026-05.md +113 -0
- package/docs/perf/final-report-2026-05.md +206 -0
- package/docs/perf/sprint-1-report.md +71 -0
- package/docs/perf/sprint-2-report.md +81 -0
- package/docs/perf/sprint-2.5-report.md +53 -0
- package/docs/perf/sprint-3-report.md +36 -0
- package/docs/perf/sprint-4-report.md +47 -0
- package/docs/perf/sprint-5-report.md +51 -0
- package/docs/perf/sprint-6-report.md +94 -0
- package/docs/perf/sprint-7-report.md +74 -0
- package/docs/perf/upgrade-plan-2026-05.md +147 -0
- package/docs/pi-subagents3-deep-analysis.md +508 -0
- package/docs/product/README.md +31 -0
- package/docs/product/platform.md +27 -0
- package/docs/product/runtime-safety.md +37 -0
- package/docs/product/team-run.md +39 -0
- package/docs/product/team-tool.md +37 -0
- package/docs/publishing.md +65 -65
- package/docs/resource-formats.md +134 -134
- package/docs/runtime-analysis-child-vs-live.md +171 -0
- package/docs/runtime-flow.md +148 -148
- package/docs/runtime-migration-in-process-analysis.md +250 -0
- package/docs/stories/README.md +30 -0
- package/docs/stories/backlog.md +36 -0
- package/docs/templates/decision.md +27 -0
- package/docs/templates/story.md +44 -0
- package/docs/templates/validation-report.md +32 -0
- package/docs/usage.md +238 -238
- package/index.ts +7 -6
- package/install.mjs +65 -65
- package/package.json +107 -100
- package/schema.json +222 -222
- package/skills/child-pi-spawning/SKILL.md +213 -0
- package/skills/context-artifact-hygiene/SKILL.md +32 -0
- package/skills/event-log-tracing/SKILL.md +299 -0
- package/skills/git-master/SKILL.md +225 -24
- package/skills/live-agent-lifecycle/SKILL.md +192 -0
- package/skills/mailbox-interactive/SKILL.md +300 -19
- package/skills/model-routing-context/SKILL.md +94 -0
- package/skills/multi-perspective-review/SKILL.md +88 -0
- package/skills/read-only-explorer/SKILL.md +250 -26
- package/skills/safe-bash/SKILL.md +307 -21
- package/skills/verification-before-done/SKILL.md +11 -2
- package/skills/widget-rendering/SKILL.md +258 -0
- package/skills/workspace-isolation/SKILL.md +202 -0
- package/skills/worktree-isolation/SKILL.md +202 -18
- package/src/adapters/claude-adapter.ts +25 -25
- package/src/adapters/codex-adapter.ts +21 -21
- package/src/adapters/cursor-adapter.ts +17 -17
- package/src/adapters/export-util.ts +137 -137
- package/src/adapters/index.ts +15 -15
- package/src/adapters/registry.ts +18 -18
- package/src/adapters/types.ts +23 -23
- package/src/agents/agent-config.ts +38 -38
- package/src/agents/agent-serializer.ts +38 -38
- package/src/agents/discover-agents.ts +121 -118
- package/src/config/config.ts +740 -858
- package/src/config/defaults.ts +96 -96
- package/src/config/drift-detector.ts +211 -211
- package/src/config/markers.ts +327 -327
- package/src/config/resilient-parser.ts +109 -108
- package/src/config/suggestions.ts +74 -74
- package/src/config/types.ts +199 -0
- package/src/extension/async-notifier.ts +123 -89
- package/src/extension/autonomous-policy.ts +169 -169
- package/src/extension/cross-extension-rpc.ts +104 -104
- package/src/extension/help.ts +47 -47
- package/src/extension/import-index.ts +69 -69
- package/src/extension/management.ts +395 -382
- package/src/extension/notification-router.ts +116 -116
- package/src/extension/notification-sink.ts +51 -51
- package/src/extension/project-init.ts +168 -168
- package/src/extension/register.ts +859 -668
- package/src/extension/registration/artifact-cleanup.ts +15 -15
- package/src/extension/registration/command-utils.ts +54 -54
- package/src/extension/registration/commands.ts +559 -452
- package/src/extension/registration/compaction-guard.ts +125 -125
- package/src/extension/registration/subagent-helpers.ts +102 -102
- package/src/extension/registration/subagent-tools.ts +220 -159
- package/src/extension/registration/team-tool.ts +159 -99
- package/src/extension/registration/viewers.ts +29 -0
- package/src/extension/result-watcher.ts +128 -128
- package/src/extension/run-bundle-schema.ts +89 -89
- package/src/extension/run-export.ts +73 -73
- package/src/extension/run-import.ts +84 -84
- package/src/extension/run-index.ts +94 -94
- package/src/extension/run-maintenance.ts +142 -142
- package/src/extension/session-summary.ts +8 -8
- package/src/extension/team-manager-command.ts +96 -96
- package/src/extension/team-recommendation.ts +188 -188
- package/src/extension/team-tool/api.ts +5 -2
- package/src/extension/team-tool/cancel.ts +224 -209
- package/src/extension/team-tool/config-patch.ts +36 -36
- package/src/extension/team-tool/context.ts +60 -60
- package/src/extension/team-tool/doctor.ts +242 -242
- package/src/extension/team-tool/handle-settings.ts +421 -195
- package/src/extension/team-tool/inspect.ts +41 -41
- package/src/extension/team-tool/lifecycle-actions.ts +139 -139
- package/src/extension/team-tool/parallel-dispatch.ts +156 -156
- package/src/extension/team-tool/plan.ts +19 -19
- package/src/extension/team-tool/respond.ts +112 -111
- package/src/extension/team-tool/run.ts +246 -229
- package/src/extension/team-tool/status.ts +110 -110
- package/src/extension/team-tool-types.ts +13 -13
- package/src/extension/team-tool.ts +344 -344
- package/src/extension/tool-result.ts +16 -16
- package/src/extension/validate-resources.ts +77 -77
- package/src/hooks/registry.ts +61 -61
- package/src/hooks/types.ts +40 -40
- package/src/i18n.ts +184 -184
- package/src/observability/correlation.ts +35 -35
- package/src/observability/event-to-metric.ts +68 -68
- package/src/observability/exporters/adapter.ts +30 -30
- package/src/observability/exporters/otlp-exporter.ts +106 -92
- package/src/observability/exporters/prometheus-exporter.ts +54 -54
- package/src/observability/metric-registry.ts +87 -87
- package/src/observability/metric-retention.ts +54 -54
- package/src/observability/metric-sink.ts +81 -56
- package/src/observability/metrics-primitives.ts +167 -167
- package/src/prompt/prompt-runtime.ts +72 -72
- package/src/runtime/adaptive-plan.ts +338 -0
- package/src/runtime/agent-control.ts +169 -169
- package/src/runtime/agent-memory.ts +72 -72
- package/src/runtime/agent-observability.ts +114 -114
- package/src/runtime/async-marker.ts +26 -26
- package/src/runtime/async-runner.ts +153 -153
- package/src/runtime/attention-events.ts +28 -28
- package/src/runtime/auto-resume.ts +100 -100
- package/src/runtime/background-runner.ts +122 -89
- package/src/runtime/cancellation.ts +61 -61
- package/src/runtime/capability-inventory.ts +116 -116
- package/src/runtime/child-pi-pool.ts +68 -0
- package/src/runtime/child-pi.ts +541 -461
- package/src/runtime/code-summary.ts +247 -247
- package/src/runtime/compaction-summary.ts +271 -271
- package/src/runtime/concurrency.ts +58 -58
- package/src/runtime/crash-recovery.ts +317 -301
- package/src/runtime/crew-agent-records.ts +379 -281
- package/src/runtime/crew-agent-runtime.ts +60 -60
- package/src/runtime/cross-extension-rpc.ts +72 -0
- package/src/runtime/custom-tools/irc-tool.ts +201 -201
- package/src/runtime/custom-tools/submit-result-tool.ts +90 -90
- package/src/runtime/deadletter.ts +47 -47
- package/src/runtime/delivery-coordinator.ts +176 -176
- package/src/runtime/delta-conflict.ts +360 -360
- package/src/runtime/diagnostic-export.ts +102 -102
- package/src/runtime/direct-run.ts +35 -35
- package/src/runtime/effectiveness.ts +82 -81
- package/src/runtime/errors/crew-errors.ts +166 -0
- package/src/runtime/event-stream-bridge.ts +92 -92
- package/src/runtime/foreground-control.ts +82 -82
- package/src/runtime/green-contract.ts +46 -46
- package/src/runtime/group-join.ts +234 -106
- package/src/runtime/heartbeat-watcher.ts +145 -124
- package/src/runtime/iteration-hooks.ts +267 -267
- package/src/runtime/live-agent-control.ts +88 -88
- package/src/runtime/live-agent-manager.ts +377 -179
- package/src/runtime/live-control-realtime.ts +36 -36
- package/src/runtime/live-session-runtime.ts +676 -600
- package/src/runtime/loop-gates.ts +129 -129
- package/src/runtime/manifest-cache.ts +263 -263
- package/src/runtime/mcp-proxy.ts +113 -113
- package/src/runtime/metric-parser.ts +40 -40
- package/src/runtime/model-fallback.ts +282 -274
- package/src/runtime/model-resolver.ts +118 -0
- package/src/runtime/output-validator.ts +187 -187
- package/src/runtime/overflow-recovery.ts +175 -175
- package/src/runtime/parallel-research.ts +44 -44
- package/src/runtime/parallel-utils.ts +156 -156
- package/src/runtime/parent-guard.ts +80 -80
- package/src/runtime/phase-progress.ts +217 -217
- package/src/runtime/pi-args.ts +165 -165
- package/src/runtime/pi-json-output.ts +111 -111
- package/src/runtime/pi-spawn.ts +167 -167
- package/src/runtime/policy-engine.ts +79 -79
- package/src/runtime/post-checks.ts +125 -125
- package/src/runtime/post-exit-stdio-guard.ts +86 -86
- package/src/runtime/process-status.ts +97 -73
- package/src/runtime/progress-event-coalescer.ts +43 -43
- package/src/runtime/recovery-recipes.ts +74 -74
- package/src/runtime/retry-executor.ts +81 -81
- package/src/runtime/role-permission.ts +39 -39
- package/src/runtime/run-tracker.ts +99 -0
- package/src/runtime/runtime-policy.ts +21 -0
- package/src/runtime/runtime-resolver.ts +94 -91
- package/src/runtime/scheduler.ts +294 -0
- package/src/runtime/semaphore.ts +131 -131
- package/src/runtime/sensitive-paths.ts +92 -92
- package/src/runtime/session-usage.ts +79 -79
- package/src/runtime/settings-store.ts +103 -0
- package/src/runtime/sidechain-output.ts +29 -29
- package/src/runtime/skill-instructions.ts +222 -222
- package/src/runtime/stale-reconciler.ts +198 -189
- package/src/runtime/streaming-output.ts +47 -0
- package/src/runtime/subagent-manager.ts +404 -400
- package/src/runtime/subprocess-tool-registry.ts +67 -67
- package/src/runtime/task-display.ts +38 -38
- package/src/runtime/task-graph-scheduler.ts +122 -122
- package/src/runtime/task-graph.ts +207 -207
- package/src/runtime/task-output-context.ts +177 -177
- package/src/runtime/task-packet.ts +93 -93
- package/src/runtime/task-quality.ts +207 -207
- package/src/runtime/task-runner/capabilities.ts +78 -78
- package/src/runtime/task-runner/live-executor.ts +131 -113
- package/src/runtime/task-runner/progress.ts +119 -119
- package/src/runtime/task-runner/prompt-builder.ts +139 -139
- package/src/runtime/task-runner/prompt-pipeline.ts +64 -64
- package/src/runtime/task-runner/result-utils.ts +14 -14
- package/src/runtime/task-runner/run-projection.ts +103 -103
- package/src/runtime/task-runner/state-helpers.ts +22 -22
- package/src/runtime/task-runner.ts +469 -459
- package/src/runtime/team-runner.ts +693 -945
- package/src/runtime/usage-tracker.ts +71 -0
- package/src/runtime/worker-heartbeat.ts +21 -21
- package/src/runtime/worker-startup.ts +57 -57
- package/src/runtime/workflow-state.ts +187 -187
- package/src/runtime/yield-handler.ts +190 -190
- package/src/schema/config-schema.ts +172 -168
- package/src/schema/team-tool-schema.ts +126 -126
- package/src/schema/validation-types.ts +151 -148
- package/src/skills/discover-skills.ts +67 -67
- package/src/skills/skill-templates.ts +374 -374
- package/src/state/active-run-registry.ts +227 -191
- package/src/state/artifact-store.ts +130 -129
- package/src/state/atomic-write.ts +262 -195
- package/src/state/blob-store.ts +116 -116
- package/src/state/contracts.ts +111 -111
- package/src/state/event-log-rotation.ts +161 -158
- package/src/state/event-log.ts +383 -303
- package/src/state/event-reconstructor.ts +217 -217
- package/src/state/jsonl-writer.ts +82 -82
- package/src/state/locks.ts +146 -146
- package/src/state/mailbox.ts +446 -405
- package/src/state/state-store.ts +364 -351
- package/src/state/task-claims.ts +44 -44
- package/src/state/types.ts +285 -285
- package/src/state/usage.ts +29 -29
- package/src/subagents/async-entry.ts +1 -1
- package/src/subagents/index.ts +3 -3
- package/src/subagents/live/control.ts +1 -1
- package/src/subagents/live/manager.ts +1 -1
- package/src/subagents/live/realtime.ts +1 -1
- package/src/subagents/live/session-runtime.ts +1 -1
- package/src/subagents/manager.ts +1 -1
- package/src/subagents/spawn.ts +1 -1
- package/src/teams/discover-teams.ts +116 -116
- package/src/teams/team-config.ts +27 -27
- package/src/teams/team-serializer.ts +38 -38
- package/src/types/diff.d.ts +18 -18
- package/src/ui/agent-management-overlay.ts +144 -144
- package/src/ui/crew-widget.ts +487 -370
- package/src/ui/dashboard-panes/agents-pane.ts +109 -28
- package/src/ui/dashboard-panes/cancellation-pane.ts +42 -42
- package/src/ui/dashboard-panes/capability-pane.ts +59 -59
- package/src/ui/dashboard-panes/health-pane.ts +30 -30
- package/src/ui/dashboard-panes/mailbox-pane.ts +35 -35
- package/src/ui/dashboard-panes/progress-pane.ts +30 -30
- package/src/ui/dashboard-panes/transcript-pane.ts +10 -10
- package/src/ui/heartbeat-aggregator.ts +63 -63
- package/src/ui/keybinding-map.ts +97 -94
- package/src/ui/live-conversation-overlay.ts +152 -0
- package/src/ui/live-run-sidebar.ts +180 -180
- package/src/ui/mascot.ts +442 -442
- package/src/ui/overlays/agent-picker-overlay.ts +57 -57
- package/src/ui/overlays/confirm-overlay.ts +58 -58
- package/src/ui/overlays/mailbox-compose-overlay.ts +144 -144
- package/src/ui/overlays/mailbox-compose-preview.ts +63 -63
- package/src/ui/overlays/mailbox-detail-overlay.ts +122 -122
- package/src/ui/pi-ui-compat.ts +57 -57
- package/src/ui/powerbar-publisher.ts +221 -197
- package/src/ui/render-scheduler.ts +216 -143
- package/src/ui/run-action-dispatcher.ts +118 -118
- package/src/ui/run-dashboard.ts +526 -464
- package/src/ui/run-event-bus.ts +208 -208
- package/src/ui/run-snapshot-cache.ts +826 -777
- package/src/ui/settings-overlay.ts +721 -0
- package/src/ui/snapshot-types.ts +86 -70
- package/src/ui/theme-adapter.ts +190 -190
- package/src/ui/tool-progress-formatter.ts +89 -0
- package/src/ui/transcript-cache.ts +94 -94
- package/src/ui/transcript-viewer.ts +335 -335
- package/src/utils/conflict-detect.ts +662 -0
- package/src/utils/file-coalescer.ts +86 -86
- package/src/utils/frontmatter.ts +68 -68
- package/src/utils/fs-watch.ts +88 -31
- package/src/utils/gh-protocol.ts +479 -0
- package/src/utils/ids.ts +17 -17
- package/src/utils/incremental-reader.ts +104 -104
- package/src/utils/internal-error.ts +6 -6
- package/src/utils/names.ts +27 -27
- package/src/utils/paths.ts +102 -63
- package/src/utils/redaction.ts +44 -44
- package/src/utils/safe-paths.ts +47 -47
- package/src/utils/scan-cache.ts +136 -136
- package/src/utils/sse-parser.ts +134 -134
- package/src/utils/task-name-generator.ts +337 -337
- package/src/utils/timings.ts +33 -33
- package/src/utils/visual.ts +243 -198
- package/src/workflows/discover-workflows.ts +139 -139
- package/src/workflows/validate-workflow.ts +40 -40
- package/src/workflows/workflow-config.ts +26 -26
- package/src/workflows/workflow-serializer.ts +32 -32
- package/src/worktree/branch-freshness.ts +45 -45
- package/src/worktree/cleanup.ts +75 -75
- package/src/worktree/worktree-manager.ts +188 -188
- package/teams/default.team.md +12 -12
- package/teams/fast-fix.team.md +11 -11
- package/teams/implementation.team.md +18 -18
- package/teams/parallel-research.team.md +14 -14
- package/teams/research.team.md +11 -11
- package/teams/review.team.md +12 -12
- package/tsconfig.json +19 -19
- package/workflows/default.workflow.md +30 -30
- package/workflows/fast-fix.workflow.md +23 -23
- package/workflows/implementation.workflow.md +43 -43
- package/workflows/parallel-research.workflow.md +46 -46
- package/workflows/research.workflow.md +22 -22
- package/workflows/review.workflow.md +30 -30
- package/skills/task-packet/SKILL.md +0 -28
- package/skills/verify-evidence/SKILL.md +0 -27
|
@@ -1,600 +1,676 @@
|
|
|
1
|
-
import * as fs from "node:fs";
|
|
2
|
-
import * as path from "node:path";
|
|
3
|
-
import type { AgentConfig } from "../agents/agent-config.ts";
|
|
4
|
-
import type { CrewRuntimeConfig } from "../config/config.ts";
|
|
5
|
-
import type { TeamRunManifest, TeamTaskState, UsageState } from "../state/types.ts";
|
|
6
|
-
import {
|
|
7
|
-
import {
|
|
8
|
-
import {
|
|
9
|
-
import {
|
|
10
|
-
import {
|
|
11
|
-
import type
|
|
12
|
-
import {
|
|
13
|
-
import {
|
|
14
|
-
import {
|
|
15
|
-
import {
|
|
16
|
-
import {
|
|
17
|
-
import {
|
|
18
|
-
import {
|
|
19
|
-
import {
|
|
20
|
-
import {
|
|
21
|
-
import {
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
import {
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
import {
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
}
|
|
66
|
-
|
|
67
|
-
export interface
|
|
68
|
-
available:
|
|
69
|
-
reason: string;
|
|
70
|
-
}
|
|
71
|
-
|
|
72
|
-
|
|
73
|
-
|
|
74
|
-
|
|
75
|
-
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
}
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
}
|
|
97
|
-
|
|
98
|
-
function
|
|
99
|
-
|
|
100
|
-
}
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
return
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
|
|
121
|
-
|
|
122
|
-
|
|
123
|
-
|
|
124
|
-
|
|
125
|
-
|
|
126
|
-
const
|
|
127
|
-
if (
|
|
128
|
-
|
|
129
|
-
|
|
130
|
-
|
|
131
|
-
|
|
132
|
-
|
|
133
|
-
|
|
134
|
-
|
|
135
|
-
|
|
136
|
-
|
|
137
|
-
|
|
138
|
-
|
|
139
|
-
|
|
140
|
-
|
|
141
|
-
|
|
142
|
-
|
|
143
|
-
|
|
144
|
-
|
|
145
|
-
|
|
146
|
-
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
|
|
162
|
-
|
|
163
|
-
|
|
164
|
-
|
|
165
|
-
|
|
166
|
-
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
|
|
173
|
-
|
|
174
|
-
|
|
175
|
-
|
|
176
|
-
|
|
177
|
-
|
|
178
|
-
|
|
179
|
-
|
|
180
|
-
"
|
|
181
|
-
|
|
182
|
-
|
|
183
|
-
"
|
|
184
|
-
"
|
|
185
|
-
"
|
|
186
|
-
"
|
|
187
|
-
|
|
188
|
-
|
|
189
|
-
|
|
190
|
-
|
|
191
|
-
|
|
192
|
-
|
|
193
|
-
"
|
|
194
|
-
|
|
195
|
-
|
|
196
|
-
|
|
197
|
-
|
|
198
|
-
|
|
199
|
-
|
|
200
|
-
"
|
|
201
|
-
"
|
|
202
|
-
"
|
|
203
|
-
"
|
|
204
|
-
].join("\n");
|
|
205
|
-
if (role === "
|
|
206
|
-
"## Output Contract",
|
|
207
|
-
"<path>:<line
|
|
208
|
-
"
|
|
209
|
-
"
|
|
210
|
-
|
|
211
|
-
|
|
212
|
-
|
|
213
|
-
"
|
|
214
|
-
"
|
|
215
|
-
"
|
|
216
|
-
"
|
|
217
|
-
].join("\n");
|
|
218
|
-
if (role === "
|
|
219
|
-
|
|
220
|
-
|
|
221
|
-
|
|
222
|
-
|
|
223
|
-
|
|
224
|
-
|
|
225
|
-
|
|
226
|
-
|
|
227
|
-
|
|
228
|
-
|
|
229
|
-
|
|
230
|
-
|
|
231
|
-
|
|
232
|
-
|
|
233
|
-
|
|
234
|
-
|
|
235
|
-
|
|
236
|
-
|
|
237
|
-
|
|
238
|
-
|
|
239
|
-
|
|
240
|
-
|
|
241
|
-
|
|
242
|
-
|
|
243
|
-
|
|
244
|
-
|
|
245
|
-
|
|
246
|
-
|
|
247
|
-
|
|
248
|
-
|
|
249
|
-
|
|
250
|
-
|
|
251
|
-
"",
|
|
252
|
-
|
|
253
|
-
|
|
254
|
-
|
|
255
|
-
|
|
256
|
-
input.
|
|
257
|
-
|
|
258
|
-
|
|
259
|
-
|
|
260
|
-
|
|
261
|
-
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
|
|
265
|
-
|
|
266
|
-
|
|
267
|
-
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
const
|
|
271
|
-
|
|
272
|
-
|
|
273
|
-
|
|
274
|
-
|
|
275
|
-
|
|
276
|
-
const
|
|
277
|
-
|
|
278
|
-
|
|
279
|
-
|
|
280
|
-
|
|
281
|
-
|
|
282
|
-
const
|
|
283
|
-
|
|
284
|
-
return
|
|
285
|
-
}
|
|
286
|
-
|
|
287
|
-
|
|
288
|
-
const
|
|
289
|
-
|
|
290
|
-
|
|
291
|
-
|
|
292
|
-
|
|
293
|
-
|
|
294
|
-
|
|
295
|
-
|
|
296
|
-
|
|
297
|
-
|
|
298
|
-
|
|
299
|
-
|
|
300
|
-
|
|
301
|
-
|
|
302
|
-
|
|
303
|
-
|
|
304
|
-
|
|
305
|
-
|
|
306
|
-
|
|
307
|
-
|
|
308
|
-
}
|
|
309
|
-
|
|
310
|
-
|
|
311
|
-
|
|
312
|
-
const
|
|
313
|
-
|
|
314
|
-
|
|
315
|
-
|
|
316
|
-
let
|
|
317
|
-
let
|
|
318
|
-
|
|
319
|
-
|
|
320
|
-
|
|
321
|
-
|
|
322
|
-
|
|
323
|
-
|
|
324
|
-
|
|
325
|
-
|
|
326
|
-
|
|
327
|
-
|
|
328
|
-
|
|
329
|
-
|
|
330
|
-
|
|
331
|
-
|
|
332
|
-
|
|
333
|
-
|
|
334
|
-
|
|
335
|
-
|
|
336
|
-
|
|
337
|
-
|
|
338
|
-
|
|
339
|
-
|
|
340
|
-
|
|
341
|
-
|
|
342
|
-
|
|
343
|
-
|
|
344
|
-
|
|
345
|
-
|
|
346
|
-
|
|
347
|
-
|
|
348
|
-
|
|
349
|
-
|
|
350
|
-
|
|
351
|
-
|
|
352
|
-
|
|
353
|
-
|
|
354
|
-
|
|
355
|
-
|
|
356
|
-
|
|
357
|
-
|
|
358
|
-
|
|
359
|
-
|
|
360
|
-
|
|
361
|
-
|
|
362
|
-
|
|
363
|
-
|
|
364
|
-
|
|
365
|
-
|
|
366
|
-
|
|
367
|
-
|
|
368
|
-
|
|
369
|
-
|
|
370
|
-
|
|
371
|
-
|
|
372
|
-
|
|
373
|
-
//
|
|
374
|
-
const
|
|
375
|
-
|
|
376
|
-
|
|
377
|
-
|
|
378
|
-
|
|
379
|
-
|
|
380
|
-
|
|
381
|
-
|
|
382
|
-
|
|
383
|
-
|
|
384
|
-
|
|
385
|
-
|
|
386
|
-
}
|
|
387
|
-
|
|
388
|
-
|
|
389
|
-
|
|
390
|
-
|
|
391
|
-
|
|
392
|
-
|
|
393
|
-
|
|
394
|
-
|
|
395
|
-
|
|
396
|
-
|
|
397
|
-
|
|
398
|
-
|
|
399
|
-
|
|
400
|
-
|
|
401
|
-
|
|
402
|
-
|
|
403
|
-
|
|
404
|
-
|
|
405
|
-
})
|
|
406
|
-
|
|
407
|
-
|
|
408
|
-
|
|
409
|
-
}
|
|
410
|
-
|
|
411
|
-
|
|
412
|
-
|
|
413
|
-
|
|
414
|
-
|
|
415
|
-
|
|
416
|
-
if
|
|
417
|
-
|
|
418
|
-
|
|
419
|
-
|
|
420
|
-
|
|
421
|
-
|
|
422
|
-
|
|
423
|
-
|
|
424
|
-
|
|
425
|
-
|
|
426
|
-
|
|
427
|
-
|
|
428
|
-
|
|
429
|
-
|
|
430
|
-
|
|
431
|
-
|
|
432
|
-
|
|
433
|
-
|
|
434
|
-
|
|
435
|
-
|
|
436
|
-
|
|
437
|
-
|
|
438
|
-
|
|
439
|
-
|
|
440
|
-
|
|
441
|
-
|
|
442
|
-
|
|
443
|
-
|
|
444
|
-
|
|
445
|
-
|
|
446
|
-
|
|
447
|
-
|
|
448
|
-
|
|
449
|
-
|
|
450
|
-
|
|
451
|
-
|
|
452
|
-
|
|
453
|
-
|
|
454
|
-
|
|
455
|
-
|
|
456
|
-
|
|
457
|
-
|
|
458
|
-
|
|
459
|
-
|
|
460
|
-
|
|
461
|
-
|
|
462
|
-
|
|
463
|
-
|
|
464
|
-
|
|
465
|
-
|
|
466
|
-
|
|
467
|
-
|
|
468
|
-
|
|
469
|
-
|
|
470
|
-
|
|
471
|
-
|
|
472
|
-
|
|
473
|
-
|
|
474
|
-
|
|
475
|
-
|
|
476
|
-
|
|
477
|
-
|
|
478
|
-
|
|
479
|
-
|
|
480
|
-
|
|
481
|
-
|
|
482
|
-
|
|
483
|
-
|
|
484
|
-
|
|
485
|
-
|
|
486
|
-
|
|
487
|
-
|
|
488
|
-
}
|
|
489
|
-
|
|
490
|
-
|
|
491
|
-
|
|
492
|
-
|
|
493
|
-
|
|
494
|
-
|
|
495
|
-
|
|
496
|
-
|
|
497
|
-
|
|
498
|
-
|
|
499
|
-
const
|
|
500
|
-
|
|
501
|
-
|
|
502
|
-
|
|
503
|
-
|
|
504
|
-
|
|
505
|
-
|
|
506
|
-
|
|
507
|
-
|
|
508
|
-
|
|
509
|
-
|
|
510
|
-
|
|
511
|
-
|
|
512
|
-
|
|
513
|
-
|
|
514
|
-
|
|
515
|
-
|
|
516
|
-
|
|
517
|
-
|
|
518
|
-
|
|
519
|
-
|
|
520
|
-
|
|
521
|
-
|
|
522
|
-
|
|
523
|
-
|
|
524
|
-
|
|
525
|
-
|
|
526
|
-
|
|
527
|
-
|
|
528
|
-
|
|
529
|
-
|
|
530
|
-
|
|
531
|
-
|
|
532
|
-
|
|
533
|
-
|
|
534
|
-
|
|
535
|
-
|
|
536
|
-
|
|
537
|
-
|
|
538
|
-
|
|
539
|
-
|
|
540
|
-
|
|
541
|
-
|
|
542
|
-
|
|
543
|
-
|
|
544
|
-
|
|
545
|
-
|
|
546
|
-
|
|
547
|
-
|
|
548
|
-
|
|
549
|
-
|
|
550
|
-
|
|
551
|
-
|
|
552
|
-
|
|
553
|
-
|
|
554
|
-
|
|
555
|
-
|
|
556
|
-
|
|
557
|
-
|
|
558
|
-
|
|
559
|
-
|
|
560
|
-
|
|
561
|
-
|
|
562
|
-
|
|
563
|
-
|
|
564
|
-
|
|
565
|
-
|
|
566
|
-
|
|
567
|
-
|
|
568
|
-
|
|
569
|
-
|
|
570
|
-
|
|
571
|
-
|
|
572
|
-
|
|
573
|
-
|
|
574
|
-
|
|
575
|
-
|
|
576
|
-
|
|
577
|
-
|
|
578
|
-
|
|
579
|
-
|
|
580
|
-
|
|
581
|
-
|
|
582
|
-
|
|
583
|
-
|
|
584
|
-
|
|
585
|
-
|
|
586
|
-
|
|
587
|
-
|
|
588
|
-
|
|
589
|
-
|
|
590
|
-
|
|
591
|
-
|
|
592
|
-
if
|
|
593
|
-
|
|
594
|
-
|
|
595
|
-
|
|
596
|
-
|
|
597
|
-
|
|
598
|
-
|
|
599
|
-
|
|
600
|
-
|
|
1
|
+
import * as fs from "node:fs";
|
|
2
|
+
import * as path from "node:path";
|
|
3
|
+
import type { AgentConfig } from "../agents/agent-config.ts";
|
|
4
|
+
import type { CrewRuntimeConfig } from "../config/config.ts";
|
|
5
|
+
import type { TeamRunManifest, TeamTaskState, UsageState } from "../state/types.ts";
|
|
6
|
+
import { appendEvent } from "../state/event-log.ts";
|
|
7
|
+
import { buildMemoryBlock } from "./agent-memory.ts";
|
|
8
|
+
import { trackTaskUsage } from "./usage-tracker.ts";
|
|
9
|
+
import { createStreamingOutput, type StreamingOutputHandle } from "./streaming-output.ts";
|
|
10
|
+
import { registerLiveAgent, disposeLiveAgentSession, terminateLiveAgent, updateLiveAgentStatus, trackLiveAgentToolStart, trackLiveAgentToolEnd, trackLiveAgentTurnEnd, trackLiveAgentResponseText, markLiveAgentCompleted } from "./live-agent-manager.ts";
|
|
11
|
+
import { applyLiveAgentControlRequest, applyLiveAgentControlRequests, type LiveAgentControlCursor } from "./live-agent-control.ts";
|
|
12
|
+
import { subscribeLiveControlRealtime } from "./live-control-realtime.ts";
|
|
13
|
+
import { eventToSidechainType, sidechainOutputPath, writeSidechainEntry } from "./sidechain-output.ts";
|
|
14
|
+
import type { WorkflowStep } from "../workflows/workflow-config.ts";
|
|
15
|
+
import { isLiveSessionRuntimeAvailable } from "./runtime-resolver.ts";
|
|
16
|
+
import { redactSecrets } from "../utils/redaction.ts";
|
|
17
|
+
import { buildConfiguredModelRouting } from "./model-fallback.ts";
|
|
18
|
+
import { DEFAULT_LIVE_SESSION } from "../config/defaults.ts";
|
|
19
|
+
import { buildYieldReminder, hasYieldInOutput, isYieldEvent, extractYieldResult, validateYieldData, DEFAULT_YIELD_CONFIG, type YieldResult } from "./yield-handler.ts";
|
|
20
|
+
import { buildMcpProxyFromSession } from "./mcp-proxy.ts";
|
|
21
|
+
import { createSubmitResultTool } from "./custom-tools/submit-result-tool.ts";
|
|
22
|
+
import { createIrcTool } from "./custom-tools/irc-tool.ts";
|
|
23
|
+
import { buildExtensionBridge } from "./live-extension-bridge.ts";
|
|
24
|
+
import { logInternalError } from "../utils/internal-error.ts";
|
|
25
|
+
// prose-compressor imported for custom tool descriptions below;
|
|
26
|
+
// tool description compression for SDK-managed tools awaits SDK support.
|
|
27
|
+
import { compressToolDescription } from "./prose-compressor.ts";
|
|
28
|
+
import { buildSensitivePathConstraint } from "./sensitive-paths.ts";
|
|
29
|
+
import { collectLiveSessionHealth, formatLiveSessionDiagnostics, type LiveSessionHealth } from "./live-session-health.ts";
|
|
30
|
+
import { listLiveAgents } from "./live-agent-manager.ts";
|
|
31
|
+
|
|
32
|
+
export interface LiveSessionSpawnInput {
|
|
33
|
+
manifest: TeamRunManifest;
|
|
34
|
+
task: TeamTaskState;
|
|
35
|
+
step: WorkflowStep;
|
|
36
|
+
agent: AgentConfig;
|
|
37
|
+
prompt: string;
|
|
38
|
+
signal?: AbortSignal;
|
|
39
|
+
transcriptPath?: string;
|
|
40
|
+
onEvent?: (event: unknown) => void;
|
|
41
|
+
onOutput?: (text: string) => void;
|
|
42
|
+
runtimeConfig?: CrewRuntimeConfig;
|
|
43
|
+
parentContext?: string;
|
|
44
|
+
parentModel?: unknown;
|
|
45
|
+
modelRegistry?: unknown;
|
|
46
|
+
modelOverride?: string;
|
|
47
|
+
teamRoleModel?: string;
|
|
48
|
+
isCurrent?: () => boolean;
|
|
49
|
+
/** Workspace where this run was initiated — used for session-scoped live-agent visibility. */
|
|
50
|
+
workspaceId: string;
|
|
51
|
+
/** Phase 2: Output schema for validating yield data. */
|
|
52
|
+
outputSchema?: unknown;
|
|
53
|
+
}
|
|
54
|
+
|
|
55
|
+
export interface LiveSessionRunResult {
|
|
56
|
+
available: true;
|
|
57
|
+
exitCode: number | null;
|
|
58
|
+
stdout: string;
|
|
59
|
+
stderr: string;
|
|
60
|
+
jsonEvents: number;
|
|
61
|
+
usage?: UsageState;
|
|
62
|
+
error?: string;
|
|
63
|
+
/** Phase 1: Extracted yield result from submit_result tool call. */
|
|
64
|
+
yieldResult?: YieldResult;
|
|
65
|
+
}
|
|
66
|
+
|
|
67
|
+
export interface LiveSessionUnavailableResult {
|
|
68
|
+
available: false;
|
|
69
|
+
reason: string;
|
|
70
|
+
}
|
|
71
|
+
|
|
72
|
+
export interface LiveSessionPlannedResult {
|
|
73
|
+
available: true;
|
|
74
|
+
reason: string;
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
type LiveSessionModule = Record<string, unknown> & {
|
|
78
|
+
createAgentSession?: (options?: Record<string, unknown>) => Promise<{ session: LiveSessionLike; modelFallbackMessage?: string }>;
|
|
79
|
+
DefaultResourceLoader?: new (options: Record<string, unknown>) => { reload?: () => Promise<void> };
|
|
80
|
+
SessionManager?: { inMemory?: (cwd?: string) => unknown; create?: (cwd?: string, sessionDir?: string) => unknown };
|
|
81
|
+
SettingsManager?: { create?: (cwd?: string, agentDir?: string) => unknown };
|
|
82
|
+
getAgentDir?: () => string;
|
|
83
|
+
};
|
|
84
|
+
|
|
85
|
+
type LiveSessionLike = {
|
|
86
|
+
subscribe?: (listener: (event: unknown) => void) => (() => void);
|
|
87
|
+
prompt?: (text: string, options?: Record<string, unknown>) => Promise<void>;
|
|
88
|
+
steer?: (text: string) => Promise<void>;
|
|
89
|
+
abort?: () => Promise<void> | void;
|
|
90
|
+
dispose?: () => void;
|
|
91
|
+
getStats?: () => unknown;
|
|
92
|
+
stats?: unknown;
|
|
93
|
+
bindExtensions?: (bindings?: Record<string, unknown>) => Promise<void>;
|
|
94
|
+
getActiveToolNames?: () => string[];
|
|
95
|
+
setActiveToolsByName?: (names: string[]) => void;
|
|
96
|
+
};
|
|
97
|
+
|
|
98
|
+
function appendTranscript(filePath: string | undefined, event: unknown): void {
|
|
99
|
+
if (!filePath) return;
|
|
100
|
+
fs.mkdirSync(path.dirname(filePath), { recursive: true });
|
|
101
|
+
fs.appendFileSync(filePath, `${JSON.stringify(redactSecrets(event))}\n`, "utf-8");
|
|
102
|
+
}
|
|
103
|
+
|
|
104
|
+
function asRecord(value: unknown): Record<string, unknown> | undefined {
|
|
105
|
+
return value && typeof value === "object" && !Array.isArray(value) ? value as Record<string, unknown> : undefined;
|
|
106
|
+
}
|
|
107
|
+
|
|
108
|
+
function textFromContent(content: unknown): string[] {
|
|
109
|
+
if (typeof content === "string") return [content];
|
|
110
|
+
if (!Array.isArray(content)) return [];
|
|
111
|
+
return content.flatMap((part) => {
|
|
112
|
+
const obj = asRecord(part);
|
|
113
|
+
if (!obj) return [];
|
|
114
|
+
if (obj.type === "text" && typeof obj.text === "string") return [obj.text];
|
|
115
|
+
if (typeof obj.content === "string") return [obj.content];
|
|
116
|
+
return [];
|
|
117
|
+
});
|
|
118
|
+
}
|
|
119
|
+
|
|
120
|
+
function eventText(event: unknown): string[] {
|
|
121
|
+
const obj = asRecord(event);
|
|
122
|
+
if (!obj) return [];
|
|
123
|
+
const text: string[] = [];
|
|
124
|
+
if (typeof obj.text === "string") text.push(obj.text);
|
|
125
|
+
text.push(...textFromContent(obj.content));
|
|
126
|
+
const message = asRecord(obj.message);
|
|
127
|
+
if (message) text.push(...textFromContent(message.content));
|
|
128
|
+
return text.filter((entry) => entry.trim());
|
|
129
|
+
}
|
|
130
|
+
|
|
131
|
+
function finalAssistantText(event: unknown): string[] {
|
|
132
|
+
const obj = asRecord(event);
|
|
133
|
+
if (!obj || obj.type !== "message_end") return [];
|
|
134
|
+
const message = asRecord(obj.message);
|
|
135
|
+
if (message?.role !== "assistant") return [];
|
|
136
|
+
return textFromContent(message.content);
|
|
137
|
+
}
|
|
138
|
+
|
|
139
|
+
function numberField(obj: Record<string, unknown> | undefined, keys: string[]): number | undefined {
|
|
140
|
+
if (!obj) return undefined;
|
|
141
|
+
for (const key of keys) {
|
|
142
|
+
const value = obj[key];
|
|
143
|
+
if (typeof value === "number" && Number.isFinite(value)) return value;
|
|
144
|
+
}
|
|
145
|
+
return undefined;
|
|
146
|
+
}
|
|
147
|
+
|
|
148
|
+
function modelFromRegistry(modelRegistry: unknown, modelId: string | undefined): unknown {
|
|
149
|
+
if (!modelId || !modelId.includes("/")) return undefined;
|
|
150
|
+
const registry = asRecord(modelRegistry);
|
|
151
|
+
const find = registry?.find;
|
|
152
|
+
if (typeof find !== "function") return undefined;
|
|
153
|
+
const [provider, ...modelParts] = modelId.split("/");
|
|
154
|
+
const id = modelParts.join("/");
|
|
155
|
+
try {
|
|
156
|
+
return find.call(modelRegistry, provider, id);
|
|
157
|
+
} catch {
|
|
158
|
+
return undefined;
|
|
159
|
+
}
|
|
160
|
+
}
|
|
161
|
+
|
|
162
|
+
/** Communication intensity by role (caveman-inspired token optimization) */
|
|
163
|
+
const ROLE_INTENSITY: Record<string, "lite" | "full" | "ultra"> = {
|
|
164
|
+
explorer: "ultra",
|
|
165
|
+
analyst: "full",
|
|
166
|
+
planner: "full",
|
|
167
|
+
critic: "full",
|
|
168
|
+
executor: "full",
|
|
169
|
+
reviewer: "full",
|
|
170
|
+
"security-reviewer": "full",
|
|
171
|
+
"test-engineer": "full",
|
|
172
|
+
verifier: "full",
|
|
173
|
+
writer: "lite",
|
|
174
|
+
};
|
|
175
|
+
|
|
176
|
+
function buildCommunicationStyle(role: string): string {
|
|
177
|
+
const intensity = ROLE_INTENSITY[role] ?? "full";
|
|
178
|
+
if (intensity === "lite") return "## Communication\nProfessional concise. No filler/hedging. Full sentences OK.";
|
|
179
|
+
if (intensity === "ultra") return [
|
|
180
|
+
"## Communication (ultra-compressed)",
|
|
181
|
+
"Drop: articles, filler, hedging, pleasantries. Fragments OK.",
|
|
182
|
+
"Pattern: [thing] [action] [reason].",
|
|
183
|
+
"Code/paths/symbols: exact, never abbreviated. Errors quoted exact.",
|
|
184
|
+
"Abbreviate prose words: DB/auth/config/req/res/fn/impl.",
|
|
185
|
+
"Arrows for causality: X → Y. One word when one word enough.",
|
|
186
|
+
"Security/destructive: write normal English. Resume compressed after.",
|
|
187
|
+
].join("\n");
|
|
188
|
+
return [
|
|
189
|
+
"## Communication (compressed)",
|
|
190
|
+
"Drop: articles (a/an/the), filler (just/really/basically/actually/simply), hedging, pleasantries.",
|
|
191
|
+
"Short synonyms. Fragments OK. Pattern: [thing] [action] [reason]. [next step].",
|
|
192
|
+
"Code/paths/symbols: exact. Errors quoted exact.",
|
|
193
|
+
"Security/destructive: write normal English. Resume compressed after.",
|
|
194
|
+
].join("\n");
|
|
195
|
+
}
|
|
196
|
+
|
|
197
|
+
function buildOutputContract(role: string): string {
|
|
198
|
+
if (role === "explorer") return [
|
|
199
|
+
"## Output Contract",
|
|
200
|
+
"<path>:<line> — `<symbol>` — <≤6 word note>",
|
|
201
|
+
"Group: Defs: / Refs: / Callers: / Tests: / Sites:",
|
|
202
|
+
"Zero hits → \"No match.\"",
|
|
203
|
+
"Last line → totals: N defs, M refs.",
|
|
204
|
+
].join("\n");
|
|
205
|
+
if (role === "executor") return [
|
|
206
|
+
"## Output Contract",
|
|
207
|
+
"<path>:<line-range> — <change ≤10 words>.",
|
|
208
|
+
"verified: <re-read OK | mismatch @ path:line>.",
|
|
209
|
+
"Refusal tokens: too-big. / needs-confirm. / ambiguous. / regressed.",
|
|
210
|
+
].join("\n");
|
|
211
|
+
if (role === "reviewer" || role === "security-reviewer") return [
|
|
212
|
+
"## Output Contract",
|
|
213
|
+
"<path>:<line>: <emoji> <severity>: <problem>. <fix>.",
|
|
214
|
+
"Severity: 🔴 bug, 🟡 risk, 🔵 nit, ❓ question.",
|
|
215
|
+
"Zero findings → \"No issues.\"",
|
|
216
|
+
"Sorted: file order → ascending line numbers.",
|
|
217
|
+
].join("\n");
|
|
218
|
+
if (role === "verifier") return [
|
|
219
|
+
"## Output Contract",
|
|
220
|
+
"PASS: <what verified> — <evidence ≤20 words>.",
|
|
221
|
+
"FAIL: <what failed> — <reason>. <expected vs actual>.",
|
|
222
|
+
"Evidence: file paths, test output, or diffs.",
|
|
223
|
+
].join("\n");
|
|
224
|
+
if (role === "writer") return "## Output Contract\nWrite clear documentation. Full sentences. No compression.";
|
|
225
|
+
return ""; // planner, critic, analyst, test-engineer: no strict format
|
|
226
|
+
}
|
|
227
|
+
|
|
228
|
+
/**
|
|
229
|
+
* Phase 3 (caveman): Compress tool descriptions in a live session to reduce
|
|
230
|
+
* input token cost per tool call. MCP tools often have verbose descriptions
|
|
231
|
+
* (e.g. "This tool allows you to search for files in the filesystem..." → "Search files in filesystem.").
|
|
232
|
+
* Compresses only description text, never modifies tool names or parameters.
|
|
233
|
+
*/
|
|
234
|
+
function compressSessionToolDescriptions(session: LiveSessionLike): void {
|
|
235
|
+
if (typeof session.getActiveToolNames !== "function") return;
|
|
236
|
+
// The Pi SDK doesn't expose a setDescription API, but we can attempt
|
|
237
|
+
// to compress via setActiveToolsByName if the session supports it.
|
|
238
|
+
// For now, this is a no-op that documents the intent for future SDK support.
|
|
239
|
+
// When Pi SDK adds tool description mutation, this function will compress.
|
|
240
|
+
// Side benefit: the import of compressToolDescription ensures the module
|
|
241
|
+
// is loaded and tree-shakeable, so adding the actual logic later is trivial.
|
|
242
|
+
}
|
|
243
|
+
|
|
244
|
+
function liveSystemPrompt(input: LiveSessionSpawnInput): string {
|
|
245
|
+
const memory = input.agent.memory ? buildMemoryBlock(input.agent.name, input.agent.memory, input.task.cwd, Boolean(input.agent.tools?.some((tool) => tool === "write" || tool === "edit"))) : "";
|
|
246
|
+
const role = input.task.role;
|
|
247
|
+
const styleBlock = buildCommunicationStyle(role);
|
|
248
|
+
const contractBlock = buildOutputContract(role);
|
|
249
|
+
const sensitiveConstraint = buildSensitivePathConstraint();
|
|
250
|
+
return [
|
|
251
|
+
"# pi-crew Live Subagent",
|
|
252
|
+
`Run ID: ${input.manifest.runId}`,
|
|
253
|
+
`Task ID: ${input.task.id}`,
|
|
254
|
+
`Role: ${role}`,
|
|
255
|
+
`Agent: ${input.agent.name}`,
|
|
256
|
+
`Working directory: ${input.task.cwd}`,
|
|
257
|
+
"",
|
|
258
|
+
styleBlock,
|
|
259
|
+
contractBlock,
|
|
260
|
+
sensitiveConstraint,
|
|
261
|
+
"",
|
|
262
|
+
input.agent.systemPrompt || "Follow the user task exactly and report verification evidence.",
|
|
263
|
+
memory ? `\n${memory}` : "",
|
|
264
|
+
].filter(Boolean).join("\n");
|
|
265
|
+
}
|
|
266
|
+
|
|
267
|
+
function filterActiveTools(session: LiveSessionLike, agent: AgentConfig): void {
|
|
268
|
+
if (typeof session.getActiveToolNames !== "function" || typeof session.setActiveToolsByName !== "function") return;
|
|
269
|
+
const recursiveTools = new Set(["team", "Team", "Agent", "get_subagent_result", "steer_subagent"]);
|
|
270
|
+
const allowed = agent.tools?.length ? new Set(agent.tools) : undefined;
|
|
271
|
+
const active = session.getActiveToolNames().filter((name) => !recursiveTools.has(name) && (!allowed || allowed.has(name)));
|
|
272
|
+
session.setActiveToolsByName(active);
|
|
273
|
+
}
|
|
274
|
+
|
|
275
|
+
function usageFromStats(stats: unknown): UsageState | undefined {
|
|
276
|
+
const obj = asRecord(stats);
|
|
277
|
+
if (!obj) return undefined;
|
|
278
|
+
const input = numberField(obj, ["input", "inputTokens", "input_tokens"]);
|
|
279
|
+
const output = numberField(obj, ["output", "outputTokens", "output_tokens"]);
|
|
280
|
+
const cacheRead = numberField(obj, ["cacheRead", "cache_read"]);
|
|
281
|
+
const cacheWrite = numberField(obj, ["cacheWrite", "cache_write"]);
|
|
282
|
+
const cost = numberField(obj, ["cost"]);
|
|
283
|
+
const turns = numberField(obj, ["turns", "turnCount", "turn_count"]);
|
|
284
|
+
return [input, output, cacheRead, cacheWrite, cost, turns].some((value) => value !== undefined) ? { input, output, cacheRead, cacheWrite, cost, turns } : undefined;
|
|
285
|
+
}
|
|
286
|
+
|
|
287
|
+
async function promptWithTimeout(session: LiveSessionLike, text: string, timeoutMs: number, label: string): Promise<boolean> {
|
|
288
|
+
const promptPromise = session.prompt?.(text, { source: "api", expandPromptTemplates: false });
|
|
289
|
+
if (!promptPromise) return false;
|
|
290
|
+
let timer: ReturnType<typeof setTimeout> | undefined;
|
|
291
|
+
try {
|
|
292
|
+
await Promise.race([
|
|
293
|
+
promptPromise,
|
|
294
|
+
new Promise<void>((_, reject) => {
|
|
295
|
+
timer = setTimeout(() => reject(new Error(`${label} timed out after ${timeoutMs}ms`)), timeoutMs);
|
|
296
|
+
timer.unref?.();
|
|
297
|
+
}),
|
|
298
|
+
]);
|
|
299
|
+
return true;
|
|
300
|
+
} finally {
|
|
301
|
+
if (timer) clearTimeout(timer);
|
|
302
|
+
}
|
|
303
|
+
}
|
|
304
|
+
|
|
305
|
+
export async function probeLiveSessionRuntime(): Promise<LiveSessionUnavailableResult | LiveSessionPlannedResult> {
|
|
306
|
+
const availability = await isLiveSessionRuntimeAvailable();
|
|
307
|
+
if (!availability.available) return { available: false, reason: availability.reason ?? "Live-session runtime is unavailable." };
|
|
308
|
+
return { available: true, reason: "Live-session SDK exports are available. pi-crew can run in-process live agents when runtime.mode=live-session." };
|
|
309
|
+
}
|
|
310
|
+
|
|
311
|
+
export async function runLiveSessionTask(input: LiveSessionSpawnInput): Promise<LiveSessionRunResult> {
|
|
312
|
+
const isCurrent = input.isCurrent ?? (() => true);
|
|
313
|
+
let streamOut: StreamingOutputHandle | undefined;
|
|
314
|
+
|
|
315
|
+
// G1: Capture yield result from custom tool callback
|
|
316
|
+
let customToolYieldResult: YieldResult | undefined;
|
|
317
|
+
let customToolYieldResolved = false;
|
|
318
|
+
if (process.env.PI_CREW_MOCK_LIVE_SESSION === "success") {
|
|
319
|
+
const agentId = `${input.manifest.runId}:${input.task.id}`;
|
|
320
|
+
const inherited = input.runtimeConfig?.inheritContext === true && input.parentContext ? ` with inherited context: ${input.parentContext}` : "";
|
|
321
|
+
const event = { type: "message_end", message: { role: "assistant", content: [{ type: "text", text: `Mock live-session success for ${input.agent.name}${inherited}` }] } };
|
|
322
|
+
const mockSession = { steer: async () => {}, prompt: async () => {}, abort: async () => {} };
|
|
323
|
+
registerLiveAgent({ agentId, runId: input.manifest.runId, taskId: input.task.id, role: input.task.role, agent: input.agent?.name ?? "mock", description: "mock", session: mockSession, status: "running", workspaceId: input.workspaceId }, appendEvent, input.manifest.eventsPath);
|
|
324
|
+
appendTranscript(input.transcriptPath, event);
|
|
325
|
+
const sidechainPath = sidechainOutputPath(input.manifest.stateRoot, input.task.id);
|
|
326
|
+
writeSidechainEntry(sidechainPath, { agentId, type: "user", message: { role: "user", content: input.prompt }, cwd: input.task.cwd });
|
|
327
|
+
writeSidechainEntry(sidechainPath, { agentId, type: "message", message: event, cwd: input.task.cwd });
|
|
328
|
+
if (isCurrent()) input.onEvent?.(event);
|
|
329
|
+
const stdout = `Mock live-session success for ${input.agent.name}${inherited}`;
|
|
330
|
+
if (isCurrent()) input.onOutput?.(stdout);
|
|
331
|
+
updateLiveAgentStatus(agentId, "completed");
|
|
332
|
+
markLiveAgentCompleted(agentId);
|
|
333
|
+
return { available: true, exitCode: 0, stdout, stderr: "", jsonEvents: 1 };
|
|
334
|
+
}
|
|
335
|
+
const availability = await isLiveSessionRuntimeAvailable();
|
|
336
|
+
if (!availability.available) return { available: true, exitCode: 1, stdout: "", stderr: availability.reason ?? "Live-session runtime unavailable.", jsonEvents: 0, error: availability.reason };
|
|
337
|
+
// LAZY: optional peer dependency — only loaded when live-session runtime is chosen.
|
|
338
|
+
const mod = await import("@mariozechner/pi-coding-agent") as LiveSessionModule;
|
|
339
|
+
if (typeof mod.createAgentSession !== "function") return { available: true, exitCode: 1, stdout: "", stderr: "createAgentSession export is unavailable.", jsonEvents: 0, error: "createAgentSession export is unavailable." };
|
|
340
|
+
let session: LiveSessionLike | undefined;
|
|
341
|
+
let unsubscribe: (() => void) | undefined;
|
|
342
|
+
let unsubscribeControlRealtime: (() => void) | undefined;
|
|
343
|
+
let controlTimer: ReturnType<typeof setInterval> | undefined;
|
|
344
|
+
let stdout = "";
|
|
345
|
+
let jsonEvents = 0;
|
|
346
|
+
const collectedJsonEvents: Record<string, unknown>[] = [];
|
|
347
|
+
const maxCollectedJsonEvents = 1000;
|
|
348
|
+
let yieldResult: YieldResult | undefined;
|
|
349
|
+
|
|
350
|
+
const agentId = `${input.manifest.runId}:${input.task.id}`;
|
|
351
|
+
|
|
352
|
+
try {
|
|
353
|
+
const agentDir = typeof mod.getAgentDir === "function" ? mod.getAgentDir() : undefined;
|
|
354
|
+
let resourceLoader: unknown;
|
|
355
|
+
if (mod.DefaultResourceLoader && agentDir) {
|
|
356
|
+
resourceLoader = new mod.DefaultResourceLoader({
|
|
357
|
+
cwd: input.task.cwd,
|
|
358
|
+
agentDir,
|
|
359
|
+
noPromptTemplates: true,
|
|
360
|
+
noThemes: true,
|
|
361
|
+
noContextFiles: input.runtimeConfig?.inheritContext !== true,
|
|
362
|
+
systemPromptOverride: () => liveSystemPrompt(input),
|
|
363
|
+
appendSystemPromptOverride: () => [],
|
|
364
|
+
});
|
|
365
|
+
await (resourceLoader as { reload?: () => Promise<void> }).reload?.();
|
|
366
|
+
}
|
|
367
|
+
const modelRouting = buildConfiguredModelRouting({ overrideModel: input.modelOverride, stepModel: input.step.model, teamRoleModel: input.teamRoleModel, agentModel: input.agent.model, fallbackModels: input.agent.fallbackModels, parentModel: input.parentModel, modelRegistry: input.modelRegistry, cwd: input.manifest.cwd });
|
|
368
|
+
const resolvedModel = modelFromRegistry(input.modelRegistry, modelRouting.candidates[0] ?? modelRouting.requested) ?? input.parentModel;
|
|
369
|
+
// Phase 4: MCP proxy — will be determined after session creation
|
|
370
|
+
// (we check parent's MCP tools and share connections when available)
|
|
371
|
+
const mcpProxy = buildMcpProxyFromSession([], { shareMcp: true });
|
|
372
|
+
|
|
373
|
+
// G1: Build custom tools (submit_result + irc)
|
|
374
|
+
const submitResultTool = createSubmitResultTool((result) => {
|
|
375
|
+
customToolYieldResult = result;
|
|
376
|
+
customToolYieldResolved = true;
|
|
377
|
+
});
|
|
378
|
+
const ircTool = createIrcTool(agentId);
|
|
379
|
+
const customTools = [submitResultTool, ircTool];
|
|
380
|
+
|
|
381
|
+
const sessionCreateStart = Date.now();
|
|
382
|
+
const created = await mod.createAgentSession({
|
|
383
|
+
cwd: input.task.cwd,
|
|
384
|
+
...(agentDir ? { agentDir } : {}),
|
|
385
|
+
...(resourceLoader ? { resourceLoader } : {}),
|
|
386
|
+
...(mod.SessionManager?.inMemory ? { sessionManager: mod.SessionManager.inMemory(input.task.cwd) } : {}),
|
|
387
|
+
...(mod.SettingsManager?.create && agentDir ? { settingsManager: mod.SettingsManager.create(input.task.cwd, agentDir) } : {}),
|
|
388
|
+
...(input.modelRegistry ? { modelRegistry: input.modelRegistry } : {}),
|
|
389
|
+
...(resolvedModel ? { model: resolvedModel } : {}),
|
|
390
|
+
...(input.agent.thinking ? { thinkingLevel: input.agent.thinking } : {}),
|
|
391
|
+
...(mcpProxy.enableMcp ? {} : { enableMCP: false }),
|
|
392
|
+
customTools,
|
|
393
|
+
});
|
|
394
|
+
session = created.session;
|
|
395
|
+
appendEvent(input.manifest.eventsPath, { type: "live-session.session_created", runId: input.manifest.runId, taskId: input.task.id, data: { elapsedMs: Date.now() - sessionCreateStart, modelFallbackMessage: created.modelFallbackMessage } });
|
|
396
|
+
filterActiveTools(session, input.agent);
|
|
397
|
+
|
|
398
|
+
// Diagnostic: log before bindExtensions so we can identify extension-loading hangs
|
|
399
|
+
const bindExtensionsStart = Date.now();
|
|
400
|
+
try {
|
|
401
|
+
await Promise.race([
|
|
402
|
+
session.bindExtensions?.({}) ?? Promise.resolve(),
|
|
403
|
+
new Promise<void>((_, reject) => setTimeout(() => reject(new Error("bindExtensions timed out after 30s")), 30_000)),
|
|
404
|
+
]);
|
|
405
|
+
} catch (bindError) {
|
|
406
|
+
const msg = bindError instanceof Error ? bindError.message : String(bindError);
|
|
407
|
+
appendEvent(input.manifest.eventsPath, { type: "live-session.bind_extensions_error", runId: input.manifest.runId, taskId: input.task.id, data: { elapsedMs: Date.now() - bindExtensionsStart, error: msg } });
|
|
408
|
+
// Continue without extensions — they should not block the session
|
|
409
|
+
}
|
|
410
|
+
|
|
411
|
+
// Phase 3 (caveman): Compress tool descriptions to reduce input token cost
|
|
412
|
+
compressSessionToolDescriptions(session);
|
|
413
|
+
|
|
414
|
+
// Phase 5: Initialize extension runner bridge if available
|
|
415
|
+
// The bridge provides extension-like APIs (sendMessage, setActiveTools, etc.)
|
|
416
|
+
// to the extension runner if the session exposes one.
|
|
417
|
+
const extensionBridge = buildExtensionBridge(session as never);
|
|
418
|
+
if (extensionBridge) {
|
|
419
|
+
const extRunner = (session as Record<string, unknown>).extensionRunner;
|
|
420
|
+
if (extRunner && typeof (extRunner as Record<string, unknown>).initialize === "function") {
|
|
421
|
+
try {
|
|
422
|
+
(extRunner as { initialize: (apis: unknown, host: unknown) => void }).initialize(extensionBridge.apis, extensionBridge.host);
|
|
423
|
+
if (typeof (extRunner as Record<string, unknown>).emit === "function") {
|
|
424
|
+
await (extRunner as { emit: (event: unknown) => Promise<void> }).emit({ type: "session_start" });
|
|
425
|
+
}
|
|
426
|
+
} catch {
|
|
427
|
+
// Extension runner initialization failure should not block the session
|
|
428
|
+
}
|
|
429
|
+
}
|
|
430
|
+
}
|
|
431
|
+
|
|
432
|
+
registerLiveAgent({ agentId, runId: input.manifest.runId, taskId: input.task.id, role: input.task.role, agent: input.agent?.name ?? "unknown", description: input.task.adaptive?.task ?? input.step?.task ?? "", modelName: (resolvedModel as { name?: string })?.name, session, status: "running", workspaceId: input.workspaceId }, appendEvent, input.manifest.eventsPath);
|
|
433
|
+
streamOut = createStreamingOutput(input.manifest, input.task.id);
|
|
434
|
+
let controlCursor: LiveAgentControlCursor = { offset: 0 };
|
|
435
|
+
const seenControlRequestIds = new Set<string>();
|
|
436
|
+
let controlBusy = false;
|
|
437
|
+
const pollControl = async () => {
|
|
438
|
+
if (!isCurrent() || controlBusy || !session) return;
|
|
439
|
+
controlBusy = true;
|
|
440
|
+
try {
|
|
441
|
+
controlCursor = await applyLiveAgentControlRequests({ manifest: input.manifest, taskId: input.task.id, agentId, session, cursor: controlCursor, seenRequestIds: seenControlRequestIds });
|
|
442
|
+
} finally {
|
|
443
|
+
controlBusy = false;
|
|
444
|
+
}
|
|
445
|
+
};
|
|
446
|
+
unsubscribeControlRealtime = subscribeLiveControlRealtime((request) => {
|
|
447
|
+
if (!isCurrent() || request.runId !== input.manifest.runId || request.taskId !== input.task.id || !session) return;
|
|
448
|
+
void applyLiveAgentControlRequest({ request, taskId: input.task.id, agentId, session, seenRequestIds: seenControlRequestIds });
|
|
449
|
+
});
|
|
450
|
+
await pollControl();
|
|
451
|
+
controlTimer = setInterval(() => {
|
|
452
|
+
if (isCurrent()) void pollControl();
|
|
453
|
+
}, 500);
|
|
454
|
+
let turnCount = 0;
|
|
455
|
+
let softLimitReached = false;
|
|
456
|
+
const maxTurns = input.runtimeConfig?.maxTurns;
|
|
457
|
+
const graceTurns = input.runtimeConfig?.graceTurns ?? 5;
|
|
458
|
+
const sidechainPath = sidechainOutputPath(input.manifest.stateRoot, input.task.id);
|
|
459
|
+
writeSidechainEntry(sidechainPath, { agentId, type: "user", message: { role: "user", content: input.prompt }, cwd: input.task.cwd });
|
|
460
|
+
if (typeof session.subscribe === "function") {
|
|
461
|
+
unsubscribe = session.subscribe((event) => {
|
|
462
|
+
if (!isCurrent()) return;
|
|
463
|
+
jsonEvents += 1;
|
|
464
|
+
appendTranscript(input.transcriptPath, event);
|
|
465
|
+
const sidechainType = eventToSidechainType(event);
|
|
466
|
+
if (sidechainType) writeSidechainEntry(sidechainPath, { agentId, type: sidechainType, message: event, cwd: input.task.cwd });
|
|
467
|
+
const obj = asRecord(event);
|
|
468
|
+
if (obj?.type === "turn_end") {
|
|
469
|
+
turnCount += 1;
|
|
470
|
+
trackLiveAgentTurnEnd(agentId);
|
|
471
|
+
if (maxTurns !== undefined && !softLimitReached && turnCount >= maxTurns) {
|
|
472
|
+
softLimitReached = true;
|
|
473
|
+
void session?.steer?.("You have reached your turn limit. Wrap up immediately — provide your final answer now.");
|
|
474
|
+
} else if (maxTurns !== undefined && softLimitReached && turnCount >= maxTurns + graceTurns) {
|
|
475
|
+
void session?.abort?.();
|
|
476
|
+
}
|
|
477
|
+
}
|
|
478
|
+
// Accumulate lifetime usage that survives compaction
|
|
479
|
+
if (obj?.type === "message_end" && (obj as any).message?.role === "assistant") {
|
|
480
|
+
const u = (obj as any).message?.usage;
|
|
481
|
+
if (u) {
|
|
482
|
+
trackTaskUsage(input.task.id, {
|
|
483
|
+
input: typeof u.input === "number" ? u.input : 0,
|
|
484
|
+
output: typeof u.output === "number" ? u.output : 0,
|
|
485
|
+
cacheWrite: typeof u.cacheWrite === "number" ? u.cacheWrite : 0,
|
|
486
|
+
});
|
|
487
|
+
}
|
|
488
|
+
}
|
|
489
|
+
input.onEvent?.(event);
|
|
490
|
+
const text = [...eventText(event), ...finalAssistantText(event)].join("\n");
|
|
491
|
+
if (text.trim()) {
|
|
492
|
+
stdout += `${text}\n`;
|
|
493
|
+
streamOut?.write(text + "\n");
|
|
494
|
+
trackLiveAgentResponseText(agentId, text);
|
|
495
|
+
input.onOutput?.(text);
|
|
496
|
+
}
|
|
497
|
+
// G2: Track tool start/end for activity display
|
|
498
|
+
if (obj?.type === "tool_use" || obj?.type === "tool_execution_start") {
|
|
499
|
+
const toolName = (obj as any).tool?.name ?? (obj as any).toolName ?? (obj as any).name ?? "unknown";
|
|
500
|
+
trackLiveAgentToolStart(agentId, toolName);
|
|
501
|
+
}
|
|
502
|
+
if (obj?.type === "tool_result" || obj?.type === "tool_execution_end") {
|
|
503
|
+
const toolName = (obj as any).tool?.name ?? (obj as any).toolName ?? (obj as any).name ?? "unknown";
|
|
504
|
+
trackLiveAgentToolEnd(agentId, toolName);
|
|
505
|
+
}
|
|
506
|
+
// Phase 1: collect events for yield detection
|
|
507
|
+
if (event && typeof event === "object" && !Array.isArray(event)) {
|
|
508
|
+
collectedJsonEvents.push(event as Record<string, unknown>);
|
|
509
|
+
if (collectedJsonEvents.length > maxCollectedJsonEvents) collectedJsonEvents.splice(0, collectedJsonEvents.length - maxCollectedJsonEvents);
|
|
510
|
+
}
|
|
511
|
+
});
|
|
512
|
+
}
|
|
513
|
+
if (input.signal) {
|
|
514
|
+
if (input.signal.aborted) await session.abort?.();
|
|
515
|
+
else input.signal.addEventListener("abort", () => { void session?.abort?.(); }, { once: true });
|
|
516
|
+
}
|
|
517
|
+
const effectivePrompt = input.runtimeConfig?.inheritContext === true && input.parentContext ? `${input.parentContext}\n\n---\n# Live Subagent Task\n${input.prompt}` : input.prompt;
|
|
518
|
+
|
|
519
|
+
// Diagnostic: log prompt size and timing
|
|
520
|
+
const promptStart = Date.now();
|
|
521
|
+
appendEvent(input.manifest.eventsPath, { type: "live-session.prompt_start", runId: input.manifest.runId, taskId: input.task.id, data: { promptLength: effectivePrompt.length, agent: input.agent.name, role: input.task.role } });
|
|
522
|
+
|
|
523
|
+
// Phase 3: Wrap session.prompt with timeout for graceful cancellation
|
|
524
|
+
const sessionTimeoutMs = DEFAULT_LIVE_SESSION.responseTimeoutMs;
|
|
525
|
+
try {
|
|
526
|
+
await promptWithTimeout(session, effectivePrompt, sessionTimeoutMs, "Live-session");
|
|
527
|
+
} catch (promptError) {
|
|
528
|
+
const msg = promptError instanceof Error ? promptError.message : String(promptError);
|
|
529
|
+
appendEvent(input.manifest.eventsPath, { type: "live-session.prompt_error", runId: input.manifest.runId, taskId: input.task.id, data: { elapsedMs: Date.now() - promptStart, error: msg } });
|
|
530
|
+
if (msg.includes("timed out")) {
|
|
531
|
+
await session.abort?.();
|
|
532
|
+
updateLiveAgentStatus(agentId, "failed");
|
|
533
|
+
return { available: true, exitCode: 1, stdout: stdout.trim(), stderr: msg, jsonEvents, error: msg };
|
|
534
|
+
}
|
|
535
|
+
throw promptError;
|
|
536
|
+
}
|
|
537
|
+
appendEvent(input.manifest.eventsPath, { type: "live-session.prompt_done", runId: input.manifest.runId, taskId: input.task.id, data: { elapsedMs: Date.now() - promptStart, jsonEvents, outputLength: stdout.length } });
|
|
538
|
+
|
|
539
|
+
// --- Phase 1: Yield enforcement loop ---
|
|
540
|
+
// After the initial prompt completes, check if the worker called submit_result.
|
|
541
|
+
// Priority: 1) custom tool callback (G1), 2) JSON event detection (legacy).
|
|
542
|
+
const yieldConfig = input.runtimeConfig?.yield ?? { enabled: DEFAULT_YIELD_CONFIG.enabled };
|
|
543
|
+
const yieldEnabled = yieldConfig.enabled !== false;
|
|
544
|
+
if (yieldEnabled && session) {
|
|
545
|
+
// Check custom tool callback first (G1)
|
|
546
|
+
if (customToolYieldResolved && customToolYieldResult) {
|
|
547
|
+
yieldResult = customToolYieldResult;
|
|
548
|
+
} else {
|
|
549
|
+
// Legacy: detect from JSON events
|
|
550
|
+
const alreadyYielded = hasYieldInOutput(collectedJsonEvents);
|
|
551
|
+
if (alreadyYielded) {
|
|
552
|
+
const yieldEvent = collectedJsonEvents.find((e) => isYieldEvent(e));
|
|
553
|
+
if (yieldEvent) yieldResult = extractYieldResult(yieldEvent);
|
|
554
|
+
}
|
|
555
|
+
}
|
|
556
|
+
// Phase 2: Validate yield data against output schema if provided
|
|
557
|
+
let schemaFailures = 0;
|
|
558
|
+
const maxSchemaFailures = 2;
|
|
559
|
+
if (yieldResult && input.outputSchema) {
|
|
560
|
+
const validation = await validateYieldData(yieldResult.structuredData, input.outputSchema);
|
|
561
|
+
if (!validation.valid) {
|
|
562
|
+
schemaFailures++;
|
|
563
|
+
yieldResult = undefined;
|
|
564
|
+
customToolYieldResolved = false;
|
|
565
|
+
const schemaReminder = `Your submit_result data did not match the required schema: ${validation.error}. Please fix and call submit_result again with valid data.`;
|
|
566
|
+
try {
|
|
567
|
+
await promptWithTimeout(session, schemaReminder, Math.min(sessionTimeoutMs, DEFAULT_LIVE_SESSION.idleWaitTimeoutMs), "Live-session schema reminder");
|
|
568
|
+
} catch {
|
|
569
|
+
/* ignore */
|
|
570
|
+
}
|
|
571
|
+
await new Promise((resolve) => setTimeout(resolve, DEFAULT_LIVE_SESSION.yieldPollIntervalMs));
|
|
572
|
+
// Check again after schema reminder
|
|
573
|
+
if (customToolYieldResolved && customToolYieldResult) {
|
|
574
|
+
yieldResult = customToolYieldResult;
|
|
575
|
+
} else {
|
|
576
|
+
const newEvents = collectedJsonEvents.slice(-10);
|
|
577
|
+
if (hasYieldInOutput(newEvents)) {
|
|
578
|
+
const yieldEvent = newEvents.find((e) => isYieldEvent(e));
|
|
579
|
+
if (yieldEvent) {
|
|
580
|
+
const candidate = extractYieldResult(yieldEvent);
|
|
581
|
+
if (candidate && input.outputSchema) {
|
|
582
|
+
const revalidation = await validateYieldData(candidate.structuredData, input.outputSchema);
|
|
583
|
+
if (revalidation.valid || schemaFailures >= maxSchemaFailures) {
|
|
584
|
+
yieldResult = candidate;
|
|
585
|
+
}
|
|
586
|
+
}
|
|
587
|
+
}
|
|
588
|
+
}
|
|
589
|
+
}
|
|
590
|
+
}
|
|
591
|
+
}
|
|
592
|
+
// Reminder loop — only if yield not yet received
|
|
593
|
+
const maxReminders = yieldConfig.maxReminders ?? DEFAULT_LIVE_SESSION.maxYieldRetries;
|
|
594
|
+
let retryCount = 0;
|
|
595
|
+
while (!customToolYieldResolved && !yieldResult && retryCount < maxReminders && !input.signal?.aborted) {
|
|
596
|
+
retryCount++;
|
|
597
|
+
const reminder = buildYieldReminder(retryCount, maxReminders, yieldConfig.reminderPrompt);
|
|
598
|
+
const prevTools = typeof session.getActiveToolNames === "function" ? session.getActiveToolNames() : [];
|
|
599
|
+
try {
|
|
600
|
+
// G6: Constrain tool set to submit_result before sending reminder
|
|
601
|
+
if (typeof session.setActiveToolsByName === "function" && prevTools.length > 0) {
|
|
602
|
+
session.setActiveToolsByName(["submit_result"]);
|
|
603
|
+
}
|
|
604
|
+
await promptWithTimeout(session, reminder, Math.min(sessionTimeoutMs, DEFAULT_LIVE_SESSION.idleWaitTimeoutMs), "Live-session yield reminder");
|
|
605
|
+
} catch {
|
|
606
|
+
break;
|
|
607
|
+
} finally {
|
|
608
|
+
// Restore previous tools even if reminder prompt times out/throws.
|
|
609
|
+
if (typeof session.setActiveToolsByName === "function" && prevTools.length > 0) {
|
|
610
|
+
session.setActiveToolsByName(prevTools);
|
|
611
|
+
}
|
|
612
|
+
}
|
|
613
|
+
const pollInterval = DEFAULT_LIVE_SESSION.yieldPollIntervalMs;
|
|
614
|
+
await new Promise((resolve) => setTimeout(resolve, pollInterval));
|
|
615
|
+
// Check custom tool callback
|
|
616
|
+
if (customToolYieldResolved && customToolYieldResult) {
|
|
617
|
+
yieldResult = customToolYieldResult;
|
|
618
|
+
break;
|
|
619
|
+
}
|
|
620
|
+
// Legacy: check JSON events
|
|
621
|
+
if (hasYieldInOutput(collectedJsonEvents.slice(-10))) {
|
|
622
|
+
const yieldEvent = collectedJsonEvents.slice(-10).find((e) => isYieldEvent(e));
|
|
623
|
+
if (yieldEvent) yieldResult = extractYieldResult(yieldEvent);
|
|
624
|
+
break;
|
|
625
|
+
}
|
|
626
|
+
}
|
|
627
|
+
if (!customToolYieldResolved && !yieldResult && !input.signal?.aborted && retryCount >= maxReminders) {
|
|
628
|
+
input.onEvent?.({ type: "task.attention", runId: input.manifest.runId, taskId: input.task.id, message: "Live-session worker completed without calling submit_result tool.", data: { activityState: "needs_attention", reason: "no_yield", attempts: retryCount } });
|
|
629
|
+
}
|
|
630
|
+
}
|
|
631
|
+
|
|
632
|
+
const usage = usageFromStats(typeof session.getStats === "function" ? session.getStats() : session.stats);
|
|
633
|
+
updateLiveAgentStatus(agentId, "completed");
|
|
634
|
+
markLiveAgentCompleted(agentId);
|
|
635
|
+
return { available: true, exitCode: 0, stdout: stdout.trim(), stderr: created.modelFallbackMessage ?? "", jsonEvents, usage, yieldResult };
|
|
636
|
+
} catch (error) {
|
|
637
|
+
const message = error instanceof Error ? error.message : String(error);
|
|
638
|
+
|
|
639
|
+
// Phase 8: Log diagnostics on failure
|
|
640
|
+
try {
|
|
641
|
+
const agents = listLiveAgents();
|
|
642
|
+
const health = collectLiveSessionHealth(agents, () => undefined);
|
|
643
|
+
const diagnostics = formatLiveSessionDiagnostics(health);
|
|
644
|
+
input.onEvent?.({ type: "live-session.diagnostics", data: diagnostics });
|
|
645
|
+
} catch (diagError) {
|
|
646
|
+
logInternalError("live-session.diagnostics", diagError);
|
|
647
|
+
}
|
|
648
|
+
|
|
649
|
+
updateLiveAgentStatus(`${input.manifest.runId}:${input.task.id}`, "failed");
|
|
650
|
+
return { available: true, exitCode: 1, stdout: stdout.trim(), stderr: message, jsonEvents, error: message };
|
|
651
|
+
} finally {
|
|
652
|
+
// H6: Unsubscribe listeners FIRST before clearing timer to prevent race
|
|
653
|
+
unsubscribe?.();
|
|
654
|
+
unsubscribeControlRealtime?.();
|
|
655
|
+
if (controlTimer) clearInterval(controlTimer);
|
|
656
|
+
streamOut?.close();
|
|
657
|
+
if (input.signal?.aborted) {
|
|
658
|
+
await terminateLiveAgent(agentId, "cancelled", appendEvent, input.manifest.eventsPath);
|
|
659
|
+
} else {
|
|
660
|
+
// Dispose the session to free resources, but keep the handle in the registry
|
|
661
|
+
// for resume/follow-up. Removing the handle entirely breaks steer/followUp/resume.
|
|
662
|
+
disposeLiveAgentSession(agentId);
|
|
663
|
+
}
|
|
664
|
+
|
|
665
|
+
// Phase 8: Emit final health snapshot
|
|
666
|
+
try {
|
|
667
|
+
const agents = listLiveAgents();
|
|
668
|
+
if (agents.length > 0) {
|
|
669
|
+
const health = collectLiveSessionHealth(agents, () => undefined);
|
|
670
|
+
input.onEvent?.({ type: "live-session.health", data: health });
|
|
671
|
+
}
|
|
672
|
+
} catch (healthError) {
|
|
673
|
+
logInternalError("live-session.health-snapshot", healthError);
|
|
674
|
+
}
|
|
675
|
+
}
|
|
676
|
+
}
|