pi-crew 0.2.3 → 0.2.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/AGENTS.md +57 -32
- package/CHANGELOG.md +466 -448
- package/LICENSE +21 -21
- package/NOTICE.md +16 -16
- package/README.md +323 -323
- package/docs/FEATURE_INTAKE.md +126 -0
- package/docs/HARNESS.md +86 -0
- package/docs/HARNESS_BACKLOG.md +41 -0
- package/docs/TEST_MATRIX.md +49 -0
- package/docs/actions-reference.md +595 -595
- package/docs/architecture.md +180 -180
- package/docs/code-review-2026-05-11.md +592 -592
- package/docs/commands-reference.md +347 -347
- package/docs/comparison-pi-subagents-vs-pi-crew.md +303 -0
- package/docs/decisions/0001-durable-state.md +41 -0
- package/docs/decisions/0002-child-process-for-async.md +42 -0
- package/docs/decisions/0003-depth-guard.md +36 -0
- package/docs/decisions/0004-execfile-over-exec.md +34 -0
- package/docs/decisions/0005-no-parameter-properties.md +49 -0
- package/docs/decisions/0006-publish-bundled-esm.md +63 -0
- package/docs/decisions/0007-active-run-binary-index.md +54 -0
- package/docs/decisions/0008-child-pi-warm-pool.md +61 -0
- package/docs/decisions/README.md +23 -0
- package/docs/followup-review-round4-2026-05-13.md +107 -0
- package/docs/implementation-plan-top3.md +333 -0
- package/docs/live-mailbox-runtime.md +36 -36
- package/docs/next-upgrade-roadmap.md +808 -808
- package/docs/oh-my-pi-research.md +509 -0
- package/docs/perf/baseline-2026-05.md +113 -0
- package/docs/perf/final-report-2026-05.md +206 -0
- package/docs/perf/sprint-1-report.md +71 -0
- package/docs/perf/sprint-2-report.md +81 -0
- package/docs/perf/sprint-2.5-report.md +53 -0
- package/docs/perf/sprint-3-report.md +36 -0
- package/docs/perf/sprint-4-report.md +47 -0
- package/docs/perf/sprint-5-report.md +51 -0
- package/docs/perf/sprint-6-report.md +94 -0
- package/docs/perf/sprint-7-report.md +74 -0
- package/docs/perf/upgrade-plan-2026-05.md +147 -0
- package/docs/pi-subagents3-deep-analysis.md +508 -0
- package/docs/product/README.md +31 -0
- package/docs/product/platform.md +27 -0
- package/docs/product/runtime-safety.md +37 -0
- package/docs/product/team-run.md +39 -0
- package/docs/product/team-tool.md +37 -0
- package/docs/publishing.md +65 -65
- package/docs/resource-formats.md +134 -134
- package/docs/runtime-analysis-child-vs-live.md +171 -0
- package/docs/runtime-flow.md +148 -148
- package/docs/runtime-migration-in-process-analysis.md +250 -0
- package/docs/stories/README.md +30 -0
- package/docs/stories/backlog.md +36 -0
- package/docs/templates/decision.md +27 -0
- package/docs/templates/story.md +44 -0
- package/docs/templates/validation-report.md +32 -0
- package/docs/usage.md +238 -238
- package/index.ts +7 -6
- package/install.mjs +65 -65
- package/package.json +107 -100
- package/schema.json +222 -222
- package/skills/child-pi-spawning/SKILL.md +213 -0
- package/skills/context-artifact-hygiene/SKILL.md +32 -0
- package/skills/event-log-tracing/SKILL.md +299 -0
- package/skills/git-master/SKILL.md +225 -24
- package/skills/live-agent-lifecycle/SKILL.md +192 -0
- package/skills/mailbox-interactive/SKILL.md +300 -19
- package/skills/model-routing-context/SKILL.md +94 -0
- package/skills/multi-perspective-review/SKILL.md +88 -0
- package/skills/read-only-explorer/SKILL.md +250 -26
- package/skills/safe-bash/SKILL.md +307 -21
- package/skills/verification-before-done/SKILL.md +11 -2
- package/skills/widget-rendering/SKILL.md +258 -0
- package/skills/workspace-isolation/SKILL.md +202 -0
- package/skills/worktree-isolation/SKILL.md +202 -18
- package/src/adapters/claude-adapter.ts +25 -25
- package/src/adapters/codex-adapter.ts +21 -21
- package/src/adapters/cursor-adapter.ts +17 -17
- package/src/adapters/export-util.ts +137 -137
- package/src/adapters/index.ts +15 -15
- package/src/adapters/registry.ts +18 -18
- package/src/adapters/types.ts +23 -23
- package/src/agents/agent-config.ts +38 -38
- package/src/agents/agent-serializer.ts +38 -38
- package/src/agents/discover-agents.ts +121 -118
- package/src/config/config.ts +740 -858
- package/src/config/defaults.ts +96 -96
- package/src/config/drift-detector.ts +211 -211
- package/src/config/markers.ts +327 -327
- package/src/config/resilient-parser.ts +109 -108
- package/src/config/suggestions.ts +74 -74
- package/src/config/types.ts +199 -0
- package/src/extension/async-notifier.ts +123 -89
- package/src/extension/autonomous-policy.ts +169 -169
- package/src/extension/cross-extension-rpc.ts +104 -104
- package/src/extension/help.ts +47 -47
- package/src/extension/import-index.ts +69 -69
- package/src/extension/management.ts +395 -382
- package/src/extension/notification-router.ts +116 -116
- package/src/extension/notification-sink.ts +51 -51
- package/src/extension/project-init.ts +168 -168
- package/src/extension/register.ts +859 -668
- package/src/extension/registration/artifact-cleanup.ts +15 -15
- package/src/extension/registration/command-utils.ts +54 -54
- package/src/extension/registration/commands.ts +559 -452
- package/src/extension/registration/compaction-guard.ts +125 -125
- package/src/extension/registration/subagent-helpers.ts +102 -102
- package/src/extension/registration/subagent-tools.ts +220 -159
- package/src/extension/registration/team-tool.ts +159 -99
- package/src/extension/registration/viewers.ts +29 -0
- package/src/extension/result-watcher.ts +128 -128
- package/src/extension/run-bundle-schema.ts +89 -89
- package/src/extension/run-export.ts +73 -73
- package/src/extension/run-import.ts +84 -84
- package/src/extension/run-index.ts +94 -94
- package/src/extension/run-maintenance.ts +142 -142
- package/src/extension/session-summary.ts +8 -8
- package/src/extension/team-manager-command.ts +96 -96
- package/src/extension/team-recommendation.ts +188 -188
- package/src/extension/team-tool/api.ts +5 -2
- package/src/extension/team-tool/cancel.ts +224 -209
- package/src/extension/team-tool/config-patch.ts +36 -36
- package/src/extension/team-tool/context.ts +60 -60
- package/src/extension/team-tool/doctor.ts +242 -242
- package/src/extension/team-tool/handle-settings.ts +421 -195
- package/src/extension/team-tool/inspect.ts +41 -41
- package/src/extension/team-tool/lifecycle-actions.ts +139 -139
- package/src/extension/team-tool/parallel-dispatch.ts +156 -156
- package/src/extension/team-tool/plan.ts +19 -19
- package/src/extension/team-tool/respond.ts +112 -111
- package/src/extension/team-tool/run.ts +246 -229
- package/src/extension/team-tool/status.ts +110 -110
- package/src/extension/team-tool-types.ts +13 -13
- package/src/extension/team-tool.ts +344 -344
- package/src/extension/tool-result.ts +16 -16
- package/src/extension/validate-resources.ts +77 -77
- package/src/hooks/registry.ts +61 -61
- package/src/hooks/types.ts +40 -40
- package/src/i18n.ts +184 -184
- package/src/observability/correlation.ts +35 -35
- package/src/observability/event-to-metric.ts +68 -68
- package/src/observability/exporters/adapter.ts +30 -30
- package/src/observability/exporters/otlp-exporter.ts +106 -92
- package/src/observability/exporters/prometheus-exporter.ts +54 -54
- package/src/observability/metric-registry.ts +87 -87
- package/src/observability/metric-retention.ts +54 -54
- package/src/observability/metric-sink.ts +81 -56
- package/src/observability/metrics-primitives.ts +167 -167
- package/src/prompt/prompt-runtime.ts +72 -72
- package/src/runtime/adaptive-plan.ts +338 -0
- package/src/runtime/agent-control.ts +169 -169
- package/src/runtime/agent-memory.ts +72 -72
- package/src/runtime/agent-observability.ts +114 -114
- package/src/runtime/async-marker.ts +26 -26
- package/src/runtime/async-runner.ts +153 -153
- package/src/runtime/attention-events.ts +28 -28
- package/src/runtime/auto-resume.ts +100 -100
- package/src/runtime/background-runner.ts +122 -89
- package/src/runtime/cancellation.ts +61 -61
- package/src/runtime/capability-inventory.ts +116 -116
- package/src/runtime/child-pi-pool.ts +68 -0
- package/src/runtime/child-pi.ts +541 -461
- package/src/runtime/code-summary.ts +247 -247
- package/src/runtime/compaction-summary.ts +271 -271
- package/src/runtime/concurrency.ts +58 -58
- package/src/runtime/crash-recovery.ts +317 -301
- package/src/runtime/crew-agent-records.ts +379 -281
- package/src/runtime/crew-agent-runtime.ts +60 -60
- package/src/runtime/cross-extension-rpc.ts +72 -0
- package/src/runtime/custom-tools/irc-tool.ts +201 -201
- package/src/runtime/custom-tools/submit-result-tool.ts +90 -90
- package/src/runtime/deadletter.ts +47 -47
- package/src/runtime/delivery-coordinator.ts +176 -176
- package/src/runtime/delta-conflict.ts +360 -360
- package/src/runtime/diagnostic-export.ts +102 -102
- package/src/runtime/direct-run.ts +35 -35
- package/src/runtime/effectiveness.ts +82 -81
- package/src/runtime/errors/crew-errors.ts +166 -0
- package/src/runtime/event-stream-bridge.ts +92 -92
- package/src/runtime/foreground-control.ts +82 -82
- package/src/runtime/green-contract.ts +46 -46
- package/src/runtime/group-join.ts +234 -106
- package/src/runtime/heartbeat-watcher.ts +145 -124
- package/src/runtime/iteration-hooks.ts +267 -267
- package/src/runtime/live-agent-control.ts +88 -88
- package/src/runtime/live-agent-manager.ts +377 -179
- package/src/runtime/live-control-realtime.ts +36 -36
- package/src/runtime/live-session-runtime.ts +676 -600
- package/src/runtime/loop-gates.ts +129 -129
- package/src/runtime/manifest-cache.ts +263 -263
- package/src/runtime/mcp-proxy.ts +113 -113
- package/src/runtime/metric-parser.ts +40 -40
- package/src/runtime/model-fallback.ts +282 -274
- package/src/runtime/model-resolver.ts +118 -0
- package/src/runtime/output-validator.ts +187 -187
- package/src/runtime/overflow-recovery.ts +175 -175
- package/src/runtime/parallel-research.ts +44 -44
- package/src/runtime/parallel-utils.ts +156 -156
- package/src/runtime/parent-guard.ts +80 -80
- package/src/runtime/phase-progress.ts +217 -217
- package/src/runtime/pi-args.ts +165 -165
- package/src/runtime/pi-json-output.ts +111 -111
- package/src/runtime/pi-spawn.ts +167 -167
- package/src/runtime/policy-engine.ts +79 -79
- package/src/runtime/post-checks.ts +125 -125
- package/src/runtime/post-exit-stdio-guard.ts +86 -86
- package/src/runtime/process-status.ts +97 -73
- package/src/runtime/progress-event-coalescer.ts +43 -43
- package/src/runtime/recovery-recipes.ts +74 -74
- package/src/runtime/retry-executor.ts +81 -81
- package/src/runtime/role-permission.ts +39 -39
- package/src/runtime/run-tracker.ts +99 -0
- package/src/runtime/runtime-policy.ts +21 -0
- package/src/runtime/runtime-resolver.ts +94 -91
- package/src/runtime/scheduler.ts +294 -0
- package/src/runtime/semaphore.ts +131 -131
- package/src/runtime/sensitive-paths.ts +92 -92
- package/src/runtime/session-usage.ts +79 -79
- package/src/runtime/settings-store.ts +103 -0
- package/src/runtime/sidechain-output.ts +29 -29
- package/src/runtime/skill-instructions.ts +222 -222
- package/src/runtime/stale-reconciler.ts +198 -189
- package/src/runtime/streaming-output.ts +47 -0
- package/src/runtime/subagent-manager.ts +404 -400
- package/src/runtime/subprocess-tool-registry.ts +67 -67
- package/src/runtime/task-display.ts +38 -38
- package/src/runtime/task-graph-scheduler.ts +122 -122
- package/src/runtime/task-graph.ts +207 -207
- package/src/runtime/task-output-context.ts +177 -177
- package/src/runtime/task-packet.ts +93 -93
- package/src/runtime/task-quality.ts +207 -207
- package/src/runtime/task-runner/capabilities.ts +78 -78
- package/src/runtime/task-runner/live-executor.ts +131 -113
- package/src/runtime/task-runner/progress.ts +119 -119
- package/src/runtime/task-runner/prompt-builder.ts +139 -139
- package/src/runtime/task-runner/prompt-pipeline.ts +64 -64
- package/src/runtime/task-runner/result-utils.ts +14 -14
- package/src/runtime/task-runner/run-projection.ts +103 -103
- package/src/runtime/task-runner/state-helpers.ts +22 -22
- package/src/runtime/task-runner.ts +469 -459
- package/src/runtime/team-runner.ts +693 -945
- package/src/runtime/usage-tracker.ts +71 -0
- package/src/runtime/worker-heartbeat.ts +21 -21
- package/src/runtime/worker-startup.ts +57 -57
- package/src/runtime/workflow-state.ts +187 -187
- package/src/runtime/yield-handler.ts +190 -190
- package/src/schema/config-schema.ts +172 -168
- package/src/schema/team-tool-schema.ts +126 -126
- package/src/schema/validation-types.ts +151 -148
- package/src/skills/discover-skills.ts +67 -67
- package/src/skills/skill-templates.ts +374 -374
- package/src/state/active-run-registry.ts +227 -191
- package/src/state/artifact-store.ts +130 -129
- package/src/state/atomic-write.ts +262 -195
- package/src/state/blob-store.ts +116 -116
- package/src/state/contracts.ts +111 -111
- package/src/state/event-log-rotation.ts +161 -158
- package/src/state/event-log.ts +383 -303
- package/src/state/event-reconstructor.ts +217 -217
- package/src/state/jsonl-writer.ts +82 -82
- package/src/state/locks.ts +146 -146
- package/src/state/mailbox.ts +446 -405
- package/src/state/state-store.ts +364 -351
- package/src/state/task-claims.ts +44 -44
- package/src/state/types.ts +285 -285
- package/src/state/usage.ts +29 -29
- package/src/subagents/async-entry.ts +1 -1
- package/src/subagents/index.ts +3 -3
- package/src/subagents/live/control.ts +1 -1
- package/src/subagents/live/manager.ts +1 -1
- package/src/subagents/live/realtime.ts +1 -1
- package/src/subagents/live/session-runtime.ts +1 -1
- package/src/subagents/manager.ts +1 -1
- package/src/subagents/spawn.ts +1 -1
- package/src/teams/discover-teams.ts +116 -116
- package/src/teams/team-config.ts +27 -27
- package/src/teams/team-serializer.ts +38 -38
- package/src/types/diff.d.ts +18 -18
- package/src/ui/agent-management-overlay.ts +144 -144
- package/src/ui/crew-widget.ts +487 -370
- package/src/ui/dashboard-panes/agents-pane.ts +109 -28
- package/src/ui/dashboard-panes/cancellation-pane.ts +42 -42
- package/src/ui/dashboard-panes/capability-pane.ts +59 -59
- package/src/ui/dashboard-panes/health-pane.ts +30 -30
- package/src/ui/dashboard-panes/mailbox-pane.ts +35 -35
- package/src/ui/dashboard-panes/progress-pane.ts +30 -30
- package/src/ui/dashboard-panes/transcript-pane.ts +10 -10
- package/src/ui/heartbeat-aggregator.ts +63 -63
- package/src/ui/keybinding-map.ts +97 -94
- package/src/ui/live-conversation-overlay.ts +152 -0
- package/src/ui/live-run-sidebar.ts +180 -180
- package/src/ui/mascot.ts +442 -442
- package/src/ui/overlays/agent-picker-overlay.ts +57 -57
- package/src/ui/overlays/confirm-overlay.ts +58 -58
- package/src/ui/overlays/mailbox-compose-overlay.ts +144 -144
- package/src/ui/overlays/mailbox-compose-preview.ts +63 -63
- package/src/ui/overlays/mailbox-detail-overlay.ts +122 -122
- package/src/ui/pi-ui-compat.ts +57 -57
- package/src/ui/powerbar-publisher.ts +221 -197
- package/src/ui/render-scheduler.ts +216 -143
- package/src/ui/run-action-dispatcher.ts +118 -118
- package/src/ui/run-dashboard.ts +526 -464
- package/src/ui/run-event-bus.ts +208 -208
- package/src/ui/run-snapshot-cache.ts +826 -777
- package/src/ui/settings-overlay.ts +721 -0
- package/src/ui/snapshot-types.ts +86 -70
- package/src/ui/theme-adapter.ts +190 -190
- package/src/ui/tool-progress-formatter.ts +89 -0
- package/src/ui/transcript-cache.ts +94 -94
- package/src/ui/transcript-viewer.ts +335 -335
- package/src/utils/conflict-detect.ts +662 -0
- package/src/utils/file-coalescer.ts +86 -86
- package/src/utils/frontmatter.ts +68 -68
- package/src/utils/fs-watch.ts +88 -31
- package/src/utils/gh-protocol.ts +479 -0
- package/src/utils/ids.ts +17 -17
- package/src/utils/incremental-reader.ts +104 -104
- package/src/utils/internal-error.ts +6 -6
- package/src/utils/names.ts +27 -27
- package/src/utils/paths.ts +102 -63
- package/src/utils/redaction.ts +44 -44
- package/src/utils/safe-paths.ts +47 -47
- package/src/utils/scan-cache.ts +136 -136
- package/src/utils/sse-parser.ts +134 -134
- package/src/utils/task-name-generator.ts +337 -337
- package/src/utils/timings.ts +33 -33
- package/src/utils/visual.ts +243 -198
- package/src/workflows/discover-workflows.ts +139 -139
- package/src/workflows/validate-workflow.ts +40 -40
- package/src/workflows/workflow-config.ts +26 -26
- package/src/workflows/workflow-serializer.ts +32 -32
- package/src/worktree/branch-freshness.ts +45 -45
- package/src/worktree/cleanup.ts +75 -75
- package/src/worktree/worktree-manager.ts +188 -188
- package/teams/default.team.md +12 -12
- package/teams/fast-fix.team.md +11 -11
- package/teams/implementation.team.md +18 -18
- package/teams/parallel-research.team.md +14 -14
- package/teams/research.team.md +11 -11
- package/teams/review.team.md +12 -12
- package/tsconfig.json +19 -19
- package/workflows/default.workflow.md +30 -30
- package/workflows/fast-fix.workflow.md +23 -23
- package/workflows/implementation.workflow.md +43 -43
- package/workflows/parallel-research.workflow.md +46 -46
- package/workflows/research.workflow.md +22 -22
- package/workflows/review.workflow.md +30 -30
- package/skills/task-packet/SKILL.md +0 -28
- package/skills/verify-evidence/SKILL.md +0 -27
|
@@ -0,0 +1,118 @@
|
|
|
1
|
+
export interface ModelEntry {
|
|
2
|
+
id: string;
|
|
3
|
+
name: string;
|
|
4
|
+
provider: string;
|
|
5
|
+
}
|
|
6
|
+
|
|
7
|
+
export interface ModelRegistry {
|
|
8
|
+
find(provider: string, modelId: string): any;
|
|
9
|
+
getAll(): any[];
|
|
10
|
+
getAvailable?(): any[];
|
|
11
|
+
}
|
|
12
|
+
|
|
13
|
+
/**
|
|
14
|
+
* Resolve a model string to a Model instance.
|
|
15
|
+
* Exact match first ("provider/modelId"), then fuzzy match.
|
|
16
|
+
* Returns Model on success, error message string on failure.
|
|
17
|
+
*/
|
|
18
|
+
export function resolveModel(input: string, registry: ModelRegistry): any | string {
|
|
19
|
+
const all = (registry.getAvailable?.() ?? registry.getAll()) as ModelEntry[];
|
|
20
|
+
const availableSet = new Set(all.map((m) => `${m.provider}/${m.id}`.toLowerCase()));
|
|
21
|
+
|
|
22
|
+
// Exact match
|
|
23
|
+
const slashIdx = input.indexOf("/");
|
|
24
|
+
if (slashIdx !== -1) {
|
|
25
|
+
const provider = input.slice(0, slashIdx);
|
|
26
|
+
const modelId = input.slice(slashIdx + 1);
|
|
27
|
+
if (availableSet.has(input.toLowerCase())) {
|
|
28
|
+
const found = registry.find(provider, modelId);
|
|
29
|
+
if (found) return found;
|
|
30
|
+
}
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
// Fuzzy match
|
|
34
|
+
const query = input.toLowerCase();
|
|
35
|
+
let bestMatch: ModelEntry | undefined;
|
|
36
|
+
let bestScore = 0;
|
|
37
|
+
|
|
38
|
+
for (const m of all) {
|
|
39
|
+
const id = m.id.toLowerCase();
|
|
40
|
+
const name = m.name.toLowerCase();
|
|
41
|
+
const full = `${m.provider}/${m.id}`.toLowerCase();
|
|
42
|
+
|
|
43
|
+
let score = 0;
|
|
44
|
+
if (id === query || full === query) {
|
|
45
|
+
score = 100;
|
|
46
|
+
} else if (id.includes(query) || full.includes(query)) {
|
|
47
|
+
score = 60 + (query.length / id.length) * 30;
|
|
48
|
+
} else if (name.includes(query)) {
|
|
49
|
+
score = 40 + (query.length / name.length) * 20;
|
|
50
|
+
} else if (
|
|
51
|
+
query
|
|
52
|
+
.split(/[\s\-/]+/)
|
|
53
|
+
.every((part) => id.includes(part) || name.includes(part) || m.provider.toLowerCase().includes(part))
|
|
54
|
+
) {
|
|
55
|
+
score = 20;
|
|
56
|
+
}
|
|
57
|
+
|
|
58
|
+
if (score > bestScore) {
|
|
59
|
+
bestScore = score;
|
|
60
|
+
bestMatch = m;
|
|
61
|
+
}
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
if (bestMatch && bestScore >= 20) {
|
|
65
|
+
const found = registry.find(bestMatch.provider, bestMatch.id);
|
|
66
|
+
if (found) return found;
|
|
67
|
+
}
|
|
68
|
+
|
|
69
|
+
const modelList = all
|
|
70
|
+
.map((m) => ` ${m.provider}/${m.id}`)
|
|
71
|
+
.sort()
|
|
72
|
+
.join("\n");
|
|
73
|
+
return `Model not found: "${input}".\n\nAvailable models:\n${modelList}`;
|
|
74
|
+
}
|
|
75
|
+
|
|
76
|
+
export interface SimpleModelEntry {
|
|
77
|
+
id: string;
|
|
78
|
+
name?: string;
|
|
79
|
+
provider: string;
|
|
80
|
+
}
|
|
81
|
+
|
|
82
|
+
/**
|
|
83
|
+
* Fuzzy-match a model query against a flat list of available models.
|
|
84
|
+
* Returns the best-match fullId (provider/id) or undefined.
|
|
85
|
+
*/
|
|
86
|
+
export function fuzzyResolveModelId(input: string, models: SimpleModelEntry[]): string | undefined {
|
|
87
|
+
const query = input.toLowerCase();
|
|
88
|
+
let bestMatch: SimpleModelEntry | undefined;
|
|
89
|
+
let bestScore = 0;
|
|
90
|
+
|
|
91
|
+
for (const m of models) {
|
|
92
|
+
const id = m.id.toLowerCase();
|
|
93
|
+
const name = (m.name ?? "").toLowerCase();
|
|
94
|
+
const full = `${m.provider}/${m.id}`.toLowerCase();
|
|
95
|
+
|
|
96
|
+
let score = 0;
|
|
97
|
+
if (id === query || full === query) {
|
|
98
|
+
score = 100;
|
|
99
|
+
} else if (id.includes(query) || full.includes(query)) {
|
|
100
|
+
score = 60 + (query.length / id.length) * 30;
|
|
101
|
+
} else if (name.includes(query)) {
|
|
102
|
+
score = 40 + (query.length / (name.length || 1)) * 20;
|
|
103
|
+
} else if (
|
|
104
|
+
query
|
|
105
|
+
.split(/[\s\-/]+/)
|
|
106
|
+
.every((part) => id.includes(part) || name.includes(part) || m.provider.toLowerCase().includes(part))
|
|
107
|
+
) {
|
|
108
|
+
score = 20;
|
|
109
|
+
}
|
|
110
|
+
|
|
111
|
+
if (score > bestScore) {
|
|
112
|
+
bestScore = score;
|
|
113
|
+
bestMatch = m;
|
|
114
|
+
}
|
|
115
|
+
}
|
|
116
|
+
|
|
117
|
+
return bestMatch && bestScore >= 20 ? `${bestMatch.provider}/${bestMatch.id}` : undefined;
|
|
118
|
+
}
|
|
@@ -1,187 +1,187 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Phase 4 (caveman): Output format validation for live-session workers.
|
|
3
|
-
*
|
|
4
|
-
* Validates that worker output conforms to the structured output contract
|
|
5
|
-
* for the given role. If validation fails, returns structured error info
|
|
6
|
-
* that can be used for retry or fallback.
|
|
7
|
-
*
|
|
8
|
-
* Inspired by caveman's validate.py — check structural preservation
|
|
9
|
-
* (headings, code blocks, URLs) after compression.
|
|
10
|
-
*/
|
|
11
|
-
|
|
12
|
-
/** Role-specific output format patterns — constructed fresh per call to avoid /g lastIndex leak */
|
|
13
|
-
const ROLE_PATTERN_DEFS: Record<string, () => RegExp> = {
|
|
14
|
-
explorer: () => /^(\S+:\d+|Defs:|Refs:|Callers:|Tests:|Sites:|No match\.|totals:)/m,
|
|
15
|
-
executor: () => /^(\S+:\d+(-\d+)? — .{1,80}\.|verified:|too-big\.|needs-confirm\.|ambiguous\.|regressed\.)/m,
|
|
16
|
-
reviewer: () => /^([^:\s]+:\d+:\s+\p{Emoji_Presentation}|No issues\.|totals:)/mu,
|
|
17
|
-
"security-reviewer": () => /^([^:\s]+:\d+:\s+\p{Emoji_Presentation}|No issues\.|totals:)/mu,
|
|
18
|
-
verifier: () => /^(PASS:|FAIL:)/m,
|
|
19
|
-
};
|
|
20
|
-
|
|
21
|
-
/** Fresh RegExp factories for structural preservation checks (avoids /g lastIndex leak) */
|
|
22
|
-
const makeUrlRe = () => /\bhttps?:\/\/[^\s<>)\]"',;]+/gi;
|
|
23
|
-
const makeFencedCodeRe = () => /```[\s\S]*?```/g;
|
|
24
|
-
const makeInlineCodeRe = () => /`[^`\n]+`/g;
|
|
25
|
-
const makeHeadingRe = () => /^#{1,6}\s+.+/gm;
|
|
26
|
-
|
|
27
|
-
export interface OutputValidationResult {
|
|
28
|
-
/** Whether the output passes validation */
|
|
29
|
-
valid: boolean;
|
|
30
|
-
/** Whether the output follows the role's contract format */
|
|
31
|
-
formatMatch: boolean;
|
|
32
|
-
/** Whether structural elements (code, URLs, headings) are preserved */
|
|
33
|
-
structurePreserved: boolean;
|
|
34
|
-
/** Specific issues found */
|
|
35
|
-
issues: string[];
|
|
36
|
-
}
|
|
37
|
-
|
|
38
|
-
/**
|
|
39
|
-
* Validate worker output against role-specific contract + structural preservation.
|
|
40
|
-
*/
|
|
41
|
-
export function validateWorkerOutput(role: string, output: string): OutputValidationResult {
|
|
42
|
-
const issues: string[] = [];
|
|
43
|
-
|
|
44
|
-
// Empty output always fails
|
|
45
|
-
if (!output || !output.trim()) {
|
|
46
|
-
return { valid: false, formatMatch: false, structurePreserved: false, issues: ["Empty output"] };
|
|
47
|
-
}
|
|
48
|
-
|
|
49
|
-
// Check role-specific format
|
|
50
|
-
const patternFactory = ROLE_PATTERN_DEFS[role];
|
|
51
|
-
const pattern = patternFactory ? patternFactory() : undefined;
|
|
52
|
-
const formatMatch = !pattern || pattern.test(output);
|
|
53
|
-
if (!formatMatch) {
|
|
54
|
-
issues.push(`Output does not match expected ${role} contract format`);
|
|
55
|
-
}
|
|
56
|
-
|
|
57
|
-
// Check structural preservation (code blocks, URLs, headings)
|
|
58
|
-
let structurePreserved = true;
|
|
59
|
-
const trimmedOutput = output.trim();
|
|
60
|
-
|
|
61
|
-
// Detect if output was truncated mid-code-block
|
|
62
|
-
const opens = (trimmedOutput.match(/```/g) ?? []).length;
|
|
63
|
-
if (opens % 2 !== 0) {
|
|
64
|
-
structurePreserved = false;
|
|
65
|
-
issues.push("Unclosed code block — output may be truncated");
|
|
66
|
-
}
|
|
67
|
-
|
|
68
|
-
// Check for malformed URLs
|
|
69
|
-
const urls = trimmedOutput.match(makeUrlRe()) ?? [];
|
|
70
|
-
for (const url of urls) {
|
|
71
|
-
if (url.endsWith(".") || url.endsWith(",")) {
|
|
72
|
-
structurePreserved = false;
|
|
73
|
-
issues.push(`URL with trailing punctuation: ${url.slice(-20)}`);
|
|
74
|
-
}
|
|
75
|
-
}
|
|
76
|
-
|
|
77
|
-
return {
|
|
78
|
-
valid: formatMatch && structurePreserved,
|
|
79
|
-
formatMatch,
|
|
80
|
-
structurePreserved,
|
|
81
|
-
issues,
|
|
82
|
-
};
|
|
83
|
-
}
|
|
84
|
-
|
|
85
|
-
/**
|
|
86
|
-
* Extract structured findings from reviewer output.
|
|
87
|
-
* Returns array of { file, line, severity, message } objects.
|
|
88
|
-
*/
|
|
89
|
-
export function parseReviewerFindings(output: string): Array<{ file: string; line: number; severity: string; message: string }> {
|
|
90
|
-
const findings: Array<{ file: string; line: number; severity: string; message: string }> = [];
|
|
91
|
-
const lines = output.split("\n");
|
|
92
|
-
|
|
93
|
-
const SEVERITY_MAP: Record<string, string> = {
|
|
94
|
-
"🔴": "bug",
|
|
95
|
-
"🟡": "risk",
|
|
96
|
-
"🔵": "nit",
|
|
97
|
-
"❓": "question",
|
|
98
|
-
};
|
|
99
|
-
|
|
100
|
-
for (const line of lines) {
|
|
101
|
-
// Match: path/to/file.ts:42: 🔴 bug: problem. fix.
|
|
102
|
-
const match = line.match(/^([^:\s]+):(\d+):\s+(\p{Emoji_Presentation}) (\w+):\s+(.+)/u);
|
|
103
|
-
if (match) {
|
|
104
|
-
findings.push({
|
|
105
|
-
file: match[1],
|
|
106
|
-
line: Number(match[2]),
|
|
107
|
-
severity: SEVERITY_MAP[match[3]] ?? match[3],
|
|
108
|
-
message: match[5].trim(),
|
|
109
|
-
});
|
|
110
|
-
}
|
|
111
|
-
}
|
|
112
|
-
|
|
113
|
-
return findings;
|
|
114
|
-
}
|
|
115
|
-
|
|
116
|
-
/**
|
|
117
|
-
* Extract explorer results from structured output.
|
|
118
|
-
* Returns array of { file, line, symbol, note } objects.
|
|
119
|
-
*/
|
|
120
|
-
export function parseExplorerResults(output: string): Array<{ file: string; line: number; symbol: string; note: string }> {
|
|
121
|
-
const results: Array<{ file: string; line: number; symbol: string; note: string }> = [];
|
|
122
|
-
const lines = output.split("\n");
|
|
123
|
-
|
|
124
|
-
for (const line of lines) {
|
|
125
|
-
// Match: path/to/file.ts:42 — `symbol` — note
|
|
126
|
-
const match = line.match(/^[- ]*(\S+):(\d+)\s*[—–-]\s*`([^`]+)`\s*[—–-]\s*(.+)/);
|
|
127
|
-
if (match) {
|
|
128
|
-
results.push({
|
|
129
|
-
file: match[1],
|
|
130
|
-
line: Number(match[2]),
|
|
131
|
-
symbol: match[3],
|
|
132
|
-
note: match[4].trim(),
|
|
133
|
-
});
|
|
134
|
-
}
|
|
135
|
-
}
|
|
136
|
-
|
|
137
|
-
return results;
|
|
138
|
-
}
|
|
139
|
-
|
|
140
|
-
/**
|
|
141
|
-
* Validate that compressed prose preserves structural elements from original.
|
|
142
|
-
* Returns list of specific issues (empty = valid).
|
|
143
|
-
*/
|
|
144
|
-
export function validateCompressionPreservation(original: string, compressed: string): string[] {
|
|
145
|
-
const issues: string[] = [];
|
|
146
|
-
|
|
147
|
-
// Check code blocks preserved
|
|
148
|
-
const origBlocks = original.match(makeFencedCodeRe()) ?? [];
|
|
149
|
-
const compBlocks = compressed.match(makeFencedCodeRe()) ?? [];
|
|
150
|
-
if (origBlocks.length !== compBlocks.length) {
|
|
151
|
-
issues.push(`Code block count: ${origBlocks.length} → ${compBlocks.length}`);
|
|
152
|
-
}
|
|
153
|
-
for (let i = 0; i < Math.min(origBlocks.length, compBlocks.length); i++) {
|
|
154
|
-
if (origBlocks[i] !== compBlocks[i]) {
|
|
155
|
-
issues.push(`Code block ${i + 1} content changed`);
|
|
156
|
-
}
|
|
157
|
-
}
|
|
158
|
-
|
|
159
|
-
// Check URLs preserved
|
|
160
|
-
const origUrls = new Set(original.match(makeUrlRe()) ?? []);
|
|
161
|
-
const compUrls = new Set(compressed.match(makeUrlRe()) ?? []);
|
|
162
|
-
for (const url of origUrls) {
|
|
163
|
-
if (!compUrls.has(url)) {
|
|
164
|
-
issues.push(`URL lost: ${url.slice(0, 60)}...`);
|
|
165
|
-
}
|
|
166
|
-
}
|
|
167
|
-
|
|
168
|
-
// Check inline code preserved
|
|
169
|
-
const origInline = original.match(makeInlineCodeRe()) ?? [];
|
|
170
|
-
const compInline = compressed.match(makeInlineCodeRe()) ?? [];
|
|
171
|
-
const origInlineSet = new Set(origInline);
|
|
172
|
-
const compInlineSet = new Set(compInline);
|
|
173
|
-
for (const code of origInlineSet) {
|
|
174
|
-
if (!compInlineSet.has(code)) {
|
|
175
|
-
issues.push(`Inline code lost: ${code}`);
|
|
176
|
-
}
|
|
177
|
-
}
|
|
178
|
-
|
|
179
|
-
// Check headings preserved
|
|
180
|
-
const origHeadings = original.match(makeHeadingRe()) ?? [];
|
|
181
|
-
const compHeadings = compressed.match(makeHeadingRe()) ?? [];
|
|
182
|
-
if (origHeadings.length !== compHeadings.length) {
|
|
183
|
-
issues.push(`Heading count: ${origHeadings.length} → ${compHeadings.length}`);
|
|
184
|
-
}
|
|
185
|
-
|
|
186
|
-
return issues;
|
|
187
|
-
}
|
|
1
|
+
/**
|
|
2
|
+
* Phase 4 (caveman): Output format validation for live-session workers.
|
|
3
|
+
*
|
|
4
|
+
* Validates that worker output conforms to the structured output contract
|
|
5
|
+
* for the given role. If validation fails, returns structured error info
|
|
6
|
+
* that can be used for retry or fallback.
|
|
7
|
+
*
|
|
8
|
+
* Inspired by caveman's validate.py — check structural preservation
|
|
9
|
+
* (headings, code blocks, URLs) after compression.
|
|
10
|
+
*/
|
|
11
|
+
|
|
12
|
+
/** Role-specific output format patterns — constructed fresh per call to avoid /g lastIndex leak */
|
|
13
|
+
const ROLE_PATTERN_DEFS: Record<string, () => RegExp> = {
|
|
14
|
+
explorer: () => /^(\S+:\d+|Defs:|Refs:|Callers:|Tests:|Sites:|No match\.|totals:)/m,
|
|
15
|
+
executor: () => /^(\S+:\d+(-\d+)? — .{1,80}\.|verified:|too-big\.|needs-confirm\.|ambiguous\.|regressed\.)/m,
|
|
16
|
+
reviewer: () => /^([^:\s]+:\d+:\s+\p{Emoji_Presentation}|No issues\.|totals:)/mu,
|
|
17
|
+
"security-reviewer": () => /^([^:\s]+:\d+:\s+\p{Emoji_Presentation}|No issues\.|totals:)/mu,
|
|
18
|
+
verifier: () => /^(PASS:|FAIL:)/m,
|
|
19
|
+
};
|
|
20
|
+
|
|
21
|
+
/** Fresh RegExp factories for structural preservation checks (avoids /g lastIndex leak) */
|
|
22
|
+
const makeUrlRe = () => /\bhttps?:\/\/[^\s<>)\]"',;]+/gi;
|
|
23
|
+
const makeFencedCodeRe = () => /```[\s\S]*?```/g;
|
|
24
|
+
const makeInlineCodeRe = () => /`[^`\n]+`/g;
|
|
25
|
+
const makeHeadingRe = () => /^#{1,6}\s+.+/gm;
|
|
26
|
+
|
|
27
|
+
export interface OutputValidationResult {
|
|
28
|
+
/** Whether the output passes validation */
|
|
29
|
+
valid: boolean;
|
|
30
|
+
/** Whether the output follows the role's contract format */
|
|
31
|
+
formatMatch: boolean;
|
|
32
|
+
/** Whether structural elements (code, URLs, headings) are preserved */
|
|
33
|
+
structurePreserved: boolean;
|
|
34
|
+
/** Specific issues found */
|
|
35
|
+
issues: string[];
|
|
36
|
+
}
|
|
37
|
+
|
|
38
|
+
/**
|
|
39
|
+
* Validate worker output against role-specific contract + structural preservation.
|
|
40
|
+
*/
|
|
41
|
+
export function validateWorkerOutput(role: string, output: string): OutputValidationResult {
|
|
42
|
+
const issues: string[] = [];
|
|
43
|
+
|
|
44
|
+
// Empty output always fails
|
|
45
|
+
if (!output || !output.trim()) {
|
|
46
|
+
return { valid: false, formatMatch: false, structurePreserved: false, issues: ["Empty output"] };
|
|
47
|
+
}
|
|
48
|
+
|
|
49
|
+
// Check role-specific format
|
|
50
|
+
const patternFactory = ROLE_PATTERN_DEFS[role];
|
|
51
|
+
const pattern = patternFactory ? patternFactory() : undefined;
|
|
52
|
+
const formatMatch = !pattern || pattern.test(output);
|
|
53
|
+
if (!formatMatch) {
|
|
54
|
+
issues.push(`Output does not match expected ${role} contract format`);
|
|
55
|
+
}
|
|
56
|
+
|
|
57
|
+
// Check structural preservation (code blocks, URLs, headings)
|
|
58
|
+
let structurePreserved = true;
|
|
59
|
+
const trimmedOutput = output.trim();
|
|
60
|
+
|
|
61
|
+
// Detect if output was truncated mid-code-block
|
|
62
|
+
const opens = (trimmedOutput.match(/```/g) ?? []).length;
|
|
63
|
+
if (opens % 2 !== 0) {
|
|
64
|
+
structurePreserved = false;
|
|
65
|
+
issues.push("Unclosed code block — output may be truncated");
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
// Check for malformed URLs
|
|
69
|
+
const urls = trimmedOutput.match(makeUrlRe()) ?? [];
|
|
70
|
+
for (const url of urls) {
|
|
71
|
+
if (url.endsWith(".") || url.endsWith(",")) {
|
|
72
|
+
structurePreserved = false;
|
|
73
|
+
issues.push(`URL with trailing punctuation: ${url.slice(-20)}`);
|
|
74
|
+
}
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
return {
|
|
78
|
+
valid: formatMatch && structurePreserved,
|
|
79
|
+
formatMatch,
|
|
80
|
+
structurePreserved,
|
|
81
|
+
issues,
|
|
82
|
+
};
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
/**
|
|
86
|
+
* Extract structured findings from reviewer output.
|
|
87
|
+
* Returns array of { file, line, severity, message } objects.
|
|
88
|
+
*/
|
|
89
|
+
export function parseReviewerFindings(output: string): Array<{ file: string; line: number; severity: string; message: string }> {
|
|
90
|
+
const findings: Array<{ file: string; line: number; severity: string; message: string }> = [];
|
|
91
|
+
const lines = output.split("\n");
|
|
92
|
+
|
|
93
|
+
const SEVERITY_MAP: Record<string, string> = {
|
|
94
|
+
"🔴": "bug",
|
|
95
|
+
"🟡": "risk",
|
|
96
|
+
"🔵": "nit",
|
|
97
|
+
"❓": "question",
|
|
98
|
+
};
|
|
99
|
+
|
|
100
|
+
for (const line of lines) {
|
|
101
|
+
// Match: path/to/file.ts:42: 🔴 bug: problem. fix.
|
|
102
|
+
const match = line.match(/^([^:\s]+):(\d+):\s+(\p{Emoji_Presentation}) (\w+):\s+(.+)/u);
|
|
103
|
+
if (match) {
|
|
104
|
+
findings.push({
|
|
105
|
+
file: match[1],
|
|
106
|
+
line: Number(match[2]),
|
|
107
|
+
severity: SEVERITY_MAP[match[3]] ?? match[3],
|
|
108
|
+
message: match[5].trim(),
|
|
109
|
+
});
|
|
110
|
+
}
|
|
111
|
+
}
|
|
112
|
+
|
|
113
|
+
return findings;
|
|
114
|
+
}
|
|
115
|
+
|
|
116
|
+
/**
|
|
117
|
+
* Extract explorer results from structured output.
|
|
118
|
+
* Returns array of { file, line, symbol, note } objects.
|
|
119
|
+
*/
|
|
120
|
+
export function parseExplorerResults(output: string): Array<{ file: string; line: number; symbol: string; note: string }> {
|
|
121
|
+
const results: Array<{ file: string; line: number; symbol: string; note: string }> = [];
|
|
122
|
+
const lines = output.split("\n");
|
|
123
|
+
|
|
124
|
+
for (const line of lines) {
|
|
125
|
+
// Match: path/to/file.ts:42 — `symbol` — note
|
|
126
|
+
const match = line.match(/^[- ]*(\S+):(\d+)\s*[—–-]\s*`([^`]+)`\s*[—–-]\s*(.+)/);
|
|
127
|
+
if (match) {
|
|
128
|
+
results.push({
|
|
129
|
+
file: match[1],
|
|
130
|
+
line: Number(match[2]),
|
|
131
|
+
symbol: match[3],
|
|
132
|
+
note: match[4].trim(),
|
|
133
|
+
});
|
|
134
|
+
}
|
|
135
|
+
}
|
|
136
|
+
|
|
137
|
+
return results;
|
|
138
|
+
}
|
|
139
|
+
|
|
140
|
+
/**
|
|
141
|
+
* Validate that compressed prose preserves structural elements from original.
|
|
142
|
+
* Returns list of specific issues (empty = valid).
|
|
143
|
+
*/
|
|
144
|
+
export function validateCompressionPreservation(original: string, compressed: string): string[] {
|
|
145
|
+
const issues: string[] = [];
|
|
146
|
+
|
|
147
|
+
// Check code blocks preserved
|
|
148
|
+
const origBlocks = original.match(makeFencedCodeRe()) ?? [];
|
|
149
|
+
const compBlocks = compressed.match(makeFencedCodeRe()) ?? [];
|
|
150
|
+
if (origBlocks.length !== compBlocks.length) {
|
|
151
|
+
issues.push(`Code block count: ${origBlocks.length} → ${compBlocks.length}`);
|
|
152
|
+
}
|
|
153
|
+
for (let i = 0; i < Math.min(origBlocks.length, compBlocks.length); i++) {
|
|
154
|
+
if (origBlocks[i] !== compBlocks[i]) {
|
|
155
|
+
issues.push(`Code block ${i + 1} content changed`);
|
|
156
|
+
}
|
|
157
|
+
}
|
|
158
|
+
|
|
159
|
+
// Check URLs preserved
|
|
160
|
+
const origUrls = new Set(original.match(makeUrlRe()) ?? []);
|
|
161
|
+
const compUrls = new Set(compressed.match(makeUrlRe()) ?? []);
|
|
162
|
+
for (const url of origUrls) {
|
|
163
|
+
if (!compUrls.has(url)) {
|
|
164
|
+
issues.push(`URL lost: ${url.slice(0, 60)}...`);
|
|
165
|
+
}
|
|
166
|
+
}
|
|
167
|
+
|
|
168
|
+
// Check inline code preserved
|
|
169
|
+
const origInline = original.match(makeInlineCodeRe()) ?? [];
|
|
170
|
+
const compInline = compressed.match(makeInlineCodeRe()) ?? [];
|
|
171
|
+
const origInlineSet = new Set(origInline);
|
|
172
|
+
const compInlineSet = new Set(compInline);
|
|
173
|
+
for (const code of origInlineSet) {
|
|
174
|
+
if (!compInlineSet.has(code)) {
|
|
175
|
+
issues.push(`Inline code lost: ${code}`);
|
|
176
|
+
}
|
|
177
|
+
}
|
|
178
|
+
|
|
179
|
+
// Check headings preserved
|
|
180
|
+
const origHeadings = original.match(makeHeadingRe()) ?? [];
|
|
181
|
+
const compHeadings = compressed.match(makeHeadingRe()) ?? [];
|
|
182
|
+
if (origHeadings.length !== compHeadings.length) {
|
|
183
|
+
issues.push(`Heading count: ${origHeadings.length} → ${compHeadings.length}`);
|
|
184
|
+
}
|
|
185
|
+
|
|
186
|
+
return issues;
|
|
187
|
+
}
|