npm - pi-crew - Versions diffs - 0.2.3 → 0.2.4 - Mend

pi-crew 0.2.3 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (348) hide show

package/AGENTS.md +57 -32
package/CHANGELOG.md +466 -448
package/LICENSE +21 -21
package/NOTICE.md +16 -16
package/README.md +323 -323
package/docs/FEATURE_INTAKE.md +126 -0
package/docs/HARNESS.md +86 -0
package/docs/HARNESS_BACKLOG.md +41 -0
package/docs/TEST_MATRIX.md +49 -0
package/docs/actions-reference.md +595 -595
package/docs/architecture.md +180 -180
package/docs/code-review-2026-05-11.md +592 -592
package/docs/commands-reference.md +347 -347
package/docs/comparison-pi-subagents-vs-pi-crew.md +303 -0
package/docs/decisions/0001-durable-state.md +41 -0
package/docs/decisions/0002-child-process-for-async.md +42 -0
package/docs/decisions/0003-depth-guard.md +36 -0
package/docs/decisions/0004-execfile-over-exec.md +34 -0
package/docs/decisions/0005-no-parameter-properties.md +49 -0
package/docs/decisions/0006-publish-bundled-esm.md +63 -0
package/docs/decisions/0007-active-run-binary-index.md +54 -0
package/docs/decisions/0008-child-pi-warm-pool.md +61 -0
package/docs/decisions/README.md +23 -0
package/docs/followup-review-round4-2026-05-13.md +107 -0
package/docs/implementation-plan-top3.md +333 -0
package/docs/live-mailbox-runtime.md +36 -36
package/docs/next-upgrade-roadmap.md +808 -808
package/docs/oh-my-pi-research.md +509 -0
package/docs/perf/baseline-2026-05.md +113 -0
package/docs/perf/final-report-2026-05.md +206 -0
package/docs/perf/sprint-1-report.md +71 -0
package/docs/perf/sprint-2-report.md +81 -0
package/docs/perf/sprint-2.5-report.md +53 -0
package/docs/perf/sprint-3-report.md +36 -0
package/docs/perf/sprint-4-report.md +47 -0
package/docs/perf/sprint-5-report.md +51 -0
package/docs/perf/sprint-6-report.md +94 -0
package/docs/perf/sprint-7-report.md +74 -0
package/docs/perf/upgrade-plan-2026-05.md +147 -0
package/docs/pi-subagents3-deep-analysis.md +508 -0
package/docs/product/README.md +31 -0
package/docs/product/platform.md +27 -0
package/docs/product/runtime-safety.md +37 -0
package/docs/product/team-run.md +39 -0
package/docs/product/team-tool.md +37 -0
package/docs/publishing.md +65 -65
package/docs/resource-formats.md +134 -134
package/docs/runtime-analysis-child-vs-live.md +171 -0
package/docs/runtime-flow.md +148 -148
package/docs/runtime-migration-in-process-analysis.md +250 -0
package/docs/stories/README.md +30 -0
package/docs/stories/backlog.md +36 -0
package/docs/templates/decision.md +27 -0
package/docs/templates/story.md +44 -0
package/docs/templates/validation-report.md +32 -0
package/docs/usage.md +238 -238
package/index.ts +7 -6
package/install.mjs +65 -65
package/package.json +107 -100
package/schema.json +222 -222
package/skills/child-pi-spawning/SKILL.md +213 -0
package/skills/context-artifact-hygiene/SKILL.md +32 -0
package/skills/event-log-tracing/SKILL.md +299 -0
package/skills/git-master/SKILL.md +225 -24
package/skills/live-agent-lifecycle/SKILL.md +192 -0
package/skills/mailbox-interactive/SKILL.md +300 -19
package/skills/model-routing-context/SKILL.md +94 -0
package/skills/multi-perspective-review/SKILL.md +88 -0
package/skills/read-only-explorer/SKILL.md +250 -26
package/skills/safe-bash/SKILL.md +307 -21
package/skills/verification-before-done/SKILL.md +11 -2
package/skills/widget-rendering/SKILL.md +258 -0
package/skills/workspace-isolation/SKILL.md +202 -0
package/skills/worktree-isolation/SKILL.md +202 -18
package/src/adapters/claude-adapter.ts +25 -25
package/src/adapters/codex-adapter.ts +21 -21
package/src/adapters/cursor-adapter.ts +17 -17
package/src/adapters/export-util.ts +137 -137
package/src/adapters/index.ts +15 -15
package/src/adapters/registry.ts +18 -18
package/src/adapters/types.ts +23 -23
package/src/agents/agent-config.ts +38 -38
package/src/agents/agent-serializer.ts +38 -38
package/src/agents/discover-agents.ts +121 -118
package/src/config/config.ts +740 -858
package/src/config/defaults.ts +96 -96
package/src/config/drift-detector.ts +211 -211
package/src/config/markers.ts +327 -327
package/src/config/resilient-parser.ts +109 -108
package/src/config/suggestions.ts +74 -74
package/src/config/types.ts +199 -0
package/src/extension/async-notifier.ts +123 -89
package/src/extension/autonomous-policy.ts +169 -169
package/src/extension/cross-extension-rpc.ts +104 -104
package/src/extension/help.ts +47 -47
package/src/extension/import-index.ts +69 -69
package/src/extension/management.ts +395 -382
package/src/extension/notification-router.ts +116 -116
package/src/extension/notification-sink.ts +51 -51
package/src/extension/project-init.ts +168 -168
package/src/extension/register.ts +859 -668
package/src/extension/registration/artifact-cleanup.ts +15 -15
package/src/extension/registration/command-utils.ts +54 -54
package/src/extension/registration/commands.ts +559 -452
package/src/extension/registration/compaction-guard.ts +125 -125
package/src/extension/registration/subagent-helpers.ts +102 -102
package/src/extension/registration/subagent-tools.ts +220 -159
package/src/extension/registration/team-tool.ts +159 -99
package/src/extension/registration/viewers.ts +29 -0
package/src/extension/result-watcher.ts +128 -128
package/src/extension/run-bundle-schema.ts +89 -89
package/src/extension/run-export.ts +73 -73
package/src/extension/run-import.ts +84 -84
package/src/extension/run-index.ts +94 -94
package/src/extension/run-maintenance.ts +142 -142
package/src/extension/session-summary.ts +8 -8
package/src/extension/team-manager-command.ts +96 -96
package/src/extension/team-recommendation.ts +188 -188
package/src/extension/team-tool/api.ts +5 -2
package/src/extension/team-tool/cancel.ts +224 -209
package/src/extension/team-tool/config-patch.ts +36 -36
package/src/extension/team-tool/context.ts +60 -60
package/src/extension/team-tool/doctor.ts +242 -242
package/src/extension/team-tool/handle-settings.ts +421 -195
package/src/extension/team-tool/inspect.ts +41 -41
package/src/extension/team-tool/lifecycle-actions.ts +139 -139
package/src/extension/team-tool/parallel-dispatch.ts +156 -156
package/src/extension/team-tool/plan.ts +19 -19
package/src/extension/team-tool/respond.ts +112 -111
package/src/extension/team-tool/run.ts +246 -229
package/src/extension/team-tool/status.ts +110 -110
package/src/extension/team-tool-types.ts +13 -13
package/src/extension/team-tool.ts +344 -344
package/src/extension/tool-result.ts +16 -16
package/src/extension/validate-resources.ts +77 -77
package/src/hooks/registry.ts +61 -61
package/src/hooks/types.ts +40 -40
package/src/i18n.ts +184 -184
package/src/observability/correlation.ts +35 -35
package/src/observability/event-to-metric.ts +68 -68
package/src/observability/exporters/adapter.ts +30 -30
package/src/observability/exporters/otlp-exporter.ts +106 -92
package/src/observability/exporters/prometheus-exporter.ts +54 -54
package/src/observability/metric-registry.ts +87 -87
package/src/observability/metric-retention.ts +54 -54
package/src/observability/metric-sink.ts +81 -56
package/src/observability/metrics-primitives.ts +167 -167
package/src/prompt/prompt-runtime.ts +72 -72
package/src/runtime/adaptive-plan.ts +338 -0
package/src/runtime/agent-control.ts +169 -169
package/src/runtime/agent-memory.ts +72 -72
package/src/runtime/agent-observability.ts +114 -114
package/src/runtime/async-marker.ts +26 -26
package/src/runtime/async-runner.ts +153 -153
package/src/runtime/attention-events.ts +28 -28
package/src/runtime/auto-resume.ts +100 -100
package/src/runtime/background-runner.ts +122 -89
package/src/runtime/cancellation.ts +61 -61
package/src/runtime/capability-inventory.ts +116 -116
package/src/runtime/child-pi-pool.ts +68 -0
package/src/runtime/child-pi.ts +541 -461
package/src/runtime/code-summary.ts +247 -247
package/src/runtime/compaction-summary.ts +271 -271
package/src/runtime/concurrency.ts +58 -58
package/src/runtime/crash-recovery.ts +317 -301
package/src/runtime/crew-agent-records.ts +379 -281
package/src/runtime/crew-agent-runtime.ts +60 -60
package/src/runtime/cross-extension-rpc.ts +72 -0
package/src/runtime/custom-tools/irc-tool.ts +201 -201
package/src/runtime/custom-tools/submit-result-tool.ts +90 -90
package/src/runtime/deadletter.ts +47 -47
package/src/runtime/delivery-coordinator.ts +176 -176
package/src/runtime/delta-conflict.ts +360 -360
package/src/runtime/diagnostic-export.ts +102 -102
package/src/runtime/direct-run.ts +35 -35
package/src/runtime/effectiveness.ts +82 -81
package/src/runtime/errors/crew-errors.ts +166 -0
package/src/runtime/event-stream-bridge.ts +92 -92
package/src/runtime/foreground-control.ts +82 -82
package/src/runtime/green-contract.ts +46 -46
package/src/runtime/group-join.ts +234 -106
package/src/runtime/heartbeat-watcher.ts +145 -124
package/src/runtime/iteration-hooks.ts +267 -267
package/src/runtime/live-agent-control.ts +88 -88
package/src/runtime/live-agent-manager.ts +377 -179
package/src/runtime/live-control-realtime.ts +36 -36
package/src/runtime/live-session-runtime.ts +676 -600
package/src/runtime/loop-gates.ts +129 -129
package/src/runtime/manifest-cache.ts +263 -263
package/src/runtime/mcp-proxy.ts +113 -113
package/src/runtime/metric-parser.ts +40 -40
package/src/runtime/model-fallback.ts +282 -274
package/src/runtime/model-resolver.ts +118 -0
package/src/runtime/output-validator.ts +187 -187
package/src/runtime/overflow-recovery.ts +175 -175
package/src/runtime/parallel-research.ts +44 -44
package/src/runtime/parallel-utils.ts +156 -156
package/src/runtime/parent-guard.ts +80 -80
package/src/runtime/phase-progress.ts +217 -217
package/src/runtime/pi-args.ts +165 -165
package/src/runtime/pi-json-output.ts +111 -111
package/src/runtime/pi-spawn.ts +167 -167
package/src/runtime/policy-engine.ts +79 -79
package/src/runtime/post-checks.ts +125 -125
package/src/runtime/post-exit-stdio-guard.ts +86 -86
package/src/runtime/process-status.ts +97 -73
package/src/runtime/progress-event-coalescer.ts +43 -43
package/src/runtime/recovery-recipes.ts +74 -74
package/src/runtime/retry-executor.ts +81 -81
package/src/runtime/role-permission.ts +39 -39
package/src/runtime/run-tracker.ts +99 -0
package/src/runtime/runtime-policy.ts +21 -0
package/src/runtime/runtime-resolver.ts +94 -91
package/src/runtime/scheduler.ts +294 -0
package/src/runtime/semaphore.ts +131 -131
package/src/runtime/sensitive-paths.ts +92 -92
package/src/runtime/session-usage.ts +79 -79
package/src/runtime/settings-store.ts +103 -0
package/src/runtime/sidechain-output.ts +29 -29
package/src/runtime/skill-instructions.ts +222 -222
package/src/runtime/stale-reconciler.ts +198 -189
package/src/runtime/streaming-output.ts +47 -0
package/src/runtime/subagent-manager.ts +404 -400
package/src/runtime/subprocess-tool-registry.ts +67 -67
package/src/runtime/task-display.ts +38 -38
package/src/runtime/task-graph-scheduler.ts +122 -122
package/src/runtime/task-graph.ts +207 -207
package/src/runtime/task-output-context.ts +177 -177
package/src/runtime/task-packet.ts +93 -93
package/src/runtime/task-quality.ts +207 -207
package/src/runtime/task-runner/capabilities.ts +78 -78
package/src/runtime/task-runner/live-executor.ts +131 -113
package/src/runtime/task-runner/progress.ts +119 -119
package/src/runtime/task-runner/prompt-builder.ts +139 -139
package/src/runtime/task-runner/prompt-pipeline.ts +64 -64
package/src/runtime/task-runner/result-utils.ts +14 -14
package/src/runtime/task-runner/run-projection.ts +103 -103
package/src/runtime/task-runner/state-helpers.ts +22 -22
package/src/runtime/task-runner.ts +469 -459
package/src/runtime/team-runner.ts +693 -945
package/src/runtime/usage-tracker.ts +71 -0
package/src/runtime/worker-heartbeat.ts +21 -21
package/src/runtime/worker-startup.ts +57 -57
package/src/runtime/workflow-state.ts +187 -187
package/src/runtime/yield-handler.ts +190 -190
package/src/schema/config-schema.ts +172 -168
package/src/schema/team-tool-schema.ts +126 -126
package/src/schema/validation-types.ts +151 -148
package/src/skills/discover-skills.ts +67 -67
package/src/skills/skill-templates.ts +374 -374
package/src/state/active-run-registry.ts +227 -191
package/src/state/artifact-store.ts +130 -129
package/src/state/atomic-write.ts +262 -195
package/src/state/blob-store.ts +116 -116
package/src/state/contracts.ts +111 -111
package/src/state/event-log-rotation.ts +161 -158
package/src/state/event-log.ts +383 -303
package/src/state/event-reconstructor.ts +217 -217
package/src/state/jsonl-writer.ts +82 -82
package/src/state/locks.ts +146 -146
package/src/state/mailbox.ts +446 -405
package/src/state/state-store.ts +364 -351
package/src/state/task-claims.ts +44 -44
package/src/state/types.ts +285 -285
package/src/state/usage.ts +29 -29
package/src/subagents/async-entry.ts +1 -1
package/src/subagents/index.ts +3 -3
package/src/subagents/live/control.ts +1 -1
package/src/subagents/live/manager.ts +1 -1
package/src/subagents/live/realtime.ts +1 -1
package/src/subagents/live/session-runtime.ts +1 -1
package/src/subagents/manager.ts +1 -1
package/src/subagents/spawn.ts +1 -1
package/src/teams/discover-teams.ts +116 -116
package/src/teams/team-config.ts +27 -27
package/src/teams/team-serializer.ts +38 -38
package/src/types/diff.d.ts +18 -18
package/src/ui/agent-management-overlay.ts +144 -144
package/src/ui/crew-widget.ts +487 -370
package/src/ui/dashboard-panes/agents-pane.ts +109 -28
package/src/ui/dashboard-panes/cancellation-pane.ts +42 -42
package/src/ui/dashboard-panes/capability-pane.ts +59 -59
package/src/ui/dashboard-panes/health-pane.ts +30 -30
package/src/ui/dashboard-panes/mailbox-pane.ts +35 -35
package/src/ui/dashboard-panes/progress-pane.ts +30 -30
package/src/ui/dashboard-panes/transcript-pane.ts +10 -10
package/src/ui/heartbeat-aggregator.ts +63 -63
package/src/ui/keybinding-map.ts +97 -94
package/src/ui/live-conversation-overlay.ts +152 -0
package/src/ui/live-run-sidebar.ts +180 -180
package/src/ui/mascot.ts +442 -442
package/src/ui/overlays/agent-picker-overlay.ts +57 -57
package/src/ui/overlays/confirm-overlay.ts +58 -58
package/src/ui/overlays/mailbox-compose-overlay.ts +144 -144
package/src/ui/overlays/mailbox-compose-preview.ts +63 -63
package/src/ui/overlays/mailbox-detail-overlay.ts +122 -122
package/src/ui/pi-ui-compat.ts +57 -57
package/src/ui/powerbar-publisher.ts +221 -197
package/src/ui/render-scheduler.ts +216 -143
package/src/ui/run-action-dispatcher.ts +118 -118
package/src/ui/run-dashboard.ts +526 -464
package/src/ui/run-event-bus.ts +208 -208
package/src/ui/run-snapshot-cache.ts +826 -777
package/src/ui/settings-overlay.ts +721 -0
package/src/ui/snapshot-types.ts +86 -70
package/src/ui/theme-adapter.ts +190 -190
package/src/ui/tool-progress-formatter.ts +89 -0
package/src/ui/transcript-cache.ts +94 -94
package/src/ui/transcript-viewer.ts +335 -335
package/src/utils/conflict-detect.ts +662 -0
package/src/utils/file-coalescer.ts +86 -86
package/src/utils/frontmatter.ts +68 -68
package/src/utils/fs-watch.ts +88 -31
package/src/utils/gh-protocol.ts +479 -0
package/src/utils/ids.ts +17 -17
package/src/utils/incremental-reader.ts +104 -104
package/src/utils/internal-error.ts +6 -6
package/src/utils/names.ts +27 -27
package/src/utils/paths.ts +102 -63
package/src/utils/redaction.ts +44 -44
package/src/utils/safe-paths.ts +47 -47
package/src/utils/scan-cache.ts +136 -136
package/src/utils/sse-parser.ts +134 -134
package/src/utils/task-name-generator.ts +337 -337
package/src/utils/timings.ts +33 -33
package/src/utils/visual.ts +243 -198
package/src/workflows/discover-workflows.ts +139 -139
package/src/workflows/validate-workflow.ts +40 -40
package/src/workflows/workflow-config.ts +26 -26
package/src/workflows/workflow-serializer.ts +32 -32
package/src/worktree/branch-freshness.ts +45 -45
package/src/worktree/cleanup.ts +75 -75
package/src/worktree/worktree-manager.ts +188 -188
package/teams/default.team.md +12 -12
package/teams/fast-fix.team.md +11 -11
package/teams/implementation.team.md +18 -18
package/teams/parallel-research.team.md +14 -14
package/teams/research.team.md +11 -11
package/teams/review.team.md +12 -12
package/tsconfig.json +19 -19
package/workflows/default.workflow.md +30 -30
package/workflows/fast-fix.workflow.md +23 -23
package/workflows/implementation.workflow.md +43 -43
package/workflows/parallel-research.workflow.md +46 -46
package/workflows/research.workflow.md +22 -22
package/workflows/review.workflow.md +30 -30
package/skills/task-packet/SKILL.md +0 -28
package/skills/verify-evidence/SKILL.md +0 -27

package/src/runtime/task-quality.ts CHANGED Viewed

@@ -1,207 +1,207 @@
-/**
- * Task quality scoring — simple additive heuristic for evaluating task
- * completion quality based on diagnostics, metrics, artifacts, and duration.
- *
- * Distilled from pi-autoresearch's quality scoring pattern.
- */
-import * as fs from "node:fs";
-import * as path from "node:path";
-import type { TeamTaskState } from "../state/types.ts";
-/** Letter grade for task quality. */
-export type QualityGrade = "A" | "B" | "C" | "D";
-/** Breakdown of individual quality criteria. */
-export interface QualityBreakdown {
-	/** Task has a non-empty diagnostics object. */
-	hasDiagnostics: boolean;
-	/** Task has a non-empty metrics object. */
-	hasMetrics: boolean;
-	/** Task produced files in the artifacts directory. */
-	producedArtifacts: boolean;
-	/** Task has a non-empty result/description. */
-	hasDescription: boolean;
-	/** Task duration is reasonable (> 0 and < 1 hour). */
-	durationReasonable: boolean;
-}
-/** Scored quality result for a task. */
-export interface TaskQualityScore {
-	/** Numeric score (0–5). */
-	score: number;
-	/** Individual criterion breakdown. */
-	breakdown: QualityBreakdown;
-	/** Letter grade based on score thresholds. */
-	grade: QualityGrade;
-}
-/** One hour in milliseconds. */
-const ONE_HOUR_MS = 3_600_000;
-/**
- * Determine the letter grade for a given numeric score.
- *
- * A: 4–5, B: 3, C: 2, D: 0–1
- */
-function scoreToGrade(score: number): QualityGrade {
-	if (score >= 4) return "A";
-	if (score === 3) return "B";
-	if (score === 2) return "C";
-	return "D";
-}
-/**
- * Check whether the artifacts directory contains files for the given task.
- *
- * Looks for a subdirectory named after the task ID, or files containing
- * the task ID prefix in the artifacts directory.
- */
-function hasTaskArtifacts(taskId: string, artifactsDir: string): boolean {
-	try {
-		if (!fs.existsSync(artifactsDir)) return false;
-		// Check for a task-specific subdirectory
-		const taskDir = path.join(artifactsDir, taskId);
-		if (fs.existsSync(taskDir)) {
-			const stat = fs.statSync(taskDir);
-			if (stat.isDirectory()) {
-				const entries = fs.readdirSync(taskDir);
-				return entries.length > 0;
-			}
-		}
-		// Check for files containing the task ID prefix
-		const entries = fs.readdirSync(artifactsDir);
-		const safePrefix = taskId.replace(/[^a-zA-Z0-9_-]/g, "");
-		return entries.some((entry) => entry.includes(safePrefix));
-	} catch {
-		return false;
-	}
-}
-/**
- * Check if a task result string is a non-empty description.
- *
- * A result is considered descriptive if any of these sources have non-empty content:
- * - task.resultArtifact exists with a path
- * - task.error is a non-empty string (workers often set this with result info)
- * - task.verification.satisfied is true
- * - task.diagnostics contains a 'result' string
- */
-function isResultDescriptive(task: TeamTaskState): boolean {
-	// Check resultArtifact — presence of a result artifact indicates output was produced
-	if (task.resultArtifact?.path) return true;
-	// Check error field — workers often put result info here
-	if (typeof task.error === "string" && task.error.trim().length > 0) return true;
-	// Check verification — satisfied verification indicates meaningful output
-	if (task.verification?.satisfied) return true;
-	// Check diagnostics for an explicit result string
-	if (
-		task.diagnostics &&
-		typeof task.diagnostics === "object" &&
-		typeof task.diagnostics.result === "string" &&
-		(task.diagnostics.result as string).trim().length > 0
-	) return true;
-	return false;
-}
-/**
- * Check if the task duration is reasonable (started, finished, > 0, < 1 hour).
- */
-function isDurationReasonable(task: TeamTaskState): boolean {
-	if (!task.startedAt || !task.finishedAt) return false;
-	const started = new Date(task.startedAt).getTime();
-	const finished = new Date(task.finishedAt).getTime();
-	if (Number.isNaN(started) || Number.isNaN(finished)) return false;
-	const duration = finished - started;
-	return duration > 0 && duration < ONE_HOUR_MS;
-}
-/**
- * Compute the quality score for a completed task.
- *
- * Uses simple additive scoring across 5 criteria:
- * - hasDiagnostics: +1 if task.diagnostics exists and has keys
- * - hasMetrics: +1 if task.metrics exists and has keys
- * - producedArtifacts: +1 if artifactsDir has files for this task
- * - hasDescription: +1 if task has a non-empty result/description
- * - durationReasonable: +1 if task has both startedAt and finishedAt, duration > 0 and < 1 hour
- *
- * @param task - The task state to evaluate
- * @param artifactsDir - Optional path to the run artifacts directory
- * @returns TaskQualityScore with numeric score, breakdown, and letter grade
- */
-export function computeTaskQuality(
-	task: TeamTaskState,
-	artifactsDir?: string,
-): TaskQualityScore {
-	const hasDiagnostics =
-		task.diagnostics !== undefined &&
-		typeof task.diagnostics === "object" &&
-		Object.keys(task.diagnostics).length > 0;
-	const hasMetrics =
-		task.metrics !== undefined &&
-		typeof task.metrics === "object" &&
-		Object.keys(task.metrics).length > 0;
-	const producedArtifacts =
-		artifactsDir !== undefined && hasTaskArtifacts(task.id, artifactsDir);
-	const hasDescription = isResultDescriptive(task);
-	const durationReasonable = isDurationReasonable(task);
-	const breakdown: QualityBreakdown = {
-		hasDiagnostics,
-		hasMetrics,
-		producedArtifacts,
-		hasDescription,
-		durationReasonable,
-	};
-	const score =
-		(hasDiagnostics ? 1 : 0) +
-		(hasMetrics ? 1 : 0) +
-		(producedArtifacts ? 1 : 0) +
-		(hasDescription ? 1 : 0) +
-		(durationReasonable ? 1 : 0);
-	return {
-		score,
-		breakdown,
-		grade: scoreToGrade(score),
-	};
-}
-/** Human-readable labels for each quality criterion. */
-const CRITERION_LABELS: Record<keyof QualityBreakdown, string> = {
-	hasDiagnostics: "diagnostics",
-	hasMetrics: "metrics",
-	producedArtifacts: "artifacts",
-	hasDescription: "description",
-	durationReasonable: "duration",
-};
-/**
- * Format a quality score as a human-readable one-line string.
- *
- * Format: "Quality: B (3/5: diagnostics, metrics, description)"
- *
- * @param score - The quality score to format
- * @returns Formatted string
- */
-export function formatQualityScore(score: TaskQualityScore): string {
-	const metCriteria = Object.entries(score.breakdown)
-		.filter(([, met]) => met)
-		.map(([key]) => CRITERION_LABELS[key as keyof QualityBreakdown]);
-	return `Quality: ${score.grade} (${score.score}/5${metCriteria.length > 0 ? `: ${metCriteria.join(", ")}` : ""})`;
-}
+/**
+ * Task quality scoring — simple additive heuristic for evaluating task
+ * completion quality based on diagnostics, metrics, artifacts, and duration.
+ *
+ * Distilled from pi-autoresearch's quality scoring pattern.
+ */
+import * as fs from "node:fs";
+import * as path from "node:path";
+import type { TeamTaskState } from "../state/types.ts";
+/** Letter grade for task quality. */
+export type QualityGrade = "A" | "B" | "C" | "D";
+/** Breakdown of individual quality criteria. */
+export interface QualityBreakdown {
+	/** Task has a non-empty diagnostics object. */
+	hasDiagnostics: boolean;
+	/** Task has a non-empty metrics object. */
+	hasMetrics: boolean;
+	/** Task produced files in the artifacts directory. */
+	producedArtifacts: boolean;
+	/** Task has a non-empty result/description. */
+	hasDescription: boolean;
+	/** Task duration is reasonable (> 0 and < 1 hour). */
+	durationReasonable: boolean;
+}
+/** Scored quality result for a task. */
+export interface TaskQualityScore {
+	/** Numeric score (0–5). */
+	score: number;
+	/** Individual criterion breakdown. */
+	breakdown: QualityBreakdown;
+	/** Letter grade based on score thresholds. */
+	grade: QualityGrade;
+}
+/** One hour in milliseconds. */
+const ONE_HOUR_MS = 3_600_000;
+/**
+ * Determine the letter grade for a given numeric score.
+ *
+ * A: 4–5, B: 3, C: 2, D: 0–1
+ */
+function scoreToGrade(score: number): QualityGrade {
+	if (score >= 4) return "A";
+	if (score === 3) return "B";
+	if (score === 2) return "C";
+	return "D";
+}
+/**
+ * Check whether the artifacts directory contains files for the given task.
+ *
+ * Looks for a subdirectory named after the task ID, or files containing
+ * the task ID prefix in the artifacts directory.
+ */
+function hasTaskArtifacts(taskId: string, artifactsDir: string): boolean {
+	try {
+		if (!fs.existsSync(artifactsDir)) return false;
+		// Check for a task-specific subdirectory
+		const taskDir = path.join(artifactsDir, taskId);
+		if (fs.existsSync(taskDir)) {
+			const stat = fs.statSync(taskDir);
+			if (stat.isDirectory()) {
+				const entries = fs.readdirSync(taskDir);
+				return entries.length > 0;
+			}
+		}
+		// Check for files containing the task ID prefix
+		const entries = fs.readdirSync(artifactsDir);
+		const safePrefix = taskId.replace(/[^a-zA-Z0-9_-]/g, "");
+		return entries.some((entry) => entry.includes(safePrefix));
+	} catch {
+		return false;
+	}
+}
+/**
+ * Check if a task result string is a non-empty description.
+ *
+ * A result is considered descriptive if any of these sources have non-empty content:
+ * - task.resultArtifact exists with a path
+ * - task.error is a non-empty string (workers often set this with result info)
+ * - task.verification.satisfied is true
+ * - task.diagnostics contains a 'result' string
+ */
+function isResultDescriptive(task: TeamTaskState): boolean {
+	// Check resultArtifact — presence of a result artifact indicates output was produced
+	if (task.resultArtifact?.path) return true;
+	// Check error field — workers often put result info here
+	if (typeof task.error === "string" && task.error.trim().length > 0) return true;
+	// Check verification — satisfied verification indicates meaningful output
+	if (task.verification?.satisfied) return true;
+	// Check diagnostics for an explicit result string
+	if (
+		task.diagnostics &&
+		typeof task.diagnostics === "object" &&
+		typeof task.diagnostics.result === "string" &&
+		(task.diagnostics.result as string).trim().length > 0
+	) return true;
+	return false;
+}
+/**
+ * Check if the task duration is reasonable (started, finished, > 0, < 1 hour).
+ */
+function isDurationReasonable(task: TeamTaskState): boolean {
+	if (!task.startedAt || !task.finishedAt) return false;
+	const started = new Date(task.startedAt).getTime();
+	const finished = new Date(task.finishedAt).getTime();
+	if (Number.isNaN(started) || Number.isNaN(finished)) return false;
+	const duration = finished - started;
+	return duration > 0 && duration < ONE_HOUR_MS;
+}
+/**
+ * Compute the quality score for a completed task.
+ *
+ * Uses simple additive scoring across 5 criteria:
+ * - hasDiagnostics: +1 if task.diagnostics exists and has keys
+ * - hasMetrics: +1 if task.metrics exists and has keys
+ * - producedArtifacts: +1 if artifactsDir has files for this task
+ * - hasDescription: +1 if task has a non-empty result/description
+ * - durationReasonable: +1 if task has both startedAt and finishedAt, duration > 0 and < 1 hour
+ *
+ * @param task - The task state to evaluate
+ * @param artifactsDir - Optional path to the run artifacts directory
+ * @returns TaskQualityScore with numeric score, breakdown, and letter grade
+ */
+export function computeTaskQuality(
+	task: TeamTaskState,
+	artifactsDir?: string,
+): TaskQualityScore {
+	const hasDiagnostics =
+		task.diagnostics !== undefined &&
+		typeof task.diagnostics === "object" &&
+		Object.keys(task.diagnostics).length > 0;
+	const hasMetrics =
+		task.metrics !== undefined &&
+		typeof task.metrics === "object" &&
+		Object.keys(task.metrics).length > 0;
+	const producedArtifacts =
+		artifactsDir !== undefined && hasTaskArtifacts(task.id, artifactsDir);
+	const hasDescription = isResultDescriptive(task);
+	const durationReasonable = isDurationReasonable(task);
+	const breakdown: QualityBreakdown = {
+		hasDiagnostics,
+		hasMetrics,
+		producedArtifacts,
+		hasDescription,
+		durationReasonable,
+	};
+	const score =
+		(hasDiagnostics ? 1 : 0) +
+		(hasMetrics ? 1 : 0) +
+		(producedArtifacts ? 1 : 0) +
+		(hasDescription ? 1 : 0) +
+		(durationReasonable ? 1 : 0);
+	return {
+		score,
+		breakdown,
+		grade: scoreToGrade(score),
+	};
+}
+/** Human-readable labels for each quality criterion. */
+const CRITERION_LABELS: Record<keyof QualityBreakdown, string> = {
+	hasDiagnostics: "diagnostics",
+	hasMetrics: "metrics",
+	producedArtifacts: "artifacts",
+	hasDescription: "description",
+	durationReasonable: "duration",
+};
+/**
+ * Format a quality score as a human-readable one-line string.
+ *
+ * Format: "Quality: B (3/5: diagnostics, metrics, description)"
+ *
+ * @param score - The quality score to format
+ * @returns Formatted string
+ */
+export function formatQualityScore(score: TaskQualityScore): string {
+	const metCriteria = Object.entries(score.breakdown)
+		.filter(([, met]) => met)
+		.map(([key]) => CRITERION_LABELS[key as keyof QualityBreakdown]);
+	return `Quality: ${score.grade} (${score.score}/5${metCriteria.length > 0 ? `: ${metCriteria.join(", ")}` : ""})`;
+}

package/src/runtime/task-runner/capabilities.ts CHANGED Viewed

@@ -1,78 +1,78 @@
-import type { AgentConfig } from "../../agents/agent-config.ts";
-import type { CrewRuntimeKind } from "../crew-agent-runtime.ts";
-export interface WorkerCapabilityInventory {
-	schemaVersion: 1;
-	taskId: string;
-	role: string;
-	agent: string;
-	runtime: CrewRuntimeKind;
-	permissionMode: string;
-	tools: string[];
-	extensions: string[];
-	skills: {
-		names: string[];
-		paths: string[];
-		disabled: boolean;
-	};
-	model: {
-		requested?: string;
-		agentDefault?: string;
-		fallbacks: string[];
-		teamRole?: string;
-		step?: string;
-	};
-	inheritance: {
-		projectContext: boolean;
-		skills: boolean;
-		systemPromptMode: "replace" | "append";
-	};
-}
-export interface BuildWorkerCapabilityInventoryInput {
-	taskId: string;
-	role: string;
-	agent: AgentConfig;
-	runtime: CrewRuntimeKind;
-	permissionMode: string;
-	skillNames?: string[];
-	skillPaths?: string[];
-	skillsDisabled: boolean;
-	modelOverride?: string;
-	teamRoleModel?: string;
-	stepModel?: string;
-}
-function uniqueSorted(values: readonly string[] | undefined): string[] {
-	return [...new Set((values ?? []).map((value) => value.trim()).filter(Boolean))].sort((a, b) => a.localeCompare(b));
-}
-export function buildWorkerCapabilityInventory(input: BuildWorkerCapabilityInventoryInput): WorkerCapabilityInventory {
-	return {
-		schemaVersion: 1,
-		taskId: input.taskId,
-		role: input.role,
-		agent: input.agent.name,
-		runtime: input.runtime,
-		permissionMode: input.permissionMode,
-		tools: uniqueSorted(input.agent.tools),
-		extensions: uniqueSorted(input.agent.extensions),
-		skills: {
-			names: uniqueSorted(input.skillNames),
-			paths: uniqueSorted(input.skillPaths),
-			disabled: input.skillsDisabled,
-		},
-		model: {
-			requested: input.modelOverride,
-			agentDefault: input.agent.model,
-			fallbacks: uniqueSorted(input.agent.fallbackModels),
-			teamRole: input.teamRoleModel,
-			step: input.stepModel,
-		},
-		inheritance: {
-			projectContext: input.agent.inheritProjectContext === true,
-			skills: input.agent.inheritSkills === true,
-			systemPromptMode: input.agent.systemPromptMode ?? "replace",
-		},
-	};
-}
+import type { AgentConfig } from "../../agents/agent-config.ts";
+import type { CrewRuntimeKind } from "../crew-agent-runtime.ts";
+export interface WorkerCapabilityInventory {
+	schemaVersion: 1;
+	taskId: string;
+	role: string;
+	agent: string;
+	runtime: CrewRuntimeKind;
+	permissionMode: string;
+	tools: string[];
+	extensions: string[];
+	skills: {
+		names: string[];
+		paths: string[];
+		disabled: boolean;
+	};
+	model: {
+		requested?: string;
+		agentDefault?: string;
+		fallbacks: string[];
+		teamRole?: string;
+		step?: string;
+	};
+	inheritance: {
+		projectContext: boolean;
+		skills: boolean;
+		systemPromptMode: "replace" | "append";
+	};
+}
+export interface BuildWorkerCapabilityInventoryInput {
+	taskId: string;
+	role: string;
+	agent: AgentConfig;
+	runtime: CrewRuntimeKind;
+	permissionMode: string;
+	skillNames?: string[];
+	skillPaths?: string[];
+	skillsDisabled: boolean;
+	modelOverride?: string;
+	teamRoleModel?: string;
+	stepModel?: string;
+}
+function uniqueSorted(values: readonly string[] | undefined): string[] {
+	return [...new Set((values ?? []).map((value) => value.trim()).filter(Boolean))].sort((a, b) => a.localeCompare(b));
+}
+export function buildWorkerCapabilityInventory(input: BuildWorkerCapabilityInventoryInput): WorkerCapabilityInventory {
+	return {
+		schemaVersion: 1,
+		taskId: input.taskId,
+		role: input.role,
+		agent: input.agent.name,
+		runtime: input.runtime,
+		permissionMode: input.permissionMode,
+		tools: uniqueSorted(input.agent.tools),
+		extensions: uniqueSorted(input.agent.extensions),
+		skills: {
+			names: uniqueSorted(input.skillNames),
+			paths: uniqueSorted(input.skillPaths),
+			disabled: input.skillsDisabled,
+		},
+		model: {
+			requested: input.modelOverride,
+			agentDefault: input.agent.model,
+			fallbacks: uniqueSorted(input.agent.fallbackModels),
+			teamRole: input.teamRoleModel,
+			step: input.stepModel,
+		},
+		inheritance: {
+			projectContext: input.agent.inheritProjectContext === true,
+			skills: input.agent.inheritSkills === true,
+			systemPromptMode: input.agent.systemPromptMode ?? "replace",
+		},
+	};
+}