npm - @katyella/legio - Versions diffs - 0.1.3 → 0.2.2 - Mend

@katyella/legio 0.1.3 → 0.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (112) hide show

package/CHANGELOG.md +61 -3
package/README.md +21 -10
package/agents/builder.md +11 -10
package/agents/coordinator.md +36 -27
package/agents/cto.md +9 -8
package/agents/gateway.md +28 -12
package/agents/lead.md +45 -30
package/agents/merger.md +4 -4
package/agents/monitor.md +10 -9
package/agents/reviewer.md +8 -8
package/agents/scout.md +10 -10
package/agents/supervisor.md +60 -45
package/package.json +2 -2
package/src/agents/hooks-deployer.test.ts +46 -41
package/src/agents/hooks-deployer.ts +10 -9
package/src/agents/manifest.test.ts +6 -2
package/src/agents/overlay.test.ts +9 -7
package/src/agents/overlay.ts +29 -7
package/src/commands/agents.test.ts +1 -5
package/src/commands/clean.test.ts +2 -5
package/src/commands/clean.ts +25 -1
package/src/commands/completions.test.ts +1 -1
package/src/commands/completions.ts +26 -7
package/src/commands/coordinator.test.ts +87 -82
package/src/commands/coordinator.ts +94 -48
package/src/commands/costs.test.ts +2 -6
package/src/commands/dashboard.test.ts +2 -5
package/src/commands/doctor.test.ts +2 -6
package/src/commands/down.ts +3 -3
package/src/commands/errors.test.ts +2 -6
package/src/commands/feed.test.ts +2 -6
package/src/commands/gateway.test.ts +43 -17
package/src/commands/gateway.ts +101 -11
package/src/commands/hooks.test.ts +2 -5
package/src/commands/init.test.ts +4 -13
package/src/commands/inspect.test.ts +2 -6
package/src/commands/log.test.ts +2 -6
package/src/commands/logs.test.ts +2 -9
package/src/commands/mail.test.ts +76 -215
package/src/commands/mail.ts +43 -187
package/src/commands/metrics.test.ts +3 -10
package/src/commands/nudge.ts +15 -0
package/src/commands/prime.test.ts +4 -11
package/src/commands/replay.test.ts +2 -6
package/src/commands/server.test.ts +1 -5
package/src/commands/server.ts +1 -1
package/src/commands/sling.test.ts +6 -1
package/src/commands/sling.ts +42 -17
package/src/commands/spec.test.ts +2 -5
package/src/commands/status.test.ts +2 -4
package/src/commands/stop.test.ts +2 -5
package/src/commands/supervisor.ts +6 -6
package/src/commands/trace.test.ts +2 -6
package/src/commands/up.test.ts +43 -9
package/src/commands/up.ts +15 -11
package/src/commands/watchman.ts +327 -0
package/src/commands/worktree.test.ts +2 -6
package/src/config.test.ts +34 -104
package/src/config.ts +120 -32
package/src/doctor/agents.test.ts +52 -2
package/src/doctor/agents.ts +4 -2
package/src/doctor/config-check.test.ts +7 -2
package/src/doctor/consistency.test.ts +7 -2
package/src/doctor/databases.test.ts +6 -2
package/src/doctor/dependencies.test.ts +18 -13
package/src/doctor/dependencies.ts +23 -94
package/src/doctor/logs.test.ts +7 -2
package/src/doctor/merge-queue.test.ts +6 -2
package/src/doctor/structure.test.ts +7 -2
package/src/doctor/version.test.ts +7 -2
package/src/e2e/init-sling-lifecycle.test.ts +2 -5
package/src/index.ts +7 -7
package/src/mail/pending.ts +120 -0
package/src/mail/store.test.ts +89 -0
package/src/mail/store.ts +11 -0
package/src/merge/resolver.test.ts +518 -489
package/src/server/index.ts +33 -2
package/src/server/public/app.js +3 -3
package/src/server/public/components/message-bubble.js +11 -1
package/src/server/public/components/terminal-panel.js +66 -74
package/src/server/public/views/chat.js +18 -2
package/src/server/public/views/costs.js +5 -5
package/src/server/public/views/dashboard.js +80 -51
package/src/server/public/views/gateway-chat.js +37 -131
package/src/server/public/views/inspect.js +16 -4
package/src/server/public/views/issues.js +16 -12
package/src/server/routes.test.ts +55 -39
package/src/server/routes.ts +38 -26
package/src/test-helpers.ts +6 -3
package/src/tracker/beads.ts +159 -0
package/src/tracker/exec.ts +44 -0
package/src/tracker/factory.test.ts +283 -0
package/src/tracker/factory.ts +59 -0
package/src/tracker/seeds.ts +156 -0
package/src/tracker/types.ts +46 -0
package/src/types.ts +11 -2
package/src/{watchdog → watchman}/daemon.test.ts +421 -515
package/src/watchman/daemon.ts +940 -0
package/src/worktree/tmux.test.ts +2 -1
package/src/worktree/tmux.ts +4 -4
package/templates/hooks.json.tmpl +17 -17
package/src/beads/client.test.ts +0 -210
package/src/commands/merge.test.ts +0 -676
package/src/commands/watch.test.ts +0 -152
package/src/commands/watch.ts +0 -238
package/src/test-helpers.test.ts +0 -97
package/src/watchdog/daemon.ts +0 -533
package/src/watchdog/health.test.ts +0 -371
package/src/watchdog/triage.test.ts +0 -162
package/src/worktree/manager.test.ts +0 -444
/package/src/{watchdog → watchman}/health.ts +0 -0
/package/src/{watchdog → watchman}/triage.ts +0 -0

package/src/watchdog/health.test.ts DELETED Viewed

@@ -1,371 +0,0 @@
-import { describe, expect, test } from "vitest";
-import type { AgentSession } from "../types.ts";
-import { evaluateHealth, isProcessRunning, transitionState } from "./health.ts";
-/**
- * Tests for the ZFC-based health evaluation and state machine.
- *
- * evaluateHealth is a pure function that takes session state + tmux liveness +
- * thresholds and returns a HealthCheck. No mocks needed for the core logic.
- *
- * isProcessRunning uses process.kill(pid, 0) which is safe to test with real PIDs:
- * the current process PID (alive) and a known-dead PID (not alive).
- *
- * Note: evaluateHealth calls isProcessRunning internally. For tests that need
- * to control pid liveness independently of the actual OS process table, we set
- * session.pid to known-alive (current process) or known-dead PIDs.
- */
-const THRESHOLDS = { zombieMs: 120_000 };
-/** PID that is guaranteed to be alive during tests: our own process. */
-const ALIVE_PID = process.pid;
-/**
- * PID that is very likely dead. PID 2147483647 (max 32-bit signed int) is
- * almost never in use. If by some miracle it is, the test still works because
- * we use it only for the "pid dead" path and the test validates behavior, not
- * the exact PID value.
- */
-const DEAD_PID = 2147483647;
-function makeSession(overrides: Partial<AgentSession> = {}): AgentSession {
-	return {
-		id: "session-test",
-		agentName: "test-agent",
-		capability: "builder",
-		worktreePath: "/tmp/test",
-		branchName: "legio/test-agent/test-task",
-		beadId: "test-task",
-		tmuxSession: "legio-test-agent",
-		state: "booting",
-		pid: ALIVE_PID,
-		parentAgent: null,
-		depth: 0,
-		runId: null,
-		startedAt: new Date().toISOString(),
-		lastActivity: new Date().toISOString(),
-		escalationLevel: 0,
-		stalledSince: null,
-		...overrides,
-	};
-}
-// === isProcessRunning ===
-describe("isProcessRunning", () => {
-	test("returns true for the current process PID", () => {
-		expect(isProcessRunning(process.pid)).toBe(true);
-	});
-	test("returns false for a PID that does not exist", () => {
-		// PID 2147483647 is max 32-bit signed — extremely unlikely to be alive
-		expect(isProcessRunning(DEAD_PID)).toBe(false);
-	});
-});
-// === evaluateHealth ===
-describe("evaluateHealth", () => {
-	// --- ZFC Rule 1: tmux dead → zombie (observable state wins) ---
-	test("ZFC: tmux dead + sessions.json says working → zombie with reconciliation note", () => {
-		const session = makeSession({ state: "working" });
-		const check = evaluateHealth(session, false, THRESHOLDS);
-		expect(check.state).toBe("zombie");
-		expect(check.action).toBe("terminate");
-		expect(check.tmuxAlive).toBe(false);
-		expect(check.processAlive).toBe(false);
-		expect(check.reconciliationNote).toContain("ZFC");
-		expect(check.reconciliationNote).toContain("tmux dead");
-		expect(check.reconciliationNote).toContain('"working"');
-	});
-	test("ZFC: tmux dead + sessions.json says booting → zombie with reconciliation note", () => {
-		const session = makeSession({ state: "booting" });
-		const check = evaluateHealth(session, false, THRESHOLDS);
-		expect(check.state).toBe("zombie");
-		expect(check.action).toBe("terminate");
-		expect(check.reconciliationNote).toContain("ZFC");
-		expect(check.reconciliationNote).toContain('"booting"');
-	});
-	// --- ZFC Rule 2: tmux alive + sessions.json says zombie → investigate ---
-	test("ZFC: tmux alive + sessions.json says zombie → investigate (don't auto-kill)", () => {
-		const session = makeSession({ state: "zombie", pid: ALIVE_PID });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("zombie");
-		expect(check.action).toBe("investigate");
-		expect(check.processAlive).toBe(true);
-		expect(check.reconciliationNote).toContain("ZFC");
-		expect(check.reconciliationNote).toContain("investigation needed");
-		expect(check.reconciliationNote).toContain("don't auto-kill");
-	});
-	// --- ZFC Rule 3: pid dead + tmux alive → zombie ---
-	test("ZFC: pid dead + tmux alive → zombie (agent process exited, shell survived)", () => {
-		const session = makeSession({ state: "working", pid: DEAD_PID });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("zombie");
-		expect(check.action).toBe("terminate");
-		expect(check.processAlive).toBe(false);
-		expect(check.pidAlive).toBe(false);
-		expect(check.tmuxAlive).toBe(true);
-		expect(check.reconciliationNote).toContain("ZFC");
-		expect(check.reconciliationNote).toContain("pid");
-		expect(check.reconciliationNote).toContain("shell survived");
-	});
-	// --- pid null (unavailable) ---
-	test("pid null does not trigger pid-based zombie detection", () => {
-		const session = makeSession({ state: "working", pid: null });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-		expect(check.pidAlive).toBeNull();
-	});
-	// --- Time-based checks (both tmux and pid alive) ---
-	test("activity older than zombieMs → zombie", () => {
-		const oldActivity = new Date(Date.now() - 200_000).toISOString();
-		const session = makeSession({ state: "working", lastActivity: oldActivity });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("zombie");
-		expect(check.action).toBe("terminate");
-		expect(check.reconciliationNote).toBeNull();
-	});
-	// --- Normal state transitions ---
-	test("booting with recent activity → transitions to working", () => {
-		const recentActivity = new Date(Date.now() - 5_000).toISOString();
-		const session = makeSession({ state: "booting", lastActivity: recentActivity });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-		expect(check.reconciliationNote).toBeNull();
-	});
-	test("working with recent activity → stays working", () => {
-		const recentActivity = new Date(Date.now() - 5_000).toISOString();
-		const session = makeSession({ state: "working", lastActivity: recentActivity });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-	});
-	// --- Persistent capabilities (coordinator, monitor) ---
-	test("persistent capability: coordinator with stale activity → still working, no escalation", () => {
-		const staleActivity = new Date(Date.now() - 60_000).toISOString();
-		const session = makeSession({
-			capability: "coordinator",
-			state: "working",
-			lastActivity: staleActivity,
-		});
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-	});
-	test("persistent capability: coordinator with zombie-level staleness → still working", () => {
-		const oldActivity = new Date(Date.now() - 200_000).toISOString();
-		const session = makeSession({
-			capability: "coordinator",
-			state: "working",
-			lastActivity: oldActivity,
-		});
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-	});
-	test("persistent capability: monitor with stale activity → still working", () => {
-		const staleActivity = new Date(Date.now() - 60_000).toISOString();
-		const session = makeSession({
-			capability: "monitor",
-			state: "working",
-			lastActivity: staleActivity,
-		});
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-	});
-	test("persistent capability: gateway with stale activity → still working", () => {
-		const staleActivity = new Date(Date.now() - 60_000).toISOString();
-		const session = makeSession({
-			capability: "gateway",
-			state: "working",
-			lastActivity: staleActivity,
-		});
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-	});
-	test("persistent capability: coordinator booting → transitions to working", () => {
-		const session = makeSession({
-			capability: "coordinator",
-			state: "booting",
-		});
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("working");
-		expect(check.action).toBe("none");
-	});
-	test("persistent capability: coordinator with tmux dead → still zombie (ZFC Rule 1 applies)", () => {
-		const session = makeSession({
-			capability: "coordinator",
-			state: "working",
-		});
-		const check = evaluateHealth(session, false, THRESHOLDS);
-		expect(check.state).toBe("zombie");
-		expect(check.action).toBe("terminate");
-	});
-	test("persistent capability: coordinator with pid dead → still zombie (ZFC Rule 3 applies)", () => {
-		const session = makeSession({
-			capability: "coordinator",
-			state: "working",
-			pid: DEAD_PID,
-		});
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("zombie");
-		expect(check.action).toBe("terminate");
-	});
-	// --- Completed agents ---
-	test("completed agents skip monitoring", () => {
-		const session = makeSession({ state: "completed" });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.state).toBe("completed");
-		expect(check.action).toBe("none");
-		expect(check.reconciliationNote).toBeNull();
-	});
-	// --- pidAlive field is populated ---
-	test("pidAlive reflects actual process state for alive PID", () => {
-		const session = makeSession({ pid: ALIVE_PID, state: "working" });
-		const check = evaluateHealth(session, true, THRESHOLDS);
-		expect(check.pidAlive).toBe(true);
-	});
-	test("pidAlive reflects actual process state for dead PID", () => {
-		// Use dead pid but also tmux dead to avoid pid-zombie path intercepting
-		const session = makeSession({ pid: DEAD_PID, state: "working" });
-		const check = evaluateHealth(session, false, THRESHOLDS);
-		// tmux dead takes priority, so state is zombie via ZFC Rule 1
-		expect(check.state).toBe("zombie");
-		expect(check.pidAlive).toBe(false);
-	});
-});
-// === transitionState ===
-describe("transitionState", () => {
-	test("advances from booting to working", () => {
-		const check = {
-			state: "working" as const,
-			agentName: "a",
-			timestamp: "",
-			tmuxAlive: true,
-			pidAlive: true as boolean | null,
-			lastActivity: "",
-			processAlive: true,
-			action: "none" as const,
-			reconciliationNote: null,
-		};
-		expect(transitionState("booting", check)).toBe("working");
-	});
-	test("never regresses from zombie to booting", () => {
-		const check = {
-			state: "booting" as const,
-			agentName: "a",
-			timestamp: "",
-			tmuxAlive: true,
-			pidAlive: true as boolean | null,
-			lastActivity: "",
-			processAlive: true,
-			action: "none" as const,
-			reconciliationNote: null,
-		};
-		expect(transitionState("zombie", check)).toBe("zombie");
-	});
-	test("same state stays the same", () => {
-		const check = {
-			state: "working" as const,
-			agentName: "a",
-			timestamp: "",
-			tmuxAlive: true,
-			pidAlive: true as boolean | null,
-			lastActivity: "",
-			processAlive: true,
-			action: "none" as const,
-			reconciliationNote: null,
-		};
-		expect(transitionState("working", check)).toBe("working");
-	});
-	// --- ZFC: investigate holds state ---
-	test("ZFC: investigate action holds current state (does not advance)", () => {
-		const check = {
-			state: "zombie" as const,
-			agentName: "a",
-			timestamp: "",
-			tmuxAlive: true,
-			pidAlive: true as boolean | null,
-			lastActivity: "",
-			processAlive: true,
-			action: "investigate" as const,
-			reconciliationNote: "ZFC: tmux alive but sessions.json says zombie",
-		};
-		// Even though check.state is zombie (order 4) and current is zombie (order 4),
-		// investigate should hold — not advance
-		expect(transitionState("zombie", check)).toBe("zombie");
-	});
-	test("ZFC: investigate prevents forward transition", () => {
-		const check = {
-			state: "zombie" as const,
-			agentName: "a",
-			timestamp: "",
-			tmuxAlive: true,
-			pidAlive: true as boolean | null,
-			lastActivity: "",
-			processAlive: true,
-			action: "investigate" as const,
-			reconciliationNote: "ZFC conflict",
-		};
-		// If something were at "working" and check says zombie with investigate,
-		// the state should NOT advance
-		expect(transitionState("working", check)).toBe("working");
-	});
-});

package/src/watchdog/triage.test.ts DELETED Viewed

@@ -1,162 +0,0 @@
-/**
- * Tests for Tier 1 AI-assisted triage.
- * classifyResponse and buildTriagePrompt are pure functions — tested directly.
- * triageAgent uses real filesystem (temp dirs). Claude spawn is expected to
- * fail in test environments, exercising the fallback-to-extend path.
- * spawnClaude is NOT mocked — we rely on it failing naturally in tests.
- */
-import { mkdir, mkdtemp, rm, writeFile } from "node:fs/promises";
-import { tmpdir } from "node:os";
-import { join } from "node:path";
-import { afterEach, beforeEach, describe, expect, test } from "vitest";
-import { buildTriagePrompt, classifyResponse, triageAgent } from "./triage.ts";
-describe("classifyResponse", () => {
-	test("returns 'retry' when response contains 'retry'", () => {
-		const result = classifyResponse("The operation should retry.");
-		expect(result).toBe("retry");
-	});
-	test("returns 'retry' when response contains 'recoverable'", () => {
-		const result = classifyResponse("This error is recoverable.");
-		expect(result).toBe("retry");
-	});
-	test("returns 'terminate' when response contains 'terminate'", () => {
-		const result = classifyResponse("You should terminate the agent.");
-		expect(result).toBe("terminate");
-	});
-	test("returns 'terminate' when response contains 'fatal'", () => {
-		const result = classifyResponse("This is a fatal error.");
-		expect(result).toBe("terminate");
-	});
-	test("returns 'terminate' when response contains 'failed'", () => {
-		const result = classifyResponse("The operation has failed.");
-		expect(result).toBe("terminate");
-	});
-	test("handles mixed case (e.g., 'RETRY', 'Fatal')", () => {
-		expect(classifyResponse("RETRY this operation")).toBe("retry");
-		expect(classifyResponse("Fatal error occurred")).toBe("terminate");
-		expect(classifyResponse("RecOverAble issue")).toBe("retry");
-	});
-	test("returns 'extend' when response contains none of the keywords", () => {
-		const result = classifyResponse("The agent is processing data.");
-		expect(result).toBe("extend");
-	});
-	test("returns 'extend' for empty string", () => {
-		const result = classifyResponse("");
-		expect(result).toBe("extend");
-	});
-	test("first match wins when response has multiple keywords", () => {
-		// 'retry' is checked before 'terminate'
-		const result = classifyResponse("retry this but it may terminate later");
-		expect(result).toBe("retry");
-	});
-});
-describe("buildTriagePrompt", () => {
-	test("contains agent name in output", () => {
-		const prompt = buildTriagePrompt("test-agent", "2026-02-13T10:00:00Z", "log content");
-		expect(prompt).toContain("test-agent");
-	});
-	test("contains lastActivity timestamp in output", () => {
-		const timestamp = "2026-02-13T10:00:00Z";
-		const prompt = buildTriagePrompt("test-agent", timestamp, "log content");
-		expect(prompt).toContain(timestamp);
-	});
-	test("contains log content wrapped in code fences", () => {
-		const logContent = "Error: something went wrong\nat line 42";
-		const prompt = buildTriagePrompt("test-agent", "2026-02-13T10:00:00Z", logContent);
-		expect(prompt).toContain("```");
-		expect(prompt).toContain(logContent);
-		expect(prompt.split("```").length).toBeGreaterThanOrEqual(3); // Opening and closing fences
-	});
-	test("contains classification instructions (retry/terminate/extend)", () => {
-		const prompt = buildTriagePrompt("test-agent", "2026-02-13T10:00:00Z", "log content");
-		expect(prompt).toContain("retry");
-		expect(prompt).toContain("terminate");
-		expect(prompt).toContain("extend");
-	});
-});
-describe("triageAgent", () => {
-	let tempRoot: string;
-	beforeEach(async () => {
-		tempRoot = await mkdtemp(join(tmpdir(), "triage-test-"));
-	});
-	afterEach(async () => {
-		await rm(tempRoot, { recursive: true, force: true });
-	});
-	test("returns 'extend' when no logs directory exists", async () => {
-		const result = await triageAgent({
-			agentName: "test-agent",
-			root: tempRoot,
-			lastActivity: "2026-02-13T10:00:00Z",
-		});
-		expect(result).toBe("extend");
-	});
-	test("returns 'extend' when logs directory exists but is empty", async () => {
-		const logsDir = join(tempRoot, ".legio", "logs", "test-agent");
-		await mkdir(logsDir, { recursive: true });
-		const result = await triageAgent({
-			agentName: "test-agent",
-			root: tempRoot,
-			lastActivity: "2026-02-13T10:00:00Z",
-		});
-		expect(result).toBe("extend");
-	});
-	test("returns 'extend' when logs directory has session dir but no session.log", async () => {
-		const logsDir = join(tempRoot, ".legio", "logs", "test-agent", "2026-02-13T10-00-00");
-		await mkdir(logsDir, { recursive: true });
-		await writeFile(join(logsDir, ".gitkeep"), "", "utf-8");
-		const result = await triageAgent({
-			agentName: "test-agent",
-			root: tempRoot,
-			lastActivity: "2026-02-13T10:00:00Z",
-		});
-		expect(result).toBe("extend");
-	});
-	test("returns 'extend' when session.log exists but claude binary fails", async () => {
-		const timestamp = "2026-02-13T10-00-00";
-		const sessionLogDir = join(tempRoot, ".legio", "logs", "test-agent", timestamp);
-		const sessionLogPath = join(sessionLogDir, "session.log");
-		await mkdir(sessionLogDir, { recursive: true });
-		// Create session.log with some content
-		await writeFile(
-			sessionLogPath,
-			"Agent started\nProcessing data\nError: something went wrong\n",
-			"utf-8",
-		);
-		// triageAgent will try to spawn claude which should fail or be killed by timeout.
-		// Short timeout ensures the test doesn't hang even if the claude binary
-		// exists on the system (e.g., inside a Claude Code session).
-		const result = await triageAgent({
-			agentName: "test-agent",
-			root: tempRoot,
-			lastActivity: "2026-02-13T10:00:00Z",
-			timeoutMs: 500,
-		});
-		expect(result).toBe("extend");
-	});
-});