npm - @cardor/agent-harness-kit - Versions diffs - 0.16.10 → 0.17.0 - Mend

@cardor/agent-harness-kit 0.16.10 → 0.17.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/agent-templates/builder.md +13 -11
package/dist/agent-templates/explorer.md +6 -6
package/dist/agent-templates/lead.md +5 -5
package/dist/agent-templates/reviewer.md +8 -11
package/dist/cli.js +54 -34
package/dist/cli.js.map +1 -1
package/package.json +2 -2

package/dist/agent-templates/builder.md CHANGED Viewed

@@ -38,30 +38,32 @@ These three calls are **not optional**. The dashboard cannot display what you do
 ### 1. Log every tool call you make
-After **each** tool invocation (Read, Edit, Write, Bash), immediately call:
+After **each** tool invocation (Read, Edit, Write, Bash), call **both**:
 ```
-actions.write(actionId, 'tools_used', '<ToolName>: <args-summary> — why')
+actions.record_tool(actionId, '<ToolName>', '<args-summary>', '<why>')
 ```
 Examples:
-- `Read: src/auth/middleware.ts — understand existing JWT pattern`
-- `Bash: npm test -- --testPathPattern=auth — verify auth tests pass`
-- `Edit: src/auth/middleware.ts:45-78 — add refresh token validation`
+- `actions.record_tool(actionId, 'Read', 'src/auth/middleware.ts', 'understand existing JWT pattern')`
+- `actions.record_tool(actionId, 'Bash', 'npm test --testPathPattern=auth', 'verify auth tests pass')`
+- `actions.record_tool(actionId, 'Edit', 'src/auth/middleware.ts:45-78', 'add refresh token validation')`
 ### 2. Log every file you touch
-After **each** file modification (Edit, Write), immediately call:
+After **each** file modification (Edit, Write), call:
 ```
-actions.write(actionId, 'files_modified', '<file-path> — what changed and why')
+actions.record_file(actionId, '<file-path>', '<operation>', '<what changed and why>')
 ```
-Example: `src/auth/middleware.ts — added refresh token expiry check in validateToken()`
+Operations: `created` | `modified` | `deleted`
+Example: `actions.record_file(actionId, 'src/auth/middleware.ts', 'modified', 'added refresh token expiry check in validateToken()')`
 ### 3. Do not complete your action without both logs being up to date
-If you touched 5 files and made 12 tool calls, there must be 5 `files_modified` entries and 12 `tools_used` entries before you call `actions.complete`.
+If you touched 5 files and made 12 tool calls, there must be 5 `actions.record_file` calls and 12 `actions.record_tool` calls before you call `actions.complete`.
 ---
@@ -125,8 +127,8 @@ actions.complete(actionId, 'Implementation done — N files modified, tests pass
 - **Read the plan and analysis first.** Never implement cold.
 - **Only write to `{{writablePaths}}`.** No exceptions.
-- **Log every file you touch.** No silent modifications.
-- **Log every tool call.** Use `actions.write(actionId, 'tools_used', ...)` after each Read, Edit, Write, Bash invocation.
+- **Log every file you touch.** Call `actions.record_file(actionId, path, operation, notes)` after each Edit/Write.
+- **Log every tool call.** Call `actions.record_tool(actionId, toolName, args, summary)` after each Read, Edit, Write, Bash invocation.
 - **Leave tests green.** If tests fail after your changes, fix them before completing.
 - **Do not refactor beyond the task scope.** Implement what was asked, nothing more.
 - **If blocked, say so.** Do not invent workarounds for unclear requirements.

package/dist/agent-templates/explorer.md CHANGED Viewed

@@ -37,18 +37,18 @@ These calls are **not optional**. The dashboard cannot display what you do not r
 ### Log every tool call you make
-After **each** tool invocation (Read, Bash, grep, docs.search), immediately call:
+After **each** tool invocation (Read, Bash, grep, docs.search), call:
 ```
-actions.write(actionId, 'tools_used', '<ToolName>: <args-summary> — why')
+actions.record_tool(actionId, '<ToolName>', '<args-summary>', '<why>')
 ```
 Examples:
-- `Read: src/auth/middleware.ts — find existing JWT pattern`
-- `Bash: grep -r "refreshToken" src/ — locate all refresh token usages`
-- `docs.search: "authentication middleware" — check project docs for auth guidance`
+- `actions.record_tool(actionId, 'Read', 'src/auth/middleware.ts', 'find existing JWT pattern')`
+- `actions.record_tool(actionId, 'Bash', 'grep -r "refreshToken" src/', 'locate all refresh token usages')`
+- `actions.record_tool(actionId, 'docs.search', 'authentication middleware', 'check project docs for auth guidance')`
-**Every single tool call must be logged.** No silent reads. The audit trail in the dashboard is built entirely from these entries.
+**Every single tool call must be logged.** No silent reads. The Tools dashboard is built entirely from these `actions.record_tool` calls.
 ---

package/dist/agent-templates/lead.md CHANGED Viewed

@@ -32,16 +32,16 @@ These calls are **not optional**. The dashboard cannot display what you do not r
 ### Log every tool call you make
-After **each** tool invocation (Bash, tasks.get, tasks.claim, actions.get), immediately call:
+After **each** tool invocation (Bash, tasks.get, tasks.claim, actions.get), call:
 ```
-actions.write(actionId, 'tools_used', '<ToolName>: <args-summary> — why')
+actions.record_tool(actionId, '<ToolName>', '<args-summary>', '<why>')
 ```
 Examples:
-- `Bash: bash health.sh — verify codebase health before starting`
-- `tasks.get: pending — find next task to claim`
-- `actions.get: taskId=abc123 — read action history to resume in-progress task`
+- `actions.record_tool(actionId, 'Bash', 'bash health.sh', 'verify codebase health before starting')`
+- `actions.record_tool(actionId, 'tasks.get', 'pending', 'find next task to claim')`
+- `actions.record_tool(actionId, 'actions.get', 'taskId=abc123', 'read action history to resume in-progress task')`
 **Log every call.** This applies from the moment you have an `actionId` (after step 3 below).

package/dist/agent-templates/reviewer.md CHANGED Viewed

@@ -32,28 +32,25 @@ These calls are **not optional**. The dashboard cannot display what you do not r
 ### 1. Log every tool call you make
-After **each** tool invocation (Read, Bash), immediately call:
+After **each** tool invocation (Read, Bash), call:
 ```
-actions.write(actionId, 'tools_used', '<ToolName>: <args-summary> — why')
+actions.record_tool(actionId, '<ToolName>', '<args-summary>', '<why>')
 ```
 Examples:
-- `Read: src/auth/middleware.ts — verify refresh token logic matches criterion 2`
-- `Bash: npm test -- --testPathPattern=auth — confirm all auth tests pass`
+- `actions.record_tool(actionId, 'Read', 'src/auth/middleware.ts', 'verify refresh token logic matches criterion 2')`
+- `actions.record_tool(actionId, 'Bash', 'npm test --testPathPattern=auth', 'confirm all auth tests pass')`
 ### 2. Mark every acceptance criterion as you verify it
-For **each** criterion (0-based index), call this immediately after you evaluate it:
+For **each** criterion, call this immediately after you evaluate it using its `id` from `tasks.get`:
 ```
-tasks.acceptance_update(taskId, criterionIndex, true|false)
+tasks.acceptance.update(criterionId)
 ```
-- `true` = criterion is fully met
-- `false` = criterion is not met
-If the task has 3 criteria, you must make exactly 3 `tasks.acceptance_update` calls — one per criterion. Skipping any of them leaves the dashboard showing criteria as unverified.
+If the task has 3 criteria, you must make exactly 3 `tasks.acceptance.update` calls — one per criterion. Skipping any of them leaves the dashboard showing criteria as unverified.
 ---
@@ -124,7 +121,7 @@ Then notify lead so the builder can be re-assigned.
 - **Run health.sh before approving.** No exceptions.
 - **Check every acceptance criterion.** Not just the obvious ones.
-- **Call `tasks.acceptance_update()` for each criterion.** Both met and unmet — never skip this step.
+- **Call `tasks.acceptance.update()` for each criterion.** Never skip this step.
 - **Never self-approve partial work.** All criteria must be met, not most.
 - **Be specific when blocking.** The builder must know exactly what to fix.
 - **Do not fix issues yourself.** Your job is to verify, not to implement.

package/dist/cli.js CHANGED Viewed

@@ -149,14 +149,17 @@ If it exits non-zero, stop and report the issue. Do not proceed with tasks until
 The harness exposes tools via MCP server on port ${port}. Use these instead of reading files directly.
 \`\`\`
-actions.start      taskId agent          \u2192 start an action, returns actionId
-actions.write      actionId section text \u2192 record a section (result, tools_used, ...)
-actions.complete   actionId summary      \u2192 close the action
-actions.get        taskId               \u2192 full action history for a task
-tasks.get          [status]             \u2192 list tasks (pending | in_progress | done | blocked)
-tasks.claim        id                   \u2192 atomically claim a pending task
-tasks.update       id status            \u2192 change task status
-docs.search        query                \u2192 search ${docsPath} for relevant content
+actions.start        taskId agent                           \u2192 start an action, returns actionId
+actions.write        actionId section text                  \u2192 record a section (result, blockers, ...)
+actions.record_tool  actionId toolName [argsJson] [summary] \u2192 log a tool call to the Tools dashboard
+actions.record_file  actionId filePath operation [notes]   \u2192 log a file touch to the Files dashboard
+actions.complete     actionId summary                       \u2192 close the action
+actions.get          taskId                                 \u2192 full action history for a task
+tasks.get            [status]                               \u2192 list tasks (pending | in_progress | done | blocked)
+tasks.claim          id                                     \u2192 atomically claim a pending task
+tasks.update         id status                              \u2192 change task status
+tasks.acceptance.update criterionId                        \u2192 mark an acceptance criterion as met
+docs.search          query                                  \u2192 search ${docsPath} for relevant content
 \`\`\`
 ## Workflow
@@ -169,7 +172,8 @@ docs.search        query                \u2192 search ${docsPath} for relevant c
 2. WORK  (lead \u2192 explorer \u2192 builder \u2192 reviewer)
    - Each agent calls actions.start(taskId, agentName) \u2192 actionId
-   - Records work with actions.write(actionId, section, content)
+   - After EVERY tool call: actions.record_tool(actionId, toolName, args, summary)
+   - After EVERY file change: actions.record_file(actionId, filePath, operation, notes)
    - Closes with actions.complete(actionId, summary)
 3. CLOSE
@@ -1161,12 +1165,27 @@ async function runHealth(cwd2) {
 // src/commands/init.ts
 import { mkdirSync as mkdirSync6, writeFileSync as writeFileSync7 } from "fs";
 import { homedir } from "os";
-import { join as join9 } from "path";
+import { join as join10 } from "path";
 import * as p2 from "@clack/prompts";
 import pc6 from "picocolors";
 // src/commands/init-helpers.ts
+import { existsSync as existsSync7, readFileSync as readFileSync5 } from "fs";
+import { join as join9 } from "path";
 import pc5 from "picocolors";
+function readProjectNameFromPackageJson(cwd2) {
+  try {
+    const pkgPath2 = join9(cwd2, "package.json");
+    if (!existsSync7(pkgPath2)) return null;
+    const content = readFileSync5(pkgPath2, "utf8");
+    const pkg2 = JSON.parse(content);
+    const name = pkg2?.name;
+    if (typeof name === "string" && name.trim()) return name.trim();
+    return null;
+  } catch {
+    return null;
+  }
+}
 function applyConfigDefaults(params) {
   return {
     provider: params.provider,
@@ -1241,7 +1260,8 @@ function printWelcomeMessage(projectName) {
 // src/commands/init.ts
 async function runInit(cwd2, flags) {
-  const projectName = flags.name || "my-project";
+  const detectedName = flags.name ?? readProjectNameFromPackageJson(cwd2);
+  const projectName = detectedName || "my-project";
   printWelcomeMessage(projectName);
   let name;
   if (flags.name) {
@@ -1373,9 +1393,9 @@ async function runInit(cwd2, flags) {
     let installDir = cwd2;
     if (globalInstallation) {
       if (provider === "claude-code") {
-        installDir = join9(homedir(), ".claude");
+        installDir = join10(homedir(), ".claude");
       } else {
-        installDir = join9(homedir(), ".config", "opencode");
+        installDir = join10(homedir(), ".config", "opencode");
       }
     }
     const configContent = configTs({
@@ -1386,8 +1406,8 @@ async function runInit(cwd2, flags) {
       tasksAdapter,
       port: config.tools.mcp.port
     });
-    writeFileSync7(join9(installDir, "agent-harness-kit.config.ts"), configContent, "utf8");
-    mkdirSync6(join9(installDir, config.storage.dir), { recursive: true });
+    writeFileSync7(join10(installDir, "agent-harness-kit.config.ts"), configContent, "utf8");
+    mkdirSync6(join10(installDir, config.storage.dir), { recursive: true });
     const db = openDB(config, installDir);
     await materializer.scaffold(config, { cwd: installDir, firstTask });
     if (firstTask) {
@@ -1469,8 +1489,8 @@ async function runMigrate(cwd2, opts) {
 }
 // src/core/mcp-server.ts
-import { readdirSync, readFileSync as readFileSync5, statSync } from "fs";
-import { join as join10, resolve as resolve7 } from "path";
+import { readdirSync, readFileSync as readFileSync6, statSync } from "fs";
+import { join as join11, resolve as resolve7 } from "path";
 import { Server } from "@modelcontextprotocol/sdk/server";
 import { StdioServerTransport } from "@modelcontextprotocol/sdk/server/stdio.js";
 import {
@@ -1741,7 +1761,7 @@ function searchDocs(docsPath, query, maxResults = 10) {
     for (const file of files) {
       if (results.length >= maxResults) break;
       try {
-        const content = readFileSync5(file, "utf8");
+        const content = readFileSync6(file, "utf8");
         const lines = content.split("\n");
         for (let i = 0; i < lines.length; i++) {
           const lower = lines[i].toLowerCase();
@@ -1762,7 +1782,7 @@ function collectMarkdownFiles(dir) {
   const files = [];
   try {
     for (const entry of readdirSync(dir)) {
-      const full = join10(dir, entry);
+      const full = join11(dir, entry);
       const stat = statSync(full);
       if (stat.isDirectory()) {
         files.push(...collectMarkdownFiles(full));
@@ -1867,13 +1887,13 @@ async function runStatus(cwd2, opts) {
 }
 // src/commands/sync.ts
-import { existsSync as existsSync7, readFileSync as readFileSync6 } from "fs";
-import { join as join11, resolve as resolve8 } from "path";
+import { existsSync as existsSync8, readFileSync as readFileSync7 } from "fs";
+import { join as join12, resolve as resolve8 } from "path";
 import pc9 from "picocolors";
 async function runSync(cwd2, opts) {
   const config = await loadConfig(cwd2);
   const direction = opts.direction ?? "both";
-  const featureListPath = resolve8(join11(cwd2, config.storage.dir, "feature_list.json"));
+  const featureListPath = resolve8(join12(cwd2, config.storage.dir, "feature_list.json"));
   const db = openDB(config, cwd2);
   try {
     if (direction === "in" || direction === "both") {
@@ -1887,13 +1907,13 @@ async function runSync(cwd2, opts) {
   }
 }
 async function syncIn(featureListPath, db, dryRun) {
-  if (!existsSync7(featureListPath)) {
+  if (!existsSync8(featureListPath)) {
     console.log(pc9.dim(`feature_list.json not found at ${featureListPath} \u2014 skipping in-sync`));
     return;
   }
   let seeds;
   try {
-    seeds = JSON.parse(readFileSync6(featureListPath, "utf8"));
+    seeds = JSON.parse(readFileSync7(featureListPath, "utf8"));
   } catch (err) {
     console.error(pc9.red(`Failed to parse feature_list.json: ${err}`));
     process.exit(1);
@@ -1971,14 +1991,14 @@ async function runTaskAdd(cwd2) {
 // src/commands/task/done.ts
 import { spawnSync as spawnSync2 } from "child_process";
-import { existsSync as existsSync8 } from "fs";
+import { existsSync as existsSync9 } from "fs";
 import { resolve as resolve9 } from "path";
 import pc11 from "picocolors";
 async function runTaskDone(cwd2, idOrSlug) {
   const config = await loadConfig(cwd2);
   if (config.health.required) {
     const scriptPath = resolve9(cwd2, config.health.scriptPath);
-    if (existsSync8(scriptPath)) {
+    if (existsSync9(scriptPath)) {
       const result = spawnSync2("bash", [scriptPath], { cwd: cwd2, stdio: "pipe", encoding: "utf8" });
       if (result.status !== 0) {
         console.error(pc11.red("\u2717 Health check failed \u2014 cannot mark task as done."));
@@ -2049,10 +2069,10 @@ async function runTaskList(cwd2, opts) {
 // src/core/package-data.ts
 import { createRequire as createRequire2 } from "module";
-import { dirname as dirname5, join as join12 } from "path";
+import { dirname as dirname5, join as join13 } from "path";
 import { fileURLToPath as fileURLToPath3 } from "url";
 var require2 = createRequire2(import.meta.url);
-var pkgPath = join12(dirname5(fileURLToPath3(import.meta.url)), "..", "package.json");
+var pkgPath = join13(dirname5(fileURLToPath3(import.meta.url)), "..", "package.json");
 var pkg = require2(pkgPath);
 // src/core/update-check.ts
@@ -2101,14 +2121,14 @@ function stripAnsi2(str2) {
 }
 // src/commands/reset.ts
-import { existsSync as existsSync9, readdirSync as readdirSync2, rmSync } from "fs";
-import { join as join13, resolve as resolve10 } from "path";
+import { existsSync as existsSync10, readdirSync as readdirSync2, rmSync } from "fs";
+import { join as join14, resolve as resolve10 } from "path";
 import * as p5 from "@clack/prompts";
 import pc14 from "picocolors";
 async function resetAgentMds(cwd2, provider) {
   const agentDir = provider === "claude-code" ? ".claude/agents" : ".opencode/agents";
   const agentDirPath = resolve10(cwd2, agentDir);
-  if (!existsSync9(agentDirPath)) {
+  if (!existsSync10(agentDirPath)) {
     console.log(pc14.yellow(`  Skipping agent files \u2014 directory not found: ${agentDirPath}`));
     return;
   }
@@ -2139,7 +2159,7 @@ async function resetAgentMds(cwd2, provider) {
     }
     if (confirm3) {
       try {
-        const filePath = join13(agentDirPath, file);
+        const filePath = join14(agentDirPath, file);
         rmSync(filePath, { force: true });
         console.log(pc14.green(`  Removed ${file}`));
       } catch {
@@ -2164,7 +2184,7 @@ async function runReset(cwd2, opts) {
   let resetDb = false;
   let resetFeatureList = false;
   let resetAgentMdsFlag = false;
-  if (existsSync9(dbPath)) {
+  if (existsSync10(dbPath)) {
     if (opts.force) {
       resetDb = true;
     } else {
@@ -2179,7 +2199,7 @@ async function runReset(cwd2, opts) {
       resetDb = confirm3;
     }
   }
-  if (existsSync9(featureListPath)) {
+  if (existsSync10(featureListPath)) {
     if (opts.force) {
       resetFeatureList = true;
     } else {