npm - claude-dev-env - Versions diffs - 1.62.1 → 1.64.0 - Mend

claude-dev-env 1.62.1 → 1.64.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

package/agents/code-advisor.md +22 -0
package/agents/code-verifier.md +42 -0
package/bin/install.mjs +1 -1
package/hooks/blocking/code_rules_dead_argparse_argument.py +554 -0
package/hooks/blocking/code_rules_enforcer.py +6 -0
package/hooks/blocking/config/verified_commit_constants.py +16 -0
package/hooks/blocking/test_code_rules_enforcer_dead_argparse_argument.py +534 -0
package/hooks/blocking/test_verification_verdict_store.py +232 -0
package/hooks/blocking/test_verified_commit_gate.py +43 -0
package/hooks/blocking/test_verifier_verdict_minter.py +139 -0
package/hooks/blocking/verification_verdict_store.py +165 -10
package/hooks/blocking/verified_commit_gate.py +8 -2
package/hooks/blocking/verifier_verdict_minter.py +59 -9
package/hooks/hooks_constants/dead_argparse_argument_constants.py +28 -0
package/package.json +1 -1
package/skills/autoconverge/SKILL.md +26 -1
package/skills/autoconverge/workflow/converge.contract.test.mjs +82 -18
package/skills/autoconverge/workflow/converge.mjs +46 -18
package/skills/verified-build/SKILL.md +38 -0

package/skills/autoconverge/workflow/converge.mjs CHANGED Viewed

@@ -141,15 +141,33 @@ const STANDARDS_EDIT_SCHEMA = {
   required: ['issueUrl', 'hardeningRepoPath', 'hardeningBranch', 'hardeningEdited', 'summary'],
 }
-const VERDICT_FENCE_STEPS =
-  `Compute the binding hash for the live surface by running exactly:\n` +
-  `   "C:\\Python313\\python.exe" "<REPO>/packages/claude-dev-env/hooks/blocking/verification_verdict_store.py" --manifest-hash "<REPO>"\n` +
-  `   (substitute the REPO path you resolved). That prints a single 64-char hex hash on stdout — capture it.\n` +
-  `Then END your message with a fenced verdict block exactly in this shape, on its own, carrying that hash:\n` +
-  "   ```verdict\n" +
-  `   {"all_pass": true, "findings": [], "manifest_sha256": "<that hash>"}\n` +
-  "   ```\n" +
-  `   When verification fails, set all_pass to false and list the unresolved concerns in findings; still include the manifest_sha256. The verdict fence must be the last thing in your message.`
+/**
+ * Build the verdict-fence step instructions for a verify agent, binding the
+ * surface hash by branch name rather than by a self-resolved cwd. Resolving
+ * the branch via `gh pr view` is cwd-immune: it does not matter which worktree
+ * the verify agent runs in, so a launcher session whose cwd is a different
+ * worktree cannot poison the binding hash.
+ * @param {string} prOwner GitHub owner of the repo that holds the branch
+ * @param {string} prRepo GitHub repo name
+ * @param {number|string} prNumber PR number used to resolve the head branch
+ * @returns {string} binding-hash and verdict-fence instructions for a verify prompt
+ */
+function buildVerdictFenceSteps(prOwner, prRepo, prNumber) {
+  return (
+    `Compute the binding hash for the live surface:\n` +
+    `   a. Resolve the PR head branch (cwd-immune): run exactly\n` +
+    `         gh pr view ${prNumber} --repo ${prOwner}/${prRepo} --json headRefName -q .headRefName\n` +
+    `      Capture the branch name printed on stdout.\n` +
+    `   b. Run exactly:\n` +
+    `         "C:\\Python313\\python.exe" "<REPO>/packages/claude-dev-env/hooks/blocking/verification_verdict_store.py" --manifest-hash-for-branch "<that branch>"\n` +
+    `      (substitute the REPO path you resolved for the script path, and the branch name for <that branch>). That prints a single 64-char hex hash on stdout — capture it.\n` +
+    `Then END your message with a fenced verdict block exactly in this shape, on its own, carrying that hash:\n` +
+    "   ```verdict\n" +
+    `   {"all_pass": true, "findings": [], "manifest_sha256": "<that hash>"}\n` +
+    "   ```\n" +
+    `   When verification fails, set all_pass to false and list the unresolved concerns in findings; still include the manifest_sha256. The verdict fence must be the last thing in your message.`
+  )
+}
 const CONVERGENCE_SUMMARY_SCHEMA = {
   type: 'object',
@@ -713,9 +731,9 @@ function verifyFixesInWorkingTree(head, findings, sourceLabel) {
     `You are the VERIFY step for ${findings.length} finding(s) (${sourceLabel}) on ${prCoordinates}, HEAD ${head}. The edit step left fixes in the working tree, uncommitted. Do NO edits of any kind — verification only; any edit invalidates the verdict you are about to emit.\n\n` +
       `Findings the working-tree fixes must address:\n${findingsBlock}\n\n` +
       `Steps:\n` +
-      `1. Resolve the worktree repo root: REPO=$(git rev-parse --show-toplevel).\n` +
+      `1. Resolve the worktree repo root for running tests: REPO=$(git rev-parse --show-toplevel).\n` +
       `2. Verify the uncommitted working-tree changes resolve every finding above: run the relevant tests and the named gates against the working tree. Read the diff (git diff) and confirm each finding is fixed test-first per CODE_RULES.\n` +
-      `3. ${VERDICT_FENCE_STEPS}`,
+      `3. ${buildVerdictFenceSteps(input.owner, input.repo, input.prNumber)}`,
     { label: `fix-verify:${sourceLabel}`, phase: 'Converge', agentType: 'code-verifier' },
   )
 }
@@ -935,9 +953,9 @@ function verifyRepairChanges(head, failures) {
     `You are the VERIFY step for the convergence repair on ${prCoordinates}, HEAD ${head}. The edit step left its repair in the working tree (a bot-thread fix uncommitted, and/or a rebase onto origin/main), unpushed. Do NO edits of any kind — verification only; any edit invalidates the verdict you are about to emit.\n\n` +
       `Concerns the working-tree repair must resolve (the gates the convergence check flagged):\n${failureBlock}\n\n` +
       `Steps:\n` +
-      `1. Resolve the worktree repo root: REPO=$(git rev-parse --show-toplevel).\n` +
+      `1. Resolve the worktree repo root for running tests: REPO=$(git rev-parse --show-toplevel).\n` +
       `2. Verify the working tree against origin/main: any bot-thread code fix is correct test-first per CODE_RULES, and a rebase (if any) left a clean, conflict-free tree. Read the diff (git diff origin/main) and run the relevant tests and named gates.\n` +
-      `3. ${VERDICT_FENCE_STEPS}`,
+      `3. ${buildVerdictFenceSteps(input.owner, input.repo, input.prNumber)}`,
     { label: 'repair-verify', phase: 'Finalize', agentType: 'code-verifier' },
   )
 }
@@ -1044,22 +1062,32 @@ function standardsFollowUpEdit(head, findings, sourceLabel) {
 /**
  * Standards-hardening verify step: a code-verifier confirms the uncommitted
  * hooks/rules change staged in the hardening repo blocks the deferred violation
- * classes, computes the binding surface hash for that repo, and ends with a
- * verdict fence as plain assistant text (NO schema) — unlocking the
+ * classes, computes the binding surface hash for that repo by branch (cwd-immune),
+ * and ends with a verdict fence as plain assistant text (NO schema) — unlocking the
  * verified-commit gate for the cross-repo hardening commit. The verifier makes
  * no edits.
  * @param {string} hardeningRepoPath absolute path of the hardening repo checkout the edit staged
+ * @param {string} hardeningBranch the branch in the hardening repo that the edit staged the change on
  * @param {string} sourceLabel short description of where the findings came from
  * @returns {Promise<string>} the verifier transcript carrying the verdict fence
  */
-function verifyHardeningChanges(hardeningRepoPath, sourceLabel) {
+function verifyHardeningChanges(hardeningRepoPath, hardeningBranch, sourceLabel) {
   return convergeAgent(
     `You are the VERIFY step for an environment-hardening change (${sourceLabel}) staged in the working tree of ${hardeningRepoPath}. The edit step left the hooks/rules edits uncommitted there. Do NO edits of any kind — verification only; any edit invalidates the verdict you are about to emit.\n\n` +
       `Concern the working-tree change must resolve: the edited hooks/rules block the code-standard violation classes from the deferred round at Write/Edit time, and a hook change carries a passing test per CODE_RULES.\n\n` +
       `Steps:\n` +
       `1. cd into ${hardeningRepoPath}, then resolve its repo root: REPO=$(git rev-parse --show-toplevel).\n` +
       `2. Verify the uncommitted working-tree change in REPO: read the diff (git diff) and run the hook/rule tests in that repo, confirming each violation class is now blocked.\n` +
-      `3. ${VERDICT_FENCE_STEPS}`,
+      `3. Compute the binding hash for the live surface:\n` +
+      `   The hardening branch is: ${hardeningBranch}\n` +
+      `   Run exactly:\n` +
+      `      "C:\\Python313\\python.exe" "<REPO>/packages/claude-dev-env/hooks/blocking/verification_verdict_store.py" --manifest-hash-for-branch "${hardeningBranch}"\n` +
+      `   (substitute the REPO path you resolved for the script path). That prints a single 64-char hex hash on stdout — capture it.\n` +
+      `   Then END your message with a fenced verdict block exactly in this shape, on its own, carrying that hash:\n` +
+      "      ```verdict\n" +
+      `      {"all_pass": true, "findings": [], "manifest_sha256": "<that hash>"}\n` +
+      "      ```\n" +
+      `      When verification fails, set all_pass to false and list the unresolved concerns in findings; still include the manifest_sha256. The verdict fence must be the last thing in your message.`,
     { label: `standards-verify:${sourceLabel}`, phase: 'Converge', agentType: 'code-verifier' },
   )
 }
@@ -1123,7 +1151,7 @@ async function spawnStandardsFollowUp(head, findings, sourceLabel) {
   if (editResult?.hardeningEdited !== true || !editResult?.hardeningRepoPath) {
     return { hardeningPrOpened: false }
   }
-  const verifyTranscript = await verifyHardeningChanges(editResult.hardeningRepoPath, sourceLabel)
+  const verifyTranscript = await verifyHardeningChanges(editResult.hardeningRepoPath, editResult.hardeningBranch, sourceLabel)
   if (!verdictPassed(verifyTranscript)) {
     return { hardeningPrOpened: false }
   }

package/skills/verified-build/SKILL.md ADDED Viewed

@@ -0,0 +1,38 @@
+---
+name: verified-build
+description: >-
+  Runs a code task through the two-phase verified workflow: scoped coder
+  agents write the changes (consulting the tool-less code-advisor when
+  stuck on a decision), then a fresh-context code-verifier agent re-derives
+  and runs every check itself. The verifier's fenced verdict is minted by
+  the verifier_verdict_minter hook and unlocks the verified_commit_gate for
+  git commit/push. Use for feature implementations, refactors, and bug
+  fixes that land behind verification. Triggers: 'verified build', 'run
+  this verified', 'two-phase build', 'build and verify', 'verified
+  implementation'.
+---
+# Verified Build
+Two phases, hook-enforced: coders write, a fresh-context verifier grades, and `git commit`/`git push` open only on a clean verdict bound to the live change surface.
+## Workflow
+Copy this checklist and check items off as you go:
+- [ ] **Record baselines.** Before any coder runs: the test command and its exact failure set, plus any other gates the repo names. Scope the test command to the modules the task touches (their test files plus tests importing the changed modules); record a full-suite baseline only when the assignments span multiple modules or multiple coders. The verifier compares against these.
+- [ ] **Scope assignments.** Split the task into file-disjoint assignments; write each as a task text with named checks.
+- [ ] **Spawn coders.** One agent per assignment (`clean-coder` or Sonnet). Tell each: on a decision it can't reasonably solve, consult the tool-less `code-advisor` agent — it returns a plan, a correction, or a stop signal — then resume.
+- [ ] **Settle the tree.** After coders finish: run formatters and any file-rewriting hooks, stage nothing, change nothing more.
+- [ ] **Spawn the verifier last.** Agent tool, `subagent_type: "code-verifier"`, with the task texts, the diff scope, and the recorded baselines. When it stops, the SubagentStop hook mints its verdict.
+- [ ] **Repair only reported findings.** On a failing verdict, spawn repair agents scoped to the findings, then re-spawn the verifier. Repeat until clean.
+- [ ] **Land right away.** One commit, push, draft PR — before anything else touches a file.
+## Gotchas
+- Any file change after the verifier stops moves the surface hash and re-locks the gate — formatter rewrites included. Settle the tree first; land right after the clean verdict.
+- The verdict covers the whole branch surface (merge base to work tree, untracked files included). There is no "verify just my part."
+- The verifier must end with a ```` ```verdict ```` fence. No fence means nothing is minted and the gate stays closed.
+- The minter keys on the agent type string `code-verifier` — spawning the same prompt under another agent type mints nothing.
+- A surface whose every change is a docs/image file (by extension), a Python file whose docstring-stripped AST is unchanged (docstring-, comment-, or formatting-only Python edits), or a pytest test file (`test_*.py`, `*_test.py`, `conftest.py`) is exempt automatically; skip the verifier for those. Comment-only edits in non-Python files are not exempt.
+- Record the test baseline before coders start. Without the exact pre-existing failure set, new breakage hides inside old noise.