npm - @linimin/pi-letscook - Versions diffs - 0.1.33 → 0.1.36 - Mend

@linimin/pi-letscook 0.1.33 → 0.1.36

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/CHANGELOG.md +25 -0
package/README.md +48 -77
package/agents/completion-implementer.md +11 -2
package/extensions/completion/index.ts +370 -222
package/extensions/completion/role-reporting.js +107 -20
package/package.json +2 -1
package/scripts/active-slice-contract-test.sh +242 -0
package/scripts/canonical-evidence-artifact-test.sh +348 -0
package/scripts/context-proposal-test.sh +50 -49
package/scripts/evaluator-calibration-test.sh +363 -0
package/scripts/refocus-test.sh +31 -0
package/scripts/release-check.sh +5 -1
package/scripts/smoke-test.sh +56 -1
package/skills/completion-protocol/SKILL.md +4 -1
package/skills/completion-protocol/references/completion.md +24 -0

package/extensions/completion/role-reporting.js CHANGED Viewed

@@ -76,6 +76,52 @@ function parseFirstNumber(value) {
   return Number.isFinite(parsed) ? parsed : undefined;
 }
+function parseNoneLikeValue(value) {
+  const raw = asString(value);
+  if (!raw) return { noneLike: false, suffix: "" };
+  const trimmed = raw.trim();
+  const patterns = [
+    /^\(none\)(.*)$/i,
+    /^none(?:\b|$)(.*)$/i,
+    /^n\/a(?:\b|$)(.*)$/i,
+    /^na(?:\b|$)(.*)$/i,
+    /^not applicable(?:\b|$)(.*)$/i,
+  ];
+  for (const pattern of patterns) {
+    const match = trimmed.match(pattern);
+    if (match) {
+      return {
+        noneLike: true,
+        suffix: match[1] ?? "",
+      };
+    }
+  }
+  return { noneLike: false, suffix: "" };
+}
+function normalizeNoneLikeSuffix(suffix) {
+  return suffix.replace(/^[\s,.;:/-]+/, "").trim();
+}
+function isNoneLike(value) {
+  return parseNoneLikeValue(value).noneLike;
+}
+function isPureNoneLike(value) {
+  const parsed = parseNoneLikeValue(value);
+  return parsed.noneLike && normalizeNoneLikeSuffix(parsed.suffix).length === 0;
+}
+function isReviewerProceedToAuditorRoutingValue(value) {
+  const raw = asString(value);
+  if (!raw) return false;
+  return /^none\s*;\s*proceed to completion-auditor(?:[\p{P}\s]*)$/iu.test(raw);
+}
+function isReviewerNoFollowUpValue(value) {
+  return isPureNoneLike(value) || isReviewerProceedToAuditorRoutingValue(value);
+}
 function rubricVerdicts(reportFields) {
   return RUBRIC_DIMENSIONS.map((dimension) => {
     const value = reportFields[dimension];
@@ -138,22 +184,26 @@ function validateRoleReport(role, output, reportFields = parseReportFields(outpu
   if (role === "completion-reviewer") {
     validateRequiredFields(reportFields, REVIEWER_REQUIRED_FIELDS, errors, role);
     const acceptable = parseYesNo(reportFields["Acceptable as-is"]);
+    const followUpSlice = asString(reportFields["Smallest follow-up slice"]);
     if (acceptable === undefined) errors.push("Reviewer output must answer 'Acceptable as-is' with yes or no.");
     if (anyFail && acceptable === true) {
       errors.push("Reviewer output cannot mark 'Acceptable as-is: yes' when any rubric line is fail.");
     }
-    if (acceptable === false && !asString(reportFields["Smallest follow-up slice"])) {
-      errors.push("Reviewer output must include a smallest follow-up slice when acceptance is no.");
+    if (acceptable === true && followUpSlice && !isReviewerNoFollowUpValue(followUpSlice)) {
+      errors.push("Reviewer output cannot mark 'Acceptable as-is: yes' while naming a follow-up slice other than none.");
+    }
+    if (acceptable === false) {
+      if (!followUpSlice) {
+        errors.push("Reviewer output must include a smallest follow-up slice when acceptance is no.");
+      } else if (isNoneLike(followUpSlice)) {
+        errors.push("Reviewer output must name a non-none smallest follow-up slice when acceptance is no.");
+      }
     }
   } else if (role === "completion-auditor") {
     validateRequiredFields(reportFields, AUDITOR_REQUIRED_FIELDS, errors, role);
-    if (parseFirstNumber(reportFields["Blocker count"]) === undefined) {
-      errors.push("Auditor output must include a numeric Blocker count.");
-    }
-    if (parseFirstNumber(reportFields["High-value gap count"]) === undefined) {
-      errors.push("Auditor output must include a numeric High-value gap count.");
-    }
-    validateYesNoField(
+    const blockerCount = parseFirstNumber(reportFields["Blocker count"]);
+    const highValueGapCount = parseFirstNumber(reportFields["High-value gap count"]);
+    const worktreeClean = validateYesNoField(
       reportFields,
       "Tracked and unignored worktree is clean",
       errors,
@@ -171,6 +221,25 @@ function validateRoleReport(role, output, reportFields = parseReportFields(outpu
       errors,
       "Auditor output must answer 'Plan truthfully captures remaining slice backlog' with yes or no.",
     );
+    if (blockerCount === undefined) {
+      errors.push("Auditor output must include a numeric Blocker count.");
+    }
+    if (highValueGapCount === undefined) {
+      errors.push("Auditor output must include a numeric High-value gap count.");
+    }
+    const worktreeBlockers = asString(reportFields["Worktree blockers"]);
+    const nextMandatorySlice = asString(reportFields["Next mandatory slice"]);
+    const openContractIds = asString(reportFields["Open top-level contract IDs"]);
+    const hasRemainingWork = !isNoneLike(openContractIds) || (blockerCount ?? 0) > 0 || (highValueGapCount ?? 0) > 0;
+    if (worktreeClean === true && worktreeBlockers && !isPureNoneLike(worktreeBlockers)) {
+      errors.push("Auditor output cannot mark 'Tracked and unignored worktree is clean: yes' while listing worktree blockers.");
+    }
+    if (worktreeClean === false && (!worktreeBlockers || isNoneLike(worktreeBlockers))) {
+      errors.push("Auditor output must describe worktree blockers when 'Tracked and unignored worktree is clean: no'.");
+    }
+    if (hasRemainingWork && nextMandatorySlice && isNoneLike(nextMandatorySlice)) {
+      errors.push("Auditor output cannot leave 'Next mandatory slice' as none while open contracts, blockers, or high-value gaps remain.");
+    }
   } else if (role === "completion-stop-judge") {
     validateRequiredFields(reportFields, STOP_JUDGE_REQUIRED_FIELDS, errors, role);
     const canStop = validateYesNoField(
@@ -179,27 +248,45 @@ function validateRoleReport(role, output, reportFields = parseReportFields(outpu
       errors,
       "Stop-judge output must answer 'Can the project stop now' with yes or no.",
     );
-    if (anyFail && canStop === true) {
-      errors.push("Stop-judge output cannot mark 'Can the project stop now: yes' when any rubric line is fail.");
-    }
-    if (parseFirstNumber(reportFields["Blocker count"]) === undefined) {
-      errors.push("Stop-judge output must include a numeric Blocker count.");
-    }
-    if (parseFirstNumber(reportFields["High-value gap count"]) === undefined) {
-      errors.push("Stop-judge output must include a numeric High-value gap count.");
-    }
-    validateYesNoField(
+    const blockerCount = parseFirstNumber(reportFields["Blocker count"]);
+    const highValueGapCount = parseFirstNumber(reportFields["High-value gap count"]);
+    const docsParity = validateYesNoField(
       reportFields,
       "Docs/config/runbooks match shipped behavior",
       errors,
       "Stop-judge output must answer 'Docs/config/runbooks match shipped behavior' with yes or no.",
     );
-    validateYesNoField(
+    const worktreeClean = validateYesNoField(
       reportFields,
       "Tracked and unignored worktree is clean",
       errors,
       "Stop-judge output must answer 'Tracked and unignored worktree is clean' with yes or no.",
     );
+    if (anyFail && canStop === true) {
+      errors.push("Stop-judge output cannot mark 'Can the project stop now: yes' when any rubric line is fail.");
+    }
+    if (blockerCount === undefined) {
+      errors.push("Stop-judge output must include a numeric Blocker count.");
+    }
+    if (highValueGapCount === undefined) {
+      errors.push("Stop-judge output must include a numeric High-value gap count.");
+    }
+    const openContractIds = asString(reportFields["Exact remaining open top-level contract IDs"]);
+    if (canStop === true && openContractIds && !isPureNoneLike(openContractIds)) {
+      errors.push("Stop-judge output cannot mark 'Can the project stop now: yes' while naming remaining open top-level contract IDs.");
+    }
+    if (canStop === true && (blockerCount ?? 0) > 0) {
+      errors.push("Stop-judge output cannot mark 'Can the project stop now: yes' when Blocker count is greater than 0.");
+    }
+    if (canStop === true && (highValueGapCount ?? 0) > 0) {
+      errors.push("Stop-judge output cannot mark 'Can the project stop now: yes' when High-value gap count is greater than 0.");
+    }
+    if (canStop === true && docsParity === false) {
+      errors.push("Stop-judge output cannot mark 'Can the project stop now: yes' when docs/config/runbooks do not match shipped behavior.");
+    }
+    if (canStop === true && worktreeClean === false) {
+      errors.push("Stop-judge output cannot mark 'Can the project stop now: yes' when the tracked and unignored worktree is not clean.");
+    }
   }
   return { valid: errors.length === 0, errors, reportFields, rubric };

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@linimin/pi-letscook",
-  "version": "0.1.33",
+  "version": "0.1.36",
   "description": "Pi package for long-running completion workflows with canonical .agent state, role-based subagents, continuity, and verification helpers.",
   "license": "MIT",
   "private": false,
@@ -29,6 +29,7 @@
     "refocus-test": "bash ./scripts/refocus-test.sh",
     "context-proposal-test": "bash ./scripts/context-proposal-test.sh",
     "observability-status-test": "bash ./scripts/observability-status-test.sh",
+    "evaluator-calibration-test": "bash ./scripts/evaluator-calibration-test.sh",
     "rubric-contract-test": "bash ./scripts/rubric-contract-test.sh",
     "release-check": "bash ./scripts/release-check.sh"
   },

package/scripts/active-slice-contract-test.sh ADDED Viewed

@@ -0,0 +1,242 @@
+#!/usr/bin/env bash
+set -euo pipefail
+PKG_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
+TMPDIR="$(mktemp -d)"
+trap 'rm -rf "$TMPDIR"' EXIT
+cd "$PKG_ROOT"
+node <<'NODE'
+const fs = require('node:fs');
+const read = (file) => fs.readFileSync(file, 'utf8');
+const assertIncludes = (file, snippet) => {
+  const text = read(file);
+  if (!text.includes(snippet)) {
+    throw new Error(`${file} is missing required active-slice-contract text: ${snippet}`);
+  }
+};
+assertIncludes('agents/completion-implementer.md', 'canonical implementation contract');
+assertIncludes('agents/completion-implementer.md', '`implementation_surfaces`');
+assertIncludes('agents/completion-implementer.md', '`verification_commands`');
+assertIncludes('agents/completion-implementer.md', '`basis_commit`');
+assertIncludes('agents/completion-implementer.md', '`remaining_contract_ids_before`');
+assertIncludes('agents/completion-implementer.md', '`release_blocker_count_before`');
+assertIncludes('agents/completion-implementer.md', '`high_value_gap_count_before`');
+assertIncludes('README.md', 'canonical implementation contract for selected, in-progress, committed, and done slices');
+assertIncludes('README.md', 'The selected plan slice must mirror that exact contract across goal, contract IDs, acceptance criteria');
+assertIncludes('README.md', '`basis_commit`');
+assertIncludes('README.md', '`remaining_contract_ids_before` plus `release_blocker_count_before` / `high_value_gap_count_before`');
+assertIncludes('README.md', 'Deterministic active-slice contract regression now lives in `bash scripts/active-slice-contract-test.sh`');
+assertIncludes('README.md', 'includes deterministic active-slice contract coverage plus observability coverage');
+assertIncludes('scripts/release-check.sh', 'bash ./scripts/active-slice-contract-test.sh');
+assertIncludes('.agent/verify_completion_stop.sh', 'npm run release-check >/dev/null');
+assertIncludes('extensions/completion/index.ts', "const planMirrorFields = ['locked_notes', 'must_fix_findings', 'implementation_surfaces', 'verification_commands', 'basis_commit', 'remaining_contract_ids_before', 'release_blocker_count_before', 'high_value_gap_count_before'];");
+assertIncludes('extensions/completion/index.ts', 'Selected/in-progress/committed/done .agent/active-slice.json is the canonical implementation contract.');
+assertIncludes('extensions/completion/index.ts', 'Active slice contract drift: ${activeContractDrift}');
+assertIncludes('extensions/completion/index.ts', 'Canonical active-slice contract drift is currently: ${activeContractDrift}');
+assertIncludes('extensions/completion/index.ts', '`active_slice_contract_drift_fields: ${activeContractDrift}`');
+assertIncludes('extensions/completion/index.ts', 'treat .agent/active-slice.json as the canonical implementation contract');
+assertIncludes('.agent/verify_completion_control_plane.sh', "const planMirrorFields = ['locked_notes', 'must_fix_findings', 'implementation_surfaces', 'verification_commands', 'basis_commit', 'remaining_contract_ids_before', 'release_blocker_count_before', 'high_value_gap_count_before'];");
+assertIncludes('.agent/verify_completion_control_plane.sh', 'slice_id must match a slice in .agent/plan.json when status carries an exact handoff');
+assertIncludes('.agent/verify_completion_control_plane.sh', '.agent/active-slice.json must match the selected .agent/plan.json slice across: ');
+NODE
+ROOT="$TMPDIR/repo"
+PROMPT="$TMPDIR/resume-prompt.txt"
+mkdir -p "$ROOT"
+cd "$ROOT"
+git init -q
+PI_COMPLETION_SKIP_DRIVER_KICKOFF=1 \
+pi -e "$PKG_ROOT" -p "/cook active-slice contract fixture" \
+  >"$TMPDIR/pi-active-slice-bootstrap.out" 2>"$TMPDIR/pi-active-slice-bootstrap.err"
+python3 - <<'PY'
+import json
+from pathlib import Path
+mission = 'Exercise active-slice contract parity.'
+task_type = 'completion-workflow'
+evaluation_profile = 'completion-rubric-v1'
+verification_commands = [
+    'bash .agent/verify_completion_control_plane.sh',
+    'bash scripts/active-slice-contract-test.sh',
+    'npm run release-check',
+]
+implementation_surfaces = [
+    'extensions/completion/index.ts',
+    'agents/completion-implementer.md',
+    'README.md',
+    '.agent/verify_completion_control_plane.sh',
+    'scripts/release-check.sh',
+    'scripts/active-slice-contract-test.sh',
+]
+locked_notes = [
+    'Keep scope locked to active-slice contract parity.',
+    'Do not broaden into canonical evidence artifacts.',
+]
+must_fix_findings = [
+    'Ensure release-check covers the active-slice contract regression.',
+]
+remaining_contracts = ['ACTIVE-SLICE-CONTRACT-V2', 'CANONICAL-EVIDENCE-ARTIFACTS']
+acceptance = [
+    'Selected active-slice data is treated as the canonical implementation contract.',
+    'Control-plane parity checks fail closed on active-vs-plan drift.',
+    'Release-check includes deterministic active-slice contract regression coverage.',
+]
+state = {
+    'schema_version': 1,
+    'mission_anchor': mission,
+    'current_phase': 'implement',
+    'continuation_policy': 'continue',
+    'continuation_reason': 'Fixture for active-slice contract regression coverage.',
+    'project_done': False,
+    'task_type': task_type,
+    'evaluation_profile': evaluation_profile,
+    'requires_reground': False,
+    'slices_since_last_reground': 0,
+    'remaining_release_blockers': 0,
+    'remaining_high_value_gaps': 2,
+    'unsatisfied_contract_ids': remaining_contracts,
+    'release_blocker_ids': [],
+    'next_mandatory_action': 'Implement selected slice active-slice-fixture.',
+    'next_mandatory_role': 'completion-implementer',
+    'remaining_stop_judges': 3,
+    'last_reground_at': '2026-05-03T00:00:00Z',
+    'last_auditor_verdict': None,
+    'contract_status': 'selected_slice_pending_implementation',
+    'latest_completed_slice': 'fixturebasis',
+    'latest_verified_slice': 'fixturebasis',
+}
+plan = {
+    'schema_version': 1,
+    'mission_anchor': mission,
+    'task_type': task_type,
+    'evaluation_profile': evaluation_profile,
+    'last_reground_at': '2026-05-03T00:00:00Z',
+    'plan_basis': 'active_slice_contract_fixture',
+    'candidate_slices': [
+        {
+            'slice_id': 'active-slice-fixture',
+            'goal': 'Tighten active-slice implementation contract enforcement.',
+            'acceptance_criteria': acceptance,
+            'contract_ids': ['ACTIVE-SLICE-CONTRACT-V2'],
+            'priority': 80,
+            'status': 'selected',
+            'why_now': 'Fixture for active-slice contract parity.',
+            'blocked_on': [],
+            'evidence': [],
+            'locked_notes': locked_notes,
+            'must_fix_findings': must_fix_findings,
+            'implementation_surfaces': implementation_surfaces,
+            'verification_commands': verification_commands,
+            'basis_commit': 'fixturebasis',
+            'remaining_contract_ids_before': remaining_contracts,
+            'release_blocker_count_before': 0,
+            'high_value_gap_count_before': 2,
+        }
+    ],
+}
+active = {
+    'schema_version': 1,
+    'mission_anchor': mission,
+    'task_type': task_type,
+    'evaluation_profile': evaluation_profile,
+    'status': 'selected',
+    'slice_id': 'active-slice-fixture',
+    'goal': 'Tighten active-slice implementation contract enforcement.',
+    'contract_ids': ['ACTIVE-SLICE-CONTRACT-V2'],
+    'acceptance_criteria': acceptance,
+    'blocked_on': [],
+    'locked_notes': locked_notes,
+    'must_fix_findings': must_fix_findings,
+    'implementation_surfaces': implementation_surfaces,
+    'verification_commands': verification_commands,
+    'basis_commit': 'fixturebasis',
+    'remaining_contract_ids_before': remaining_contracts,
+    'release_blocker_count_before': 0,
+    'high_value_gap_count_before': 2,
+    'priority': 80,
+    'why_now': 'Fixture for active-slice contract parity.',
+}
+Path('.agent/state.json').write_text(json.dumps(state, indent=2) + '\n')
+Path('.agent/plan.json').write_text(json.dumps(plan, indent=2) + '\n')
+Path('.agent/active-slice.json').write_text(json.dumps(active, indent=2) + '\n')
+Path('.agent/verification-evidence.json').write_text(json.dumps({
+    'schema_version': 1,
+    'artifact_type': 'completion-verification-evidence',
+    'subject_type': 'selected_slice',
+    'slice_id': active['slice_id'],
+    'goal': active['goal'],
+    'contract_ids': active['contract_ids'],
+    'basis_commit': active['basis_commit'],
+    'head_sha': active['basis_commit'],
+    'verification_commands': verification_commands,
+    'outcome': 'passed',
+    'recorded_at': '2026-05-03T00:00:00Z',
+    'summary': 'Fixture evidence matches the selected active-slice contract.',
+}, indent=2) + '\n')
+PY
+PI_COMPLETION_SKIP_DRIVER_KICKOFF=1 \
+PI_COMPLETION_TEST_DRIVER_PROMPT_PATH="$PROMPT" \
+pi -e "$PKG_ROOT" -p "/cook" \
+  >"$TMPDIR/pi-active-slice-resume.out" 2>"$TMPDIR/pi-active-slice-resume.err"
+python3 - "$PROMPT" <<'PY'
+import sys
+from pathlib import Path
+text = Path(sys.argv[1]).read_text()
+assert 'treat .agent/active-slice.json as the canonical implementation contract' in text, text
+assert 'drifts from the selected plan slice or the exact handoff is unclear' in text, text
+PY
+bash .agent/verify_completion_control_plane.sh >/dev/null
+python3 - <<'PY'
+import copy
+import json
+import subprocess
+from pathlib import Path
+plan_path = Path('.agent/plan.json')
+base_plan = json.loads(plan_path.read_text())
+cases = [
+    ('slice_id', lambda slice: slice.__setitem__('slice_id', 'different-slice')),
+    ('goal', lambda slice: slice.__setitem__('goal', 'Drifted goal')),
+    ('contract_ids', lambda slice: slice.__setitem__('contract_ids', ['OTHER-CONTRACT'])),
+    ('acceptance_criteria', lambda slice: slice.__setitem__('acceptance_criteria', ['Different criterion'])),
+    ('blocked_on', lambda slice: slice.__setitem__('blocked_on', ['fixture-blocker'])),
+    ('priority', lambda slice: slice.__setitem__('priority', 1)),
+    ('why_now', lambda slice: slice.__setitem__('why_now', 'Different why_now')),
+    ('implementation_surfaces', lambda slice: slice.pop('implementation_surfaces', None)),
+    ('verification_commands', lambda slice: slice.__setitem__('verification_commands', ['bash .agent/verify_completion_control_plane.sh'])),
+    ('locked_notes', lambda slice: slice.__setitem__('locked_notes', ['different note'])),
+    ('must_fix_findings', lambda slice: slice.__setitem__('must_fix_findings', ['different finding'])),
+    ('basis_commit', lambda slice: slice.__setitem__('basis_commit', 'differentbasis')),
+    ('remaining_contract_ids_before', lambda slice: slice.__setitem__('remaining_contract_ids_before', ['ACTIVE-SLICE-CONTRACT-V2'])),
+    ('release_blocker_count_before', lambda slice: slice.__setitem__('release_blocker_count_before', 1)),
+    ('high_value_gap_count_before', lambda slice: slice.__setitem__('high_value_gap_count_before', 99)),
+]
+for label, mutate in cases:
+    plan = copy.deepcopy(base_plan)
+    slice_data = plan['candidate_slices'][0]
+    mutate(slice_data)
+    plan_path.write_text(json.dumps(plan, indent=2) + '\n')
+    result = subprocess.run(['bash', '.agent/verify_completion_control_plane.sh'], capture_output=True, text=True)
+    combined = (result.stdout or '') + (result.stderr or '')
+    assert result.returncode != 0, f'expected verifier failure for {label}'
+    assert label in combined, f'expected verifier output to mention {label}, got: {combined}'
+plan_path.write_text(json.dumps(base_plan, indent=2) + '\n')
+PY
+echo "active-slice contract test passed: $TMPDIR"