bigpowers 2.26.0 → 2.28.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/skills-lock.json CHANGED
@@ -16,6 +16,11 @@
16
16
  "sha256": "8192ebe6f66a9f91",
17
17
  "path": "audit-code/SKILL.md"
18
18
  },
19
+ "audit-plan": {
20
+ "description": "Evaluate an incoming project plan against bigpowers principles and conventions, surface gaps, and produce a READY/NOT READY verdict before engagement begins. Use when a new project arrives, when adapting a foreign plan, or before running seed-conventions on an unfamiliar codebase.",
21
+ "sha256": "3e88b606fc8e886c",
22
+ "path": "audit-plan/SKILL.md"
23
+ },
19
24
  "build-epic": {
20
25
  "description": "Eight-step epic build cycle — reads state.yaml, execution-status.yaml, and one epic capsule; updates status via bp-yaml-set or direct edit. Resume mode runs one step per invocation. Use instead of ad-hoc execute-plan for release work.",
21
26
  "sha256": "7a376ef092fde9cc",
@@ -93,7 +98,7 @@
93
98
  },
94
99
  "elaborate-spec": {
95
100
  "description": "Refine a rough idea into a clear, detailed specification through dialogue. Does not produce code. Use when user has a vague idea, wants to think through a feature before planning, or needs to turn \"I want X\" into a concrete spec.",
96
- "sha256": "6d60cffd5139347e",
101
+ "sha256": "9edc17057449444d",
97
102
  "path": "elaborate-spec/SKILL.md"
98
103
  },
99
104
  "enforce-first": {
@@ -103,7 +108,7 @@
103
108
  },
104
109
  "evolve-skill": {
105
110
  "description": "Benchmark-gated skill evolution — consume bigpowers-benchmark report, propose plan-work change, edit skill via craft-skill, re-run benchmark, record ADR. Use when a skill underperforms on benchmark or stocktake finds systemic gap.",
106
- "sha256": "3582333ff9b15942",
111
+ "sha256": "e2d127c4ae0b5af7",
107
112
  "path": "evolve-skill/SKILL.md"
108
113
  },
109
114
  "execute-plan": {
@@ -198,7 +203,7 @@
198
203
  },
199
204
  "quick-fix": {
200
205
  "description": "\"Streamlined fast-path for trivial data-only fixes — no TDD, no branching ceremony. Collapses 6 skills into 2 for changes that are purely data with no logic risk. Aborts with fallback to investigate-bug if guardrails trigger.\"",
201
- "sha256": "6b83f22481ff4995",
206
+ "sha256": "2b9f1cd6557b6256",
202
207
  "path": "quick-fix/SKILL.md"
203
208
  },
204
209
  "release-branch": {
@@ -226,6 +231,11 @@
226
231
  "sha256": "c16bbe4854a0d665",
227
232
  "path": "respond-review/SKILL.md"
228
233
  },
234
+ "run-benchmark": {
235
+ "description": "Run skill quality benchmarks from specs/benchmarks/ definitions and write pass@k reports. Use before and after evolve-skill to prove quality changes are improvements, not regressions.",
236
+ "sha256": "e27f4e682e505b19",
237
+ "path": "run-benchmark/SKILL.md"
238
+ },
229
239
  "run-evals": {
230
240
  "description": "Eval-Driven Development — define capability and regression evals before building; code graders use verify commands, model graders use explicit rubrics; log pass@k. Use before develop-tdd on new features, or when measuring agent capability over runs.",
231
241
  "sha256": "b3cd89a7e440c94f",
@@ -233,12 +243,12 @@
233
243
  },
234
244
  "run-planning": {
235
245
  "description": "\"DISCOVER-PHASE ADVANCER — Drive the discover-phase checklist (specs/planning-status.yaml) through survey-context → scope-work → research-first → elaborate-spec → plan-release → slice-tasks. NOT a duplicate of plan-work or the planning spine; it orchestrates the pre-coding discover phase only.\"",
236
- "sha256": "eb6c9d3c0e26b7fc",
246
+ "sha256": "a2e7c028e7f817de",
237
247
  "path": "run-planning/SKILL.md"
238
248
  },
239
249
  "scope-work": {
240
250
  "description": "\"PLANNING SPINE STEP 1 of 3 — Scope the work: define what is in and out of scope and save as specs/product/SCOPE_LATEST.yaml. Use before slice-tasks or plan-release on any new initiative. Not a substitute for slice-tasks (step 2) or plan-work (step 3).\"",
241
- "sha256": "3d333e2bfa5f9998",
251
+ "sha256": "d3cb167d8a5296be",
242
252
  "path": "scope-work/SKILL.md"
243
253
  },
244
254
  "search-skills": {
@@ -268,7 +278,7 @@
268
278
  },
269
279
  "slice-tasks": {
270
280
  "description": "\"PLANNING SPINE STEP 2 of 3 — Slice the work: break a scoped PRD into vertical-slice stories in specs/epics/. Use after scope-work (step 1), before plan-work (step 3). Not a substitute for scope-work or plan-work.\"",
271
- "sha256": "bda9db54dbe791b5",
281
+ "sha256": "7948164e218541ea",
272
282
  "path": "slice-tasks/SKILL.md"
273
283
  },
274
284
  "smoke-test": {
@@ -283,7 +293,7 @@
283
293
  },
284
294
  "stocktake-skills": {
285
295
  "description": "Sequential subagent batch audit of the bigpowers skill catalog — Quick Scan (changed only) or Full (all skills). Use during sustain phase, before a major release, or when catalog drift is suspected.",
286
- "sha256": "c58bf4f70ff02cd3",
296
+ "sha256": "6e73b2d2cf0cfbe1",
287
297
  "path": "stocktake-skills/SKILL.md"
288
298
  },
289
299
  "survey-context": {
@@ -18,6 +18,12 @@ Produce **epic capsule story tasks** in `specs/epics/eNN-slug/` — vertical sli
18
18
 
19
19
  ## Process
20
20
 
21
+ 0. **Read planning-context.yaml** — If `specs/planning-context.yaml` exists, read it first:
22
+ ```bash
23
+ test -f specs/planning-context.yaml && echo "Context found" || echo "No context — starting fresh"
24
+ ```
25
+ Use `feature_name`, `constraints`, and `out_of_scope` to inform slice boundaries. `key_decisions` in the file may constrain how stories are cut (e.g., "no external deps" constrains slice 2). If absent, proceed normally.
26
+
21
27
  1. **Read context** — Read `specs/product/SCOPE_LATEST.yaml` and/or `specs/release-plan.yaml`. Understand what the epic delivers end-to-end.
22
28
 
23
29
  2. **Cut tracer-bullet slices** — Identify the thinnest possible vertical path through the stack that delivers user value. Start with this slice; it will catch integration issues first. For example:
@@ -15,7 +15,8 @@ Audit SKILL.md catalog for drift, stale triggers, missing HARD GATEs, and INDEX
15
15
  | Mode | Scope |
16
16
  |------|-------|
17
17
  | **Quick Scan** | Skills changed since last tag or in current diff |
18
- | **Full** | All 62 skills per SKILL-INDEX.md + catalog audit |
18
+ | **Full** | All skills per SKILL-INDEX.md + catalog audit |
19
+ | **--verify** | Run `bash scripts/run-skill-verify.sh` and append health results to the stocktake report |
19
20
 
20
21
  ## Process
21
22
 
@@ -27,6 +28,7 @@ Audit SKILL.md catalog for drift, stale triggers, missing HARD GATEs, and INDEX
27
28
  - Skills with zero calls (potential dead weight)
28
29
  - Skills with high average time (candidates for `evolve-skill`)
29
30
  5. Critical findings → `plan-work` story; cosmetic → `evolve-skill` candidate.
31
+ 6. **--verify mode:** Run `bash scripts/run-skill-verify.sh` and append a `## Verify Health` section to the stocktake report: `"N/68 PASS, M FAIL, K SKIP"`. FAIL skills are critical findings and go straight to `plan-work`.
30
32
 
31
33
  ### Skill timing data (`metrics.skill_timings`)
32
34