npm - @riddledc/riddle-proof-packs - Versions diffs - 0.4.0 → 0.4.1 - Mend

@riddledc/riddle-proof-packs 0.4.0 → 0.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/dist/index.cjs CHANGED Viewed

@@ -1665,7 +1665,7 @@ var ratchet_loop_mix_level_search_default = {
       },
       {
         type: "window_call",
-        label: "run-ratchet-loop-mix-level-search",
+        label: "test-claim-candidates-mix-level-search",
         path: "__NEON_MIX_PROOF__.runRatchetLoop",
         args: [
           {
@@ -1679,8 +1679,7 @@ var ratchet_loop_mix_level_search_default = {
             maxIterations: 6,
             monitorProfile: "smallSpeaker",
             restore: true,
-            applyBest: false,
-            minImprovement: 0.1
+            applyBest: false
           }
         ],
         store_return_to: "__neonMixProof.ratchetLoop",
@@ -1697,10 +1696,13 @@ var ratchet_loop_mix_level_search_default = {
             path: "strategy"
           },
           {
-            path: "improvement"
+            path: "best.claimVerdict.status"
           },
           {
-            path: "best.candidate.track"
+            path: "best.claimCandidate.action.track"
+          },
+          {
+            path: "supportedClaimCandidateCount"
           }
         ]
       },
@@ -1750,16 +1752,18 @@ var ratchet_loop_mix_level_search_default = {
     pack_id: "neon_step_sequencer",
     pack_public_name: "Neon Step Sequencer Pack",
     evidence_role_pattern: "interaction_snapshots",
-    purpose: "Run a bounded automated ratchet loop using the Neon mix-level-search strategy.",
+    purpose: "Run a bounded loop that tests Neon mix-level change-claim candidates using the mix-level-search strategy.",
     required_receipts: [
       "ratchet loop returns ok",
       "baseline proof-window summary is captured",
-      "candidate attempts are captured",
-      "best candidate or human-review status is captured"
+      "claim candidates are captured",
+      "each candidate records claim receipts",
+      "best supported claim candidate or human-review status is captured",
+      "state restoration receipt is captured"
     ],
     does_not_prove: [
       "subjective mix quality",
-      "that the best objective candidate should be kept",
+      "that a supported claim candidate should be kept",
       "all possible mix edits"
     ]
   }

package/dist/index.js CHANGED Viewed

@@ -1630,7 +1630,7 @@ var ratchet_loop_mix_level_search_default = {
       },
       {
         type: "window_call",
-        label: "run-ratchet-loop-mix-level-search",
+        label: "test-claim-candidates-mix-level-search",
         path: "__NEON_MIX_PROOF__.runRatchetLoop",
         args: [
           {
@@ -1644,8 +1644,7 @@ var ratchet_loop_mix_level_search_default = {
             maxIterations: 6,
             monitorProfile: "smallSpeaker",
             restore: true,
-            applyBest: false,
-            minImprovement: 0.1
+            applyBest: false
           }
         ],
         store_return_to: "__neonMixProof.ratchetLoop",
@@ -1662,10 +1661,13 @@ var ratchet_loop_mix_level_search_default = {
             path: "strategy"
           },
           {
-            path: "improvement"
+            path: "best.claimVerdict.status"
           },
           {
-            path: "best.candidate.track"
+            path: "best.claimCandidate.action.track"
+          },
+          {
+            path: "supportedClaimCandidateCount"
           }
         ]
       },
@@ -1715,16 +1717,18 @@ var ratchet_loop_mix_level_search_default = {
     pack_id: "neon_step_sequencer",
     pack_public_name: "Neon Step Sequencer Pack",
     evidence_role_pattern: "interaction_snapshots",
-    purpose: "Run a bounded automated ratchet loop using the Neon mix-level-search strategy.",
+    purpose: "Run a bounded loop that tests Neon mix-level change-claim candidates using the mix-level-search strategy.",
     required_receipts: [
       "ratchet loop returns ok",
       "baseline proof-window summary is captured",
-      "candidate attempts are captured",
-      "best candidate or human-review status is captured"
+      "claim candidates are captured",
+      "each candidate records claim receipts",
+      "best supported claim candidate or human-review status is captured",
+      "state restoration receipt is captured"
     ],
     does_not_prove: [
       "subjective mix quality",
-      "that the best objective candidate should be kept",
+      "that a supported claim candidate should be kept",
       "all possible mix edits"
     ]
   }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@riddledc/riddle-proof-packs",
-  "version": "0.4.0",
+  "version": "0.4.1",
   "description": "Reusable proof pack profiles and metadata helpers for the Riddle proof framework.",
   "license": "MIT",
   "author": "RiddleDC",

package/packs/neon-step-sequencer/README.md CHANGED Viewed

@@ -33,7 +33,7 @@ This pack is the first app-specific lab for the open Riddle Proof architecture.
 The loop is not mix-specific as a proof concept. The proof concept is a bounded ratchet loop: propose a candidate, apply it, collect evidence, classify the result, restore or keep state, and repeat until the budget is exhausted.
-This pack's first concrete strategy is `mix-level-search`, which tries small level edits against Neon proof windows and returns objective evidence for the best candidate. It still does not decide subjective mix taste; the output is a listening and review packet.
+This pack's first concrete strategy is `mix-level-search`, which turns small level edits into change-claim candidates. Each candidate says what action will be attempted, what receipts must support the claim, and what evidence should be reviewed afterward. The loop may include a ranking metric to order review, but the verdict comes from receipts and invariants, not from a universal mix-quality number. It still does not decide subjective mix taste; the output is a listening and review packet.
 ## Example evidence
@@ -42,7 +42,7 @@ The `examples/` directory contains four local Playwright proof results captured
 - `run-001-fast-mix-health`: passing `current_target` audit with proof contract, source readiness, mix RMS `0.1234`, peak `0.8321`, and no clipping.
 - `run-002-mix-change`: passing `interaction_snapshots` proof where a bass-level edit moved bass RMS from `0.0507` to `0.1071` and mix RMS from `0.073` to `0.1264` without clipping.
 - `run-003-full-matrix`: passing `current_target` viewport matrix across desktop, phone, iPad Mini, and iPad with `0 px` horizontal overflow.
-- `run-004-ratchet-loop-mix-level-search`: passing `interaction_snapshots` proof where a bounded loop tested six mix-level candidates and returned `chord -0.10` as the best objective candidate without keeping the edit.
+- `run-004-ratchet-loop-mix-level-search`: passing `interaction_snapshots` proof where a bounded loop tested six mix-level change-claim candidates, found a supported `chord -0.10` candidate, recorded receipt-level verdicts, and restored app state without keeping the edit.
 ## Naming note

package/packs/neon-step-sequencer/case-study/findings.md CHANGED Viewed

@@ -41,7 +41,7 @@ Profile render window, song fixture, or authoring guide.
 ### Subjective boundary
-Metrics pass, but deciding whether the mix is better requires listening.
+Receipts can support that a requested mix-level change happened and stayed inside guardrails, but deciding whether the mix is musically better requires listening.
 Likely change:
@@ -93,9 +93,9 @@ Pack summary guidance first; Riddle Proof core only if a general display primiti
 ### Run 004 proved the bounded loop shape without making it mix-specific
 - run: `run-004-ratchet-loop-mix-level-search`
-- claim: a bounded ratchet loop can try candidate edits, collect proof-window evidence, rank candidates, and restore state.
-- observed evidence: `mix-level-search` tested `6` candidates; baseline score was `28.83345`; best score was `27.0708`; best candidate was `chord -0.10` to level `0.28`; loop status was `candidate_found`; console fatal count was `0`.
-- classification: none; passing `interaction_snapshots` proof with subjective listening caveat.
+- claim: a bounded ratchet loop can try change-claim candidates, collect proof-window evidence, record receipt verdicts, select a supported candidate for review, and restore state.
+- observed evidence: `mix-level-search` tested `6` candidates; baseline candidate-ranking metric was `28.8336`; best candidate-ranking metric was `27.07095`; best supported claim candidate was `chord -0.10` to level `0.28`; loop status was `claim_candidate_supported`; receipt checks covered edit acceptance, contract level agreement, rendered target metric movement, required instrument activity, no clipping, and no low-level proof window; console fatal count was `0`.
+- classification: none; passing `interaction_snapshots` proof with subjective listening caveat. The ranking metric is a review-order hint, not a proof verdict.
 - smallest layer changed: generic app proof-contract loop plus one Neon strategy.
 - change made: added `runRatchetLoop` with a `mix-level-search` strategy and a proof-pack profile that calls it.
 - rerun: passed on May 24, 2026.
@@ -108,6 +108,6 @@ Pack summary guidance first; Riddle Proof core only if a general display primiti
 - observed evidence: complete passing artifacts were written, but the wrapper process lingered after artifact write and had to be stopped.
 - classification: `proof_insufficient` for operator ergonomics, not a Neon product regression.
 - smallest layer changed: none in this pack.
-- change made: documented the issue and used an outer timeout for the matrix run.
-- rerun: not yet rerun after a runner fix.
+- change made: fixed the local Playwright runner timeout cleanup in `@riddledc/riddle-proof-runner-playwright`.
+- rerun: later runner smoke tests and the published `0.4.3` package exited cleanly.
 - next sharper question: should the local runner force-close browser handles or expose a clearer artifact-written exit phase?

package/packs/neon-step-sequencer/case-study/ratchet-card.md CHANGED Viewed

@@ -33,7 +33,7 @@ The project shows that a complex audio app can improve proof confidence mostly b
 - Run 001: a `current_target` audit connected the Neon route, proof contract, source readiness, and offline mix-health metrics.
 - Run 002: an `interaction_snapshots` proof showed a bass-level edit moving bass RMS from `0.0507` to `0.1071` and mix RMS from `0.073` to `0.1264` without clipping.
 - Run 003: a `current_target` matrix passed across desktop, phone, iPad Mini, and iPad with `0 px` horizontal overflow.
-- Run 004: a bounded loop tested six `mix-level-search` candidates, returned `chord -0.10` as the best objective candidate, and restored app state.
+- Run 004: a bounded loop tested six `mix-level-search` change-claim candidates, returned `chord -0.10` as a supported review candidate with receipt-level evidence, and restored app state.
 ## Honest boundary

package/packs/neon-step-sequencer/case-study/ratchet-log.md CHANGED Viewed

@@ -177,7 +177,7 @@ Can the pack explore song/mix combinations and produce a prioritized confidence
 Claim:
-Neon can run a bounded ratchet loop that proposes mix-level candidates, applies each candidate, captures proof-window evidence, ranks candidates by objective metrics, and restores app state.
+Neon can run a bounded ratchet loop that proposes mix-level change-claim candidates, applies each candidate action, captures proof-window evidence, records receipt-level verdicts, selects a supported candidate for review, and restores app state.
 Profile:
@@ -185,16 +185,16 @@ Profile:
 Evidence to capture:
-- baseline proof-window score
-- per-candidate proof-window score
-- best candidate and objective improvement
+- baseline candidate-ranking metric
+- per-candidate receipt verdicts
+- supported claim candidate and ranking metric delta
 - state restoration receipt
 - compact caveats for human handoff
 Possible outcomes:
-- `candidate_found`: at least one candidate improves objective metrics.
-- `needs_human_review`: evidence is valid but no objective candidate clears the threshold.
+- `claim_candidate_supported`: at least one candidate has the receipts needed to support its change claim.
+- `needs_human_review`: evidence is valid but no candidate has enough receipts to support the proposed claim automatically.
 - `proof_insufficient`: the app contract or proof window does not provide enough evidence.
 - `profile_calibration`: the chosen tracks, windows, or thresholds do not fit the target.
@@ -206,17 +206,18 @@ Observed evidence:
 - strategy `mix-level-search`
 - tested `6` candidates across `bass`, `chord`, `guitar`, and `rhythmSynth`
-- baseline score `28.83345`
-- best score `27.0708`
-- objective improvement `1.7627`
-- best candidate `chord -0.10` to level `0.28`
-- loop status `candidate_found`
+- baseline candidate-ranking metric `28.8336`
+- best candidate-ranking metric `27.07095`
+- ranking metric delta `1.7627`
+- best supported claim candidate `chord -0.10` to level `0.28`
+- claim receipts recorded for edit acceptance, contract level agreement, rendered target metric movement, required instrument activity, no clipping, and no low-level proof window
+- loop status `claim_candidate_supported`
 - app state restored after the run
 - console fatal count `0`
 Failure classification:
-None. This was a passing `interaction_snapshots` loop proof, with an explicit listening-review caveat.
+None. This was a passing `interaction_snapshots` loop proof, with an explicit listening-review caveat and a ranking metric that is only a review-order hint.
 Smallest layer changed:

package/packs/neon-step-sequencer/case-study/reusable-lessons.md CHANGED Viewed

@@ -28,4 +28,4 @@ Most ratchet steps should change profile JSON, pack docs, app proof contracts, o
 ## Loops are generic
-A ratchet loop should be domain-neutral: propose a candidate, apply it, collect evidence, classify the result, restore or keep state, and repeat within a budget. Neon `mix-level-search` is a strategy plugged into that loop, not the loop's identity.
+A ratchet loop should be domain-neutral: propose a claim candidate, apply its action, collect evidence, classify receipt-level support, restore or keep state, and repeat within a budget. Neon `mix-level-search` is a strategy plugged into that loop, not the loop's identity.

package/packs/neon-step-sequencer/examples/README.md CHANGED Viewed

@@ -11,7 +11,7 @@ The raw `profile-result.json` files are real runner outputs. They intentionally
 | `run-001-fast-mix-health` | `current_target` | passed | The current Neon target exposes a proof contract, source receipts, and a bounded offline mix-health render. |
 | `run-002-mix-change` | `interaction_snapshots` | passed | A bass-level edit changes rendered bass and mix metrics without clipping. |
 | `run-003-full-matrix` | `current_target` | passed | The mix-health proof holds across desktop, phone, iPad Mini, and iPad viewports. |
-| `run-004-ratchet-loop-mix-level-search` | `interaction_snapshots` | passed | A bounded ratchet loop tests mix-level candidates, returns the best objective candidate, and restores app state. |
+| `run-004-ratchet-loop-mix-level-search` | `interaction_snapshots` | passed | A bounded ratchet loop tests mix-level change-claim candidates, records receipt verdicts, chooses a supported candidate for review, and restores app state. |
 ## What these examples do not prove
@@ -20,3 +20,4 @@ The raw `profile-result.json` files are real runner outputs. They intentionally
 - They do not prove production CDN asset availability; these were local dev-server runs.
 - They do not prove a reference/candidate release delta. The mix-change run uses pre-action/post-action snapshots inside one proof run, not a separate baseline deployment.
 - The ratchet-loop run does not prove that the loop primitive is mix-specific; `mix-level-search` is only this pack's first concrete strategy.
+- The ratchet-loop run does not prove that the supported candidate should be kept. Its ranking metric is a review-order hint, not a taste verdict.