npm - @ryuenn3123/agentic-senior-core - Versions diffs - 3.0.37 → 3.0.39 - Mend

@ryuenn3123/agentic-senior-core 3.0.37 → 3.0.39

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (66) hide show

package/.agent-context/prompts/bootstrap-design.md +109 -146
package/.agent-context/rules/frontend-architecture.md +92 -108
package/.agent-context/state/README.md +26 -0
package/.agent-context/state/architecture-map.md +32 -17
package/.agent-context/state/dependency-map.md +31 -22
package/.cursor/mcp.json +10 -0
package/.cursor/rules/agentic-senior-core.mdc +48 -0
package/.cursorrules +22 -88
package/.gemini/instructions.md +25 -16
package/.github/copilot-instructions.md +25 -16
package/.github/instructions/agentic-senior-core.instructions.md +47 -0
package/.instructions.md +98 -207
package/.windsurf/rules/agentic-senior-core.md +43 -0
package/.windsurfrules +22 -88
package/AGENTS.md +23 -26
package/CLAUDE.md +43 -0
package/CONTRIBUTING.md +7 -2
package/GEMINI.md +43 -0
package/README.md +25 -7
package/lib/cli/backup.mjs +4 -4
package/lib/cli/commands/init/project-context.mjs +101 -0
package/lib/cli/commands/init/runtime-environment.mjs +59 -0
package/lib/cli/commands/init/setup-decisions.mjs +83 -0
package/lib/cli/commands/init.mjs +33 -250
package/lib/cli/commands/optimize.mjs +1 -1
package/lib/cli/commands/upgrade.mjs +34 -16
package/lib/cli/compiler.mjs +59 -17
package/lib/cli/constants.mjs +5 -0
package/lib/cli/detector.mjs +4 -0
package/lib/cli/init-detection-flow.mjs +9 -1
package/lib/cli/init-selection.mjs +0 -5
package/lib/cli/preflight.mjs +3 -3
package/lib/cli/project-scaffolder/design-contract/validation.mjs +789 -0
package/lib/cli/project-scaffolder/design-contract.mjs +119 -924
package/lib/cli/project-scaffolder/prompt-builders.mjs +69 -84
package/lib/cli/project-scaffolder.mjs +0 -2
package/lib/cli/utils/filesystem.mjs +79 -0
package/lib/cli/utils/managed-surface.mjs +237 -0
package/lib/cli/utils/prompting.mjs +44 -0
package/lib/cli/utils.mjs +33 -335
package/package.json +21 -2
package/scripts/bump-version.mjs +15 -13
package/scripts/clean-local-artifacts.mjs +76 -0
package/scripts/docs-quality-drift-report.mjs +5 -0
package/scripts/frontend-usability-audit.mjs +23 -19
package/scripts/governance-weekly-report.mjs +37 -15
package/scripts/single-source-lazy-loading-audit.mjs +24 -0
package/scripts/sync-thin-adapters.mjs +99 -129
package/scripts/v3-purge-audit.mjs +5 -0
package/scripts/validate/config.mjs +10 -0
package/scripts/validate/coverage-checks.mjs +55 -0
package/scripts/validate.mjs +20 -0
package/.agent-context/marketplace/trust-tiers.json +0 -114
package/.agent-context/state/benchmark-analysis.json +0 -431
package/.agent-context/state/benchmark-evidence-bundle.json +0 -1040
package/.agent-context/state/benchmark-history.json +0 -75
package/.agent-context/state/benchmark-trend-report.csv +0 -5
package/.agent-context/state/benchmark-trend-report.json +0 -140
package/.agent-context/state/benchmark-writer-judge-matrix.json +0 -462
package/.agent-context/state/memory-continuity-benchmark.json +0 -132
package/.agent-context/state/onboarding-report.json +0 -102
package/.agent-context/state/quality-trend-report.json +0 -89
package/.agent-context/state/token-optimization-benchmark.json +0 -130
package/.agent-context/state/weekly-governance-report.json +0 -329
package/lib/cli/compatibility.mjs +0 -124
package/scripts/validate-evidence-bundle.mjs +0 -76

package/.agent-context/state/benchmark-history.json DELETED Viewed

@@ -1,75 +0,0 @@
-{
-  "generatedAt": "2026-04-17T03:20:15.400Z",
-  "reportName": "benchmark-history",
-  "maxEntries": 90,
-  "history": [
-    {
-      "generatedAt": "2026-04-17T02:54:01.239Z",
-      "releaseVersion": "2.0.26",
-      "fixtureCount": 12,
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "staleWatchlistCount": 0,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor",
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "forbiddenContentPassed": true
-    },
-    {
-      "generatedAt": "2026-04-17T02:54:57.419Z",
-      "releaseVersion": "2.0.26",
-      "fixtureCount": 12,
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "staleWatchlistCount": 0,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor",
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "forbiddenContentPassed": true
-    },
-    {
-      "generatedAt": "2026-04-17T03:19:31.047Z",
-      "releaseVersion": "2.0.26",
-      "fixtureCount": 12,
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "staleWatchlistCount": 0,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor",
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "forbiddenContentPassed": true
-    },
-    {
-      "generatedAt": "2026-04-17T03:20:15.400Z",
-      "releaseVersion": "2.0.26",
-      "fixtureCount": 12,
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "staleWatchlistCount": 0,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor",
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "forbiddenContentPassed": true
-    }
-  ]
-}

package/.agent-context/state/benchmark-trend-report.csv DELETED Viewed

@@ -1,5 +0,0 @@
-snapshotIndex,generatedAt,releaseVersion,top1Accuracy,manualCorrectionRate,incorrectDetectionRate,lowConfidenceRate,staleWatchlistCount,vulnerabilityTotal,criticalVulnerabilityCount,benchmarkGatePassed,intelligencePassed,reliabilityPassed,reliabilityRiskLevel
-"1","2026-04-17T02:54:01.239Z","2.0.26","0.9167","0.0833","0.0833","0.0833","0",,,"true","true","true","monitor"
-"2","2026-04-17T02:54:57.419Z","2.0.26","0.9167","0.0833","0.0833","0.0833","0",,,"true","true","true","monitor"
-"3","2026-04-17T03:19:31.047Z","2.0.26","0.9167","0.0833","0.0833","0.0833","0",,,"true","true","true","monitor"
-"4","2026-04-17T03:20:15.400Z","2.0.26","0.9167","0.0833","0.0833","0.0833","0",,,"true","true","true","monitor"

package/.agent-context/state/benchmark-trend-report.json DELETED Viewed

@@ -1,140 +0,0 @@
-{
-  "generatedAt": "2026-04-17T03:20:15.400Z",
-  "reportName": "benchmark-trend-report",
-  "releaseVersion": "2.0.26",
-  "historyCount": 4,
-  "releaseDelta": {
-    "currentReleaseVersion": "2.0.26",
-    "previousReleaseVersion": "2.0.26",
-    "comparedSnapshot": {
-      "currentGeneratedAt": "2026-04-17T03:20:15.400Z",
-      "previousGeneratedAt": "2026-04-17T03:19:31.047Z"
-    },
-    "top1AccuracyDelta": 0,
-    "manualCorrectionRateDelta": 0,
-    "staleWatchlistCountDelta": 0,
-    "vulnerabilityTotalDelta": 0,
-    "summary": [
-      "top1Accuracy: +0",
-      "manualCorrectionRate: +0",
-      "staleWatchlistCount: +0",
-      "vulnerabilityTotal: +0"
-    ]
-  },
-  "trendTable": [
-    {
-      "snapshotIndex": 1,
-      "generatedAt": "2026-04-17T02:54:01.239Z",
-      "releaseVersion": "2.0.26",
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "staleWatchlistCount": 0,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor"
-    },
-    {
-      "snapshotIndex": 2,
-      "generatedAt": "2026-04-17T02:54:57.419Z",
-      "releaseVersion": "2.0.26",
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "staleWatchlistCount": 0,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor"
-    },
-    {
-      "snapshotIndex": 3,
-      "generatedAt": "2026-04-17T03:19:31.047Z",
-      "releaseVersion": "2.0.26",
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "staleWatchlistCount": 0,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor"
-    },
-    {
-      "snapshotIndex": 4,
-      "generatedAt": "2026-04-17T03:20:15.400Z",
-      "releaseVersion": "2.0.26",
-      "top1Accuracy": 0.9167,
-      "manualCorrectionRate": 0.0833,
-      "incorrectDetectionRate": 0.0833,
-      "lowConfidenceRate": 0.0833,
-      "staleWatchlistCount": 0,
-      "vulnerabilityTotal": null,
-      "criticalVulnerabilityCount": null,
-      "benchmarkGatePassed": true,
-      "intelligencePassed": true,
-      "reliabilityPassed": true,
-      "reliabilityRiskLevel": "monitor"
-    }
-  ],
-  "chartSeries": {
-    "generatedAt": [
-      "2026-04-17T02:54:01.239Z",
-      "2026-04-17T02:54:57.419Z",
-      "2026-04-17T03:19:31.047Z",
-      "2026-04-17T03:20:15.400Z"
-    ],
-    "top1Accuracy": [
-      0.9167,
-      0.9167,
-      0.9167,
-      0.9167
-    ],
-    "manualCorrectionRate": [
-      0.0833,
-      0.0833,
-      0.0833,
-      0.0833
-    ],
-    "incorrectDetectionRate": [
-      0.0833,
-      0.0833,
-      0.0833,
-      0.0833
-    ],
-    "lowConfidenceRate": [
-      0.0833,
-      0.0833,
-      0.0833,
-      0.0833
-    ],
-    "staleWatchlistCount": [
-      0,
-      0,
-      0,
-      0
-    ],
-    "vulnerabilityTotal": [
-      null,
-      null,
-      null,
-      null
-    ]
-  },
-  "artifacts": {
-    "historyPath": ".agent-context/state/benchmark-history.json",
-    "jsonPath": ".agent-context/state/benchmark-trend-report.json",
-    "csvPath": ".agent-context/state/benchmark-trend-report.csv",
-    "writeMode": "stdout-and-file"
-  }
-}

package/.agent-context/state/benchmark-writer-judge-matrix.json DELETED Viewed

@@ -1,462 +0,0 @@
-{
-  "generatedAt": "2026-04-14T06:57:14.623Z",
-  "reportName": "benchmark-writer-judge-matrix",
-  "phase": "v2.5.1",
-  "passed": true,
-  "failureCount": 0,
-  "methodology": {
-    "blindReviewMode": true,
-    "writerLaneModelCount": 3,
-    "judgeLaneModelCount": 2,
-    "scenarioCount": 4,
-    "writerWeights": {
-      "quality": 40,
-      "efficiency": 20,
-      "reliability": 25,
-      "freshness": 15
-    },
-    "judgeWeights": {
-      "clarity": 35,
-      "correctness": 35,
-      "risk": 20,
-      "consistency": 10
-    }
-  },
-  "coreSignals": {
-    "top1Accuracy": 0.9167,
-    "manualCorrectionRate": 0.0833,
-    "nativeSavingsPercent": 81.52,
-    "benchmarkGatePassed": true,
-    "benchmarkGateFailureCount": 0,
-    "intelligenceFailureCount": 0,
-    "staleWatchlistCount": 0,
-    "top1AccuracyMet": true,
-    "manualCorrectionMet": true
-  },
-  "writerDirectory": [
-    {
-      "writerToken": "W1",
-      "writerModel": {
-        "id": "writer-copilot-balanced",
-        "provider": "github-copilot",
-        "profile": "balanced"
-      },
-      "averageCompositeScore": 93.7
-    },
-    {
-      "writerToken": "W2",
-      "writerModel": {
-        "id": "writer-claude-architect",
-        "provider": "anthropic",
-        "profile": "architect"
-      },
-      "averageCompositeScore": 92.8
-    },
-    {
-      "writerToken": "W3",
-      "writerModel": {
-        "id": "writer-gemini-ops",
-        "provider": "google",
-        "profile": "operations"
-      },
-      "averageCompositeScore": 92.65
-    }
-  ],
-  "comparisonMatrix": [
-    {
-      "scenarioId": "planning",
-      "scenarioCategory": "planning",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "planning:W1:judge-claude-audit",
-      "writerCompositeScore": 92.12,
-      "judgeCompositeScore": 94.12,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "planning",
-      "scenarioCategory": "planning",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "planning:W1:judge-gpt-risk",
-      "writerCompositeScore": 92.12,
-      "judgeCompositeScore": 94.12,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "refactor",
-      "scenarioCategory": "refactor",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "refactor:W1:judge-claude-audit",
-      "writerCompositeScore": 95.26,
-      "judgeCompositeScore": 93.26,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "refactor",
-      "scenarioCategory": "refactor",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "refactor:W1:judge-gpt-risk",
-      "writerCompositeScore": 95.26,
-      "judgeCompositeScore": 93.26,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "security",
-      "scenarioCategory": "security",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "security:W1:judge-claude-audit",
-      "writerCompositeScore": 94.42,
-      "judgeCompositeScore": 92.42,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "security",
-      "scenarioCategory": "security",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "security:W1:judge-gpt-risk",
-      "writerCompositeScore": 94.42,
-      "judgeCompositeScore": 93.42,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "delivery",
-      "scenarioCategory": "delivery",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "delivery:W1:judge-claude-audit",
-      "writerCompositeScore": 92.99,
-      "judgeCompositeScore": 93.99,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "delivery",
-      "scenarioCategory": "delivery",
-      "writerToken": "W1",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "delivery:W1:judge-gpt-risk",
-      "writerCompositeScore": 92.99,
-      "judgeCompositeScore": 92.99,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "planning",
-      "scenarioCategory": "planning",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "planning:W2:judge-claude-audit",
-      "writerCompositeScore": 93.12,
-      "judgeCompositeScore": 94.12,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "planning",
-      "scenarioCategory": "planning",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "planning:W2:judge-gpt-risk",
-      "writerCompositeScore": 93.12,
-      "judgeCompositeScore": 94.12,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "refactor",
-      "scenarioCategory": "refactor",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "refactor:W2:judge-claude-audit",
-      "writerCompositeScore": 93.06,
-      "judgeCompositeScore": 95.06,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "refactor",
-      "scenarioCategory": "refactor",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "refactor:W2:judge-gpt-risk",
-      "writerCompositeScore": 93.06,
-      "judgeCompositeScore": 95.06,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "security",
-      "scenarioCategory": "security",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "security:W2:judge-claude-audit",
-      "writerCompositeScore": 91.82,
-      "judgeCompositeScore": 90.82,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "security",
-      "scenarioCategory": "security",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "security:W2:judge-gpt-risk",
-      "writerCompositeScore": 91.82,
-      "judgeCompositeScore": 89.82,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "delivery",
-      "scenarioCategory": "delivery",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "delivery:W2:judge-claude-audit",
-      "writerCompositeScore": 93.19,
-      "judgeCompositeScore": 93.19,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "delivery",
-      "scenarioCategory": "delivery",
-      "writerToken": "W2",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "delivery:W2:judge-gpt-risk",
-      "writerCompositeScore": 93.19,
-      "judgeCompositeScore": 94.19,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "planning",
-      "scenarioCategory": "planning",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "planning:W3:judge-claude-audit",
-      "writerCompositeScore": 93.27,
-      "judgeCompositeScore": 93.27,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "planning",
-      "scenarioCategory": "planning",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "planning:W3:judge-gpt-risk",
-      "writerCompositeScore": 93.27,
-      "judgeCompositeScore": 93.27,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "refactor",
-      "scenarioCategory": "refactor",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "refactor:W3:judge-claude-audit",
-      "writerCompositeScore": 94.01,
-      "judgeCompositeScore": 95.01,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "refactor",
-      "scenarioCategory": "refactor",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "refactor:W3:judge-gpt-risk",
-      "writerCompositeScore": 94.01,
-      "judgeCompositeScore": 95.01,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "security",
-      "scenarioCategory": "security",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "security:W3:judge-claude-audit",
-      "writerCompositeScore": 92.37,
-      "judgeCompositeScore": 92.37,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "security",
-      "scenarioCategory": "security",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "security:W3:judge-gpt-risk",
-      "writerCompositeScore": 92.37,
-      "judgeCompositeScore": 94.37,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "delivery",
-      "scenarioCategory": "delivery",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-claude-audit",
-      "blindPairId": "delivery:W3:judge-claude-audit",
-      "writerCompositeScore": 90.94,
-      "judgeCompositeScore": 89.94,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    },
-    {
-      "scenarioId": "delivery",
-      "scenarioCategory": "delivery",
-      "writerToken": "W3",
-      "writerModelId": null,
-      "judgeModelId": "judge-gpt-risk",
-      "blindPairId": "delivery:W3:judge-gpt-risk",
-      "writerCompositeScore": 90.94,
-      "judgeCompositeScore": 92.94,
-      "scoreThreshold": 75,
-      "leniencyWindow": 2,
-      "meetsScoreThreshold": true,
-      "meetsCoreSignals": true,
-      "verdict": "pass"
-    }
-  ],
-  "summary": {
-    "passCount": 24,
-    "failCount": 0,
-    "passRatePercent": 100
-  },
-  "executions": [
-    {
-      "scriptPath": "scripts/detection-benchmark.mjs",
-      "exitCode": 0,
-      "parseError": null,
-      "reportName": null,
-      "passed": null
-    },
-    {
-      "scriptPath": "scripts/token-optimization-benchmark.mjs",
-      "exitCode": 0,
-      "parseError": null,
-      "reportName": "token-optimization-benchmark",
-      "passed": null
-    },
-    {
-      "scriptPath": "scripts/benchmark-gate.mjs",
-      "exitCode": 0,
-      "parseError": null,
-      "reportName": "benchmark-gate",
-      "passed": true
-    },
-    {
-      "scriptPath": "scripts/benchmark-intelligence.mjs",
-      "exitCode": 0,
-      "parseError": null,
-      "reportName": "benchmark-intelligence",
-      "passed": true
-    }
-  ]
-}