@vibecheckai/cli 3.5.0 → 3.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (326) hide show
  1. package/bin/registry.js +174 -449
  2. package/bin/runners/cli-utils.js +33 -2
  3. package/bin/runners/context/generators/cursor.js +2 -49
  4. package/bin/runners/context/generators/mcp.js +13 -15
  5. package/bin/runners/context/proof-context.js +1 -248
  6. package/bin/runners/lib/analysis-core.js +180 -198
  7. package/bin/runners/lib/analyzers.js +241 -2212
  8. package/bin/runners/lib/cli-output.js +210 -242
  9. package/bin/runners/lib/detectors-v2.js +785 -547
  10. package/bin/runners/lib/entitlements-v2.js +431 -161
  11. package/bin/runners/lib/error-handler.js +9 -16
  12. package/bin/runners/lib/global-flags.js +0 -37
  13. package/bin/runners/lib/html-proof-report.js +700 -350
  14. package/bin/runners/lib/missions/plan.js +6 -46
  15. package/bin/runners/lib/missions/templates.js +0 -232
  16. package/bin/runners/lib/route-truth.js +322 -1167
  17. package/bin/runners/lib/scan-output.js +467 -493
  18. package/bin/runners/lib/ship-output.js +27 -280
  19. package/bin/runners/lib/terminal-ui.js +700 -310
  20. package/bin/runners/lib/truth.js +321 -1004
  21. package/bin/runners/lib/unified-output.js +158 -162
  22. package/bin/runners/lib/upsell.js +204 -104
  23. package/bin/runners/runAIAgent.js +10 -5
  24. package/bin/runners/runAllowlist.js +324 -0
  25. package/bin/runners/runAuth.js +94 -344
  26. package/bin/runners/runCheckpoint.js +45 -43
  27. package/bin/runners/runContext.js +24 -139
  28. package/bin/runners/runDoctor.js +101 -136
  29. package/bin/runners/runEvidencePack.js +219 -0
  30. package/bin/runners/runFix.js +71 -82
  31. package/bin/runners/runGuard.js +119 -606
  32. package/bin/runners/runInit.js +60 -22
  33. package/bin/runners/runInstall.js +281 -0
  34. package/bin/runners/runLabs.js +341 -0
  35. package/bin/runners/runMcp.js +62 -139
  36. package/bin/runners/runPolish.js +83 -282
  37. package/bin/runners/runPromptFirewall.js +12 -5
  38. package/bin/runners/runProve.js +58 -33
  39. package/bin/runners/runReality.js +58 -81
  40. package/bin/runners/runReport.js +7 -34
  41. package/bin/runners/runRuntime.js +8 -5
  42. package/bin/runners/runScan.js +844 -219
  43. package/bin/runners/runShip.js +59 -721
  44. package/bin/runners/runValidate.js +11 -24
  45. package/bin/runners/runWatch.js +76 -131
  46. package/bin/vibecheck.js +69 -295
  47. package/mcp-server/ARCHITECTURE.md +339 -0
  48. package/mcp-server/__tests__/cache.test.ts +313 -0
  49. package/mcp-server/__tests__/executor.test.ts +239 -0
  50. package/mcp-server/__tests__/fixtures/exclusion-test/.cache/webpack/cache.pack +1 -0
  51. package/mcp-server/__tests__/fixtures/exclusion-test/.next/server/chunk.js +3 -0
  52. package/mcp-server/__tests__/fixtures/exclusion-test/.turbo/cache.json +3 -0
  53. package/mcp-server/__tests__/fixtures/exclusion-test/.venv/lib/env.py +3 -0
  54. package/mcp-server/__tests__/fixtures/exclusion-test/dist/bundle.js +3 -0
  55. package/mcp-server/__tests__/fixtures/exclusion-test/package.json +5 -0
  56. package/mcp-server/__tests__/fixtures/exclusion-test/src/app.ts +5 -0
  57. package/mcp-server/__tests__/fixtures/exclusion-test/venv/lib/config.py +4 -0
  58. package/mcp-server/__tests__/ids.test.ts +345 -0
  59. package/mcp-server/__tests__/integration/tools.test.ts +410 -0
  60. package/mcp-server/__tests__/registry.test.ts +365 -0
  61. package/mcp-server/__tests__/sandbox.test.ts +323 -0
  62. package/mcp-server/__tests__/schemas.test.ts +372 -0
  63. package/mcp-server/benchmarks/run-benchmarks.ts +304 -0
  64. package/mcp-server/examples/doctor.request.json +14 -0
  65. package/mcp-server/examples/doctor.response.json +53 -0
  66. package/mcp-server/examples/error.response.json +15 -0
  67. package/mcp-server/examples/scan.request.json +14 -0
  68. package/mcp-server/examples/scan.response.json +108 -0
  69. package/mcp-server/handlers/tool-handler.ts +671 -0
  70. package/mcp-server/index-v1.js +698 -0
  71. package/mcp-server/index-v3.ts +293 -0
  72. package/mcp-server/index.js +1080 -1757
  73. package/mcp-server/index.old.js +4137 -0
  74. package/mcp-server/lib/cache.ts +341 -0
  75. package/mcp-server/lib/errors.ts +346 -0
  76. package/mcp-server/lib/executor.ts +792 -0
  77. package/mcp-server/lib/ids.ts +238 -0
  78. package/mcp-server/lib/logger.ts +368 -0
  79. package/mcp-server/lib/metrics.ts +365 -0
  80. package/mcp-server/lib/sandbox.ts +337 -0
  81. package/mcp-server/lib/validator.ts +229 -0
  82. package/mcp-server/package-lock.json +165 -0
  83. package/mcp-server/package.json +32 -7
  84. package/mcp-server/premium-tools.js +2 -2
  85. package/mcp-server/registry/tools.json +476 -0
  86. package/mcp-server/schemas/error-envelope.schema.json +125 -0
  87. package/mcp-server/schemas/finding.schema.json +167 -0
  88. package/mcp-server/schemas/report-artifact.schema.json +88 -0
  89. package/mcp-server/schemas/run-request.schema.json +75 -0
  90. package/mcp-server/schemas/verdict.schema.json +168 -0
  91. package/mcp-server/tier-auth.d.ts +71 -0
  92. package/mcp-server/tier-auth.js +371 -183
  93. package/mcp-server/truth-context.js +90 -131
  94. package/mcp-server/truth-firewall-tools.js +1000 -1611
  95. package/mcp-server/tsconfig.json +34 -0
  96. package/mcp-server/vibecheck-tools.js +2 -2
  97. package/mcp-server/vitest.config.ts +16 -0
  98. package/package.json +3 -4
  99. package/bin/runners/lib/agent-firewall/ai/false-positive-analyzer.js +0 -474
  100. package/bin/runners/lib/agent-firewall/change-packet/builder.js +0 -488
  101. package/bin/runners/lib/agent-firewall/change-packet/schema.json +0 -228
  102. package/bin/runners/lib/agent-firewall/change-packet/store.js +0 -200
  103. package/bin/runners/lib/agent-firewall/claims/claim-types.js +0 -21
  104. package/bin/runners/lib/agent-firewall/claims/extractor.js +0 -303
  105. package/bin/runners/lib/agent-firewall/claims/patterns.js +0 -24
  106. package/bin/runners/lib/agent-firewall/critic/index.js +0 -151
  107. package/bin/runners/lib/agent-firewall/critic/judge.js +0 -432
  108. package/bin/runners/lib/agent-firewall/critic/prompts.js +0 -305
  109. package/bin/runners/lib/agent-firewall/evidence/auth-evidence.js +0 -88
  110. package/bin/runners/lib/agent-firewall/evidence/contract-evidence.js +0 -75
  111. package/bin/runners/lib/agent-firewall/evidence/env-evidence.js +0 -127
  112. package/bin/runners/lib/agent-firewall/evidence/resolver.js +0 -102
  113. package/bin/runners/lib/agent-firewall/evidence/route-evidence.js +0 -213
  114. package/bin/runners/lib/agent-firewall/evidence/side-effect-evidence.js +0 -145
  115. package/bin/runners/lib/agent-firewall/fs-hook/daemon.js +0 -19
  116. package/bin/runners/lib/agent-firewall/fs-hook/installer.js +0 -87
  117. package/bin/runners/lib/agent-firewall/fs-hook/watcher.js +0 -184
  118. package/bin/runners/lib/agent-firewall/git-hook/pre-commit.js +0 -163
  119. package/bin/runners/lib/agent-firewall/ide-extension/cursor.js +0 -107
  120. package/bin/runners/lib/agent-firewall/ide-extension/vscode.js +0 -68
  121. package/bin/runners/lib/agent-firewall/ide-extension/windsurf.js +0 -66
  122. package/bin/runners/lib/agent-firewall/interceptor/base.js +0 -304
  123. package/bin/runners/lib/agent-firewall/interceptor/cursor.js +0 -35
  124. package/bin/runners/lib/agent-firewall/interceptor/vscode.js +0 -35
  125. package/bin/runners/lib/agent-firewall/interceptor/windsurf.js +0 -34
  126. package/bin/runners/lib/agent-firewall/lawbook/distributor.js +0 -465
  127. package/bin/runners/lib/agent-firewall/lawbook/evaluator.js +0 -604
  128. package/bin/runners/lib/agent-firewall/lawbook/index.js +0 -304
  129. package/bin/runners/lib/agent-firewall/lawbook/registry.js +0 -514
  130. package/bin/runners/lib/agent-firewall/lawbook/schema.js +0 -420
  131. package/bin/runners/lib/agent-firewall/learning/learning-engine.js +0 -849
  132. package/bin/runners/lib/agent-firewall/logger.js +0 -141
  133. package/bin/runners/lib/agent-firewall/policy/default-policy.json +0 -90
  134. package/bin/runners/lib/agent-firewall/policy/engine.js +0 -103
  135. package/bin/runners/lib/agent-firewall/policy/loader.js +0 -451
  136. package/bin/runners/lib/agent-firewall/policy/rules/auth-drift.js +0 -50
  137. package/bin/runners/lib/agent-firewall/policy/rules/contract-drift.js +0 -50
  138. package/bin/runners/lib/agent-firewall/policy/rules/fake-success.js +0 -86
  139. package/bin/runners/lib/agent-firewall/policy/rules/ghost-env.js +0 -162
  140. package/bin/runners/lib/agent-firewall/policy/rules/ghost-route.js +0 -189
  141. package/bin/runners/lib/agent-firewall/policy/rules/scope.js +0 -93
  142. package/bin/runners/lib/agent-firewall/policy/rules/unsafe-side-effect.js +0 -57
  143. package/bin/runners/lib/agent-firewall/policy/schema.json +0 -183
  144. package/bin/runners/lib/agent-firewall/policy/verdict.js +0 -54
  145. package/bin/runners/lib/agent-firewall/proposal/extractor.js +0 -394
  146. package/bin/runners/lib/agent-firewall/proposal/index.js +0 -212
  147. package/bin/runners/lib/agent-firewall/proposal/schema.js +0 -251
  148. package/bin/runners/lib/agent-firewall/proposal/validator.js +0 -386
  149. package/bin/runners/lib/agent-firewall/reality/index.js +0 -332
  150. package/bin/runners/lib/agent-firewall/reality/state.js +0 -625
  151. package/bin/runners/lib/agent-firewall/reality/watcher.js +0 -322
  152. package/bin/runners/lib/agent-firewall/risk/index.js +0 -173
  153. package/bin/runners/lib/agent-firewall/risk/scorer.js +0 -328
  154. package/bin/runners/lib/agent-firewall/risk/thresholds.js +0 -321
  155. package/bin/runners/lib/agent-firewall/risk/vectors.js +0 -421
  156. package/bin/runners/lib/agent-firewall/simulator/diff-simulator.js +0 -472
  157. package/bin/runners/lib/agent-firewall/simulator/import-resolver.js +0 -346
  158. package/bin/runners/lib/agent-firewall/simulator/index.js +0 -181
  159. package/bin/runners/lib/agent-firewall/simulator/route-validator.js +0 -380
  160. package/bin/runners/lib/agent-firewall/time-machine/incident-correlator.js +0 -661
  161. package/bin/runners/lib/agent-firewall/time-machine/index.js +0 -267
  162. package/bin/runners/lib/agent-firewall/time-machine/replay-engine.js +0 -436
  163. package/bin/runners/lib/agent-firewall/time-machine/state-reconstructor.js +0 -490
  164. package/bin/runners/lib/agent-firewall/time-machine/timeline-builder.js +0 -530
  165. package/bin/runners/lib/agent-firewall/truthpack/index.js +0 -67
  166. package/bin/runners/lib/agent-firewall/truthpack/loader.js +0 -137
  167. package/bin/runners/lib/agent-firewall/unblock/planner.js +0 -337
  168. package/bin/runners/lib/agent-firewall/utils/ignore-checker.js +0 -118
  169. package/bin/runners/lib/api-client.js +0 -269
  170. package/bin/runners/lib/audit-logger.js +0 -532
  171. package/bin/runners/lib/authority/authorities/architecture.js +0 -364
  172. package/bin/runners/lib/authority/authorities/compliance.js +0 -341
  173. package/bin/runners/lib/authority/authorities/human.js +0 -343
  174. package/bin/runners/lib/authority/authorities/quality.js +0 -420
  175. package/bin/runners/lib/authority/authorities/security.js +0 -228
  176. package/bin/runners/lib/authority/index.js +0 -293
  177. package/bin/runners/lib/authority-badge.js +0 -425
  178. package/bin/runners/lib/bundle/bundle-intelligence.js +0 -846
  179. package/bin/runners/lib/cli-charts.js +0 -368
  180. package/bin/runners/lib/cli-config-display.js +0 -405
  181. package/bin/runners/lib/cli-demo.js +0 -275
  182. package/bin/runners/lib/cli-errors.js +0 -438
  183. package/bin/runners/lib/cli-help-formatter.js +0 -439
  184. package/bin/runners/lib/cli-interactive-menu.js +0 -509
  185. package/bin/runners/lib/cli-prompts.js +0 -441
  186. package/bin/runners/lib/cli-scan-cards.js +0 -362
  187. package/bin/runners/lib/compliance-reporter.js +0 -710
  188. package/bin/runners/lib/conductor/index.js +0 -671
  189. package/bin/runners/lib/easy/README.md +0 -123
  190. package/bin/runners/lib/easy/index.js +0 -140
  191. package/bin/runners/lib/easy/interactive-wizard.js +0 -788
  192. package/bin/runners/lib/easy/one-click-firewall.js +0 -564
  193. package/bin/runners/lib/easy/zero-config-reality.js +0 -714
  194. package/bin/runners/lib/engines/accessibility-engine.js +0 -390
  195. package/bin/runners/lib/engines/api-consistency-engine.js +0 -467
  196. package/bin/runners/lib/engines/ast-cache.js +0 -99
  197. package/bin/runners/lib/engines/async-patterns-engine.js +0 -444
  198. package/bin/runners/lib/engines/bundle-size-engine.js +0 -433
  199. package/bin/runners/lib/engines/code-quality-engine.js +0 -255
  200. package/bin/runners/lib/engines/confidence-scoring.js +0 -276
  201. package/bin/runners/lib/engines/console-logs-engine.js +0 -115
  202. package/bin/runners/lib/engines/context-detection.js +0 -264
  203. package/bin/runners/lib/engines/cross-file-analysis-engine.js +0 -533
  204. package/bin/runners/lib/engines/database-patterns-engine.js +0 -429
  205. package/bin/runners/lib/engines/dead-code-engine.js +0 -198
  206. package/bin/runners/lib/engines/deprecated-api-engine.js +0 -226
  207. package/bin/runners/lib/engines/duplicate-code-engine.js +0 -354
  208. package/bin/runners/lib/engines/empty-catch-engine.js +0 -260
  209. package/bin/runners/lib/engines/env-variables-engine.js +0 -458
  210. package/bin/runners/lib/engines/error-handling-engine.js +0 -437
  211. package/bin/runners/lib/engines/false-positive-prevention.js +0 -630
  212. package/bin/runners/lib/engines/file-filter.js +0 -131
  213. package/bin/runners/lib/engines/framework-adapters/index.js +0 -607
  214. package/bin/runners/lib/engines/framework-detection.js +0 -508
  215. package/bin/runners/lib/engines/hardcoded-secrets-engine.js +0 -251
  216. package/bin/runners/lib/engines/import-order-engine.js +0 -429
  217. package/bin/runners/lib/engines/mock-data-engine.js +0 -315
  218. package/bin/runners/lib/engines/naming-conventions-engine.js +0 -544
  219. package/bin/runners/lib/engines/noise-reduction-engine.js +0 -452
  220. package/bin/runners/lib/engines/orchestrator.js +0 -334
  221. package/bin/runners/lib/engines/parallel-processor.js +0 -71
  222. package/bin/runners/lib/engines/performance-issues-engine.js +0 -405
  223. package/bin/runners/lib/engines/react-patterns-engine.js +0 -457
  224. package/bin/runners/lib/engines/security-vulnerabilities-engine.js +0 -571
  225. package/bin/runners/lib/engines/todo-fixme-engine.js +0 -115
  226. package/bin/runners/lib/engines/type-aware-engine.js +0 -376
  227. package/bin/runners/lib/engines/unsafe-regex-engine.js +0 -225
  228. package/bin/runners/lib/engines/vibecheck-engines/README.md +0 -53
  229. package/bin/runners/lib/engines/vibecheck-engines/index.js +0 -124
  230. package/bin/runners/lib/engines/vibecheck-engines/lib/ai-hallucination-engine.js +0 -806
  231. package/bin/runners/lib/engines/vibecheck-engines/lib/hardcoded-secrets-engine.js +0 -439
  232. package/bin/runners/lib/engines/vibecheck-engines/lib/smart-fix-engine.js +0 -577
  233. package/bin/runners/lib/engines/vibecheck-engines/lib/vibe-score-engine.js +0 -543
  234. package/bin/runners/lib/engines/vibecheck-engines/package.json +0 -13
  235. package/bin/runners/lib/engines/vibecheck-engines.js +0 -514
  236. package/bin/runners/lib/enhanced-features/index.js +0 -305
  237. package/bin/runners/lib/enhanced-output.js +0 -631
  238. package/bin/runners/lib/enterprise.js +0 -300
  239. package/bin/runners/lib/exit-codes.js +0 -275
  240. package/bin/runners/lib/fingerprint.js +0 -377
  241. package/bin/runners/lib/firewall/command-validator.js +0 -351
  242. package/bin/runners/lib/firewall/config.js +0 -341
  243. package/bin/runners/lib/firewall/content-validator.js +0 -519
  244. package/bin/runners/lib/firewall/index.js +0 -101
  245. package/bin/runners/lib/firewall/path-validator.js +0 -256
  246. package/bin/runners/lib/help-formatter.js +0 -413
  247. package/bin/runners/lib/intelligence/cross-repo-intelligence.js +0 -817
  248. package/bin/runners/lib/logger.js +0 -38
  249. package/bin/runners/lib/mcp-utils.js +0 -425
  250. package/bin/runners/lib/output/index.js +0 -1022
  251. package/bin/runners/lib/policy-engine.js +0 -652
  252. package/bin/runners/lib/polish/autofix/accessibility-fixes.js +0 -333
  253. package/bin/runners/lib/polish/autofix/async-handlers.js +0 -273
  254. package/bin/runners/lib/polish/autofix/dead-code.js +0 -280
  255. package/bin/runners/lib/polish/autofix/imports-optimizer.js +0 -344
  256. package/bin/runners/lib/polish/autofix/index.js +0 -200
  257. package/bin/runners/lib/polish/autofix/remove-consoles.js +0 -209
  258. package/bin/runners/lib/polish/autofix/strengthen-types.js +0 -245
  259. package/bin/runners/lib/polish/backend-checks.js +0 -148
  260. package/bin/runners/lib/polish/documentation-checks.js +0 -111
  261. package/bin/runners/lib/polish/frontend-checks.js +0 -168
  262. package/bin/runners/lib/polish/index.js +0 -71
  263. package/bin/runners/lib/polish/infrastructure-checks.js +0 -131
  264. package/bin/runners/lib/polish/library-detection.js +0 -175
  265. package/bin/runners/lib/polish/performance-checks.js +0 -100
  266. package/bin/runners/lib/polish/security-checks.js +0 -148
  267. package/bin/runners/lib/polish/utils.js +0 -203
  268. package/bin/runners/lib/prompt-builder.js +0 -540
  269. package/bin/runners/lib/proof-certificate.js +0 -634
  270. package/bin/runners/lib/reality/accessibility-audit.js +0 -946
  271. package/bin/runners/lib/reality/api-contract-validator.js +0 -1012
  272. package/bin/runners/lib/reality/chaos-engineering.js +0 -1084
  273. package/bin/runners/lib/reality/performance-tracker.js +0 -1077
  274. package/bin/runners/lib/reality/scenario-generator.js +0 -1404
  275. package/bin/runners/lib/reality/visual-regression.js +0 -852
  276. package/bin/runners/lib/reality-profiler.js +0 -717
  277. package/bin/runners/lib/replay/flight-recorder-viewer.js +0 -1160
  278. package/bin/runners/lib/review/ai-code-review.js +0 -832
  279. package/bin/runners/lib/rules/custom-rule-engine.js +0 -985
  280. package/bin/runners/lib/sbom-generator.js +0 -641
  281. package/bin/runners/lib/scan-output-enhanced.js +0 -512
  282. package/bin/runners/lib/security/owasp-scanner.js +0 -939
  283. package/bin/runners/lib/ship-output-enterprise.js +0 -239
  284. package/bin/runners/lib/unified-cli-output.js +0 -777
  285. package/bin/runners/lib/validators/contract-validator.js +0 -283
  286. package/bin/runners/lib/validators/dead-export-detector.js +0 -279
  287. package/bin/runners/lib/validators/dep-audit.js +0 -245
  288. package/bin/runners/lib/validators/env-validator.js +0 -319
  289. package/bin/runners/lib/validators/index.js +0 -120
  290. package/bin/runners/lib/validators/license-checker.js +0 -252
  291. package/bin/runners/lib/validators/route-validator.js +0 -290
  292. package/bin/runners/runAgent.d.ts +0 -5
  293. package/bin/runners/runAgent.js +0 -164
  294. package/bin/runners/runApprove.js +0 -1233
  295. package/bin/runners/runAuthority.js +0 -528
  296. package/bin/runners/runClassify.js +0 -862
  297. package/bin/runners/runConductor.js +0 -772
  298. package/bin/runners/runContainer.js +0 -366
  299. package/bin/runners/runContext.d.ts +0 -4
  300. package/bin/runners/runEasy.js +0 -410
  301. package/bin/runners/runFirewall.d.ts +0 -5
  302. package/bin/runners/runFirewall.js +0 -137
  303. package/bin/runners/runFirewallHook.d.ts +0 -5
  304. package/bin/runners/runFirewallHook.js +0 -59
  305. package/bin/runners/runIaC.js +0 -372
  306. package/bin/runners/runPolish.d.ts +0 -4
  307. package/bin/runners/runProof.zip +0 -0
  308. package/bin/runners/runTruth.d.ts +0 -5
  309. package/bin/runners/runTruth.js +0 -104
  310. package/bin/runners/runVibe.js +0 -791
  311. package/mcp-server/HARDENING_SUMMARY.md +0 -299
  312. package/mcp-server/agent-firewall-interceptor.js +0 -500
  313. package/mcp-server/authority-tools.js +0 -569
  314. package/mcp-server/conductor/conflict-resolver.js +0 -588
  315. package/mcp-server/conductor/execution-planner.js +0 -544
  316. package/mcp-server/conductor/index.js +0 -377
  317. package/mcp-server/conductor/lock-manager.js +0 -615
  318. package/mcp-server/conductor/request-queue.js +0 -550
  319. package/mcp-server/conductor/session-manager.js +0 -500
  320. package/mcp-server/conductor/tools.js +0 -510
  321. package/mcp-server/lib/api-client.cjs +0 -13
  322. package/mcp-server/lib/logger.cjs +0 -30
  323. package/mcp-server/logger.js +0 -173
  324. package/mcp-server/tools-v3.js +0 -1039
  325. package/mcp-server/tools.js +0 -495
  326. package/mcp-server/vibecheck-mcp-server-3.2.0.tgz +0 -0
@@ -1,432 +0,0 @@
1
- /**
2
- * Critic LLM Judge
3
- *
4
- * The "savage" judge that evaluates proposal quality.
5
- * Detects hand-waving, vague intent, and unverified assumptions.
6
- *
7
- * Philosophy: "If this change cannot be proven safe by the repository, block it."
8
- */
9
-
10
- "use strict";
11
-
12
- const {
13
- CRITIC_SYSTEM_PROMPT,
14
- buildEvaluationPrompt,
15
- buildVaguenessPrompt,
16
- buildVerificationPrompt,
17
- parseCriticResponse,
18
- } = require("./prompts");
19
-
20
- /**
21
- * @typedef {Object} CriticVerdict
22
- * @property {string} verdict - ALLOW, BLOCK, or REQUIRE_CONFIRMATION
23
- * @property {number} confidence - Confidence in verdict (0-1)
24
- * @property {Array} reasoning - Reasons for the verdict
25
- * @property {Array} violations - Specific violations found
26
- * @property {Array} recommendations - Suggestions for improvement
27
- */
28
-
29
- /**
30
- * Default LLM client configuration
31
- */
32
- const DEFAULT_CONFIG = {
33
- model: "gpt-4-turbo-preview",
34
- temperature: 0.1, // Low temperature for consistent judgments
35
- maxTokens: 1000,
36
- timeout: 30000,
37
- };
38
-
39
- /**
40
- * Critic Judge class
41
- */
42
- class CriticJudge {
43
- constructor(options = {}) {
44
- this.config = { ...DEFAULT_CONFIG, ...options };
45
- this.llmClient = options.llmClient || null;
46
- this.enabled = options.enabled !== false;
47
- this.fallbackMode = options.fallbackMode || "conservative";
48
- }
49
-
50
- /**
51
- * Set the LLM client
52
- * @param {Function} client - LLM client function
53
- */
54
- setClient(client) {
55
- this.llmClient = client;
56
- }
57
-
58
- /**
59
- * Check if critic is available
60
- * @returns {boolean} Is available
61
- */
62
- isAvailable() {
63
- return this.enabled && this.llmClient !== null;
64
- }
65
-
66
- /**
67
- * Evaluate a proposal
68
- * @param {Object} params - Evaluation parameters
69
- * @returns {Promise<CriticVerdict>} Critic verdict
70
- */
71
- async evaluate(params) {
72
- const {
73
- proposal,
74
- validationResults = {},
75
- riskScore = {},
76
- simulationResult = {},
77
- realityState = {},
78
- } = params;
79
-
80
- // If critic is disabled, use rule-based evaluation
81
- if (!this.isAvailable()) {
82
- return this.ruleBasedEvaluation(params);
83
- }
84
-
85
- try {
86
- // Build the evaluation prompt
87
- const prompt = buildEvaluationPrompt({
88
- proposal,
89
- validationResults,
90
- riskScore,
91
- simulationResult,
92
- realityState,
93
- });
94
-
95
- // Call LLM
96
- const response = await this.callLLM(prompt);
97
-
98
- // Parse response
99
- const verdict = parseCriticResponse(response);
100
-
101
- // Validate verdict
102
- return this.validateVerdict(verdict);
103
- } catch (error) {
104
- console.warn(`Critic LLM evaluation failed: ${error.message}`);
105
-
106
- // Fall back to rule-based evaluation
107
- if (this.fallbackMode === "conservative") {
108
- return this.ruleBasedEvaluation(params);
109
- } else {
110
- return {
111
- verdict: "ALLOW",
112
- confidence: 0.3,
113
- reasoning: ["Critic unavailable, using permissive fallback"],
114
- violations: [],
115
- recommendations: ["Consider manual review"],
116
- };
117
- }
118
- }
119
- }
120
-
121
- /**
122
- * Check for vagueness in proposal
123
- * @param {Object} proposal - Proposal to check
124
- * @returns {Promise<Object>} Vagueness analysis
125
- */
126
- async checkVagueness(proposal) {
127
- if (!this.isAvailable()) {
128
- return this.ruleBasedVaguenessCheck(proposal);
129
- }
130
-
131
- try {
132
- const prompt = buildVaguenessPrompt(proposal);
133
- const response = await this.callLLM(prompt);
134
- return parseCriticResponse(response);
135
- } catch (error) {
136
- return this.ruleBasedVaguenessCheck(proposal);
137
- }
138
- }
139
-
140
- /**
141
- * Verify assumptions against reality
142
- * @param {Array} assumptions - Assumptions to verify
143
- * @param {Object} realityState - Repository state
144
- * @returns {Promise<Object>} Verification results
145
- */
146
- async verifyAssumptions(assumptions, realityState) {
147
- if (!this.isAvailable()) {
148
- return this.ruleBasedAssumptionVerification(assumptions, realityState);
149
- }
150
-
151
- try {
152
- const prompt = buildVerificationPrompt(assumptions, realityState);
153
- const response = await this.callLLM(prompt);
154
- return parseCriticResponse(response);
155
- } catch (error) {
156
- return this.ruleBasedAssumptionVerification(assumptions, realityState);
157
- }
158
- }
159
-
160
- /**
161
- * Call the LLM
162
- * @param {string} prompt - User prompt
163
- * @returns {Promise<string>} LLM response
164
- */
165
- async callLLM(prompt) {
166
- if (!this.llmClient) {
167
- throw new Error("LLM client not configured");
168
- }
169
-
170
- return this.llmClient({
171
- systemPrompt: CRITIC_SYSTEM_PROMPT,
172
- userPrompt: prompt,
173
- model: this.config.model,
174
- temperature: this.config.temperature,
175
- maxTokens: this.config.maxTokens,
176
- });
177
- }
178
-
179
- /**
180
- * Validate and normalize verdict
181
- * @param {Object} verdict - Raw verdict
182
- * @returns {CriticVerdict} Validated verdict
183
- */
184
- validateVerdict(verdict) {
185
- const validVerdicts = ["ALLOW", "BLOCK", "REQUIRE_CONFIRMATION"];
186
-
187
- return {
188
- verdict: validVerdicts.includes(verdict.verdict) ? verdict.verdict : "BLOCK",
189
- confidence: typeof verdict.confidence === "number"
190
- ? Math.max(0, Math.min(1, verdict.confidence))
191
- : 0.5,
192
- reasoning: Array.isArray(verdict.reasoning) ? verdict.reasoning : [],
193
- violations: Array.isArray(verdict.violations) ? verdict.violations : [],
194
- recommendations: Array.isArray(verdict.recommendations) ? verdict.recommendations : [],
195
- };
196
- }
197
-
198
- /**
199
- * Rule-based evaluation fallback
200
- * @param {Object} params - Evaluation parameters
201
- * @returns {CriticVerdict} Verdict
202
- */
203
- ruleBasedEvaluation(params) {
204
- const { proposal, validationResults, riskScore, simulationResult } = params;
205
-
206
- const violations = [];
207
- const reasoning = [];
208
- let verdict = "ALLOW";
209
- let confidence = 0.7;
210
-
211
- // Check simulation result
212
- if (simulationResult && !simulationResult.passed) {
213
- violations.push("Simulation failed");
214
- reasoning.push("Change would break imports or routes");
215
- verdict = "BLOCK";
216
- confidence = 0.9;
217
- }
218
-
219
- // Check risk score
220
- if (riskScore?.total >= 80) {
221
- violations.push(`High risk score: ${riskScore.total}`);
222
- reasoning.push("Risk score exceeds safe threshold");
223
- verdict = verdict === "BLOCK" ? "BLOCK" : "REQUIRE_CONFIRMATION";
224
- confidence = Math.max(confidence, 0.8);
225
- }
226
-
227
- // Check unverified assumptions
228
- if (validationResults?.invalid?.length > 0) {
229
- for (const invalid of validationResults.invalid) {
230
- violations.push(`Unverified assumption: ${invalid.assumption?.key || invalid.assumption?.type}`);
231
- }
232
- reasoning.push(`${validationResults.invalid.length} assumptions could not be verified`);
233
- verdict = "BLOCK";
234
- confidence = 0.85;
235
- }
236
-
237
- // Check vagueness
238
- const vaguenessCheck = this.ruleBasedVaguenessCheck(proposal);
239
- if (vaguenessCheck.specificityScore < 4) {
240
- violations.push("Proposal is too vague");
241
- reasoning.push(`Specificity score: ${vaguenessCheck.specificityScore}/10`);
242
- if (verdict === "ALLOW") verdict = "REQUIRE_CONFIRMATION";
243
- }
244
-
245
- // Check for sensitive domains without explicit acknowledgment
246
- const sensitiveDomains = ["auth", "payments", "database"];
247
- const touchesSensitive = (proposal.operations || []).some(op => {
248
- const path = (op.path || "").toLowerCase();
249
- return sensitiveDomains.some(d => path.includes(d));
250
- });
251
-
252
- if (touchesSensitive && !proposal.riskAcknowledgment) {
253
- violations.push("Touches sensitive domains without risk acknowledgment");
254
- reasoning.push("Changes to auth/payments/database require explicit acknowledgment");
255
- if (verdict === "ALLOW") verdict = "REQUIRE_CONFIRMATION";
256
- }
257
-
258
- // No violations = allow
259
- if (violations.length === 0) {
260
- reasoning.push("No violations detected");
261
- }
262
-
263
- return {
264
- verdict,
265
- confidence,
266
- reasoning,
267
- violations,
268
- recommendations: violations.length > 0
269
- ? ["Address violations before proceeding", "Add missing assumptions"]
270
- : [],
271
- };
272
- }
273
-
274
- /**
275
- * Rule-based vagueness check
276
- * @param {Object} proposal - Proposal to check
277
- * @returns {Object} Vagueness analysis
278
- */
279
- ruleBasedVaguenessCheck(proposal) {
280
- const vagueTerms = [];
281
- let specificityScore = 10;
282
-
283
- // Check intent
284
- const vagueIntents = ["fix", "update", "change", "modify", "improve", "refactor", "adjust"];
285
- const intentWords = (proposal.intent || "").toLowerCase().split("_");
286
-
287
- if (intentWords.length === 1 && vagueIntents.includes(intentWords[0])) {
288
- vagueTerms.push(proposal.intent);
289
- specificityScore -= 3;
290
- }
291
-
292
- // Check summary
293
- if (!proposal.summary) {
294
- specificityScore -= 2;
295
- } else if (proposal.summary.length < 20) {
296
- specificityScore -= 1;
297
- }
298
-
299
- // Check assumptions
300
- if (!proposal.assumptions || proposal.assumptions.length === 0) {
301
- specificityScore -= 2;
302
- }
303
-
304
- // Check operation count vs explanation
305
- const opCount = (proposal.operations || []).length;
306
- if (opCount > 3 && (!proposal.summary || proposal.summary.length < 50)) {
307
- specificityScore -= 2;
308
- }
309
-
310
- // Check for vague words in summary
311
- const vagueWords = ["some", "various", "etc", "stuff", "things", "somehow"];
312
- if (proposal.summary) {
313
- for (const word of vagueWords) {
314
- if (proposal.summary.toLowerCase().includes(word)) {
315
- vagueTerms.push(word);
316
- specificityScore -= 1;
317
- }
318
- }
319
- }
320
-
321
- specificityScore = Math.max(1, specificityScore);
322
-
323
- return {
324
- specificityScore,
325
- vagueTerms,
326
- suggestions: vagueTerms.length > 0
327
- ? [`Replace vague terms: ${vagueTerms.join(", ")}`, "Add specific details"]
328
- : [],
329
- };
330
- }
331
-
332
- /**
333
- * Rule-based assumption verification
334
- * @param {Array} assumptions - Assumptions to verify
335
- * @param {Object} realityState - Repository state
336
- * @returns {Object} Verification results
337
- */
338
- ruleBasedAssumptionVerification(assumptions, realityState) {
339
- const results = [];
340
- let verifiedCount = 0;
341
-
342
- for (const assumption of assumptions) {
343
- let verified = false;
344
- let evidence = null;
345
- let reason = "";
346
-
347
- switch (assumption.type) {
348
- case "env":
349
- if (realityState?.envVars?.has(assumption.key)) {
350
- verified = true;
351
- evidence = `Found in env vars: ${assumption.key}`;
352
- } else {
353
- reason = `Env var '${assumption.key}' not found in declared variables`;
354
- }
355
- break;
356
-
357
- case "route":
358
- const routeExists = realityState?.routes?.some(r =>
359
- r.path === assumption.path &&
360
- (r.method === assumption.method || !assumption.method)
361
- );
362
- if (routeExists) {
363
- verified = true;
364
- evidence = `Route ${assumption.method || "GET"} ${assumption.path} is registered`;
365
- } else {
366
- reason = `Route ${assumption.path} not found in registered routes`;
367
- }
368
- break;
369
-
370
- case "service":
371
- const serviceExists = realityState?.services?.some(s =>
372
- s.name === assumption.key || s.name === assumption.name
373
- );
374
- if (serviceExists) {
375
- verified = true;
376
- evidence = `Service ${assumption.key || assumption.name} is registered`;
377
- } else {
378
- reason = `Service ${assumption.key || assumption.name} not found`;
379
- }
380
- break;
381
-
382
- case "file":
383
- if (realityState?.files?.has(assumption.path?.replace(/\\/g, "/"))) {
384
- verified = true;
385
- evidence = `File ${assumption.path} exists`;
386
- } else {
387
- reason = `File ${assumption.path} not found`;
388
- }
389
- break;
390
-
391
- default:
392
- reason = `Unknown assumption type: ${assumption.type}`;
393
- }
394
-
395
- if (verified) verifiedCount++;
396
-
397
- results.push({
398
- assumption: assumption.key || assumption.path || assumption.type,
399
- verified,
400
- evidence,
401
- reason,
402
- });
403
- }
404
-
405
- return {
406
- results,
407
- overallVerificationRate: assumptions.length > 0
408
- ? verifiedCount / assumptions.length
409
- : 1,
410
- };
411
- }
412
- }
413
-
414
- /**
415
- * Create a critic judge instance
416
- * @param {Object} options - Configuration options
417
- * @returns {CriticJudge} Judge instance
418
- */
419
- function createJudge(options = {}) {
420
- return new CriticJudge(options);
421
- }
422
-
423
- /**
424
- * Default judge instance
425
- */
426
- const defaultJudge = createJudge();
427
-
428
- module.exports = {
429
- CriticJudge,
430
- createJudge,
431
- defaultJudge,
432
- };