@vibecheckai/cli 3.5.0 → 3.5.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/bin/registry.js +174 -449
- package/bin/runners/cli-utils.js +33 -2
- package/bin/runners/context/generators/cursor.js +2 -49
- package/bin/runners/context/generators/mcp.js +13 -15
- package/bin/runners/context/proof-context.js +1 -248
- package/bin/runners/lib/analysis-core.js +180 -198
- package/bin/runners/lib/analyzers.js +241 -2212
- package/bin/runners/lib/cli-output.js +210 -242
- package/bin/runners/lib/detectors-v2.js +785 -547
- package/bin/runners/lib/entitlements-v2.js +431 -161
- package/bin/runners/lib/error-handler.js +9 -16
- package/bin/runners/lib/global-flags.js +0 -37
- package/bin/runners/lib/html-proof-report.js +700 -350
- package/bin/runners/lib/missions/plan.js +6 -46
- package/bin/runners/lib/missions/templates.js +0 -232
- package/bin/runners/lib/route-truth.js +322 -1167
- package/bin/runners/lib/scan-output.js +467 -493
- package/bin/runners/lib/ship-output.js +27 -280
- package/bin/runners/lib/terminal-ui.js +700 -310
- package/bin/runners/lib/truth.js +321 -1004
- package/bin/runners/lib/unified-output.js +158 -162
- package/bin/runners/lib/upsell.js +204 -104
- package/bin/runners/runAIAgent.js +10 -5
- package/bin/runners/runAllowlist.js +324 -0
- package/bin/runners/runAuth.js +94 -344
- package/bin/runners/runCheckpoint.js +45 -43
- package/bin/runners/runContext.js +24 -139
- package/bin/runners/runDoctor.js +101 -136
- package/bin/runners/runEvidencePack.js +219 -0
- package/bin/runners/runFix.js +71 -82
- package/bin/runners/runGuard.js +119 -606
- package/bin/runners/runInit.js +60 -22
- package/bin/runners/runInstall.js +281 -0
- package/bin/runners/runLabs.js +341 -0
- package/bin/runners/runMcp.js +62 -139
- package/bin/runners/runPolish.js +83 -282
- package/bin/runners/runPromptFirewall.js +12 -5
- package/bin/runners/runProve.js +58 -33
- package/bin/runners/runReality.js +58 -81
- package/bin/runners/runReport.js +7 -34
- package/bin/runners/runRuntime.js +8 -5
- package/bin/runners/runScan.js +844 -219
- package/bin/runners/runShip.js +59 -721
- package/bin/runners/runValidate.js +11 -24
- package/bin/runners/runWatch.js +76 -131
- package/bin/vibecheck.js +69 -295
- package/mcp-server/ARCHITECTURE.md +339 -0
- package/mcp-server/__tests__/cache.test.ts +313 -0
- package/mcp-server/__tests__/executor.test.ts +239 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/.cache/webpack/cache.pack +1 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/.next/server/chunk.js +3 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/.turbo/cache.json +3 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/.venv/lib/env.py +3 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/dist/bundle.js +3 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/package.json +5 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/src/app.ts +5 -0
- package/mcp-server/__tests__/fixtures/exclusion-test/venv/lib/config.py +4 -0
- package/mcp-server/__tests__/ids.test.ts +345 -0
- package/mcp-server/__tests__/integration/tools.test.ts +410 -0
- package/mcp-server/__tests__/registry.test.ts +365 -0
- package/mcp-server/__tests__/sandbox.test.ts +323 -0
- package/mcp-server/__tests__/schemas.test.ts +372 -0
- package/mcp-server/benchmarks/run-benchmarks.ts +304 -0
- package/mcp-server/examples/doctor.request.json +14 -0
- package/mcp-server/examples/doctor.response.json +53 -0
- package/mcp-server/examples/error.response.json +15 -0
- package/mcp-server/examples/scan.request.json +14 -0
- package/mcp-server/examples/scan.response.json +108 -0
- package/mcp-server/handlers/tool-handler.ts +671 -0
- package/mcp-server/index-v1.js +698 -0
- package/mcp-server/index-v3.ts +293 -0
- package/mcp-server/index.js +1080 -1757
- package/mcp-server/index.old.js +4137 -0
- package/mcp-server/lib/cache.ts +341 -0
- package/mcp-server/lib/errors.ts +346 -0
- package/mcp-server/lib/executor.ts +792 -0
- package/mcp-server/lib/ids.ts +238 -0
- package/mcp-server/lib/logger.ts +368 -0
- package/mcp-server/lib/metrics.ts +365 -0
- package/mcp-server/lib/sandbox.ts +337 -0
- package/mcp-server/lib/validator.ts +229 -0
- package/mcp-server/package-lock.json +165 -0
- package/mcp-server/package.json +32 -7
- package/mcp-server/premium-tools.js +2 -2
- package/mcp-server/registry/tools.json +476 -0
- package/mcp-server/schemas/error-envelope.schema.json +125 -0
- package/mcp-server/schemas/finding.schema.json +167 -0
- package/mcp-server/schemas/report-artifact.schema.json +88 -0
- package/mcp-server/schemas/run-request.schema.json +75 -0
- package/mcp-server/schemas/verdict.schema.json +168 -0
- package/mcp-server/tier-auth.d.ts +71 -0
- package/mcp-server/tier-auth.js +371 -183
- package/mcp-server/truth-context.js +90 -131
- package/mcp-server/truth-firewall-tools.js +1000 -1611
- package/mcp-server/tsconfig.json +34 -0
- package/mcp-server/vibecheck-tools.js +2 -2
- package/mcp-server/vitest.config.ts +16 -0
- package/package.json +3 -4
- package/bin/runners/lib/agent-firewall/ai/false-positive-analyzer.js +0 -474
- package/bin/runners/lib/agent-firewall/change-packet/builder.js +0 -488
- package/bin/runners/lib/agent-firewall/change-packet/schema.json +0 -228
- package/bin/runners/lib/agent-firewall/change-packet/store.js +0 -200
- package/bin/runners/lib/agent-firewall/claims/claim-types.js +0 -21
- package/bin/runners/lib/agent-firewall/claims/extractor.js +0 -303
- package/bin/runners/lib/agent-firewall/claims/patterns.js +0 -24
- package/bin/runners/lib/agent-firewall/critic/index.js +0 -151
- package/bin/runners/lib/agent-firewall/critic/judge.js +0 -432
- package/bin/runners/lib/agent-firewall/critic/prompts.js +0 -305
- package/bin/runners/lib/agent-firewall/evidence/auth-evidence.js +0 -88
- package/bin/runners/lib/agent-firewall/evidence/contract-evidence.js +0 -75
- package/bin/runners/lib/agent-firewall/evidence/env-evidence.js +0 -127
- package/bin/runners/lib/agent-firewall/evidence/resolver.js +0 -102
- package/bin/runners/lib/agent-firewall/evidence/route-evidence.js +0 -213
- package/bin/runners/lib/agent-firewall/evidence/side-effect-evidence.js +0 -145
- package/bin/runners/lib/agent-firewall/fs-hook/daemon.js +0 -19
- package/bin/runners/lib/agent-firewall/fs-hook/installer.js +0 -87
- package/bin/runners/lib/agent-firewall/fs-hook/watcher.js +0 -184
- package/bin/runners/lib/agent-firewall/git-hook/pre-commit.js +0 -163
- package/bin/runners/lib/agent-firewall/ide-extension/cursor.js +0 -107
- package/bin/runners/lib/agent-firewall/ide-extension/vscode.js +0 -68
- package/bin/runners/lib/agent-firewall/ide-extension/windsurf.js +0 -66
- package/bin/runners/lib/agent-firewall/interceptor/base.js +0 -304
- package/bin/runners/lib/agent-firewall/interceptor/cursor.js +0 -35
- package/bin/runners/lib/agent-firewall/interceptor/vscode.js +0 -35
- package/bin/runners/lib/agent-firewall/interceptor/windsurf.js +0 -34
- package/bin/runners/lib/agent-firewall/lawbook/distributor.js +0 -465
- package/bin/runners/lib/agent-firewall/lawbook/evaluator.js +0 -604
- package/bin/runners/lib/agent-firewall/lawbook/index.js +0 -304
- package/bin/runners/lib/agent-firewall/lawbook/registry.js +0 -514
- package/bin/runners/lib/agent-firewall/lawbook/schema.js +0 -420
- package/bin/runners/lib/agent-firewall/learning/learning-engine.js +0 -849
- package/bin/runners/lib/agent-firewall/logger.js +0 -141
- package/bin/runners/lib/agent-firewall/policy/default-policy.json +0 -90
- package/bin/runners/lib/agent-firewall/policy/engine.js +0 -103
- package/bin/runners/lib/agent-firewall/policy/loader.js +0 -451
- package/bin/runners/lib/agent-firewall/policy/rules/auth-drift.js +0 -50
- package/bin/runners/lib/agent-firewall/policy/rules/contract-drift.js +0 -50
- package/bin/runners/lib/agent-firewall/policy/rules/fake-success.js +0 -86
- package/bin/runners/lib/agent-firewall/policy/rules/ghost-env.js +0 -162
- package/bin/runners/lib/agent-firewall/policy/rules/ghost-route.js +0 -189
- package/bin/runners/lib/agent-firewall/policy/rules/scope.js +0 -93
- package/bin/runners/lib/agent-firewall/policy/rules/unsafe-side-effect.js +0 -57
- package/bin/runners/lib/agent-firewall/policy/schema.json +0 -183
- package/bin/runners/lib/agent-firewall/policy/verdict.js +0 -54
- package/bin/runners/lib/agent-firewall/proposal/extractor.js +0 -394
- package/bin/runners/lib/agent-firewall/proposal/index.js +0 -212
- package/bin/runners/lib/agent-firewall/proposal/schema.js +0 -251
- package/bin/runners/lib/agent-firewall/proposal/validator.js +0 -386
- package/bin/runners/lib/agent-firewall/reality/index.js +0 -332
- package/bin/runners/lib/agent-firewall/reality/state.js +0 -625
- package/bin/runners/lib/agent-firewall/reality/watcher.js +0 -322
- package/bin/runners/lib/agent-firewall/risk/index.js +0 -173
- package/bin/runners/lib/agent-firewall/risk/scorer.js +0 -328
- package/bin/runners/lib/agent-firewall/risk/thresholds.js +0 -321
- package/bin/runners/lib/agent-firewall/risk/vectors.js +0 -421
- package/bin/runners/lib/agent-firewall/simulator/diff-simulator.js +0 -472
- package/bin/runners/lib/agent-firewall/simulator/import-resolver.js +0 -346
- package/bin/runners/lib/agent-firewall/simulator/index.js +0 -181
- package/bin/runners/lib/agent-firewall/simulator/route-validator.js +0 -380
- package/bin/runners/lib/agent-firewall/time-machine/incident-correlator.js +0 -661
- package/bin/runners/lib/agent-firewall/time-machine/index.js +0 -267
- package/bin/runners/lib/agent-firewall/time-machine/replay-engine.js +0 -436
- package/bin/runners/lib/agent-firewall/time-machine/state-reconstructor.js +0 -490
- package/bin/runners/lib/agent-firewall/time-machine/timeline-builder.js +0 -530
- package/bin/runners/lib/agent-firewall/truthpack/index.js +0 -67
- package/bin/runners/lib/agent-firewall/truthpack/loader.js +0 -137
- package/bin/runners/lib/agent-firewall/unblock/planner.js +0 -337
- package/bin/runners/lib/agent-firewall/utils/ignore-checker.js +0 -118
- package/bin/runners/lib/api-client.js +0 -269
- package/bin/runners/lib/audit-logger.js +0 -532
- package/bin/runners/lib/authority/authorities/architecture.js +0 -364
- package/bin/runners/lib/authority/authorities/compliance.js +0 -341
- package/bin/runners/lib/authority/authorities/human.js +0 -343
- package/bin/runners/lib/authority/authorities/quality.js +0 -420
- package/bin/runners/lib/authority/authorities/security.js +0 -228
- package/bin/runners/lib/authority/index.js +0 -293
- package/bin/runners/lib/authority-badge.js +0 -425
- package/bin/runners/lib/bundle/bundle-intelligence.js +0 -846
- package/bin/runners/lib/cli-charts.js +0 -368
- package/bin/runners/lib/cli-config-display.js +0 -405
- package/bin/runners/lib/cli-demo.js +0 -275
- package/bin/runners/lib/cli-errors.js +0 -438
- package/bin/runners/lib/cli-help-formatter.js +0 -439
- package/bin/runners/lib/cli-interactive-menu.js +0 -509
- package/bin/runners/lib/cli-prompts.js +0 -441
- package/bin/runners/lib/cli-scan-cards.js +0 -362
- package/bin/runners/lib/compliance-reporter.js +0 -710
- package/bin/runners/lib/conductor/index.js +0 -671
- package/bin/runners/lib/easy/README.md +0 -123
- package/bin/runners/lib/easy/index.js +0 -140
- package/bin/runners/lib/easy/interactive-wizard.js +0 -788
- package/bin/runners/lib/easy/one-click-firewall.js +0 -564
- package/bin/runners/lib/easy/zero-config-reality.js +0 -714
- package/bin/runners/lib/engines/accessibility-engine.js +0 -390
- package/bin/runners/lib/engines/api-consistency-engine.js +0 -467
- package/bin/runners/lib/engines/ast-cache.js +0 -99
- package/bin/runners/lib/engines/async-patterns-engine.js +0 -444
- package/bin/runners/lib/engines/bundle-size-engine.js +0 -433
- package/bin/runners/lib/engines/code-quality-engine.js +0 -255
- package/bin/runners/lib/engines/confidence-scoring.js +0 -276
- package/bin/runners/lib/engines/console-logs-engine.js +0 -115
- package/bin/runners/lib/engines/context-detection.js +0 -264
- package/bin/runners/lib/engines/cross-file-analysis-engine.js +0 -533
- package/bin/runners/lib/engines/database-patterns-engine.js +0 -429
- package/bin/runners/lib/engines/dead-code-engine.js +0 -198
- package/bin/runners/lib/engines/deprecated-api-engine.js +0 -226
- package/bin/runners/lib/engines/duplicate-code-engine.js +0 -354
- package/bin/runners/lib/engines/empty-catch-engine.js +0 -260
- package/bin/runners/lib/engines/env-variables-engine.js +0 -458
- package/bin/runners/lib/engines/error-handling-engine.js +0 -437
- package/bin/runners/lib/engines/false-positive-prevention.js +0 -630
- package/bin/runners/lib/engines/file-filter.js +0 -131
- package/bin/runners/lib/engines/framework-adapters/index.js +0 -607
- package/bin/runners/lib/engines/framework-detection.js +0 -508
- package/bin/runners/lib/engines/hardcoded-secrets-engine.js +0 -251
- package/bin/runners/lib/engines/import-order-engine.js +0 -429
- package/bin/runners/lib/engines/mock-data-engine.js +0 -315
- package/bin/runners/lib/engines/naming-conventions-engine.js +0 -544
- package/bin/runners/lib/engines/noise-reduction-engine.js +0 -452
- package/bin/runners/lib/engines/orchestrator.js +0 -334
- package/bin/runners/lib/engines/parallel-processor.js +0 -71
- package/bin/runners/lib/engines/performance-issues-engine.js +0 -405
- package/bin/runners/lib/engines/react-patterns-engine.js +0 -457
- package/bin/runners/lib/engines/security-vulnerabilities-engine.js +0 -571
- package/bin/runners/lib/engines/todo-fixme-engine.js +0 -115
- package/bin/runners/lib/engines/type-aware-engine.js +0 -376
- package/bin/runners/lib/engines/unsafe-regex-engine.js +0 -225
- package/bin/runners/lib/engines/vibecheck-engines/README.md +0 -53
- package/bin/runners/lib/engines/vibecheck-engines/index.js +0 -124
- package/bin/runners/lib/engines/vibecheck-engines/lib/ai-hallucination-engine.js +0 -806
- package/bin/runners/lib/engines/vibecheck-engines/lib/hardcoded-secrets-engine.js +0 -439
- package/bin/runners/lib/engines/vibecheck-engines/lib/smart-fix-engine.js +0 -577
- package/bin/runners/lib/engines/vibecheck-engines/lib/vibe-score-engine.js +0 -543
- package/bin/runners/lib/engines/vibecheck-engines/package.json +0 -13
- package/bin/runners/lib/engines/vibecheck-engines.js +0 -514
- package/bin/runners/lib/enhanced-features/index.js +0 -305
- package/bin/runners/lib/enhanced-output.js +0 -631
- package/bin/runners/lib/enterprise.js +0 -300
- package/bin/runners/lib/exit-codes.js +0 -275
- package/bin/runners/lib/fingerprint.js +0 -377
- package/bin/runners/lib/firewall/command-validator.js +0 -351
- package/bin/runners/lib/firewall/config.js +0 -341
- package/bin/runners/lib/firewall/content-validator.js +0 -519
- package/bin/runners/lib/firewall/index.js +0 -101
- package/bin/runners/lib/firewall/path-validator.js +0 -256
- package/bin/runners/lib/help-formatter.js +0 -413
- package/bin/runners/lib/intelligence/cross-repo-intelligence.js +0 -817
- package/bin/runners/lib/logger.js +0 -38
- package/bin/runners/lib/mcp-utils.js +0 -425
- package/bin/runners/lib/output/index.js +0 -1022
- package/bin/runners/lib/policy-engine.js +0 -652
- package/bin/runners/lib/polish/autofix/accessibility-fixes.js +0 -333
- package/bin/runners/lib/polish/autofix/async-handlers.js +0 -273
- package/bin/runners/lib/polish/autofix/dead-code.js +0 -280
- package/bin/runners/lib/polish/autofix/imports-optimizer.js +0 -344
- package/bin/runners/lib/polish/autofix/index.js +0 -200
- package/bin/runners/lib/polish/autofix/remove-consoles.js +0 -209
- package/bin/runners/lib/polish/autofix/strengthen-types.js +0 -245
- package/bin/runners/lib/polish/backend-checks.js +0 -148
- package/bin/runners/lib/polish/documentation-checks.js +0 -111
- package/bin/runners/lib/polish/frontend-checks.js +0 -168
- package/bin/runners/lib/polish/index.js +0 -71
- package/bin/runners/lib/polish/infrastructure-checks.js +0 -131
- package/bin/runners/lib/polish/library-detection.js +0 -175
- package/bin/runners/lib/polish/performance-checks.js +0 -100
- package/bin/runners/lib/polish/security-checks.js +0 -148
- package/bin/runners/lib/polish/utils.js +0 -203
- package/bin/runners/lib/prompt-builder.js +0 -540
- package/bin/runners/lib/proof-certificate.js +0 -634
- package/bin/runners/lib/reality/accessibility-audit.js +0 -946
- package/bin/runners/lib/reality/api-contract-validator.js +0 -1012
- package/bin/runners/lib/reality/chaos-engineering.js +0 -1084
- package/bin/runners/lib/reality/performance-tracker.js +0 -1077
- package/bin/runners/lib/reality/scenario-generator.js +0 -1404
- package/bin/runners/lib/reality/visual-regression.js +0 -852
- package/bin/runners/lib/reality-profiler.js +0 -717
- package/bin/runners/lib/replay/flight-recorder-viewer.js +0 -1160
- package/bin/runners/lib/review/ai-code-review.js +0 -832
- package/bin/runners/lib/rules/custom-rule-engine.js +0 -985
- package/bin/runners/lib/sbom-generator.js +0 -641
- package/bin/runners/lib/scan-output-enhanced.js +0 -512
- package/bin/runners/lib/security/owasp-scanner.js +0 -939
- package/bin/runners/lib/ship-output-enterprise.js +0 -239
- package/bin/runners/lib/unified-cli-output.js +0 -777
- package/bin/runners/lib/validators/contract-validator.js +0 -283
- package/bin/runners/lib/validators/dead-export-detector.js +0 -279
- package/bin/runners/lib/validators/dep-audit.js +0 -245
- package/bin/runners/lib/validators/env-validator.js +0 -319
- package/bin/runners/lib/validators/index.js +0 -120
- package/bin/runners/lib/validators/license-checker.js +0 -252
- package/bin/runners/lib/validators/route-validator.js +0 -290
- package/bin/runners/runAgent.d.ts +0 -5
- package/bin/runners/runAgent.js +0 -164
- package/bin/runners/runApprove.js +0 -1233
- package/bin/runners/runAuthority.js +0 -528
- package/bin/runners/runClassify.js +0 -862
- package/bin/runners/runConductor.js +0 -772
- package/bin/runners/runContainer.js +0 -366
- package/bin/runners/runContext.d.ts +0 -4
- package/bin/runners/runEasy.js +0 -410
- package/bin/runners/runFirewall.d.ts +0 -5
- package/bin/runners/runFirewall.js +0 -137
- package/bin/runners/runFirewallHook.d.ts +0 -5
- package/bin/runners/runFirewallHook.js +0 -59
- package/bin/runners/runIaC.js +0 -372
- package/bin/runners/runPolish.d.ts +0 -4
- package/bin/runners/runProof.zip +0 -0
- package/bin/runners/runTruth.d.ts +0 -5
- package/bin/runners/runTruth.js +0 -104
- package/bin/runners/runVibe.js +0 -791
- package/mcp-server/HARDENING_SUMMARY.md +0 -299
- package/mcp-server/agent-firewall-interceptor.js +0 -500
- package/mcp-server/authority-tools.js +0 -569
- package/mcp-server/conductor/conflict-resolver.js +0 -588
- package/mcp-server/conductor/execution-planner.js +0 -544
- package/mcp-server/conductor/index.js +0 -377
- package/mcp-server/conductor/lock-manager.js +0 -615
- package/mcp-server/conductor/request-queue.js +0 -550
- package/mcp-server/conductor/session-manager.js +0 -500
- package/mcp-server/conductor/tools.js +0 -510
- package/mcp-server/lib/api-client.cjs +0 -13
- package/mcp-server/lib/logger.cjs +0 -30
- package/mcp-server/logger.js +0 -173
- package/mcp-server/tools-v3.js +0 -1039
- package/mcp-server/tools.js +0 -495
- package/mcp-server/vibecheck-mcp-server-3.2.0.tgz +0 -0
|
@@ -1,432 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Critic LLM Judge
|
|
3
|
-
*
|
|
4
|
-
* The "savage" judge that evaluates proposal quality.
|
|
5
|
-
* Detects hand-waving, vague intent, and unverified assumptions.
|
|
6
|
-
*
|
|
7
|
-
* Philosophy: "If this change cannot be proven safe by the repository, block it."
|
|
8
|
-
*/
|
|
9
|
-
|
|
10
|
-
"use strict";
|
|
11
|
-
|
|
12
|
-
const {
|
|
13
|
-
CRITIC_SYSTEM_PROMPT,
|
|
14
|
-
buildEvaluationPrompt,
|
|
15
|
-
buildVaguenessPrompt,
|
|
16
|
-
buildVerificationPrompt,
|
|
17
|
-
parseCriticResponse,
|
|
18
|
-
} = require("./prompts");
|
|
19
|
-
|
|
20
|
-
/**
|
|
21
|
-
* @typedef {Object} CriticVerdict
|
|
22
|
-
* @property {string} verdict - ALLOW, BLOCK, or REQUIRE_CONFIRMATION
|
|
23
|
-
* @property {number} confidence - Confidence in verdict (0-1)
|
|
24
|
-
* @property {Array} reasoning - Reasons for the verdict
|
|
25
|
-
* @property {Array} violations - Specific violations found
|
|
26
|
-
* @property {Array} recommendations - Suggestions for improvement
|
|
27
|
-
*/
|
|
28
|
-
|
|
29
|
-
/**
|
|
30
|
-
* Default LLM client configuration
|
|
31
|
-
*/
|
|
32
|
-
const DEFAULT_CONFIG = {
|
|
33
|
-
model: "gpt-4-turbo-preview",
|
|
34
|
-
temperature: 0.1, // Low temperature for consistent judgments
|
|
35
|
-
maxTokens: 1000,
|
|
36
|
-
timeout: 30000,
|
|
37
|
-
};
|
|
38
|
-
|
|
39
|
-
/**
|
|
40
|
-
* Critic Judge class
|
|
41
|
-
*/
|
|
42
|
-
class CriticJudge {
|
|
43
|
-
constructor(options = {}) {
|
|
44
|
-
this.config = { ...DEFAULT_CONFIG, ...options };
|
|
45
|
-
this.llmClient = options.llmClient || null;
|
|
46
|
-
this.enabled = options.enabled !== false;
|
|
47
|
-
this.fallbackMode = options.fallbackMode || "conservative";
|
|
48
|
-
}
|
|
49
|
-
|
|
50
|
-
/**
|
|
51
|
-
* Set the LLM client
|
|
52
|
-
* @param {Function} client - LLM client function
|
|
53
|
-
*/
|
|
54
|
-
setClient(client) {
|
|
55
|
-
this.llmClient = client;
|
|
56
|
-
}
|
|
57
|
-
|
|
58
|
-
/**
|
|
59
|
-
* Check if critic is available
|
|
60
|
-
* @returns {boolean} Is available
|
|
61
|
-
*/
|
|
62
|
-
isAvailable() {
|
|
63
|
-
return this.enabled && this.llmClient !== null;
|
|
64
|
-
}
|
|
65
|
-
|
|
66
|
-
/**
|
|
67
|
-
* Evaluate a proposal
|
|
68
|
-
* @param {Object} params - Evaluation parameters
|
|
69
|
-
* @returns {Promise<CriticVerdict>} Critic verdict
|
|
70
|
-
*/
|
|
71
|
-
async evaluate(params) {
|
|
72
|
-
const {
|
|
73
|
-
proposal,
|
|
74
|
-
validationResults = {},
|
|
75
|
-
riskScore = {},
|
|
76
|
-
simulationResult = {},
|
|
77
|
-
realityState = {},
|
|
78
|
-
} = params;
|
|
79
|
-
|
|
80
|
-
// If critic is disabled, use rule-based evaluation
|
|
81
|
-
if (!this.isAvailable()) {
|
|
82
|
-
return this.ruleBasedEvaluation(params);
|
|
83
|
-
}
|
|
84
|
-
|
|
85
|
-
try {
|
|
86
|
-
// Build the evaluation prompt
|
|
87
|
-
const prompt = buildEvaluationPrompt({
|
|
88
|
-
proposal,
|
|
89
|
-
validationResults,
|
|
90
|
-
riskScore,
|
|
91
|
-
simulationResult,
|
|
92
|
-
realityState,
|
|
93
|
-
});
|
|
94
|
-
|
|
95
|
-
// Call LLM
|
|
96
|
-
const response = await this.callLLM(prompt);
|
|
97
|
-
|
|
98
|
-
// Parse response
|
|
99
|
-
const verdict = parseCriticResponse(response);
|
|
100
|
-
|
|
101
|
-
// Validate verdict
|
|
102
|
-
return this.validateVerdict(verdict);
|
|
103
|
-
} catch (error) {
|
|
104
|
-
console.warn(`Critic LLM evaluation failed: ${error.message}`);
|
|
105
|
-
|
|
106
|
-
// Fall back to rule-based evaluation
|
|
107
|
-
if (this.fallbackMode === "conservative") {
|
|
108
|
-
return this.ruleBasedEvaluation(params);
|
|
109
|
-
} else {
|
|
110
|
-
return {
|
|
111
|
-
verdict: "ALLOW",
|
|
112
|
-
confidence: 0.3,
|
|
113
|
-
reasoning: ["Critic unavailable, using permissive fallback"],
|
|
114
|
-
violations: [],
|
|
115
|
-
recommendations: ["Consider manual review"],
|
|
116
|
-
};
|
|
117
|
-
}
|
|
118
|
-
}
|
|
119
|
-
}
|
|
120
|
-
|
|
121
|
-
/**
|
|
122
|
-
* Check for vagueness in proposal
|
|
123
|
-
* @param {Object} proposal - Proposal to check
|
|
124
|
-
* @returns {Promise<Object>} Vagueness analysis
|
|
125
|
-
*/
|
|
126
|
-
async checkVagueness(proposal) {
|
|
127
|
-
if (!this.isAvailable()) {
|
|
128
|
-
return this.ruleBasedVaguenessCheck(proposal);
|
|
129
|
-
}
|
|
130
|
-
|
|
131
|
-
try {
|
|
132
|
-
const prompt = buildVaguenessPrompt(proposal);
|
|
133
|
-
const response = await this.callLLM(prompt);
|
|
134
|
-
return parseCriticResponse(response);
|
|
135
|
-
} catch (error) {
|
|
136
|
-
return this.ruleBasedVaguenessCheck(proposal);
|
|
137
|
-
}
|
|
138
|
-
}
|
|
139
|
-
|
|
140
|
-
/**
|
|
141
|
-
* Verify assumptions against reality
|
|
142
|
-
* @param {Array} assumptions - Assumptions to verify
|
|
143
|
-
* @param {Object} realityState - Repository state
|
|
144
|
-
* @returns {Promise<Object>} Verification results
|
|
145
|
-
*/
|
|
146
|
-
async verifyAssumptions(assumptions, realityState) {
|
|
147
|
-
if (!this.isAvailable()) {
|
|
148
|
-
return this.ruleBasedAssumptionVerification(assumptions, realityState);
|
|
149
|
-
}
|
|
150
|
-
|
|
151
|
-
try {
|
|
152
|
-
const prompt = buildVerificationPrompt(assumptions, realityState);
|
|
153
|
-
const response = await this.callLLM(prompt);
|
|
154
|
-
return parseCriticResponse(response);
|
|
155
|
-
} catch (error) {
|
|
156
|
-
return this.ruleBasedAssumptionVerification(assumptions, realityState);
|
|
157
|
-
}
|
|
158
|
-
}
|
|
159
|
-
|
|
160
|
-
/**
|
|
161
|
-
* Call the LLM
|
|
162
|
-
* @param {string} prompt - User prompt
|
|
163
|
-
* @returns {Promise<string>} LLM response
|
|
164
|
-
*/
|
|
165
|
-
async callLLM(prompt) {
|
|
166
|
-
if (!this.llmClient) {
|
|
167
|
-
throw new Error("LLM client not configured");
|
|
168
|
-
}
|
|
169
|
-
|
|
170
|
-
return this.llmClient({
|
|
171
|
-
systemPrompt: CRITIC_SYSTEM_PROMPT,
|
|
172
|
-
userPrompt: prompt,
|
|
173
|
-
model: this.config.model,
|
|
174
|
-
temperature: this.config.temperature,
|
|
175
|
-
maxTokens: this.config.maxTokens,
|
|
176
|
-
});
|
|
177
|
-
}
|
|
178
|
-
|
|
179
|
-
/**
|
|
180
|
-
* Validate and normalize verdict
|
|
181
|
-
* @param {Object} verdict - Raw verdict
|
|
182
|
-
* @returns {CriticVerdict} Validated verdict
|
|
183
|
-
*/
|
|
184
|
-
validateVerdict(verdict) {
|
|
185
|
-
const validVerdicts = ["ALLOW", "BLOCK", "REQUIRE_CONFIRMATION"];
|
|
186
|
-
|
|
187
|
-
return {
|
|
188
|
-
verdict: validVerdicts.includes(verdict.verdict) ? verdict.verdict : "BLOCK",
|
|
189
|
-
confidence: typeof verdict.confidence === "number"
|
|
190
|
-
? Math.max(0, Math.min(1, verdict.confidence))
|
|
191
|
-
: 0.5,
|
|
192
|
-
reasoning: Array.isArray(verdict.reasoning) ? verdict.reasoning : [],
|
|
193
|
-
violations: Array.isArray(verdict.violations) ? verdict.violations : [],
|
|
194
|
-
recommendations: Array.isArray(verdict.recommendations) ? verdict.recommendations : [],
|
|
195
|
-
};
|
|
196
|
-
}
|
|
197
|
-
|
|
198
|
-
/**
|
|
199
|
-
* Rule-based evaluation fallback
|
|
200
|
-
* @param {Object} params - Evaluation parameters
|
|
201
|
-
* @returns {CriticVerdict} Verdict
|
|
202
|
-
*/
|
|
203
|
-
ruleBasedEvaluation(params) {
|
|
204
|
-
const { proposal, validationResults, riskScore, simulationResult } = params;
|
|
205
|
-
|
|
206
|
-
const violations = [];
|
|
207
|
-
const reasoning = [];
|
|
208
|
-
let verdict = "ALLOW";
|
|
209
|
-
let confidence = 0.7;
|
|
210
|
-
|
|
211
|
-
// Check simulation result
|
|
212
|
-
if (simulationResult && !simulationResult.passed) {
|
|
213
|
-
violations.push("Simulation failed");
|
|
214
|
-
reasoning.push("Change would break imports or routes");
|
|
215
|
-
verdict = "BLOCK";
|
|
216
|
-
confidence = 0.9;
|
|
217
|
-
}
|
|
218
|
-
|
|
219
|
-
// Check risk score
|
|
220
|
-
if (riskScore?.total >= 80) {
|
|
221
|
-
violations.push(`High risk score: ${riskScore.total}`);
|
|
222
|
-
reasoning.push("Risk score exceeds safe threshold");
|
|
223
|
-
verdict = verdict === "BLOCK" ? "BLOCK" : "REQUIRE_CONFIRMATION";
|
|
224
|
-
confidence = Math.max(confidence, 0.8);
|
|
225
|
-
}
|
|
226
|
-
|
|
227
|
-
// Check unverified assumptions
|
|
228
|
-
if (validationResults?.invalid?.length > 0) {
|
|
229
|
-
for (const invalid of validationResults.invalid) {
|
|
230
|
-
violations.push(`Unverified assumption: ${invalid.assumption?.key || invalid.assumption?.type}`);
|
|
231
|
-
}
|
|
232
|
-
reasoning.push(`${validationResults.invalid.length} assumptions could not be verified`);
|
|
233
|
-
verdict = "BLOCK";
|
|
234
|
-
confidence = 0.85;
|
|
235
|
-
}
|
|
236
|
-
|
|
237
|
-
// Check vagueness
|
|
238
|
-
const vaguenessCheck = this.ruleBasedVaguenessCheck(proposal);
|
|
239
|
-
if (vaguenessCheck.specificityScore < 4) {
|
|
240
|
-
violations.push("Proposal is too vague");
|
|
241
|
-
reasoning.push(`Specificity score: ${vaguenessCheck.specificityScore}/10`);
|
|
242
|
-
if (verdict === "ALLOW") verdict = "REQUIRE_CONFIRMATION";
|
|
243
|
-
}
|
|
244
|
-
|
|
245
|
-
// Check for sensitive domains without explicit acknowledgment
|
|
246
|
-
const sensitiveDomains = ["auth", "payments", "database"];
|
|
247
|
-
const touchesSensitive = (proposal.operations || []).some(op => {
|
|
248
|
-
const path = (op.path || "").toLowerCase();
|
|
249
|
-
return sensitiveDomains.some(d => path.includes(d));
|
|
250
|
-
});
|
|
251
|
-
|
|
252
|
-
if (touchesSensitive && !proposal.riskAcknowledgment) {
|
|
253
|
-
violations.push("Touches sensitive domains without risk acknowledgment");
|
|
254
|
-
reasoning.push("Changes to auth/payments/database require explicit acknowledgment");
|
|
255
|
-
if (verdict === "ALLOW") verdict = "REQUIRE_CONFIRMATION";
|
|
256
|
-
}
|
|
257
|
-
|
|
258
|
-
// No violations = allow
|
|
259
|
-
if (violations.length === 0) {
|
|
260
|
-
reasoning.push("No violations detected");
|
|
261
|
-
}
|
|
262
|
-
|
|
263
|
-
return {
|
|
264
|
-
verdict,
|
|
265
|
-
confidence,
|
|
266
|
-
reasoning,
|
|
267
|
-
violations,
|
|
268
|
-
recommendations: violations.length > 0
|
|
269
|
-
? ["Address violations before proceeding", "Add missing assumptions"]
|
|
270
|
-
: [],
|
|
271
|
-
};
|
|
272
|
-
}
|
|
273
|
-
|
|
274
|
-
/**
|
|
275
|
-
* Rule-based vagueness check
|
|
276
|
-
* @param {Object} proposal - Proposal to check
|
|
277
|
-
* @returns {Object} Vagueness analysis
|
|
278
|
-
*/
|
|
279
|
-
ruleBasedVaguenessCheck(proposal) {
|
|
280
|
-
const vagueTerms = [];
|
|
281
|
-
let specificityScore = 10;
|
|
282
|
-
|
|
283
|
-
// Check intent
|
|
284
|
-
const vagueIntents = ["fix", "update", "change", "modify", "improve", "refactor", "adjust"];
|
|
285
|
-
const intentWords = (proposal.intent || "").toLowerCase().split("_");
|
|
286
|
-
|
|
287
|
-
if (intentWords.length === 1 && vagueIntents.includes(intentWords[0])) {
|
|
288
|
-
vagueTerms.push(proposal.intent);
|
|
289
|
-
specificityScore -= 3;
|
|
290
|
-
}
|
|
291
|
-
|
|
292
|
-
// Check summary
|
|
293
|
-
if (!proposal.summary) {
|
|
294
|
-
specificityScore -= 2;
|
|
295
|
-
} else if (proposal.summary.length < 20) {
|
|
296
|
-
specificityScore -= 1;
|
|
297
|
-
}
|
|
298
|
-
|
|
299
|
-
// Check assumptions
|
|
300
|
-
if (!proposal.assumptions || proposal.assumptions.length === 0) {
|
|
301
|
-
specificityScore -= 2;
|
|
302
|
-
}
|
|
303
|
-
|
|
304
|
-
// Check operation count vs explanation
|
|
305
|
-
const opCount = (proposal.operations || []).length;
|
|
306
|
-
if (opCount > 3 && (!proposal.summary || proposal.summary.length < 50)) {
|
|
307
|
-
specificityScore -= 2;
|
|
308
|
-
}
|
|
309
|
-
|
|
310
|
-
// Check for vague words in summary
|
|
311
|
-
const vagueWords = ["some", "various", "etc", "stuff", "things", "somehow"];
|
|
312
|
-
if (proposal.summary) {
|
|
313
|
-
for (const word of vagueWords) {
|
|
314
|
-
if (proposal.summary.toLowerCase().includes(word)) {
|
|
315
|
-
vagueTerms.push(word);
|
|
316
|
-
specificityScore -= 1;
|
|
317
|
-
}
|
|
318
|
-
}
|
|
319
|
-
}
|
|
320
|
-
|
|
321
|
-
specificityScore = Math.max(1, specificityScore);
|
|
322
|
-
|
|
323
|
-
return {
|
|
324
|
-
specificityScore,
|
|
325
|
-
vagueTerms,
|
|
326
|
-
suggestions: vagueTerms.length > 0
|
|
327
|
-
? [`Replace vague terms: ${vagueTerms.join(", ")}`, "Add specific details"]
|
|
328
|
-
: [],
|
|
329
|
-
};
|
|
330
|
-
}
|
|
331
|
-
|
|
332
|
-
/**
|
|
333
|
-
* Rule-based assumption verification
|
|
334
|
-
* @param {Array} assumptions - Assumptions to verify
|
|
335
|
-
* @param {Object} realityState - Repository state
|
|
336
|
-
* @returns {Object} Verification results
|
|
337
|
-
*/
|
|
338
|
-
ruleBasedAssumptionVerification(assumptions, realityState) {
|
|
339
|
-
const results = [];
|
|
340
|
-
let verifiedCount = 0;
|
|
341
|
-
|
|
342
|
-
for (const assumption of assumptions) {
|
|
343
|
-
let verified = false;
|
|
344
|
-
let evidence = null;
|
|
345
|
-
let reason = "";
|
|
346
|
-
|
|
347
|
-
switch (assumption.type) {
|
|
348
|
-
case "env":
|
|
349
|
-
if (realityState?.envVars?.has(assumption.key)) {
|
|
350
|
-
verified = true;
|
|
351
|
-
evidence = `Found in env vars: ${assumption.key}`;
|
|
352
|
-
} else {
|
|
353
|
-
reason = `Env var '${assumption.key}' not found in declared variables`;
|
|
354
|
-
}
|
|
355
|
-
break;
|
|
356
|
-
|
|
357
|
-
case "route":
|
|
358
|
-
const routeExists = realityState?.routes?.some(r =>
|
|
359
|
-
r.path === assumption.path &&
|
|
360
|
-
(r.method === assumption.method || !assumption.method)
|
|
361
|
-
);
|
|
362
|
-
if (routeExists) {
|
|
363
|
-
verified = true;
|
|
364
|
-
evidence = `Route ${assumption.method || "GET"} ${assumption.path} is registered`;
|
|
365
|
-
} else {
|
|
366
|
-
reason = `Route ${assumption.path} not found in registered routes`;
|
|
367
|
-
}
|
|
368
|
-
break;
|
|
369
|
-
|
|
370
|
-
case "service":
|
|
371
|
-
const serviceExists = realityState?.services?.some(s =>
|
|
372
|
-
s.name === assumption.key || s.name === assumption.name
|
|
373
|
-
);
|
|
374
|
-
if (serviceExists) {
|
|
375
|
-
verified = true;
|
|
376
|
-
evidence = `Service ${assumption.key || assumption.name} is registered`;
|
|
377
|
-
} else {
|
|
378
|
-
reason = `Service ${assumption.key || assumption.name} not found`;
|
|
379
|
-
}
|
|
380
|
-
break;
|
|
381
|
-
|
|
382
|
-
case "file":
|
|
383
|
-
if (realityState?.files?.has(assumption.path?.replace(/\\/g, "/"))) {
|
|
384
|
-
verified = true;
|
|
385
|
-
evidence = `File ${assumption.path} exists`;
|
|
386
|
-
} else {
|
|
387
|
-
reason = `File ${assumption.path} not found`;
|
|
388
|
-
}
|
|
389
|
-
break;
|
|
390
|
-
|
|
391
|
-
default:
|
|
392
|
-
reason = `Unknown assumption type: ${assumption.type}`;
|
|
393
|
-
}
|
|
394
|
-
|
|
395
|
-
if (verified) verifiedCount++;
|
|
396
|
-
|
|
397
|
-
results.push({
|
|
398
|
-
assumption: assumption.key || assumption.path || assumption.type,
|
|
399
|
-
verified,
|
|
400
|
-
evidence,
|
|
401
|
-
reason,
|
|
402
|
-
});
|
|
403
|
-
}
|
|
404
|
-
|
|
405
|
-
return {
|
|
406
|
-
results,
|
|
407
|
-
overallVerificationRate: assumptions.length > 0
|
|
408
|
-
? verifiedCount / assumptions.length
|
|
409
|
-
: 1,
|
|
410
|
-
};
|
|
411
|
-
}
|
|
412
|
-
}
|
|
413
|
-
|
|
414
|
-
/**
|
|
415
|
-
* Create a critic judge instance
|
|
416
|
-
* @param {Object} options - Configuration options
|
|
417
|
-
* @returns {CriticJudge} Judge instance
|
|
418
|
-
*/
|
|
419
|
-
function createJudge(options = {}) {
|
|
420
|
-
return new CriticJudge(options);
|
|
421
|
-
}
|
|
422
|
-
|
|
423
|
-
/**
|
|
424
|
-
* Default judge instance
|
|
425
|
-
*/
|
|
426
|
-
const defaultJudge = createJudge();
|
|
427
|
-
|
|
428
|
-
module.exports = {
|
|
429
|
-
CriticJudge,
|
|
430
|
-
createJudge,
|
|
431
|
-
defaultJudge,
|
|
432
|
-
};
|