@vibecheckai/cli 3.0.4 → 3.0.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (108) hide show
  1. package/bin/dev/run-v2-torture.js +30 -0
  2. package/bin/runners/context/index.js +1 -1
  3. package/bin/runners/lib/analyzers.js +38 -0
  4. package/bin/runners/lib/assets/vibecheck-logo.png +0 -0
  5. package/bin/runners/lib/contracts/auth-contract.js +8 -0
  6. package/bin/runners/lib/contracts/env-contract.js +3 -0
  7. package/bin/runners/lib/contracts/external-contract.js +10 -2
  8. package/bin/runners/lib/contracts/route-contract.js +7 -0
  9. package/bin/runners/lib/contracts.js +804 -0
  10. package/bin/runners/lib/detectors-v2.js +703 -0
  11. package/bin/runners/lib/drift.js +425 -0
  12. package/bin/runners/lib/entitlements-v2.js +3 -1
  13. package/bin/runners/lib/entitlements.js +11 -3
  14. package/bin/runners/lib/env-resolver.js +417 -0
  15. package/bin/runners/lib/extractors/client-calls.js +990 -0
  16. package/bin/runners/lib/extractors/fastify-route-dump.js +573 -0
  17. package/bin/runners/lib/extractors/fastify-routes.js +426 -0
  18. package/bin/runners/lib/extractors/index.js +363 -0
  19. package/bin/runners/lib/extractors/next-routes.js +524 -0
  20. package/bin/runners/lib/extractors/proof-graph.js +431 -0
  21. package/bin/runners/lib/extractors/route-matcher.js +451 -0
  22. package/bin/runners/lib/extractors/truthpack-v2.js +377 -0
  23. package/bin/runners/lib/extractors/ui-bindings.js +547 -0
  24. package/bin/runners/lib/findings-schema.js +281 -0
  25. package/bin/runners/lib/html-report.js +650 -0
  26. package/bin/runners/lib/missions/templates.js +45 -0
  27. package/bin/runners/lib/policy.js +295 -0
  28. package/bin/runners/lib/reality/correlation-detectors.js +359 -0
  29. package/bin/runners/lib/reality/index.js +318 -0
  30. package/bin/runners/lib/reality/request-hashing.js +416 -0
  31. package/bin/runners/lib/reality/request-mapper.js +453 -0
  32. package/bin/runners/lib/reality/safety-rails.js +463 -0
  33. package/bin/runners/lib/reality/semantic-snapshot.js +408 -0
  34. package/bin/runners/lib/reality/toast-detector.js +393 -0
  35. package/bin/runners/lib/report-html.js +5 -0
  36. package/bin/runners/lib/report-templates.js +5 -0
  37. package/bin/runners/lib/report.js +135 -0
  38. package/bin/runners/lib/route-truth.js +10 -10
  39. package/bin/runners/lib/schema-validator.js +350 -0
  40. package/bin/runners/lib/schemas/contracts.schema.json +160 -0
  41. package/bin/runners/lib/schemas/finding.schema.json +100 -0
  42. package/bin/runners/lib/schemas/mission-pack.schema.json +206 -0
  43. package/bin/runners/lib/schemas/proof-graph.schema.json +176 -0
  44. package/bin/runners/lib/schemas/reality-report.schema.json +162 -0
  45. package/bin/runners/lib/schemas/share-pack.schema.json +180 -0
  46. package/bin/runners/lib/schemas/ship-report.schema.json +117 -0
  47. package/bin/runners/lib/schemas/truthpack-v2.schema.json +303 -0
  48. package/bin/runners/lib/schemas/validator.js +438 -0
  49. package/bin/runners/lib/ui.js +562 -0
  50. package/bin/runners/lib/verdict-engine.js +628 -0
  51. package/bin/runners/runAIAgent.js +228 -1
  52. package/bin/runners/runBadge.js +181 -1
  53. package/bin/runners/runCtx.js +7 -2
  54. package/bin/runners/runCtxDiff.js +301 -0
  55. package/bin/runners/runGuard.js +168 -0
  56. package/bin/runners/runInitGha.js +78 -15
  57. package/bin/runners/runLabs.js +341 -0
  58. package/bin/runners/runLaunch.js +180 -1
  59. package/bin/runners/runMdc.js +203 -1
  60. package/bin/runners/runProof.zip +0 -0
  61. package/bin/runners/runProve.js +23 -0
  62. package/bin/runners/runReplay.js +114 -84
  63. package/bin/runners/runScan.js +111 -32
  64. package/bin/runners/runShip.js +23 -2
  65. package/bin/runners/runTruthpack.js +9 -7
  66. package/bin/runners/runValidate.js +161 -1
  67. package/bin/vibecheck.js +416 -770
  68. package/mcp-server/.guardrail/audit/audit.log.jsonl +2 -0
  69. package/mcp-server/.specs/architecture.mdc +90 -0
  70. package/mcp-server/.specs/security.mdc +30 -0
  71. package/mcp-server/README.md +252 -0
  72. package/mcp-server/agent-checkpoint.js +364 -0
  73. package/mcp-server/architect-tools.js +707 -0
  74. package/mcp-server/audit-mcp.js +206 -0
  75. package/mcp-server/codebase-architect-tools.js +838 -0
  76. package/mcp-server/consolidated-tools.js +804 -0
  77. package/mcp-server/hygiene-tools.js +428 -0
  78. package/mcp-server/index-v1.js +698 -0
  79. package/mcp-server/index.js +2092 -0
  80. package/mcp-server/index.old.js +4137 -0
  81. package/mcp-server/intelligence-tools.js +664 -0
  82. package/mcp-server/intent-drift-tools.js +873 -0
  83. package/mcp-server/mdc-generator.js +298 -0
  84. package/mcp-server/package-lock.json +165 -0
  85. package/mcp-server/package.json +47 -0
  86. package/mcp-server/premium-tools.js +1275 -0
  87. package/mcp-server/test-mcp.js +108 -0
  88. package/mcp-server/test-tools.js +36 -0
  89. package/mcp-server/tier-auth.js +147 -0
  90. package/mcp-server/tools/index.js +72 -0
  91. package/mcp-server/tools-reorganized.ts +244 -0
  92. package/mcp-server/truth-context.js +581 -0
  93. package/mcp-server/truth-firewall-tools.js +1500 -0
  94. package/mcp-server/vibecheck-2.0-tools.js +748 -0
  95. package/mcp-server/vibecheck-tools.js +1075 -0
  96. package/package.json +10 -8
  97. package/bin/guardrail.js +0 -834
  98. package/bin/runners/runAudit.js +0 -2
  99. package/bin/runners/runAutopilot.js +0 -2
  100. package/bin/runners/runCertify.js +0 -2
  101. package/bin/runners/runDashboard.js +0 -10
  102. package/bin/runners/runEnhancedShip.js +0 -2
  103. package/bin/runners/runFixPacks.js +0 -2
  104. package/bin/runners/runNaturalLanguage.js +0 -3
  105. package/bin/runners/runProof.js +0 -2
  106. package/bin/runners/runRealitySniff.js +0 -2
  107. package/bin/runners/runUpgrade.js +0 -2
  108. package/bin/runners/runVerifyAgentOutput.js +0 -2
@@ -0,0 +1,408 @@
1
+ /**
2
+ * Semantic Snapshot v2
3
+ *
4
+ * Creates stable, lightweight UI fingerprints for meaningful change detection.
5
+ * Captures accessible DOM features while filtering noise.
6
+ */
7
+
8
+ "use strict";
9
+
10
+ const crypto = require("crypto");
11
+
12
+ // =============================================================================
13
+ // CONSTANTS
14
+ // =============================================================================
15
+
16
+ const IGNORE_TAGS = new Set([
17
+ "script", "style", "link", "meta", "noscript", "template"
18
+ ]);
19
+
20
+ const IGNORE_SELECTORS = [
21
+ "[data-hydration]",
22
+ "[data-nextjs-scroll-focus-boundary]",
23
+ "nextjs-portal",
24
+ "[data-overlay-container]",
25
+ "#__next-build-watcher",
26
+ "#__next-prerender-indicator",
27
+ ];
28
+
29
+ const MEANINGFUL_ROLES = new Set([
30
+ "button", "link", "textbox", "checkbox", "radio", "combobox",
31
+ "listbox", "menu", "menuitem", "tab", "tabpanel", "dialog",
32
+ "alert", "alertdialog", "status", "progressbar", "form",
33
+ "navigation", "main", "region", "banner", "contentinfo"
34
+ ]);
35
+
36
+ const TIMESTAMP_REGEX = /^\d{1,2}:\d{2}(:\d{2})?\s*(AM|PM)?$/i;
37
+ const TIMER_REGEX = /^\d+(\.\d+)?\s*(s|ms|sec|seconds?)$/i;
38
+
39
+ // =============================================================================
40
+ // SEMANTIC SNAPSHOT CAPTURE (runs in browser context)
41
+ // =============================================================================
42
+
43
+ /**
44
+ * Playwright script to capture semantic snapshot
45
+ * Inject this into page.evaluate()
46
+ */
47
+ const CAPTURE_SCRIPT = `
48
+ (function captureSemanticSnapshot(options = {}) {
49
+ const {
50
+ regions = ['main', '#__next', '[role="main"]', 'body'],
51
+ includeDialogs = true,
52
+ maxTextLength = 80,
53
+ ignoreTimestamps = true,
54
+ } = options;
55
+
56
+ const IGNORE_TAGS = new Set(['script', 'style', 'link', 'meta', 'noscript', 'template', 'svg']);
57
+ const TIMESTAMP_RE = /^\\d{1,2}:\\d{2}(:\\d{2})?\\s*(AM|PM)?$/i;
58
+ const TIMER_RE = /^\\d+(\\.\\d+)?\\s*(s|ms|sec|seconds?)$/i;
59
+
60
+ function normalizeText(text) {
61
+ if (!text) return '';
62
+ let t = text.trim().replace(/\\s+/g, ' ');
63
+ if (t.length > maxTextLength) t = t.slice(0, maxTextLength) + '...';
64
+ return t;
65
+ }
66
+
67
+ function isTimestamp(text) {
68
+ if (!ignoreTimestamps) return false;
69
+ return TIMESTAMP_RE.test(text) || TIMER_RE.test(text);
70
+ }
71
+
72
+ function getAccessibleName(el) {
73
+ // aria-label takes precedence
74
+ if (el.getAttribute('aria-label')) return normalizeText(el.getAttribute('aria-label'));
75
+ // aria-labelledby
76
+ const labelledBy = el.getAttribute('aria-labelledby');
77
+ if (labelledBy) {
78
+ const labelEl = document.getElementById(labelledBy);
79
+ if (labelEl) return normalizeText(labelEl.textContent);
80
+ }
81
+ // For inputs, check associated label
82
+ if (el.id) {
83
+ const label = document.querySelector('label[for="' + el.id + '"]');
84
+ if (label) return normalizeText(label.textContent);
85
+ }
86
+ // Fallback to text content for buttons/links
87
+ if (['BUTTON', 'A'].includes(el.tagName)) {
88
+ return normalizeText(el.textContent);
89
+ }
90
+ return '';
91
+ }
92
+
93
+ function getRole(el) {
94
+ if (el.getAttribute('role')) return el.getAttribute('role');
95
+ // Infer from tag
96
+ const tag = el.tagName.toLowerCase();
97
+ const roleMap = {
98
+ button: 'button', a: 'link', input: 'textbox',
99
+ select: 'combobox', textarea: 'textbox', nav: 'navigation',
100
+ main: 'main', header: 'banner', footer: 'contentinfo',
101
+ dialog: 'dialog', form: 'form', img: 'img'
102
+ };
103
+ if (roleMap[tag]) return roleMap[tag];
104
+ if (tag === 'input') {
105
+ const type = el.type?.toLowerCase();
106
+ if (type === 'checkbox') return 'checkbox';
107
+ if (type === 'radio') return 'radio';
108
+ if (type === 'submit' || type === 'button') return 'button';
109
+ }
110
+ return null;
111
+ }
112
+
113
+ function extractNode(el) {
114
+ if (!el || el.nodeType !== 1) return null;
115
+ if (IGNORE_TAGS.has(el.tagName.toLowerCase())) return null;
116
+ if (el.hidden || el.getAttribute('aria-hidden') === 'true') return null;
117
+
118
+ const style = window.getComputedStyle(el);
119
+ if (style.display === 'none' || style.visibility === 'hidden') return null;
120
+
121
+ const role = getRole(el);
122
+ const name = getAccessibleName(el);
123
+
124
+ // Skip if text looks like timestamp
125
+ if (name && isTimestamp(name)) return null;
126
+
127
+ const node = {
128
+ tag: el.tagName.toLowerCase(),
129
+ role: role,
130
+ name: name || undefined,
131
+ disabled: el.disabled || el.getAttribute('aria-disabled') === 'true' || undefined,
132
+ invalid: el.getAttribute('aria-invalid') === 'true' || undefined,
133
+ href: el.tagName === 'A' ? el.getAttribute('href')?.split('?')[0] : undefined,
134
+ type: el.tagName === 'INPUT' ? el.type : undefined,
135
+ checked: (el.type === 'checkbox' || el.type === 'radio') ? el.checked : undefined,
136
+ value: el.tagName === 'INPUT' && el.type !== 'password' ? (el.value?.slice(0, 50) || undefined) : undefined,
137
+ };
138
+
139
+ // Clean undefined
140
+ Object.keys(node).forEach(k => node[k] === undefined && delete node[k]);
141
+
142
+ return node;
143
+ }
144
+
145
+ function walkTree(root, nodes = [], depth = 0) {
146
+ if (depth > 20) return nodes; // Prevent infinite recursion
147
+
148
+ for (const el of root.children || []) {
149
+ const node = extractNode(el);
150
+ if (node && (node.role || node.name)) {
151
+ nodes.push(node);
152
+ }
153
+ walkTree(el, nodes, depth + 1);
154
+ }
155
+ return nodes;
156
+ }
157
+
158
+ // Find main region
159
+ let mainRegion = null;
160
+ for (const selector of regions) {
161
+ mainRegion = document.querySelector(selector);
162
+ if (mainRegion) break;
163
+ }
164
+
165
+ const nodes = [];
166
+ if (mainRegion) {
167
+ walkTree(mainRegion, nodes);
168
+ }
169
+
170
+ // Add dialogs/modals
171
+ if (includeDialogs) {
172
+ const dialogs = document.querySelectorAll('[role="dialog"], [aria-modal="true"], [data-state="open"]');
173
+ for (const dialog of dialogs) {
174
+ walkTree(dialog, nodes);
175
+ }
176
+ }
177
+
178
+ // Count by role
179
+ const counts = {};
180
+ for (const n of nodes) {
181
+ if (n.role) {
182
+ counts[n.role] = (counts[n.role] || 0) + 1;
183
+ }
184
+ }
185
+
186
+ // Count errors
187
+ const errorCount = nodes.filter(n => n.invalid).length;
188
+ const disabledCount = nodes.filter(n => n.disabled).length;
189
+
190
+ return {
191
+ nodes: nodes,
192
+ counts: counts,
193
+ errorCount: errorCount,
194
+ disabledCount: disabledCount,
195
+ region: mainRegion?.tagName?.toLowerCase() || 'body',
196
+ url: window.location.pathname + window.location.search,
197
+ timestamp: Date.now(),
198
+ };
199
+ })
200
+ `;
201
+
202
+ /**
203
+ * Compute semantic hash from snapshot
204
+ */
205
+ function computeSemanticHash(snapshot) {
206
+ // Create a stable string representation
207
+ const significantNodes = snapshot.nodes
208
+ .filter(n => n.role || n.name)
209
+ .map(n => `${n.role || ""}:${n.name || ""}:${n.disabled ? "d" : ""}:${n.invalid ? "i" : ""}`)
210
+ .sort();
211
+
212
+ const content = JSON.stringify({
213
+ nodes: significantNodes,
214
+ counts: snapshot.counts,
215
+ url: snapshot.url,
216
+ });
217
+
218
+ return "sha256:" + crypto.createHash("sha256").update(content).digest("hex").slice(0, 16);
219
+ }
220
+
221
+ /**
222
+ * Compare two semantic snapshots and generate diff
223
+ */
224
+ function diffSnapshots(before, after) {
225
+ const diff = {
226
+ added: [],
227
+ removed: [],
228
+ changed: [],
229
+ };
230
+
231
+ // Create maps by role+name for comparison
232
+ const beforeMap = new Map();
233
+ const afterMap = new Map();
234
+
235
+ for (const n of before.nodes || []) {
236
+ const key = `${n.role || ""}:${n.name || ""}`;
237
+ beforeMap.set(key, n);
238
+ }
239
+
240
+ for (const n of after.nodes || []) {
241
+ const key = `${n.role || ""}:${n.name || ""}`;
242
+ afterMap.set(key, n);
243
+ }
244
+
245
+ // Find added
246
+ for (const [key, node] of afterMap) {
247
+ if (!beforeMap.has(key)) {
248
+ diff.added.push(`${node.role || node.tag}: ${node.name || "(unnamed)"}`);
249
+ } else {
250
+ // Check for changes
251
+ const beforeNode = beforeMap.get(key);
252
+ const changes = [];
253
+ if (beforeNode.disabled !== node.disabled) {
254
+ changes.push(node.disabled ? "disabled" : "enabled");
255
+ }
256
+ if (beforeNode.invalid !== node.invalid) {
257
+ changes.push(node.invalid ? "invalid" : "valid");
258
+ }
259
+ if (beforeNode.checked !== node.checked) {
260
+ changes.push(node.checked ? "checked" : "unchecked");
261
+ }
262
+ if (changes.length > 0) {
263
+ diff.changed.push(`${node.role || node.tag}: ${node.name || "(unnamed)"} -> ${changes.join(", ")}`);
264
+ }
265
+ }
266
+ }
267
+
268
+ // Find removed
269
+ for (const [key, node] of beforeMap) {
270
+ if (!afterMap.has(key)) {
271
+ diff.removed.push(`${node.role || node.tag}: ${node.name || "(unnamed)"}`);
272
+ }
273
+ }
274
+
275
+ // Check for route change
276
+ diff.routeChanged = before.url !== after.url;
277
+
278
+ // Check for error count change
279
+ diff.errorsChanged = before.errorCount !== after.errorCount;
280
+ diff.errorDelta = (after.errorCount || 0) - (before.errorCount || 0);
281
+
282
+ // Check for dialog changes
283
+ const beforeDialogCount = before.counts?.dialog || 0;
284
+ const afterDialogCount = after.counts?.dialog || 0;
285
+ diff.dialogOpened = afterDialogCount > beforeDialogCount;
286
+ diff.dialogClosed = afterDialogCount < beforeDialogCount;
287
+
288
+ return diff;
289
+ }
290
+
291
+ /**
292
+ * Calculate meaningful change score
293
+ */
294
+ function calculateChangeScore(diff, signals = []) {
295
+ let score = 0;
296
+ const reasons = [];
297
+
298
+ // Route change is always meaningful
299
+ if (diff.routeChanged) {
300
+ score += 1.0;
301
+ reasons.push("route_changed");
302
+ }
303
+
304
+ // Dialog opened/closed
305
+ if (diff.dialogOpened) {
306
+ score += 0.8;
307
+ reasons.push("dialog_opened");
308
+ }
309
+ if (diff.dialogClosed) {
310
+ score += 0.8;
311
+ reasons.push("dialog_closed");
312
+ }
313
+
314
+ // Toast signals
315
+ const toastSuccess = signals.find(s => s.kind === "toast_success");
316
+ const toastError = signals.find(s => s.kind === "toast_error");
317
+ const toastAny = signals.find(s => s.kind?.startsWith("toast_"));
318
+
319
+ if (toastSuccess) {
320
+ score += 0.6;
321
+ reasons.push("toast_success");
322
+ }
323
+ if (toastError) {
324
+ score += 0.6;
325
+ reasons.push("toast_error");
326
+ } else if (toastAny && !toastSuccess) {
327
+ score += 0.5;
328
+ reasons.push("toast_appeared");
329
+ }
330
+
331
+ // Alert banner (role=alert, aria-live)
332
+ const alertSignal = signals.find(s => s.kind === "alert_appeared");
333
+ if (alertSignal) {
334
+ score += 0.7;
335
+ reasons.push("alert_banner");
336
+ }
337
+
338
+ // Form errors changed
339
+ if (diff.errorsChanged) {
340
+ score += 0.7;
341
+ reasons.push(diff.errorDelta > 0 ? "form_errors_appeared" : "form_errors_cleared");
342
+ }
343
+
344
+ // Significant semantic diff
345
+ const significantChanges = diff.added.length + diff.removed.length + diff.changed.length;
346
+ if (significantChanges > 2) {
347
+ score += 0.7;
348
+ reasons.push("semantic_hash_changed");
349
+ } else if (significantChanges > 0) {
350
+ score += 0.3;
351
+ reasons.push("minor_semantic_change");
352
+ }
353
+
354
+ // Key control state changed (disabled/enabled)
355
+ const controlChanges = diff.changed.filter(c => c.includes("enabled") || c.includes("disabled"));
356
+ if (controlChanges.length > 0) {
357
+ score += 0.6;
358
+ reasons.push("control_state_changed");
359
+ }
360
+
361
+ // Cap at 1.0
362
+ score = Math.min(score, 1.0);
363
+
364
+ return {
365
+ score,
366
+ meaningful: score >= 0.6 || diff.routeChanged,
367
+ reasons,
368
+ };
369
+ }
370
+
371
+ /**
372
+ * Create UI change report from before/after snapshots and signals
373
+ */
374
+ function createUIChangeReport(before, after, signals = []) {
375
+ const beforeHash = computeSemanticHash(before);
376
+ const afterHash = computeSemanticHash(after);
377
+ const diff = diffSnapshots(before, after);
378
+ const { score, meaningful, reasons } = calculateChangeScore(diff, signals);
379
+
380
+ return {
381
+ score,
382
+ meaningful,
383
+ reasons,
384
+ beforeSemanticHash: beforeHash,
385
+ afterSemanticHash: afterHash,
386
+ semanticDiffSummary: {
387
+ added: diff.added.slice(0, 10),
388
+ removed: diff.removed.slice(0, 10),
389
+ changed: diff.changed.slice(0, 10),
390
+ },
391
+ routeChanged: diff.routeChanged,
392
+ dialogOpened: diff.dialogOpened,
393
+ dialogClosed: diff.dialogClosed,
394
+ errorsChanged: diff.errorsChanged,
395
+ errorDelta: diff.errorDelta,
396
+ };
397
+ }
398
+
399
+ module.exports = {
400
+ CAPTURE_SCRIPT,
401
+ computeSemanticHash,
402
+ diffSnapshots,
403
+ calculateChangeScore,
404
+ createUIChangeReport,
405
+ IGNORE_TAGS,
406
+ IGNORE_SELECTORS,
407
+ MEANINGFUL_ROLES,
408
+ };