thumbgate 0.9.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (364) hide show
  1. package/.claude-plugin/README.md +134 -0
  2. package/.claude-plugin/bundle/icon.png +0 -0
  3. package/.claude-plugin/bundle/icon.svg +18 -0
  4. package/.claude-plugin/bundle/server/index.js +24 -0
  5. package/.claude-plugin/marketplace.json +36 -0
  6. package/.claude-plugin/plugin.json +21 -0
  7. package/.well-known/mcp/server-card.json +231 -0
  8. package/LICENSE +21 -0
  9. package/README.md +375 -0
  10. package/adapters/README.md +9 -0
  11. package/adapters/amp/skills/thumbgate-feedback/SKILL.md +22 -0
  12. package/adapters/chatgpt/INSTALL.md +83 -0
  13. package/adapters/chatgpt/openapi.yaml +1281 -0
  14. package/adapters/claude/.mcp.json +14 -0
  15. package/adapters/codex/config.toml +9 -0
  16. package/adapters/gemini/function-declarations.json +224 -0
  17. package/adapters/mcp/server-stdio.js +788 -0
  18. package/adapters/opencode/opencode.json +15 -0
  19. package/bin/cli.js +1484 -0
  20. package/bin/memory.sh +64 -0
  21. package/bin/obsidian-sync.sh +20 -0
  22. package/bin/postinstall.js +37 -0
  23. package/config/build-metadata.json +4 -0
  24. package/config/e2e-critical-flows.json +45 -0
  25. package/config/gate-templates.json +77 -0
  26. package/config/gates/claim-verification.json +29 -0
  27. package/config/gates/computer-use.json +39 -0
  28. package/config/gates/default.json +117 -0
  29. package/config/github-about.json +25 -0
  30. package/config/mcp-allowlists.json +135 -0
  31. package/config/model-tiers.json +33 -0
  32. package/config/partner-routing.json +132 -0
  33. package/config/policy-bundles/constrained-v1.json +64 -0
  34. package/config/policy-bundles/default-v1.json +91 -0
  35. package/config/rubrics/default-v1.json +52 -0
  36. package/config/skill-packs/react-testing.json +23 -0
  37. package/config/skill-packs/stripe-integration/references/api-spec.json +1 -0
  38. package/config/skill-packs/stripe-integration/references/webhook-guide.md +3 -0
  39. package/config/skill-specs/pr-reviewer.json +9 -0
  40. package/config/skill-specs/release-status.json +9 -0
  41. package/config/skill-specs/ticket-triage.json +9 -0
  42. package/config/subagent-profiles.json +32 -0
  43. package/config/tessl-tiles.json +29 -0
  44. package/config/thumbgate-settings.managed.json +12 -0
  45. package/openapi/openapi.yaml +1281 -0
  46. package/package.json +283 -0
  47. package/plugins/amp-skill/INSTALL.md +52 -0
  48. package/plugins/amp-skill/SKILL.md +64 -0
  49. package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +22 -0
  50. package/plugins/claude-codex-bridge/.mcp.json +12 -0
  51. package/plugins/claude-codex-bridge/INSTALL.md +43 -0
  52. package/plugins/claude-codex-bridge/README.md +46 -0
  53. package/plugins/claude-codex-bridge/scripts/codex-bridge.js +288 -0
  54. package/plugins/claude-codex-bridge/skills/adversarial-review/SKILL.md +24 -0
  55. package/plugins/claude-codex-bridge/skills/result/SKILL.md +22 -0
  56. package/plugins/claude-codex-bridge/skills/review/SKILL.md +28 -0
  57. package/plugins/claude-codex-bridge/skills/second-pass/SKILL.md +27 -0
  58. package/plugins/claude-codex-bridge/skills/setup/SKILL.md +21 -0
  59. package/plugins/claude-codex-bridge/skills/status/SKILL.md +19 -0
  60. package/plugins/claude-skill/INSTALL.md +55 -0
  61. package/plugins/claude-skill/SKILL.md +46 -0
  62. package/plugins/codex-profile/.codex-plugin/plugin.json +43 -0
  63. package/plugins/codex-profile/.mcp.json +12 -0
  64. package/plugins/codex-profile/AGENTS.md +20 -0
  65. package/plugins/codex-profile/INSTALL.md +66 -0
  66. package/plugins/codex-profile/README.md +37 -0
  67. package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +23 -0
  68. package/plugins/cursor-marketplace/CHANGELOG.md +30 -0
  69. package/plugins/cursor-marketplace/LICENSE +21 -0
  70. package/plugins/cursor-marketplace/README.md +124 -0
  71. package/plugins/cursor-marketplace/agents/reliability-reviewer.md +31 -0
  72. package/plugins/cursor-marketplace/assets/logo-400x400.png +0 -0
  73. package/plugins/cursor-marketplace/commands/capture-feedback.md +33 -0
  74. package/plugins/cursor-marketplace/commands/check-gates.md +25 -0
  75. package/plugins/cursor-marketplace/commands/show-lessons.md +27 -0
  76. package/plugins/cursor-marketplace/hooks/hooks.json +10 -0
  77. package/plugins/cursor-marketplace/mcp.json +12 -0
  78. package/plugins/cursor-marketplace/rules/feedback-capture.mdc +34 -0
  79. package/plugins/cursor-marketplace/rules/pre-action-gates.mdc +30 -0
  80. package/plugins/cursor-marketplace/rules/session-continuity.mdc +28 -0
  81. package/plugins/cursor-marketplace/scripts/gate-check.sh +11 -0
  82. package/plugins/cursor-marketplace/skills/capture-feedback/SKILL.md +47 -0
  83. package/plugins/cursor-marketplace/skills/prevention-rules/SKILL.md +31 -0
  84. package/plugins/cursor-marketplace/skills/recall-context/SKILL.md +30 -0
  85. package/plugins/cursor-marketplace/skills/search-lessons/SKILL.md +33 -0
  86. package/plugins/gemini-extension/INSTALL.md +92 -0
  87. package/plugins/gemini-extension/gemini_prompt.txt +14 -0
  88. package/plugins/gemini-extension/tool_contract.json +45 -0
  89. package/plugins/opencode-profile/INSTALL.md +57 -0
  90. package/public/assets/instagram-card.png +0 -0
  91. package/public/assets/tiktok-agent-memory.mp4 +0 -0
  92. package/public/blog.html +400 -0
  93. package/public/dashboard.html +1093 -0
  94. package/public/guide.html +317 -0
  95. package/public/index.html +1014 -0
  96. package/public/learn/agent-harness-pattern.html +180 -0
  97. package/public/learn/ai-agent-persistent-memory.html +202 -0
  98. package/public/learn/learn.css +45 -0
  99. package/public/learn/mcp-pre-action-gates-explained.html +172 -0
  100. package/public/learn/stop-ai-agent-force-push.html +134 -0
  101. package/public/learn/vibe-coding-safety-net.html +142 -0
  102. package/public/learn.html +213 -0
  103. package/public/lessons.html +650 -0
  104. package/public/vercel.json +8 -0
  105. package/scripts/__pycache__/train_from_feedback.cpython-312.pyc +0 -0
  106. package/scripts/a2ui-engine.js +73 -0
  107. package/scripts/access-anomaly-detector.js +12 -0
  108. package/scripts/adk-consolidator.js +266 -0
  109. package/scripts/agent-readiness.js +220 -0
  110. package/scripts/agent-security-hardening.js +227 -0
  111. package/scripts/agentic-data-pipeline.js +847 -0
  112. package/scripts/analytics-report.js +328 -0
  113. package/scripts/analytics-window.js +158 -0
  114. package/scripts/async-job-runner.js +1001 -0
  115. package/scripts/audit-trail.js +398 -0
  116. package/scripts/auto-promote-gates.js +299 -0
  117. package/scripts/auto-wire-hooks.js +312 -0
  118. package/scripts/autonomous-sales-agent.js +39 -0
  119. package/scripts/autoresearch-runner.js +216 -0
  120. package/scripts/background-agent-governance.js +237 -0
  121. package/scripts/behavioral-extraction.js +97 -0
  122. package/scripts/belief-update.js +84 -0
  123. package/scripts/billing.js +2438 -0
  124. package/scripts/bot-detector.js +50 -0
  125. package/scripts/budget-guard.js +173 -0
  126. package/scripts/build-claude-mcpb.js +189 -0
  127. package/scripts/build-metadata.js +97 -0
  128. package/scripts/check-congruence.js +322 -0
  129. package/scripts/cli-feedback.js +135 -0
  130. package/scripts/cli-telemetry.js +87 -0
  131. package/scripts/cloudflare-dynamic-sandbox.js +315 -0
  132. package/scripts/code-reasoning.js +350 -0
  133. package/scripts/codegraph-context.js +466 -0
  134. package/scripts/commercial-offer.js +56 -0
  135. package/scripts/computer-use-firewall.js +250 -0
  136. package/scripts/context-engine.js +694 -0
  137. package/scripts/contextfs.js +1287 -0
  138. package/scripts/conversation-context.js +119 -0
  139. package/scripts/creator-campaigns.js +239 -0
  140. package/scripts/daemon-manager.js +108 -0
  141. package/scripts/daily-digest.js +11 -0
  142. package/scripts/dashboard-render-spec.js +395 -0
  143. package/scripts/dashboard.js +1058 -0
  144. package/scripts/data-governance.js +173 -0
  145. package/scripts/delegation-runtime.js +900 -0
  146. package/scripts/deploy-gcp.sh +44 -0
  147. package/scripts/deploy-policy.js +263 -0
  148. package/scripts/disagreement-mining.js +315 -0
  149. package/scripts/dispatch-brief.js +159 -0
  150. package/scripts/distribution-surfaces.js +44 -0
  151. package/scripts/dpo-optimizer.js +209 -0
  152. package/scripts/ephemeral-agent-store.js +219 -0
  153. package/scripts/eval-harness.js +56 -0
  154. package/scripts/evolution-state.js +241 -0
  155. package/scripts/experiment-tracker.js +267 -0
  156. package/scripts/export-databricks-bundle.js +242 -0
  157. package/scripts/export-dpo-pairs.js +345 -0
  158. package/scripts/export-kto-pairs.js +310 -0
  159. package/scripts/export-training.js +448 -0
  160. package/scripts/failure-diagnostics.js +558 -0
  161. package/scripts/feedback-attribution.js +313 -0
  162. package/scripts/feedback-fallback.js +111 -0
  163. package/scripts/feedback-history-distiller.js +391 -0
  164. package/scripts/feedback-inbox-read.js +162 -0
  165. package/scripts/feedback-loop.js +1887 -0
  166. package/scripts/feedback-paths.js +145 -0
  167. package/scripts/feedback-quality.js +139 -0
  168. package/scripts/feedback-root-consolidator.js +238 -0
  169. package/scripts/feedback-schema.js +426 -0
  170. package/scripts/feedback-session.js +286 -0
  171. package/scripts/feedback-to-memory.js +185 -0
  172. package/scripts/feedback-to-rules.js +163 -0
  173. package/scripts/filesystem-search.js +404 -0
  174. package/scripts/funnel-analytics.js +35 -0
  175. package/scripts/gate-satisfy.js +42 -0
  176. package/scripts/gate-stats.js +116 -0
  177. package/scripts/gate-templates.js +70 -0
  178. package/scripts/gates-engine.js +816 -0
  179. package/scripts/generate-paperbanana-diagrams.sh +99 -0
  180. package/scripts/generate-pretool-hook.sh +40 -0
  181. package/scripts/github-about.js +350 -0
  182. package/scripts/github-outreach.js +65 -0
  183. package/scripts/gtm-revenue-loop.js +520 -0
  184. package/scripts/hallucination-detector.js +226 -0
  185. package/scripts/hf-papers.js +317 -0
  186. package/scripts/history-distiller.js +200 -0
  187. package/scripts/hook-auto-capture.sh +95 -0
  188. package/scripts/hook-stop-pr-thread-check.sh +68 -0
  189. package/scripts/hook-stop-self-score.sh +51 -0
  190. package/scripts/hook-stop-verify-deploy.sh +31 -0
  191. package/scripts/hook-thumbgate-cache-updater.js +48 -0
  192. package/scripts/hook-verify-before-done.sh +20 -0
  193. package/scripts/hosted-config.js +170 -0
  194. package/scripts/hybrid-feedback-context.js +676 -0
  195. package/scripts/install-mcp.js +159 -0
  196. package/scripts/intent-router.js +392 -0
  197. package/scripts/internal-agent-bootstrap.js +490 -0
  198. package/scripts/jsonl-watcher.js +155 -0
  199. package/scripts/lesson-db.js +613 -0
  200. package/scripts/lesson-inference.js +315 -0
  201. package/scripts/lesson-retrieval.js +95 -0
  202. package/scripts/lesson-rotation.js +137 -0
  203. package/scripts/lesson-search.js +644 -0
  204. package/scripts/lesson-synthesis.js +196 -0
  205. package/scripts/license.js +50 -0
  206. package/scripts/local-model-profile.js +383 -0
  207. package/scripts/markdown-escape.js +12 -0
  208. package/scripts/marketing-experiment.js +671 -0
  209. package/scripts/mcp-config.js +149 -0
  210. package/scripts/mcp-policy.js +99 -0
  211. package/scripts/memalign-recall.js +111 -0
  212. package/scripts/memory-firewall.js +222 -0
  213. package/scripts/memory-migration.js +296 -0
  214. package/scripts/meta-policy.js +194 -0
  215. package/scripts/metered-billing.js +16 -0
  216. package/scripts/model-tier-router.js +301 -0
  217. package/scripts/money-watcher.js +71 -0
  218. package/scripts/multi-hop-recall.js +240 -0
  219. package/scripts/natural-language-harness.js +330 -0
  220. package/scripts/obsidian-export.js +712 -0
  221. package/scripts/operational-dashboard.js +103 -0
  222. package/scripts/operational-summary.js +93 -0
  223. package/scripts/optimize-context.js +17 -0
  224. package/scripts/org-dashboard.js +201 -0
  225. package/scripts/partner-orchestration.js +146 -0
  226. package/scripts/per-step-scoring.js +165 -0
  227. package/scripts/perplexity-marketing.js +466 -0
  228. package/scripts/pii-scanner.js +153 -0
  229. package/scripts/plan-gate.js +154 -0
  230. package/scripts/post-everywhere.js +308 -0
  231. package/scripts/post-to-x-retry.sh +22 -0
  232. package/scripts/post-to-x.js +369 -0
  233. package/scripts/pr-manager.js +236 -0
  234. package/scripts/predictive-insights.js +356 -0
  235. package/scripts/principle-extractor.js +162 -0
  236. package/scripts/pro-features.js +40 -0
  237. package/scripts/pro-local-dashboard.js +174 -0
  238. package/scripts/problem-detail.js +53 -0
  239. package/scripts/product-feedback.js +134 -0
  240. package/scripts/profile-router.js +245 -0
  241. package/scripts/prompt-dlp.js +221 -0
  242. package/scripts/prompt-guard.js +83 -0
  243. package/scripts/prove-adapters.js +863 -0
  244. package/scripts/prove-attribution.js +365 -0
  245. package/scripts/prove-automation.js +653 -0
  246. package/scripts/prove-autoresearch.js +304 -0
  247. package/scripts/prove-claim-verification.js +277 -0
  248. package/scripts/prove-cloudflare-sandbox.js +163 -0
  249. package/scripts/prove-data-pipeline.js +410 -0
  250. package/scripts/prove-data-quality.js +227 -0
  251. package/scripts/prove-evolution.js +352 -0
  252. package/scripts/prove-harnesses.js +287 -0
  253. package/scripts/prove-intelligence.js +259 -0
  254. package/scripts/prove-lancedb.js +371 -0
  255. package/scripts/prove-local-intelligence.js +342 -0
  256. package/scripts/prove-loop-closure.js +263 -0
  257. package/scripts/prove-predictive-insights.js +357 -0
  258. package/scripts/prove-runtime.js +350 -0
  259. package/scripts/prove-seo-gsd.js +234 -0
  260. package/scripts/prove-settings.js +279 -0
  261. package/scripts/prove-subway-upgrades.js +277 -0
  262. package/scripts/prove-tessl.js +229 -0
  263. package/scripts/prove-training-export.js +327 -0
  264. package/scripts/prove-workflow-contract.js +116 -0
  265. package/scripts/prove-xmemory.js +332 -0
  266. package/scripts/publish-decision.js +133 -0
  267. package/scripts/pulse.js +80 -0
  268. package/scripts/rate-limiter.js +125 -0
  269. package/scripts/reddit-dm-outreach.js +182 -0
  270. package/scripts/reddit-monitor-cron.sh +26 -0
  271. package/scripts/reflector-agent.js +221 -0
  272. package/scripts/reminder-engine.js +132 -0
  273. package/scripts/revenue-status.js +472 -0
  274. package/scripts/risk-scorer.js +458 -0
  275. package/scripts/rlaif-self-audit.js +129 -0
  276. package/scripts/rubric-engine.js +230 -0
  277. package/scripts/schedule-manager.js +251 -0
  278. package/scripts/secret-scanner.js +414 -0
  279. package/scripts/self-heal.js +147 -0
  280. package/scripts/self-healing-check.js +188 -0
  281. package/scripts/semantic-layer.js +98 -0
  282. package/scripts/seo-gsd.js +1153 -0
  283. package/scripts/settings-hierarchy.js +214 -0
  284. package/scripts/shieldcortex-memory-firewall-runner.mjs +53 -0
  285. package/scripts/skill-exporter.js +262 -0
  286. package/scripts/skill-generator.js +446 -0
  287. package/scripts/skill-materializer.js +134 -0
  288. package/scripts/skill-packs.js +136 -0
  289. package/scripts/skill-proposer.js +99 -0
  290. package/scripts/skill-quality-tracker.js +284 -0
  291. package/scripts/slo-alert-engine.js +14 -0
  292. package/scripts/slow-loop.js +72 -0
  293. package/scripts/social-analytics/db/schema.sql +32 -0
  294. package/scripts/social-analytics/digest.js +256 -0
  295. package/scripts/social-analytics/generate-instagram-card.js +97 -0
  296. package/scripts/social-analytics/instagram-thumbgate-post.js +73 -0
  297. package/scripts/social-analytics/mcp-server.js +289 -0
  298. package/scripts/social-analytics/normalizer.js +580 -0
  299. package/scripts/social-analytics/notify.js +162 -0
  300. package/scripts/social-analytics/poll-all.js +107 -0
  301. package/scripts/social-analytics/pollers/github.js +195 -0
  302. package/scripts/social-analytics/pollers/instagram.js +253 -0
  303. package/scripts/social-analytics/pollers/linkedin.js +330 -0
  304. package/scripts/social-analytics/pollers/plausible.js +247 -0
  305. package/scripts/social-analytics/pollers/reddit.js +306 -0
  306. package/scripts/social-analytics/pollers/threads.js +233 -0
  307. package/scripts/social-analytics/pollers/tiktok.js +203 -0
  308. package/scripts/social-analytics/pollers/x.js +227 -0
  309. package/scripts/social-analytics/pollers/youtube.js +304 -0
  310. package/scripts/social-analytics/pollers/zernio.js +180 -0
  311. package/scripts/social-analytics/publish-instagram-thumbgate.js +85 -0
  312. package/scripts/social-analytics/publishers/devto.js +122 -0
  313. package/scripts/social-analytics/publishers/instagram.js +317 -0
  314. package/scripts/social-analytics/publishers/linkedin.js +294 -0
  315. package/scripts/social-analytics/publishers/reddit.js +390 -0
  316. package/scripts/social-analytics/publishers/threads.js +275 -0
  317. package/scripts/social-analytics/publishers/tiktok.js +217 -0
  318. package/scripts/social-analytics/publishers/x.js +259 -0
  319. package/scripts/social-analytics/publishers/youtube.js +223 -0
  320. package/scripts/social-analytics/publishers/zernio.js +209 -0
  321. package/scripts/social-analytics/run-digest.js +34 -0
  322. package/scripts/social-analytics/store.js +257 -0
  323. package/scripts/social-analytics/utm.js +143 -0
  324. package/scripts/social-pipeline.js +2628 -0
  325. package/scripts/social-quality-gate.js +18 -0
  326. package/scripts/social-reply-monitor.js +445 -0
  327. package/scripts/status-dashboard.js +155 -0
  328. package/scripts/statusline-lesson.js +16 -0
  329. package/scripts/statusline-tower.js +8 -0
  330. package/scripts/statusline.sh +116 -0
  331. package/scripts/stripe-live-status.js +115 -0
  332. package/scripts/subagent-profiles.js +79 -0
  333. package/scripts/sync-gh-secrets-from-env.sh +70 -0
  334. package/scripts/sync-github-about.js +52 -0
  335. package/scripts/sync-version.js +451 -0
  336. package/scripts/synthetic-dpo.js +234 -0
  337. package/scripts/telemetry-analytics.js +821 -0
  338. package/scripts/tessl-export.js +371 -0
  339. package/scripts/test-coverage.js +120 -0
  340. package/scripts/thompson-sampling.js +417 -0
  341. package/scripts/thumbgate-search.js +189 -0
  342. package/scripts/tool-kpi-tracker.js +12 -0
  343. package/scripts/tool-registry.js +811 -0
  344. package/scripts/train_from_feedback.py +910 -0
  345. package/scripts/user-profile.js +78 -0
  346. package/scripts/validate-feedback.js +580 -0
  347. package/scripts/validate-workflow-contract.js +287 -0
  348. package/scripts/vector-store.js +198 -0
  349. package/scripts/verification-loop.js +291 -0
  350. package/scripts/verify-obsidian-setup.sh +269 -0
  351. package/scripts/verify-run.js +269 -0
  352. package/scripts/webhook-delivery.js +62 -0
  353. package/scripts/weekly-auto-post.js +124 -0
  354. package/scripts/workflow-runs.js +154 -0
  355. package/scripts/workflow-sprint-intake.js +475 -0
  356. package/scripts/workspace-evolver.js +374 -0
  357. package/scripts/x-autonomous-marketing.js +139 -0
  358. package/scripts/xmemory-lite.js +405 -0
  359. package/skills/agent-memory/SKILL.md +97 -0
  360. package/skills/solve-architecture-autonomy/SKILL.md +17 -0
  361. package/skills/solve-architecture-autonomy/tool.js +33 -0
  362. package/skills/thumbgate/SKILL.md +114 -0
  363. package/skills/thumbgate-feedback/SKILL.md +49 -0
  364. package/src/api/server.js +4208 -0
@@ -0,0 +1,226 @@
1
+ #!/usr/bin/env node
2
+ 'use strict';
3
+
4
+ /**
5
+ * Hallucination Detector — claim verification, confidence-weighted gates,
6
+ * retrieval-grounded verification.
7
+ *
8
+ * Turns ThumbGate from "block known-bad patterns" into "detect and block
9
+ * hallucinated claims" using 3 techniques from hallucination detection research.
10
+ */
11
+
12
+ const { constructContextPack } = require('./contextfs');
13
+ const { matchSkillPacks } = require('./skill-packs');
14
+
15
+ // ---------------------------------------------------------------------------
16
+ // 1. Claim Decomposition & Verification
17
+ // ---------------------------------------------------------------------------
18
+
19
+ const CLAIM_PATTERNS = [
20
+ { pattern: /\b(?:deployed|shipped|live|released)\b/i, type: 'deployment', verifyWith: ['health_check', 'version_match'] },
21
+ { pattern: /\b(?:tests?\s+pass|all\s+tests?\s+(?:pass|green))\b/i, type: 'test_result', verifyWith: ['test_output', 'exit_code'] },
22
+ { pattern: /\b(?:merged|PR\s+merged)\b/i, type: 'pr_merge', verifyWith: ['pr_state', 'ci_status'] },
23
+ { pattern: /\b(?:fixed|resolved|bug\s+fix)\b/i, type: 'fix_claim', verifyWith: ['test_evidence', 'reproduction_check'] },
24
+ { pattern: /\b(?:published|npm\s+publish)\b/i, type: 'publish', verifyWith: ['registry_check', 'version_match'] },
25
+ { pattern: /\b(?:no\s+(?:errors?|failures?|issues?))\b/i, type: 'clean_state', verifyWith: ['log_check', 'status_check'] },
26
+ ];
27
+
28
+ /**
29
+ * Decompose agent output into verifiable sub-claims.
30
+ * Returns array of { claim, type, verifyWith, text }.
31
+ */
32
+ function decomposeClaims(agentOutput) {
33
+ const text = String(agentOutput || '');
34
+ if (!text.trim()) return [];
35
+
36
+ const claims = [];
37
+ for (const cp of CLAIM_PATTERNS) {
38
+ cp.pattern.lastIndex = 0;
39
+ const matches = text.match(cp.pattern);
40
+ if (matches) {
41
+ for (const match of matches) {
42
+ // Extract surrounding sentence for context
43
+ const idx = text.indexOf(match);
44
+ const start = Math.max(0, text.lastIndexOf('.', idx) + 1);
45
+ const end = text.indexOf('.', idx + match.length);
46
+ const sentence = text.slice(start, end > idx ? end + 1 : undefined).trim().slice(0, 200);
47
+
48
+ claims.push({
49
+ claim: match,
50
+ type: cp.type,
51
+ verifyWith: cp.verifyWith,
52
+ context: sentence,
53
+ });
54
+ }
55
+ }
56
+ }
57
+
58
+ return claims;
59
+ }
60
+
61
+ /**
62
+ * Check a decomposed claim against available evidence.
63
+ * Evidence is a map of { evidence_type: boolean_or_string }.
64
+ */
65
+ function verifyClaim(claim, evidence) {
66
+ const missing = [];
67
+ const verified = [];
68
+
69
+ for (const req of claim.verifyWith) {
70
+ if (evidence[req] === true || (typeof evidence[req] === 'string' && evidence[req].length > 0)) {
71
+ verified.push(req);
72
+ } else {
73
+ missing.push(req);
74
+ }
75
+ }
76
+
77
+ const isVerified = missing.length === 0;
78
+ return {
79
+ claim: claim.claim,
80
+ type: claim.type,
81
+ verified: isVerified,
82
+ verifiedEvidence: verified,
83
+ missingEvidence: missing,
84
+ confidence: claim.verifyWith.length > 0 ? Math.round((verified.length / claim.verifyWith.length) * 100) : 0,
85
+ verdict: isVerified ? 'grounded' : missing.length === claim.verifyWith.length ? 'hallucination' : 'partial',
86
+ };
87
+ }
88
+
89
+ // ---------------------------------------------------------------------------
90
+ // 2. Confidence-Weighted Gate Decisions
91
+ // ---------------------------------------------------------------------------
92
+
93
+ const CONFIDENCE_THRESHOLDS = {
94
+ none: { action: 'block', minSamples: 0, maxSamples: 0 },
95
+ low: { action: 'block', minSamples: 1, maxSamples: 4 },
96
+ medium: { action: 'warn', minSamples: 5, maxSamples: 19 },
97
+ high: { action: 'allow', minSamples: 20, maxSamples: Infinity },
98
+ };
99
+
100
+ /**
101
+ * Determine gate action based on Thompson Sampling confidence tier.
102
+ * Low confidence = stricter (block), high confidence = lenient (allow).
103
+ */
104
+ function confidenceWeightedDecision({ confidence, reliability, samples }) {
105
+ let tier = 'none';
106
+ const s = samples || 0;
107
+
108
+ if (s === 0) tier = 'none';
109
+ else if (s <= 4) tier = 'low';
110
+ else if (s <= 19) tier = 'medium';
111
+ else tier = 'high';
112
+
113
+ const threshold = CONFIDENCE_THRESHOLDS[tier];
114
+ const rel = typeof reliability === 'number' ? reliability : 0.5;
115
+
116
+ // Override: even high-confidence, if reliability < 0.3 → block
117
+ let action = threshold.action;
118
+ if (rel < 0.3) action = 'block';
119
+ else if (rel < 0.5 && tier === 'high') action = 'warn';
120
+
121
+ return {
122
+ tier,
123
+ action,
124
+ reliability: Math.round(rel * 1000) / 1000,
125
+ samples: s,
126
+ reasoning: `${tier} confidence (${s} samples, ${Math.round(rel * 100)}% reliability) → ${action}`,
127
+ };
128
+ }
129
+
130
+ // ---------------------------------------------------------------------------
131
+ // 3. Retrieval-Grounded Verification
132
+ // ---------------------------------------------------------------------------
133
+
134
+ /**
135
+ * Check if a proposed action contradicts recalled prevention rules.
136
+ * Retrieves relevant context and scans for contradictions.
137
+ *
138
+ * Returns { grounded, contradictions, relevantRules, groundingScore }.
139
+ */
140
+ function retrievalGroundedCheck(proposedAction, { maxItems = 5, maxChars = 3000 } = {}) {
141
+ const actionText = String(proposedAction || '').toLowerCase();
142
+ if (!actionText.trim()) return { grounded: true, contradictions: [], relevantRules: [], groundingScore: 100 };
143
+
144
+ // Retrieve relevant context
145
+ let pack;
146
+ try {
147
+ pack = constructContextPack({ query: proposedAction, maxItems, maxChars, namespaces: ['rules', 'memoryError'] });
148
+ } catch {
149
+ return { grounded: true, contradictions: [], relevantRules: [], groundingScore: 100 };
150
+ }
151
+
152
+ const contradictions = [];
153
+ const relevantRules = [];
154
+
155
+ for (const item of pack.items) {
156
+ const content = ((item.structuredContext && item.structuredContext.rawContent) || '').toLowerCase();
157
+ const title = (item.title || '').toLowerCase();
158
+
159
+ // Check for NEVER/ALWAYS rules that contradict the action
160
+ const neverMatches = content.match(/never\s+(.{10,80})/gi) || [];
161
+ for (const neverRule of neverMatches) {
162
+ const ruleAction = neverRule.replace(/^never\s+/i, '').trim();
163
+ // Check if the proposed action contains what the rule says never to do
164
+ const ruleTokens = ruleAction.split(/\s+/).filter((t) => t.length > 3);
165
+ const matchCount = ruleTokens.filter((t) => actionText.includes(t)).length;
166
+ if (matchCount >= 2) {
167
+ contradictions.push({
168
+ rule: neverRule.trim(),
169
+ source: item.title,
170
+ matchStrength: Math.round((matchCount / ruleTokens.length) * 100),
171
+ });
172
+ }
173
+ }
174
+
175
+ // Track all relevant rules
176
+ if (item.score > 0) {
177
+ relevantRules.push({ title: item.title, score: item.score, namespace: item.namespace });
178
+ }
179
+ }
180
+
181
+ const groundingScore = contradictions.length === 0 ? 100 : Math.max(0, 100 - contradictions.length * 25);
182
+
183
+ return {
184
+ grounded: contradictions.length === 0,
185
+ contradictions,
186
+ relevantRules,
187
+ groundingScore,
188
+ packItemCount: pack.items.length,
189
+ };
190
+ }
191
+
192
+ /**
193
+ * Full hallucination check: decompose claims + verify + ground against rules.
194
+ * Returns comprehensive report.
195
+ */
196
+ function fullHallucinationCheck(agentOutput, evidence = {}) {
197
+ const claims = decomposeClaims(agentOutput);
198
+ const claimResults = claims.map((c) => verifyClaim(c, evidence));
199
+ const grounding = retrievalGroundedCheck(agentOutput);
200
+
201
+ const verifiedCount = claimResults.filter((r) => r.verified).length;
202
+ const hallucinationCount = claimResults.filter((r) => r.verdict === 'hallucination').length;
203
+ const totalClaims = claimResults.length;
204
+
205
+ return {
206
+ claims: claimResults,
207
+ grounding,
208
+ summary: {
209
+ totalClaims,
210
+ verified: verifiedCount,
211
+ hallucinated: hallucinationCount,
212
+ partial: totalClaims - verifiedCount - hallucinationCount,
213
+ claimPassRate: totalClaims > 0 ? Math.round((verifiedCount / totalClaims) * 1000) / 10 : 100,
214
+ groundingScore: grounding.groundingScore,
215
+ overallVerdict: hallucinationCount > 0 ? 'hallucination_detected' : (grounding.grounded ? 'grounded' : 'contradiction_detected'),
216
+ },
217
+ checkedAt: new Date().toISOString(),
218
+ };
219
+ }
220
+
221
+ module.exports = {
222
+ CLAIM_PATTERNS, CONFIDENCE_THRESHOLDS,
223
+ decomposeClaims, verifyClaim,
224
+ confidenceWeightedDecision,
225
+ retrievalGroundedCheck, fullHallucinationCheck,
226
+ };
@@ -0,0 +1,317 @@
1
+ 'use strict';
2
+
3
+ const { URL, URLSearchParams } = require('node:url');
4
+ const {
5
+ NAMESPACES,
6
+ upsertContextObject,
7
+ recordProvenance,
8
+ constructTemplatedPack,
9
+ } = require('./contextfs');
10
+
11
+ const DEFAULT_HF_PAPERS_API_BASE = process.env.HF_PAPERS_API_BASE || 'https://huggingface.co/api';
12
+ const DEFAULT_LIMIT = 5;
13
+
14
+ function normalizeAuthors(authors) {
15
+ if (!Array.isArray(authors)) return [];
16
+ return authors
17
+ .map((author) => {
18
+ if (typeof author === 'string') return author.trim();
19
+ if (author && typeof author.name === 'string') return author.name.trim();
20
+ return '';
21
+ })
22
+ .filter(Boolean);
23
+ }
24
+
25
+ function normalizeTags(tags) {
26
+ if (!Array.isArray(tags)) return [];
27
+ return [...new Set(tags
28
+ .map((tag) => {
29
+ if (typeof tag === 'string') return tag.trim();
30
+ if (tag && typeof tag.label === 'string') return tag.label.trim();
31
+ if (tag && typeof tag.name === 'string') return tag.name.trim();
32
+ return '';
33
+ })
34
+ .filter(Boolean))];
35
+ }
36
+
37
+ function normalizePaper(record = {}) {
38
+ const paper = record && typeof record.paper === 'object' ? record.paper : record;
39
+ const paperId = String(
40
+ paper.id
41
+ || paper.paper_id
42
+ || paper.paperId
43
+ || paper.arxiv_id
44
+ || paper.arxivId
45
+ || record.id
46
+ || record.paper_id
47
+ || record.paperId
48
+ || record.arxiv_id
49
+ || record.arxivId
50
+ || ''
51
+ ).trim();
52
+ const title = String(
53
+ paper.title
54
+ || record.title
55
+ || (paperId ? `Paper ${paperId}` : 'Untitled paper')
56
+ ).trim();
57
+ const summary = String(
58
+ paper.summary
59
+ || paper.abstract
60
+ || record.summary
61
+ || record.abstract
62
+ || ''
63
+ ).trim();
64
+ const url = String(
65
+ paper.url
66
+ || paper.paper_url
67
+ || record.url
68
+ || record.paper_url
69
+ || (paperId ? `https://arxiv.org/abs/${paperId}` : '')
70
+ ).trim();
71
+
72
+ return {
73
+ paperId,
74
+ title,
75
+ summary,
76
+ url: url || null,
77
+ authors: normalizeAuthors(paper.authors || record.authors),
78
+ tags: normalizeTags(paper.tags || paper.categories || record.tags || record.categories),
79
+ publishedAt: paper.publishedAt || paper.published_at || record.publishedAt || record.published_at || null,
80
+ source: 'huggingface-papers',
81
+ };
82
+ }
83
+
84
+ function extractPaperItems(payload) {
85
+ if (Array.isArray(payload)) return payload;
86
+ if (!payload || typeof payload !== 'object') return [];
87
+ if (Array.isArray(payload.papers)) return payload.papers;
88
+ if (Array.isArray(payload.items)) return payload.items;
89
+ if (Array.isArray(payload.results)) return payload.results;
90
+ if (Array.isArray(payload.dailyPapers)) return payload.dailyPapers;
91
+ if (payload.paper && typeof payload.paper === 'object') return [payload.paper];
92
+ return [];
93
+ }
94
+
95
+ function buildSearchUrls({ query, limit = DEFAULT_LIMIT, baseUrl = DEFAULT_HF_PAPERS_API_BASE }) {
96
+ const normalizedBase = String(baseUrl || DEFAULT_HF_PAPERS_API_BASE).replace(/\/+$/, '');
97
+ const routes = [
98
+ ['/daily_papers', { query, limit: String(limit) }],
99
+ ['/papers/search', { q: query, limit: String(limit) }],
100
+ ['/papers', { query, limit: String(limit) }],
101
+ ];
102
+
103
+ return routes.map(([pathname, params]) => {
104
+ const url = new URL(`${normalizedBase}${pathname}`);
105
+ url.search = new URLSearchParams(params).toString();
106
+ return url.toString();
107
+ });
108
+ }
109
+
110
+ async function readJson(url, fetchImpl = global.fetch) {
111
+ if (typeof fetchImpl !== 'function') {
112
+ throw new Error('A fetch implementation is required');
113
+ }
114
+
115
+ const response = await fetchImpl(url, {
116
+ headers: {
117
+ accept: 'application/json',
118
+ },
119
+ });
120
+
121
+ if (!response.ok) {
122
+ const error = new Error(`HF papers request failed: ${response.status} ${response.statusText}`);
123
+ error.status = response.status;
124
+ throw error;
125
+ }
126
+
127
+ return response.json();
128
+ }
129
+
130
+ async function searchPapers({
131
+ query,
132
+ limit = DEFAULT_LIMIT,
133
+ baseUrl = DEFAULT_HF_PAPERS_API_BASE,
134
+ fetchImpl = global.fetch,
135
+ } = {}) {
136
+ const normalizedQuery = String(query || '').trim();
137
+ if (!normalizedQuery) {
138
+ throw new Error('searchPapers requires query');
139
+ }
140
+
141
+ const urls = buildSearchUrls({
142
+ query: normalizedQuery,
143
+ limit: Math.max(1, Number(limit) || DEFAULT_LIMIT),
144
+ baseUrl,
145
+ });
146
+
147
+ let lastError = null;
148
+ for (const url of urls) {
149
+ try {
150
+ const payload = await readJson(url, fetchImpl);
151
+ const papers = extractPaperItems(payload)
152
+ .map(normalizePaper)
153
+ .filter((paper) => paper.paperId || paper.title);
154
+
155
+ if (papers.length > 0) {
156
+ return papers.slice(0, limit);
157
+ }
158
+ } catch (error) {
159
+ lastError = error;
160
+ if (error && error.status === 404) {
161
+ continue;
162
+ }
163
+ }
164
+ }
165
+
166
+ if (lastError) throw lastError;
167
+ return [];
168
+ }
169
+
170
+ function paperToMarkdown(paper) {
171
+ const normalized = normalizePaper(paper);
172
+ const lines = [
173
+ `# ${normalized.title}`,
174
+ '',
175
+ `Paper ID: ${normalized.paperId || 'unknown'}`,
176
+ `Source: ${normalized.source}`,
177
+ ];
178
+
179
+ if (normalized.url) {
180
+ lines.push(`URL: ${normalized.url}`);
181
+ }
182
+ if (normalized.publishedAt) {
183
+ lines.push(`Published: ${normalized.publishedAt}`);
184
+ }
185
+ if (normalized.authors.length > 0) {
186
+ lines.push(`Authors: ${normalized.authors.join(', ')}`);
187
+ }
188
+ if (normalized.tags.length > 0) {
189
+ lines.push(`Tags: ${normalized.tags.join(', ')}`);
190
+ }
191
+
192
+ lines.push('', '## Abstract', '', normalized.summary || 'No abstract available.', '');
193
+ return lines.join('\n');
194
+ }
195
+
196
+ function buildCitation(paper) {
197
+ return {
198
+ paperId: paper.paperId || null,
199
+ title: paper.title,
200
+ url: paper.url,
201
+ };
202
+ }
203
+
204
+ function ingestNormalizedPapers(papers, query) {
205
+ const ingested = papers.map((paper) => {
206
+ const normalizedTags = [...new Set([
207
+ 'research',
208
+ 'paper',
209
+ 'hf-papers',
210
+ ...paper.tags.map((tag) => String(tag)),
211
+ ])].sort();
212
+
213
+ return upsertContextObject({
214
+ namespace: NAMESPACES.research,
215
+ title: `Paper: ${paper.title}`,
216
+ content: paperToMarkdown(paper),
217
+ tags: normalizedTags,
218
+ source: 'hf-papers',
219
+ metadata: {
220
+ provider: 'huggingface',
221
+ paperId: paper.paperId || null,
222
+ url: paper.url,
223
+ authors: paper.authors,
224
+ publishedAt: paper.publishedAt,
225
+ query,
226
+ },
227
+ });
228
+ });
229
+
230
+ recordProvenance({
231
+ type: 'hf_papers_ingested',
232
+ query,
233
+ count: ingested.length,
234
+ dedupedCount: ingested.filter((entry) => entry.deduped).length,
235
+ paperIds: papers.map((paper) => paper.paperId).filter(Boolean),
236
+ });
237
+
238
+ return ingested;
239
+ }
240
+
241
+ async function ingestPaperSearch({
242
+ query,
243
+ limit = DEFAULT_LIMIT,
244
+ baseUrl = DEFAULT_HF_PAPERS_API_BASE,
245
+ fetchImpl = global.fetch,
246
+ searchPapersImpl = searchPapers,
247
+ } = {}) {
248
+ const papers = await searchPapersImpl({
249
+ query,
250
+ limit,
251
+ baseUrl,
252
+ fetchImpl,
253
+ });
254
+ const ingested = ingestNormalizedPapers(papers, query);
255
+
256
+ return {
257
+ query,
258
+ limit,
259
+ papers,
260
+ ingested,
261
+ };
262
+ }
263
+
264
+ async function buildResearchBrief({
265
+ query,
266
+ limit = DEFAULT_LIMIT,
267
+ template = 'research-brief',
268
+ baseUrl = DEFAULT_HF_PAPERS_API_BASE,
269
+ fetchImpl = global.fetch,
270
+ searchPapersImpl = searchPapers,
271
+ } = {}) {
272
+ const result = await ingestPaperSearch({
273
+ query,
274
+ limit,
275
+ baseUrl,
276
+ fetchImpl,
277
+ searchPapersImpl,
278
+ });
279
+ const pack = constructTemplatedPack({ template, query });
280
+ const citations = result.papers.map(buildCitation);
281
+ const brief = pack.items
282
+ .map((item, index) => {
283
+ const digest = String(item.structuredContext && item.structuredContext.rawContent || '')
284
+ .split('\n')
285
+ .slice(0, 6)
286
+ .join(' ')
287
+ .trim();
288
+ return `${index + 1}. ${item.title} ${digest}`.trim();
289
+ })
290
+ .join('\n');
291
+
292
+ return {
293
+ query,
294
+ limit,
295
+ source: 'huggingface-papers',
296
+ template,
297
+ ingestedCount: result.ingested.length,
298
+ packId: pack.packId,
299
+ citations,
300
+ brief,
301
+ pack,
302
+ };
303
+ }
304
+
305
+ module.exports = {
306
+ DEFAULT_HF_PAPERS_API_BASE,
307
+ buildResearchBrief,
308
+ buildSearchUrls,
309
+ extractPaperItems,
310
+ ingestNormalizedPapers,
311
+ ingestPaperSearch,
312
+ normalizeAuthors,
313
+ normalizePaper,
314
+ normalizeTags,
315
+ paperToMarkdown,
316
+ searchPapers,
317
+ };