thumbgate 1.4.2 → 1.4.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (279) hide show
  1. package/.claude-plugin/README.md +45 -34
  2. package/.claude-plugin/marketplace.json +3 -3
  3. package/.claude-plugin/plugin.json +3 -3
  4. package/.well-known/llms.txt +1 -1
  5. package/.well-known/mcp/server-card.json +1 -1
  6. package/README.md +26 -2
  7. package/adapters/README.md +4 -1
  8. package/adapters/claude/.mcp.json +2 -2
  9. package/adapters/codex/config.toml +2 -2
  10. package/adapters/mcp/server-stdio.js +10 -4
  11. package/adapters/opencode/opencode.json +1 -1
  12. package/bin/cli.js +246 -90
  13. package/config/mcp-allowlists.json +11 -3
  14. package/package.json +184 -21
  15. package/scripts/audit-trail.js +25 -15
  16. package/scripts/auto-wire-hooks.js +127 -0
  17. package/scripts/cli-demo.js +102 -0
  18. package/scripts/cli-schema.js +285 -0
  19. package/scripts/cli-status.js +166 -0
  20. package/scripts/cross-encoder-reranker.js +235 -0
  21. package/scripts/explore-subcommands.js +277 -0
  22. package/scripts/explore.js +569 -0
  23. package/scripts/feedback-loop.js +20 -6
  24. package/scripts/lesson-inference.js +7 -1
  25. package/scripts/lesson-reranker.js +263 -0
  26. package/scripts/lesson-retrieval.js +34 -17
  27. package/scripts/lesson-search.js +69 -0
  28. package/scripts/perplexity-client.js +210 -0
  29. package/scripts/reflector-agent.js +2 -2
  30. package/scripts/statusline-local-stats.js +3 -1
  31. package/scripts/statusline.sh +12 -11
  32. package/src/api/server.js +178 -17
  33. package/src/index.js +3 -0
  34. package/.claude-plugin/bundle/icon.png +0 -0
  35. package/.claude-plugin/bundle/icon.svg +0 -18
  36. package/.claude-plugin/bundle/server/index.js +0 -24
  37. package/adapters/chatgpt/INSTALL.md +0 -138
  38. package/bin/memory.sh +0 -64
  39. package/bin/obsidian-sync.sh +0 -20
  40. package/plugins/amp-skill/INSTALL.md +0 -52
  41. package/plugins/amp-skill/SKILL.md +0 -64
  42. package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +0 -22
  43. package/plugins/claude-codex-bridge/.mcp.json +0 -14
  44. package/plugins/claude-codex-bridge/INSTALL.md +0 -43
  45. package/plugins/claude-codex-bridge/README.md +0 -46
  46. package/plugins/claude-codex-bridge/scripts/codex-bridge.js +0 -286
  47. package/plugins/claude-codex-bridge/skills/adversarial-review/SKILL.md +0 -24
  48. package/plugins/claude-codex-bridge/skills/result/SKILL.md +0 -22
  49. package/plugins/claude-codex-bridge/skills/review/SKILL.md +0 -28
  50. package/plugins/claude-codex-bridge/skills/second-pass/SKILL.md +0 -27
  51. package/plugins/claude-codex-bridge/skills/setup/SKILL.md +0 -21
  52. package/plugins/claude-codex-bridge/skills/status/SKILL.md +0 -19
  53. package/plugins/claude-skill/INSTALL.md +0 -55
  54. package/plugins/claude-skill/SKILL.md +0 -46
  55. package/plugins/codex-profile/.codex-plugin/plugin.json +0 -43
  56. package/plugins/codex-profile/.mcp.json +0 -14
  57. package/plugins/codex-profile/AGENTS.md +0 -20
  58. package/plugins/codex-profile/INSTALL.md +0 -89
  59. package/plugins/codex-profile/README.md +0 -61
  60. package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +0 -23
  61. package/plugins/cursor-marketplace/CHANGELOG.md +0 -30
  62. package/plugins/cursor-marketplace/LICENSE +0 -21
  63. package/plugins/cursor-marketplace/README.md +0 -124
  64. package/plugins/cursor-marketplace/agents/reliability-reviewer.md +0 -31
  65. package/plugins/cursor-marketplace/assets/logo-400x400.png +0 -0
  66. package/plugins/cursor-marketplace/commands/capture-feedback.md +0 -33
  67. package/plugins/cursor-marketplace/commands/check-gates.md +0 -25
  68. package/plugins/cursor-marketplace/commands/show-lessons.md +0 -27
  69. package/plugins/cursor-marketplace/hooks/hooks.json +0 -10
  70. package/plugins/cursor-marketplace/mcp.json +0 -14
  71. package/plugins/cursor-marketplace/rules/feedback-capture.mdc +0 -34
  72. package/plugins/cursor-marketplace/rules/pre-action-gates.mdc +0 -30
  73. package/plugins/cursor-marketplace/rules/session-continuity.mdc +0 -28
  74. package/plugins/cursor-marketplace/scripts/gate-check.sh +0 -21
  75. package/plugins/cursor-marketplace/skills/capture-feedback/SKILL.md +0 -48
  76. package/plugins/cursor-marketplace/skills/prevention-rules/SKILL.md +0 -31
  77. package/plugins/cursor-marketplace/skills/recall-context/SKILL.md +0 -30
  78. package/plugins/cursor-marketplace/skills/search-lessons/SKILL.md +0 -33
  79. package/plugins/gemini-extension/INSTALL.md +0 -92
  80. package/plugins/gemini-extension/gemini_prompt.txt +0 -14
  81. package/plugins/gemini-extension/tool_contract.json +0 -45
  82. package/plugins/opencode-profile/INSTALL.md +0 -57
  83. package/public/assets/instagram-card.png +0 -0
  84. package/public/assets/tiktok-agent-memory.mp4 +0 -0
  85. package/public/blog.html +0 -474
  86. package/public/compare/mem0.html +0 -189
  87. package/public/compare/speclock.html +0 -180
  88. package/public/compare.html +0 -310
  89. package/public/dashboard.html +0 -1100
  90. package/public/guide.html +0 -317
  91. package/public/guides/claude-code-prevent-repeated-mistakes.html +0 -161
  92. package/public/guides/codex-cli-guardrails.html +0 -158
  93. package/public/guides/cursor-prevent-repeated-mistakes.html +0 -161
  94. package/public/guides/pre-action-gates.html +0 -162
  95. package/public/guides/stop-repeated-ai-agent-mistakes.html +0 -159
  96. package/public/index.html +0 -1128
  97. package/public/js/buyer-intent.js +0 -252
  98. package/public/learn/agent-harness-pattern.html +0 -180
  99. package/public/learn/ai-agent-persistent-memory.html +0 -203
  100. package/public/learn/learn.css +0 -45
  101. package/public/learn/mcp-pre-action-gates-explained.html +0 -172
  102. package/public/learn/stop-ai-agent-force-push.html +0 -134
  103. package/public/learn/vibe-coding-safety-net.html +0 -142
  104. package/public/learn.html +0 -274
  105. package/public/lessons.html +0 -967
  106. package/public/llm-context.md +0 -140
  107. package/public/pro.html +0 -1087
  108. package/public/vercel.json +0 -8
  109. package/scripts/a2ui-engine.js +0 -73
  110. package/scripts/adk-consolidator.js +0 -274
  111. package/scripts/agent-security-hardening.js +0 -225
  112. package/scripts/ai-search-visibility.js +0 -142
  113. package/scripts/autonomous-sales-agent.js +0 -39
  114. package/scripts/autoresearch-runner.js +0 -216
  115. package/scripts/background-agent-governance.js +0 -229
  116. package/scripts/behavioral-extraction.js +0 -93
  117. package/scripts/budget-enforcer.js +0 -173
  118. package/scripts/budget-guard.js +0 -173
  119. package/scripts/build-claude-mcpb.js +0 -255
  120. package/scripts/build-codex-plugin.js +0 -152
  121. package/scripts/capture-railway-diagnostics.sh +0 -97
  122. package/scripts/changeset-check.js +0 -372
  123. package/scripts/check-congruence.js +0 -443
  124. package/scripts/computer-use-firewall.js +0 -280
  125. package/scripts/content-engine/linkedin-content-generator.js +0 -154
  126. package/scripts/content-engine/output/linkedin-memento-validation.md +0 -17
  127. package/scripts/content-engine/output/linkedin-posts-2026-04-09.md +0 -175
  128. package/scripts/content-engine/reddit-thread-finder.js +0 -154
  129. package/scripts/context-engine.js +0 -710
  130. package/scripts/daily-digest.js +0 -11
  131. package/scripts/data-governance.js +0 -173
  132. package/scripts/deploy-gcp.sh +0 -44
  133. package/scripts/deploy-policy.js +0 -249
  134. package/scripts/disagreement-mining.js +0 -315
  135. package/scripts/dpo-optimizer.js +0 -206
  136. package/scripts/ensure-repo-bootstrap.js +0 -130
  137. package/scripts/ephemeral-agent-store.js +0 -212
  138. package/scripts/eval-harness.js +0 -56
  139. package/scripts/export-kto-pairs.js +0 -309
  140. package/scripts/export-training.js +0 -446
  141. package/scripts/feedback-fallback.js +0 -111
  142. package/scripts/feedback-inbox-read.js +0 -162
  143. package/scripts/feedback-root-consolidator.js +0 -233
  144. package/scripts/feedback-to-memory.js +0 -185
  145. package/scripts/gate-satisfy.js +0 -42
  146. package/scripts/generate-paperbanana-diagrams.sh +0 -99
  147. package/scripts/generate-pretool-hook.sh +0 -40
  148. package/scripts/github-about.js +0 -430
  149. package/scripts/github-outreach.js +0 -65
  150. package/scripts/gtm-revenue-loop.js +0 -535
  151. package/scripts/hallucination-detector.js +0 -226
  152. package/scripts/hf-papers.js +0 -317
  153. package/scripts/hook-auto-capture.sh +0 -100
  154. package/scripts/hook-stop-pr-thread-check.sh +0 -68
  155. package/scripts/hook-stop-self-score.sh +0 -51
  156. package/scripts/hook-stop-verify-deploy.sh +0 -31
  157. package/scripts/hook-verify-before-done.sh +0 -20
  158. package/scripts/managed-dpo-export.js +0 -91
  159. package/scripts/markdown-escape.js +0 -12
  160. package/scripts/marketing-experiment.js +0 -657
  161. package/scripts/memalign-recall.js +0 -111
  162. package/scripts/memory-migration.js +0 -296
  163. package/scripts/meta-policy.js +0 -190
  164. package/scripts/metered-billing.js +0 -16
  165. package/scripts/model-tier-router.js +0 -310
  166. package/scripts/money-watcher.js +0 -218
  167. package/scripts/multi-hop-recall.js +0 -240
  168. package/scripts/per-step-scoring.js +0 -163
  169. package/scripts/perplexity-marketing.js +0 -466
  170. package/scripts/pii-scanner.js +0 -153
  171. package/scripts/plan-gate.js +0 -154
  172. package/scripts/post-everywhere.js +0 -341
  173. package/scripts/post-to-x-retry.sh +0 -22
  174. package/scripts/post-to-x.js +0 -369
  175. package/scripts/pr-manager.js +0 -421
  176. package/scripts/principle-extractor.js +0 -162
  177. package/scripts/pro-features.js +0 -41
  178. package/scripts/prompt-dlp.js +0 -222
  179. package/scripts/prove-adapters.js +0 -860
  180. package/scripts/prove-attribution.js +0 -361
  181. package/scripts/prove-automation.js +0 -651
  182. package/scripts/prove-autoresearch.js +0 -304
  183. package/scripts/prove-claim-verification.js +0 -277
  184. package/scripts/prove-cloudflare-sandbox.js +0 -161
  185. package/scripts/prove-data-pipeline.js +0 -408
  186. package/scripts/prove-data-quality.js +0 -227
  187. package/scripts/prove-evolution.js +0 -352
  188. package/scripts/prove-harnesses.js +0 -287
  189. package/scripts/prove-intelligence.js +0 -257
  190. package/scripts/prove-lancedb.js +0 -425
  191. package/scripts/prove-local-intelligence.js +0 -340
  192. package/scripts/prove-loop-closure.js +0 -263
  193. package/scripts/prove-packaged-runtime.js +0 -326
  194. package/scripts/prove-predictive-insights.js +0 -355
  195. package/scripts/prove-runtime.js +0 -363
  196. package/scripts/prove-seo-gsd.js +0 -234
  197. package/scripts/prove-settings.js +0 -279
  198. package/scripts/prove-subway-upgrades.js +0 -277
  199. package/scripts/prove-tessl.js +0 -229
  200. package/scripts/prove-training-export.js +0 -325
  201. package/scripts/prove-workflow-contract.js +0 -112
  202. package/scripts/prove-xmemory.js +0 -332
  203. package/scripts/publish-decision.js +0 -159
  204. package/scripts/ralph-loop.js +0 -376
  205. package/scripts/ralph-mode-ci.js +0 -331
  206. package/scripts/reddit-dm-outreach.js +0 -192
  207. package/scripts/reddit-monitor-cron.sh +0 -26
  208. package/scripts/reminder-engine.js +0 -132
  209. package/scripts/revenue-status.js +0 -472
  210. package/scripts/rotate-stripe-webhook-secret.js +0 -314
  211. package/scripts/schedule-manager.js +0 -249
  212. package/scripts/self-healing-check.js +0 -193
  213. package/scripts/shieldcortex-memory-firewall-runner.mjs +0 -53
  214. package/scripts/skill-exporter.js +0 -260
  215. package/scripts/skill-materializer.js +0 -134
  216. package/scripts/skill-packs.js +0 -136
  217. package/scripts/skill-proposer.js +0 -99
  218. package/scripts/skill-quality-tracker.js +0 -282
  219. package/scripts/slow-loop.js +0 -72
  220. package/scripts/social-analytics/db/analytics.sqlite +0 -0
  221. package/scripts/social-analytics/db/schema.sql +0 -32
  222. package/scripts/social-analytics/digest.js +0 -256
  223. package/scripts/social-analytics/engagement-audit.js +0 -185
  224. package/scripts/social-analytics/generate-instagram-card.js +0 -97
  225. package/scripts/social-analytics/instagram-thumbgate-post.js +0 -111
  226. package/scripts/social-analytics/install-growth-automation.js +0 -114
  227. package/scripts/social-analytics/load-env.js +0 -77
  228. package/scripts/social-analytics/mcp-server.js +0 -289
  229. package/scripts/social-analytics/normalizer.js +0 -580
  230. package/scripts/social-analytics/notify.js +0 -162
  231. package/scripts/social-analytics/poll-all.js +0 -107
  232. package/scripts/social-analytics/pollers/github.js +0 -195
  233. package/scripts/social-analytics/pollers/instagram.js +0 -253
  234. package/scripts/social-analytics/pollers/linkedin.js +0 -340
  235. package/scripts/social-analytics/pollers/plausible.js +0 -245
  236. package/scripts/social-analytics/pollers/reddit.js +0 -306
  237. package/scripts/social-analytics/pollers/threads.js +0 -233
  238. package/scripts/social-analytics/pollers/tiktok.js +0 -203
  239. package/scripts/social-analytics/pollers/x.js +0 -227
  240. package/scripts/social-analytics/pollers/youtube.js +0 -304
  241. package/scripts/social-analytics/pollers/zernio.js +0 -183
  242. package/scripts/social-analytics/publish-instagram-thumbgate.js +0 -104
  243. package/scripts/social-analytics/publish-thumbgate-launch.js +0 -322
  244. package/scripts/social-analytics/publishers/devto.js +0 -122
  245. package/scripts/social-analytics/publishers/instagram.js +0 -317
  246. package/scripts/social-analytics/publishers/linkedin.js +0 -294
  247. package/scripts/social-analytics/publishers/reddit.js +0 -385
  248. package/scripts/social-analytics/publishers/threads.js +0 -275
  249. package/scripts/social-analytics/publishers/tiktok.js +0 -217
  250. package/scripts/social-analytics/publishers/x.js +0 -259
  251. package/scripts/social-analytics/publishers/youtube.js +0 -223
  252. package/scripts/social-analytics/publishers/zernio.js +0 -539
  253. package/scripts/social-analytics/reconcile-thumbgate-campaign.js +0 -165
  254. package/scripts/social-analytics/run-digest.js +0 -34
  255. package/scripts/social-analytics/schedule-thumbgate-campaign.js +0 -275
  256. package/scripts/social-analytics/store.js +0 -455
  257. package/scripts/social-analytics/sync-launch-assets.js +0 -185
  258. package/scripts/social-analytics/utm.js +0 -143
  259. package/scripts/social-pipeline.js +0 -2626
  260. package/scripts/social-post-hourly.js +0 -228
  261. package/scripts/social-quality-gate.js +0 -134
  262. package/scripts/social-reply-monitor.js +0 -592
  263. package/scripts/status-dashboard.js +0 -155
  264. package/scripts/stripe-live-status.js +0 -115
  265. package/scripts/subagent-profiles.js +0 -79
  266. package/scripts/sync-branch-protection.js +0 -340
  267. package/scripts/sync-gh-secrets-from-env.sh +0 -70
  268. package/scripts/sync-github-about.js +0 -55
  269. package/scripts/sync-version.js +0 -479
  270. package/scripts/synthetic-dpo.js +0 -234
  271. package/scripts/tessl-export.js +0 -369
  272. package/scripts/test-coverage.js +0 -128
  273. package/scripts/thumbgate_session_start.sh +0 -32
  274. package/scripts/train_from_feedback.py +0 -929
  275. package/scripts/validate-feedback.js +0 -581
  276. package/scripts/verify-obsidian-setup.sh +0 -269
  277. package/scripts/verify-run.js +0 -269
  278. package/scripts/weekly-auto-post.js +0 -124
  279. package/scripts/x-autonomous-marketing.js +0 -139
@@ -1,581 +0,0 @@
1
- 'use strict';
2
- /**
3
- * Feedback Data Quality Validator
4
- *
5
- * Implements a 4-level validation pipeline:
6
- * 1. Schema validation (required fields, value ranges)
7
- * 2. Semantic validation (logical consistency)
8
- * 3. Anomaly detection (suspicious patterns, sensitive data)
9
- * 4. Self-correction (auto-correct fixable errors)
10
- *
11
- * Ported from Subway_RN_Demo with ThumbGate schema adaptations:
12
- * - Uses 'signal' (not 'feedback') with values 'positive'/'negative'
13
- * - Uses 'id' as required field (not 'source')
14
- * - THUMBGATE_FEEDBACK_DIR env var for path resolution
15
- *
16
- * Usage (CLI):
17
- * echo '{"signal":"positive",...}' | node validate-feedback.js
18
- * node validate-feedback.js --audit # Audit existing feedback log
19
- * node validate-feedback.js --stats # Show quality statistics
20
- *
21
- * Usage (module):
22
- * const { validateEntry } = require('./validate-feedback');
23
- *
24
- * LOCAL ONLY - Do not commit feedback log data to repository
25
- */
26
-
27
- const fs = require('fs');
28
- const path = require('path');
29
- const { resolveFeedbackDir } = require('./feedback-paths');
30
-
31
- // =============================================================================
32
- // PATH RESOLUTION
33
- // =============================================================================
34
-
35
- const DEFAULT_FEEDBACK_DIR = resolveFeedbackDir();
36
-
37
- function getFeedbackDir() {
38
- return resolveFeedbackDir();
39
- }
40
-
41
- function getFeedbackPaths() {
42
- const dir = getFeedbackDir();
43
- return {
44
- FEEDBACK_LOG: path.join(dir, 'feedback-log.jsonl'),
45
- VALIDATION_LOG: path.join(dir, 'validation-issues.jsonl'),
46
- QUALITY_REPORT: path.join(dir, 'quality-report.json'),
47
- };
48
- }
49
-
50
- // =============================================================================
51
- // SCHEMA VALIDATION (Level 1)
52
- // =============================================================================
53
-
54
- const REQUIRED_FIELDS = ['timestamp', 'signal', 'id'];
55
- const VALID_SIGNAL_VALUES = ['positive', 'negative'];
56
- const VALID_REWARD_RANGE = [-1, 1];
57
-
58
- function validateSchema(entry) {
59
- const issues = [];
60
-
61
- // Check required fields
62
- for (const field of REQUIRED_FIELDS) {
63
- if (!(field in entry)) {
64
- issues.push({
65
- level: 'error',
66
- field,
67
- message: `Missing required field: ${field}`,
68
- suggestion: `Add "${field}" to the feedback entry`,
69
- });
70
- }
71
- }
72
-
73
- // Validate signal value
74
- if (entry.signal && !VALID_SIGNAL_VALUES.includes(entry.signal)) {
75
- issues.push({
76
- level: 'warning',
77
- field: 'signal',
78
- message: `Invalid signal value: "${entry.signal}"`,
79
- suggestion: `Use one of: ${VALID_SIGNAL_VALUES.join(', ')}`,
80
- });
81
- }
82
-
83
- // Validate reward range
84
- if ('reward' in entry) {
85
- if (
86
- typeof entry.reward !== 'number' ||
87
- entry.reward < VALID_REWARD_RANGE[0] ||
88
- entry.reward > VALID_REWARD_RANGE[1]
89
- ) {
90
- issues.push({
91
- level: 'error',
92
- field: 'reward',
93
- message: `Reward out of range: ${entry.reward}`,
94
- suggestion: `Reward must be between ${VALID_REWARD_RANGE[0]} and ${VALID_REWARD_RANGE[1]}`,
95
- });
96
- }
97
- }
98
-
99
- // Validate timestamp format
100
- if (entry.timestamp) {
101
- const ts = new Date(entry.timestamp);
102
- if (isNaN(ts.getTime())) {
103
- issues.push({
104
- level: 'error',
105
- field: 'timestamp',
106
- message: `Invalid timestamp format: "${entry.timestamp}"`,
107
- suggestion: 'Use ISO 8601 format: YYYY-MM-DDTHH:MM:SSZ',
108
- });
109
- } else if (ts > new Date()) {
110
- issues.push({
111
- level: 'warning',
112
- field: 'timestamp',
113
- message: 'Timestamp is in the future',
114
- suggestion: 'Check system clock synchronization',
115
- });
116
- }
117
- }
118
-
119
- return issues;
120
- }
121
-
122
- // =============================================================================
123
- // SEMANTIC VALIDATION (Level 2)
124
- // =============================================================================
125
-
126
- function validateSemantics(entry) {
127
- const issues = [];
128
-
129
- // Signal-reward consistency
130
- if (entry.signal === 'positive' && typeof entry.reward === 'number' && entry.reward < 0) {
131
- issues.push({
132
- level: 'error',
133
- field: 'reward',
134
- message: 'Positive signal but negative reward',
135
- explanation: 'Semantic inconsistency: positive signal should have reward >= 0',
136
- suggestion: 'Either change signal to "negative" or reward to positive value',
137
- });
138
- }
139
-
140
- if (entry.signal === 'negative' && typeof entry.reward === 'number' && entry.reward > 0) {
141
- issues.push({
142
- level: 'error',
143
- field: 'reward',
144
- message: 'Negative signal but positive reward',
145
- explanation: 'Semantic inconsistency: negative signal should have reward <= 0',
146
- suggestion: 'Either change signal to "positive" or reward to negative value',
147
- });
148
- }
149
-
150
- // Context validation
151
- if (entry.context !== undefined) {
152
- // Empty or too short context
153
- if (typeof entry.context === 'string' && entry.context.trim().length < 5) {
154
- issues.push({
155
- level: 'warning',
156
- field: 'context',
157
- message: 'Context too short to be meaningful',
158
- explanation: 'Short context reduces ML training value',
159
- suggestion: 'Provide more descriptive context (at least 10 characters)',
160
- });
161
- }
162
-
163
- // Check for placeholder text
164
- const placeholders = ['TODO', 'FIXME', 'placeholder', 'test', 'example'];
165
- for (const ph of placeholders) {
166
- if (
167
- typeof entry.context === 'string' &&
168
- entry.context.toLowerCase().includes(ph.toLowerCase())
169
- ) {
170
- issues.push({
171
- level: 'warning',
172
- field: 'context',
173
- message: `Context contains placeholder text: "${ph}"`,
174
- explanation: 'Placeholder text may indicate incomplete entry',
175
- suggestion: 'Replace with actual context or remove entry',
176
- });
177
- break;
178
- }
179
- }
180
- }
181
-
182
- // Tool-name validation
183
- if (entry.tool_name) {
184
- const validTools = ['Read', 'Write', 'Edit', 'Bash', 'Glob', 'Grep', 'Task', 'WebFetch'];
185
- if (!validTools.includes(entry.tool_name)) {
186
- issues.push({
187
- level: 'info',
188
- field: 'tool_name',
189
- message: `Uncommon tool: "${entry.tool_name}"`,
190
- explanation: 'Tool not in standard list - may be valid but unusual',
191
- suggestion: 'Verify tool name is correct',
192
- });
193
- }
194
- }
195
-
196
- return issues;
197
- }
198
-
199
- // =============================================================================
200
- // ANOMALY DETECTION (Level 3)
201
- // =============================================================================
202
-
203
- function detectAnomalies(entry, allEntries) {
204
- const entries = Array.isArray(allEntries) ? allEntries : [];
205
- const issues = [];
206
-
207
- // Rapid feedback burst (more than 5 in 1 minute)
208
- if (entry.timestamp && entries.length > 0) {
209
- const entryTime = new Date(entry.timestamp);
210
- const recentEntries = entries.filter((e) => {
211
- const t = new Date(e.timestamp);
212
- return Math.abs(entryTime - t) < 60000; // 1 minute
213
- });
214
-
215
- if (recentEntries.length > 5) {
216
- issues.push({
217
- level: 'warning',
218
- type: 'anomaly',
219
- message: 'Feedback burst detected',
220
- explanation: `${recentEntries.length} entries within 1 minute - unusual pattern`,
221
- suggestion: 'Verify this is not automated noise or duplicate entries',
222
- });
223
- }
224
- }
225
-
226
- // Same feedback repeated exactly (duplicate detection)
227
- if (entry.context && entries.length > 0) {
228
- const duplicates = entries.filter(
229
- (e) =>
230
- e.context === entry.context &&
231
- e.signal === entry.signal &&
232
- e.tool_name === entry.tool_name
233
- );
234
-
235
- if (duplicates.length > 0) {
236
- issues.push({
237
- level: 'warning',
238
- type: 'anomaly',
239
- message: 'Duplicate feedback entry',
240
- explanation: `Found ${duplicates.length} identical entries`,
241
- suggestion: 'Consider deduplication or review capture logic',
242
- });
243
- }
244
- }
245
-
246
- // Feedback balance check (session imbalance)
247
- if (entries.length >= 10) {
248
- const positiveCount = entries.filter((e) => e.signal === 'positive').length;
249
- const ratio = positiveCount / entries.length;
250
-
251
- if (ratio > 0.95) {
252
- issues.push({
253
- level: 'info',
254
- type: 'anomaly',
255
- message: 'Feedback heavily skewed positive',
256
- explanation: `${(ratio * 100).toFixed(1)}% positive - may indicate capture bias`,
257
- suggestion: 'Review if negative cases are being properly captured',
258
- });
259
- } else if (ratio < 0.05) {
260
- issues.push({
261
- level: 'warning',
262
- type: 'anomaly',
263
- message: 'Feedback heavily skewed negative',
264
- explanation: `${((1 - ratio) * 100).toFixed(1)}% negative - unusual pattern`,
265
- suggestion: 'Check for systematic issues or misconfigured error detection',
266
- });
267
- }
268
- }
269
-
270
- // Sensitive data leakage detection
271
- if (entry.context) {
272
- const sensitivePatterns = [
273
- /api[_-]?key/i,
274
- /password/i,
275
- /secret/i,
276
- /token/i,
277
- /bearer/i,
278
- /\b[A-Za-z0-9]{32,}\b/, // Long alphanumeric strings (possible keys)
279
- ];
280
-
281
- for (const pattern of sensitivePatterns) {
282
- if (pattern.test(entry.context)) {
283
- issues.push({
284
- level: 'error',
285
- type: 'security',
286
- message: 'Potential sensitive data in context',
287
- explanation: `Pattern matched: ${pattern.toString()}`,
288
- suggestion: 'Redact sensitive information before logging',
289
- });
290
- break;
291
- }
292
- }
293
- }
294
-
295
- return issues;
296
- }
297
-
298
- // =============================================================================
299
- // SELF-CORRECTION (Level 4)
300
- // =============================================================================
301
-
302
- function generateCorrections(entry, issues) {
303
- const corrections = [];
304
-
305
- for (const issue of issues) {
306
- if (issue.level === 'error') {
307
- // Auto-correct reward to match signal
308
- if (issue.field === 'reward' && entry.signal) {
309
- const correctedReward =
310
- entry.signal === 'positive' ? 1 : entry.signal === 'negative' ? -1 : 0;
311
- corrections.push({
312
- field: 'reward',
313
- original: entry.reward,
314
- corrected: correctedReward,
315
- reason: 'Auto-corrected to match signal type',
316
- });
317
- }
318
-
319
- // Auto-add missing timestamp
320
- if (issue.field === 'timestamp' && !entry.timestamp) {
321
- corrections.push({
322
- field: 'timestamp',
323
- original: null,
324
- corrected: new Date().toISOString(),
325
- reason: 'Added missing timestamp',
326
- });
327
- }
328
- }
329
- }
330
-
331
- return corrections;
332
- }
333
-
334
- function applyCorrections(entry, corrections) {
335
- const corrected = { ...entry };
336
- for (const c of corrections) {
337
- corrected[c.field] = c.corrected;
338
- }
339
- corrected._corrected = true;
340
- corrected._corrections = corrections;
341
- return corrected;
342
- }
343
-
344
- // =============================================================================
345
- // MAIN VALIDATION PIPELINE
346
- // =============================================================================
347
-
348
- function validateEntry(entry, allEntries) {
349
- const entries = Array.isArray(allEntries) ? allEntries : [];
350
- const result = {
351
- valid: true,
352
- entry,
353
- issues: [],
354
- corrections: [],
355
- correctedEntry: null,
356
- };
357
-
358
- // Level 1: Schema
359
- result.issues.push(...validateSchema(entry));
360
-
361
- // Level 2: Semantics
362
- result.issues.push(...validateSemantics(entry));
363
-
364
- // Level 3: Anomalies
365
- result.issues.push(...detectAnomalies(entry, entries));
366
-
367
- // Level 4: Self-correction
368
- result.corrections = generateCorrections(entry, result.issues);
369
-
370
- // Determine validity (errors make entry invalid)
371
- const hasErrors = result.issues.some((i) => i.level === 'error');
372
- result.valid = !hasErrors;
373
-
374
- // Apply corrections if available
375
- if (result.corrections.length > 0) {
376
- result.correctedEntry = applyCorrections(entry, result.corrections);
377
- }
378
-
379
- return result;
380
- }
381
-
382
- // =============================================================================
383
- // FEEDBACK LOG UTILITIES
384
- // =============================================================================
385
-
386
- function loadFeedbackLog() {
387
- const { FEEDBACK_LOG } = getFeedbackPaths();
388
- if (!fs.existsSync(FEEDBACK_LOG)) return [];
389
-
390
- const content = fs.readFileSync(FEEDBACK_LOG, 'utf8');
391
- return content
392
- .trim()
393
- .split('\n')
394
- .filter((line) => line.trim())
395
- .map((line) => {
396
- try {
397
- return JSON.parse(line);
398
- } catch {
399
- return null;
400
- }
401
- })
402
- .filter((e) => e !== null);
403
- }
404
-
405
- // =============================================================================
406
- // AUDIT MODE
407
- // =============================================================================
408
-
409
- function auditFeedbackLog() {
410
- const { VALIDATION_LOG, QUALITY_REPORT } = getFeedbackPaths();
411
- console.log('Auditing feedback log...\n');
412
-
413
- const entries = loadFeedbackLog();
414
- if (entries.length === 0) {
415
- console.log('No entries to audit.');
416
- return;
417
- }
418
-
419
- const results = {
420
- total: entries.length,
421
- valid: 0,
422
- invalid: 0,
423
- corrected: 0,
424
- issuesByLevel: { error: 0, warning: 0, info: 0 },
425
- issuesByField: {},
426
- };
427
-
428
- const validationIssues = [];
429
-
430
- for (const entry of entries) {
431
- const validation = validateEntry(entry, entries);
432
-
433
- if (validation.valid) {
434
- results.valid++;
435
- } else {
436
- results.invalid++;
437
- }
438
-
439
- if (validation.corrections.length > 0) {
440
- results.corrected++;
441
- }
442
-
443
- for (const issue of validation.issues) {
444
- results.issuesByLevel[issue.level] = (results.issuesByLevel[issue.level] || 0) + 1;
445
- if (issue.field) {
446
- results.issuesByField[issue.field] = (results.issuesByField[issue.field] || 0) + 1;
447
- }
448
-
449
- validationIssues.push({
450
- timestamp: entry.timestamp,
451
- entryId: entry.id,
452
- ...issue,
453
- });
454
- }
455
- }
456
-
457
- // Save validation issues log
458
- if (validationIssues.length > 0) {
459
- const dir = getFeedbackDir();
460
- if (!fs.existsSync(dir)) fs.mkdirSync(dir, { recursive: true });
461
- const issueLog = validationIssues.map((i) => JSON.stringify(i)).join('\n');
462
- fs.writeFileSync(VALIDATION_LOG, issueLog + '\n');
463
- }
464
-
465
- // Save quality report
466
- const report = {
467
- ...results,
468
- validityRate: ((results.valid / results.total) * 100).toFixed(2) + '%',
469
- auditedAt: new Date().toISOString(),
470
- };
471
- const dir = getFeedbackDir();
472
- if (!fs.existsSync(dir)) fs.mkdirSync(dir, { recursive: true });
473
- fs.writeFileSync(QUALITY_REPORT, JSON.stringify(report, null, 2) + '\n');
474
-
475
- // Print summary
476
- console.log(`Total entries: ${results.total}`);
477
- console.log(`Valid: ${results.valid} (${report.validityRate})`);
478
- console.log(`Invalid: ${results.invalid}`);
479
- console.log(`Auto-correctable: ${results.corrected}`);
480
- console.log('\nIssues by level:');
481
- console.log(` Errors: ${results.issuesByLevel.error || 0}`);
482
- console.log(` Warnings: ${results.issuesByLevel.warning || 0}`);
483
- console.log(` Info: ${results.issuesByLevel.info || 0}`);
484
-
485
- if (Object.keys(results.issuesByField).length > 0) {
486
- console.log('\nTop issue fields:');
487
- const sorted = Object.entries(results.issuesByField)
488
- .sort((a, b) => b[1] - a[1])
489
- .slice(0, 5);
490
- for (const [field, count] of sorted) {
491
- console.log(` ${field}: ${count}`);
492
- }
493
- }
494
-
495
- console.log(`\nValidation issues saved to: ${VALIDATION_LOG}`);
496
- console.log(`Quality report saved to: ${QUALITY_REPORT}`);
497
- }
498
-
499
- function showStats() {
500
- const { QUALITY_REPORT } = getFeedbackPaths();
501
- if (!fs.existsSync(QUALITY_REPORT)) {
502
- console.log('No quality report found. Run --audit first.');
503
- return;
504
- }
505
-
506
- const report = JSON.parse(fs.readFileSync(QUALITY_REPORT, 'utf8'));
507
- console.log('Feedback Quality Statistics\n');
508
- console.log(JSON.stringify(report, null, 2));
509
- }
510
-
511
- // =============================================================================
512
- // CLI ENTRY POINT
513
- // =============================================================================
514
-
515
- async function main() {
516
- const args = process.argv.slice(2);
517
-
518
- if (args.includes('--audit')) {
519
- auditFeedbackLog();
520
- } else if (args.includes('--stats')) {
521
- showStats();
522
- } else {
523
- // Read from stdin (piped input)
524
- let input = '';
525
-
526
- if (!process.stdin.isTTY) {
527
- for await (const chunk of process.stdin) {
528
- input += chunk;
529
- }
530
- }
531
-
532
- if (input.trim()) {
533
- try {
534
- const entry = JSON.parse(input);
535
- const allEntries = loadFeedbackLog();
536
- const result = validateEntry(entry, allEntries);
537
-
538
- if (result.valid) {
539
- const output = result.correctedEntry || result.entry;
540
- console.log(JSON.stringify(output));
541
- } else {
542
- console.error('[VALIDATION] Issues found:');
543
- for (const issue of result.issues) {
544
- console.error(` [${issue.level}] ${issue.message}`);
545
- }
546
- console.log(JSON.stringify(result.correctedEntry || result.entry));
547
- }
548
- } catch (e) {
549
- console.error(`[VALIDATION] Invalid JSON: ${e.message}`);
550
- process.exit(1);
551
- }
552
- } else {
553
- console.log('Feedback Data Quality Validator');
554
- console.log('\nUsage:');
555
- console.log(" echo '{\"signal\":\"positive\",...}' | node validate-feedback.js");
556
- console.log(' node validate-feedback.js --audit # Audit existing log');
557
- console.log(' node validate-feedback.js --stats # Show statistics');
558
- }
559
- }
560
- }
561
-
562
- // =============================================================================
563
- // MODULE EXPORTS
564
- // =============================================================================
565
-
566
- module.exports = {
567
- validateEntry,
568
- validateSchema,
569
- validateSemantics,
570
- detectAnomalies,
571
- generateCorrections,
572
- applyCorrections,
573
- loadFeedbackLog,
574
- auditFeedbackLog,
575
- showStats,
576
- };
577
-
578
- // Run CLI only when invoked directly
579
- if (require.main === module) {
580
- main().catch(console.error);
581
- }