thumbgate 0.9.10
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/README.md +134 -0
- package/.claude-plugin/bundle/icon.png +0 -0
- package/.claude-plugin/bundle/icon.svg +18 -0
- package/.claude-plugin/bundle/server/index.js +24 -0
- package/.claude-plugin/marketplace.json +36 -0
- package/.claude-plugin/plugin.json +21 -0
- package/.well-known/mcp/server-card.json +231 -0
- package/LICENSE +21 -0
- package/README.md +375 -0
- package/adapters/README.md +9 -0
- package/adapters/amp/skills/thumbgate-feedback/SKILL.md +22 -0
- package/adapters/chatgpt/INSTALL.md +83 -0
- package/adapters/chatgpt/openapi.yaml +1281 -0
- package/adapters/claude/.mcp.json +14 -0
- package/adapters/codex/config.toml +9 -0
- package/adapters/gemini/function-declarations.json +224 -0
- package/adapters/mcp/server-stdio.js +788 -0
- package/adapters/opencode/opencode.json +15 -0
- package/bin/cli.js +1484 -0
- package/bin/memory.sh +64 -0
- package/bin/obsidian-sync.sh +20 -0
- package/bin/postinstall.js +37 -0
- package/config/build-metadata.json +4 -0
- package/config/e2e-critical-flows.json +45 -0
- package/config/gate-templates.json +77 -0
- package/config/gates/claim-verification.json +29 -0
- package/config/gates/computer-use.json +39 -0
- package/config/gates/default.json +117 -0
- package/config/github-about.json +25 -0
- package/config/mcp-allowlists.json +135 -0
- package/config/model-tiers.json +33 -0
- package/config/partner-routing.json +132 -0
- package/config/policy-bundles/constrained-v1.json +64 -0
- package/config/policy-bundles/default-v1.json +91 -0
- package/config/rubrics/default-v1.json +52 -0
- package/config/skill-packs/react-testing.json +23 -0
- package/config/skill-packs/stripe-integration/references/api-spec.json +1 -0
- package/config/skill-packs/stripe-integration/references/webhook-guide.md +3 -0
- package/config/skill-specs/pr-reviewer.json +9 -0
- package/config/skill-specs/release-status.json +9 -0
- package/config/skill-specs/ticket-triage.json +9 -0
- package/config/subagent-profiles.json +32 -0
- package/config/tessl-tiles.json +29 -0
- package/config/thumbgate-settings.managed.json +12 -0
- package/openapi/openapi.yaml +1281 -0
- package/package.json +283 -0
- package/plugins/amp-skill/INSTALL.md +52 -0
- package/plugins/amp-skill/SKILL.md +64 -0
- package/plugins/claude-codex-bridge/.claude-plugin/plugin.json +22 -0
- package/plugins/claude-codex-bridge/.mcp.json +12 -0
- package/plugins/claude-codex-bridge/INSTALL.md +43 -0
- package/plugins/claude-codex-bridge/README.md +46 -0
- package/plugins/claude-codex-bridge/scripts/codex-bridge.js +288 -0
- package/plugins/claude-codex-bridge/skills/adversarial-review/SKILL.md +24 -0
- package/plugins/claude-codex-bridge/skills/result/SKILL.md +22 -0
- package/plugins/claude-codex-bridge/skills/review/SKILL.md +28 -0
- package/plugins/claude-codex-bridge/skills/second-pass/SKILL.md +27 -0
- package/plugins/claude-codex-bridge/skills/setup/SKILL.md +21 -0
- package/plugins/claude-codex-bridge/skills/status/SKILL.md +19 -0
- package/plugins/claude-skill/INSTALL.md +55 -0
- package/plugins/claude-skill/SKILL.md +46 -0
- package/plugins/codex-profile/.codex-plugin/plugin.json +43 -0
- package/plugins/codex-profile/.mcp.json +12 -0
- package/plugins/codex-profile/AGENTS.md +20 -0
- package/plugins/codex-profile/INSTALL.md +66 -0
- package/plugins/codex-profile/README.md +37 -0
- package/plugins/cursor-marketplace/.cursor-plugin/plugin.json +23 -0
- package/plugins/cursor-marketplace/CHANGELOG.md +30 -0
- package/plugins/cursor-marketplace/LICENSE +21 -0
- package/plugins/cursor-marketplace/README.md +124 -0
- package/plugins/cursor-marketplace/agents/reliability-reviewer.md +31 -0
- package/plugins/cursor-marketplace/assets/logo-400x400.png +0 -0
- package/plugins/cursor-marketplace/commands/capture-feedback.md +33 -0
- package/plugins/cursor-marketplace/commands/check-gates.md +25 -0
- package/plugins/cursor-marketplace/commands/show-lessons.md +27 -0
- package/plugins/cursor-marketplace/hooks/hooks.json +10 -0
- package/plugins/cursor-marketplace/mcp.json +12 -0
- package/plugins/cursor-marketplace/rules/feedback-capture.mdc +34 -0
- package/plugins/cursor-marketplace/rules/pre-action-gates.mdc +30 -0
- package/plugins/cursor-marketplace/rules/session-continuity.mdc +28 -0
- package/plugins/cursor-marketplace/scripts/gate-check.sh +11 -0
- package/plugins/cursor-marketplace/skills/capture-feedback/SKILL.md +47 -0
- package/plugins/cursor-marketplace/skills/prevention-rules/SKILL.md +31 -0
- package/plugins/cursor-marketplace/skills/recall-context/SKILL.md +30 -0
- package/plugins/cursor-marketplace/skills/search-lessons/SKILL.md +33 -0
- package/plugins/gemini-extension/INSTALL.md +92 -0
- package/plugins/gemini-extension/gemini_prompt.txt +14 -0
- package/plugins/gemini-extension/tool_contract.json +45 -0
- package/plugins/opencode-profile/INSTALL.md +57 -0
- package/public/assets/instagram-card.png +0 -0
- package/public/assets/tiktok-agent-memory.mp4 +0 -0
- package/public/blog.html +400 -0
- package/public/dashboard.html +1093 -0
- package/public/guide.html +317 -0
- package/public/index.html +1014 -0
- package/public/learn/agent-harness-pattern.html +180 -0
- package/public/learn/ai-agent-persistent-memory.html +202 -0
- package/public/learn/learn.css +45 -0
- package/public/learn/mcp-pre-action-gates-explained.html +172 -0
- package/public/learn/stop-ai-agent-force-push.html +134 -0
- package/public/learn/vibe-coding-safety-net.html +142 -0
- package/public/learn.html +213 -0
- package/public/lessons.html +650 -0
- package/public/vercel.json +8 -0
- package/scripts/__pycache__/train_from_feedback.cpython-312.pyc +0 -0
- package/scripts/a2ui-engine.js +73 -0
- package/scripts/access-anomaly-detector.js +12 -0
- package/scripts/adk-consolidator.js +266 -0
- package/scripts/agent-readiness.js +220 -0
- package/scripts/agent-security-hardening.js +227 -0
- package/scripts/agentic-data-pipeline.js +847 -0
- package/scripts/analytics-report.js +328 -0
- package/scripts/analytics-window.js +158 -0
- package/scripts/async-job-runner.js +1001 -0
- package/scripts/audit-trail.js +398 -0
- package/scripts/auto-promote-gates.js +299 -0
- package/scripts/auto-wire-hooks.js +312 -0
- package/scripts/autonomous-sales-agent.js +39 -0
- package/scripts/autoresearch-runner.js +216 -0
- package/scripts/background-agent-governance.js +237 -0
- package/scripts/behavioral-extraction.js +97 -0
- package/scripts/belief-update.js +84 -0
- package/scripts/billing.js +2438 -0
- package/scripts/bot-detector.js +50 -0
- package/scripts/budget-guard.js +173 -0
- package/scripts/build-claude-mcpb.js +189 -0
- package/scripts/build-metadata.js +97 -0
- package/scripts/check-congruence.js +322 -0
- package/scripts/cli-feedback.js +135 -0
- package/scripts/cli-telemetry.js +87 -0
- package/scripts/cloudflare-dynamic-sandbox.js +315 -0
- package/scripts/code-reasoning.js +350 -0
- package/scripts/codegraph-context.js +466 -0
- package/scripts/commercial-offer.js +56 -0
- package/scripts/computer-use-firewall.js +250 -0
- package/scripts/context-engine.js +694 -0
- package/scripts/contextfs.js +1287 -0
- package/scripts/conversation-context.js +119 -0
- package/scripts/creator-campaigns.js +239 -0
- package/scripts/daemon-manager.js +108 -0
- package/scripts/daily-digest.js +11 -0
- package/scripts/dashboard-render-spec.js +395 -0
- package/scripts/dashboard.js +1058 -0
- package/scripts/data-governance.js +173 -0
- package/scripts/delegation-runtime.js +900 -0
- package/scripts/deploy-gcp.sh +44 -0
- package/scripts/deploy-policy.js +263 -0
- package/scripts/disagreement-mining.js +315 -0
- package/scripts/dispatch-brief.js +159 -0
- package/scripts/distribution-surfaces.js +44 -0
- package/scripts/dpo-optimizer.js +209 -0
- package/scripts/ephemeral-agent-store.js +219 -0
- package/scripts/eval-harness.js +56 -0
- package/scripts/evolution-state.js +241 -0
- package/scripts/experiment-tracker.js +267 -0
- package/scripts/export-databricks-bundle.js +242 -0
- package/scripts/export-dpo-pairs.js +345 -0
- package/scripts/export-kto-pairs.js +310 -0
- package/scripts/export-training.js +448 -0
- package/scripts/failure-diagnostics.js +558 -0
- package/scripts/feedback-attribution.js +313 -0
- package/scripts/feedback-fallback.js +111 -0
- package/scripts/feedback-history-distiller.js +391 -0
- package/scripts/feedback-inbox-read.js +162 -0
- package/scripts/feedback-loop.js +1887 -0
- package/scripts/feedback-paths.js +145 -0
- package/scripts/feedback-quality.js +139 -0
- package/scripts/feedback-root-consolidator.js +238 -0
- package/scripts/feedback-schema.js +426 -0
- package/scripts/feedback-session.js +286 -0
- package/scripts/feedback-to-memory.js +185 -0
- package/scripts/feedback-to-rules.js +163 -0
- package/scripts/filesystem-search.js +404 -0
- package/scripts/funnel-analytics.js +35 -0
- package/scripts/gate-satisfy.js +42 -0
- package/scripts/gate-stats.js +116 -0
- package/scripts/gate-templates.js +70 -0
- package/scripts/gates-engine.js +816 -0
- package/scripts/generate-paperbanana-diagrams.sh +99 -0
- package/scripts/generate-pretool-hook.sh +40 -0
- package/scripts/github-about.js +350 -0
- package/scripts/github-outreach.js +65 -0
- package/scripts/gtm-revenue-loop.js +520 -0
- package/scripts/hallucination-detector.js +226 -0
- package/scripts/hf-papers.js +317 -0
- package/scripts/history-distiller.js +200 -0
- package/scripts/hook-auto-capture.sh +95 -0
- package/scripts/hook-stop-pr-thread-check.sh +68 -0
- package/scripts/hook-stop-self-score.sh +51 -0
- package/scripts/hook-stop-verify-deploy.sh +31 -0
- package/scripts/hook-thumbgate-cache-updater.js +48 -0
- package/scripts/hook-verify-before-done.sh +20 -0
- package/scripts/hosted-config.js +170 -0
- package/scripts/hybrid-feedback-context.js +676 -0
- package/scripts/install-mcp.js +159 -0
- package/scripts/intent-router.js +392 -0
- package/scripts/internal-agent-bootstrap.js +490 -0
- package/scripts/jsonl-watcher.js +155 -0
- package/scripts/lesson-db.js +613 -0
- package/scripts/lesson-inference.js +315 -0
- package/scripts/lesson-retrieval.js +95 -0
- package/scripts/lesson-rotation.js +137 -0
- package/scripts/lesson-search.js +644 -0
- package/scripts/lesson-synthesis.js +196 -0
- package/scripts/license.js +50 -0
- package/scripts/local-model-profile.js +383 -0
- package/scripts/markdown-escape.js +12 -0
- package/scripts/marketing-experiment.js +671 -0
- package/scripts/mcp-config.js +149 -0
- package/scripts/mcp-policy.js +99 -0
- package/scripts/memalign-recall.js +111 -0
- package/scripts/memory-firewall.js +222 -0
- package/scripts/memory-migration.js +296 -0
- package/scripts/meta-policy.js +194 -0
- package/scripts/metered-billing.js +16 -0
- package/scripts/model-tier-router.js +301 -0
- package/scripts/money-watcher.js +71 -0
- package/scripts/multi-hop-recall.js +240 -0
- package/scripts/natural-language-harness.js +330 -0
- package/scripts/obsidian-export.js +712 -0
- package/scripts/operational-dashboard.js +103 -0
- package/scripts/operational-summary.js +93 -0
- package/scripts/optimize-context.js +17 -0
- package/scripts/org-dashboard.js +201 -0
- package/scripts/partner-orchestration.js +146 -0
- package/scripts/per-step-scoring.js +165 -0
- package/scripts/perplexity-marketing.js +466 -0
- package/scripts/pii-scanner.js +153 -0
- package/scripts/plan-gate.js +154 -0
- package/scripts/post-everywhere.js +308 -0
- package/scripts/post-to-x-retry.sh +22 -0
- package/scripts/post-to-x.js +369 -0
- package/scripts/pr-manager.js +236 -0
- package/scripts/predictive-insights.js +356 -0
- package/scripts/principle-extractor.js +162 -0
- package/scripts/pro-features.js +40 -0
- package/scripts/pro-local-dashboard.js +174 -0
- package/scripts/problem-detail.js +53 -0
- package/scripts/product-feedback.js +134 -0
- package/scripts/profile-router.js +245 -0
- package/scripts/prompt-dlp.js +221 -0
- package/scripts/prompt-guard.js +83 -0
- package/scripts/prove-adapters.js +863 -0
- package/scripts/prove-attribution.js +365 -0
- package/scripts/prove-automation.js +653 -0
- package/scripts/prove-autoresearch.js +304 -0
- package/scripts/prove-claim-verification.js +277 -0
- package/scripts/prove-cloudflare-sandbox.js +163 -0
- package/scripts/prove-data-pipeline.js +410 -0
- package/scripts/prove-data-quality.js +227 -0
- package/scripts/prove-evolution.js +352 -0
- package/scripts/prove-harnesses.js +287 -0
- package/scripts/prove-intelligence.js +259 -0
- package/scripts/prove-lancedb.js +371 -0
- package/scripts/prove-local-intelligence.js +342 -0
- package/scripts/prove-loop-closure.js +263 -0
- package/scripts/prove-predictive-insights.js +357 -0
- package/scripts/prove-runtime.js +350 -0
- package/scripts/prove-seo-gsd.js +234 -0
- package/scripts/prove-settings.js +279 -0
- package/scripts/prove-subway-upgrades.js +277 -0
- package/scripts/prove-tessl.js +229 -0
- package/scripts/prove-training-export.js +327 -0
- package/scripts/prove-workflow-contract.js +116 -0
- package/scripts/prove-xmemory.js +332 -0
- package/scripts/publish-decision.js +133 -0
- package/scripts/pulse.js +80 -0
- package/scripts/rate-limiter.js +125 -0
- package/scripts/reddit-dm-outreach.js +182 -0
- package/scripts/reddit-monitor-cron.sh +26 -0
- package/scripts/reflector-agent.js +221 -0
- package/scripts/reminder-engine.js +132 -0
- package/scripts/revenue-status.js +472 -0
- package/scripts/risk-scorer.js +458 -0
- package/scripts/rlaif-self-audit.js +129 -0
- package/scripts/rubric-engine.js +230 -0
- package/scripts/schedule-manager.js +251 -0
- package/scripts/secret-scanner.js +414 -0
- package/scripts/self-heal.js +147 -0
- package/scripts/self-healing-check.js +188 -0
- package/scripts/semantic-layer.js +98 -0
- package/scripts/seo-gsd.js +1153 -0
- package/scripts/settings-hierarchy.js +214 -0
- package/scripts/shieldcortex-memory-firewall-runner.mjs +53 -0
- package/scripts/skill-exporter.js +262 -0
- package/scripts/skill-generator.js +446 -0
- package/scripts/skill-materializer.js +134 -0
- package/scripts/skill-packs.js +136 -0
- package/scripts/skill-proposer.js +99 -0
- package/scripts/skill-quality-tracker.js +284 -0
- package/scripts/slo-alert-engine.js +14 -0
- package/scripts/slow-loop.js +72 -0
- package/scripts/social-analytics/db/schema.sql +32 -0
- package/scripts/social-analytics/digest.js +256 -0
- package/scripts/social-analytics/generate-instagram-card.js +97 -0
- package/scripts/social-analytics/instagram-thumbgate-post.js +73 -0
- package/scripts/social-analytics/mcp-server.js +289 -0
- package/scripts/social-analytics/normalizer.js +580 -0
- package/scripts/social-analytics/notify.js +162 -0
- package/scripts/social-analytics/poll-all.js +107 -0
- package/scripts/social-analytics/pollers/github.js +195 -0
- package/scripts/social-analytics/pollers/instagram.js +253 -0
- package/scripts/social-analytics/pollers/linkedin.js +330 -0
- package/scripts/social-analytics/pollers/plausible.js +247 -0
- package/scripts/social-analytics/pollers/reddit.js +306 -0
- package/scripts/social-analytics/pollers/threads.js +233 -0
- package/scripts/social-analytics/pollers/tiktok.js +203 -0
- package/scripts/social-analytics/pollers/x.js +227 -0
- package/scripts/social-analytics/pollers/youtube.js +304 -0
- package/scripts/social-analytics/pollers/zernio.js +180 -0
- package/scripts/social-analytics/publish-instagram-thumbgate.js +85 -0
- package/scripts/social-analytics/publishers/devto.js +122 -0
- package/scripts/social-analytics/publishers/instagram.js +317 -0
- package/scripts/social-analytics/publishers/linkedin.js +294 -0
- package/scripts/social-analytics/publishers/reddit.js +390 -0
- package/scripts/social-analytics/publishers/threads.js +275 -0
- package/scripts/social-analytics/publishers/tiktok.js +217 -0
- package/scripts/social-analytics/publishers/x.js +259 -0
- package/scripts/social-analytics/publishers/youtube.js +223 -0
- package/scripts/social-analytics/publishers/zernio.js +209 -0
- package/scripts/social-analytics/run-digest.js +34 -0
- package/scripts/social-analytics/store.js +257 -0
- package/scripts/social-analytics/utm.js +143 -0
- package/scripts/social-pipeline.js +2628 -0
- package/scripts/social-quality-gate.js +18 -0
- package/scripts/social-reply-monitor.js +445 -0
- package/scripts/status-dashboard.js +155 -0
- package/scripts/statusline-lesson.js +16 -0
- package/scripts/statusline-tower.js +8 -0
- package/scripts/statusline.sh +116 -0
- package/scripts/stripe-live-status.js +115 -0
- package/scripts/subagent-profiles.js +79 -0
- package/scripts/sync-gh-secrets-from-env.sh +70 -0
- package/scripts/sync-github-about.js +52 -0
- package/scripts/sync-version.js +451 -0
- package/scripts/synthetic-dpo.js +234 -0
- package/scripts/telemetry-analytics.js +821 -0
- package/scripts/tessl-export.js +371 -0
- package/scripts/test-coverage.js +120 -0
- package/scripts/thompson-sampling.js +417 -0
- package/scripts/thumbgate-search.js +189 -0
- package/scripts/tool-kpi-tracker.js +12 -0
- package/scripts/tool-registry.js +811 -0
- package/scripts/train_from_feedback.py +910 -0
- package/scripts/user-profile.js +78 -0
- package/scripts/validate-feedback.js +580 -0
- package/scripts/validate-workflow-contract.js +287 -0
- package/scripts/vector-store.js +198 -0
- package/scripts/verification-loop.js +291 -0
- package/scripts/verify-obsidian-setup.sh +269 -0
- package/scripts/verify-run.js +269 -0
- package/scripts/webhook-delivery.js +62 -0
- package/scripts/weekly-auto-post.js +124 -0
- package/scripts/workflow-runs.js +154 -0
- package/scripts/workflow-sprint-intake.js +475 -0
- package/scripts/workspace-evolver.js +374 -0
- package/scripts/x-autonomous-marketing.js +139 -0
- package/scripts/xmemory-lite.js +405 -0
- package/skills/agent-memory/SKILL.md +97 -0
- package/skills/solve-architecture-autonomy/SKILL.md +17 -0
- package/skills/solve-architecture-autonomy/tool.js +33 -0
- package/skills/thumbgate/SKILL.md +114 -0
- package/skills/thumbgate-feedback/SKILL.md +49 -0
- package/src/api/server.js +4208 -0
|
@@ -0,0 +1,458 @@
|
|
|
1
|
+
#!/usr/bin/env node
|
|
2
|
+
'use strict';
|
|
3
|
+
|
|
4
|
+
const fs = require('fs');
|
|
5
|
+
const path = require('path');
|
|
6
|
+
|
|
7
|
+
const PROJECT_ROOT = path.join(__dirname, '..');
|
|
8
|
+
const DEFAULT_FEEDBACK_DIR = path.join(PROJECT_ROOT, '.claude', 'memory', 'feedback');
|
|
9
|
+
const DEFAULT_MODEL_PATH = path.join(DEFAULT_FEEDBACK_DIR, 'risk-model.json');
|
|
10
|
+
const DEFAULT_SEQUENCE_PATH = path.join(DEFAULT_FEEDBACK_DIR, 'feedback-sequences.jsonl');
|
|
11
|
+
|
|
12
|
+
const DOMAIN_FEATURES = [
|
|
13
|
+
'general',
|
|
14
|
+
'testing',
|
|
15
|
+
'security',
|
|
16
|
+
'performance',
|
|
17
|
+
'ui-components',
|
|
18
|
+
'api-integration',
|
|
19
|
+
'git-workflow',
|
|
20
|
+
'documentation',
|
|
21
|
+
'debugging',
|
|
22
|
+
'architecture',
|
|
23
|
+
'data-modeling',
|
|
24
|
+
];
|
|
25
|
+
|
|
26
|
+
const RISK_WORD_RE = /\b(fail|error|wrong|missing|skip|regress|unsafe|blocked|rejected)\b/i;
|
|
27
|
+
const VERIFY_WORD_RE = /\b(test|verify|coverage|evidence|log|proof)\b/i;
|
|
28
|
+
const SAFETY_WORD_RE = /\b(budget|path|guardrail|safe|security|risk)\b/i;
|
|
29
|
+
const SUCCESS_WORD_RE = /\b(pass|worked|fixed|success|verified)\b/i;
|
|
30
|
+
|
|
31
|
+
function resolveFeedbackDir(feedbackDir) {
|
|
32
|
+
return feedbackDir || process.env.THUMBGATE_FEEDBACK_DIR || DEFAULT_FEEDBACK_DIR;
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
function readJSONL(filePath) {
|
|
36
|
+
if (!fs.existsSync(filePath)) return [];
|
|
37
|
+
const raw = fs.readFileSync(filePath, 'utf8').trim();
|
|
38
|
+
if (!raw) return [];
|
|
39
|
+
return raw
|
|
40
|
+
.split('\n')
|
|
41
|
+
.map((line) => {
|
|
42
|
+
try {
|
|
43
|
+
return JSON.parse(line);
|
|
44
|
+
} catch {
|
|
45
|
+
return null;
|
|
46
|
+
}
|
|
47
|
+
})
|
|
48
|
+
.filter(Boolean);
|
|
49
|
+
}
|
|
50
|
+
|
|
51
|
+
function average(values) {
|
|
52
|
+
if (!Array.isArray(values) || values.length === 0) return 0;
|
|
53
|
+
return values.reduce((sum, value) => sum + Number(value || 0), 0) / values.length;
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
function max(values) {
|
|
57
|
+
if (!Array.isArray(values) || values.length === 0) return 0;
|
|
58
|
+
return values.reduce((best, value) => Math.max(best, Number(value || 0)), 0);
|
|
59
|
+
}
|
|
60
|
+
|
|
61
|
+
function countNegatives(values) {
|
|
62
|
+
return (values || []).filter((value) => Number(value) < 0).length;
|
|
63
|
+
}
|
|
64
|
+
|
|
65
|
+
function countPositives(values) {
|
|
66
|
+
return (values || []).filter((value) => Number(value) > 0).length;
|
|
67
|
+
}
|
|
68
|
+
|
|
69
|
+
function toArray(value) {
|
|
70
|
+
return Array.isArray(value) ? value : [];
|
|
71
|
+
}
|
|
72
|
+
|
|
73
|
+
function buildVocabulary(rows, key, limit) {
|
|
74
|
+
const counts = new Map();
|
|
75
|
+
rows.forEach((row) => {
|
|
76
|
+
const values = key === 'targetTags'
|
|
77
|
+
? toArray(row.targetTags || row.tags)
|
|
78
|
+
: row[key] ? [row[key]] : [];
|
|
79
|
+
values.forEach((value) => {
|
|
80
|
+
const normalized = String(value || '').trim().toLowerCase();
|
|
81
|
+
if (!normalized) return;
|
|
82
|
+
counts.set(normalized, (counts.get(normalized) || 0) + 1);
|
|
83
|
+
});
|
|
84
|
+
});
|
|
85
|
+
|
|
86
|
+
return [...counts.entries()]
|
|
87
|
+
.sort((left, right) => right[1] - left[1] || left[0].localeCompare(right[0]))
|
|
88
|
+
.slice(0, limit)
|
|
89
|
+
.map(([value]) => value);
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
function buildFeatureRegistry(rows, options = {}) {
|
|
93
|
+
return {
|
|
94
|
+
topTags: buildVocabulary(rows, 'targetTags', options.maxTags || 8),
|
|
95
|
+
topSkills: buildVocabulary(rows, 'skill', options.maxSkills || 4),
|
|
96
|
+
domains: DOMAIN_FEATURES,
|
|
97
|
+
};
|
|
98
|
+
}
|
|
99
|
+
|
|
100
|
+
function deriveTargetRisk(row) {
|
|
101
|
+
if (typeof row.targetRisk === 'number') return row.targetRisk > 0 ? 1 : 0;
|
|
102
|
+
if (typeof row.accepted === 'boolean' && row.accepted === false) return 1;
|
|
103
|
+
const label = String(row.label || row.signal || '').toLowerCase();
|
|
104
|
+
return label === 'negative' ? 1 : 0;
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
function deriveActionNegativeRate(actionPatterns) {
|
|
108
|
+
const entries = Object.values(actionPatterns || {});
|
|
109
|
+
if (entries.length === 0) return 0;
|
|
110
|
+
const rates = entries.map((entry) => {
|
|
111
|
+
const positive = Number(entry.positive || 0);
|
|
112
|
+
const negative = Number(entry.negative || 0);
|
|
113
|
+
const total = positive + negative;
|
|
114
|
+
return total > 0 ? negative / total : 0;
|
|
115
|
+
});
|
|
116
|
+
return average(rates);
|
|
117
|
+
}
|
|
118
|
+
|
|
119
|
+
function extractFeatureMap(row, registry) {
|
|
120
|
+
const rewardSequence = toArray(row.features && row.features.rewardSequence);
|
|
121
|
+
const timeGaps = toArray(row.features && row.features.timeGaps);
|
|
122
|
+
const currentTags = toArray(row.targetTags || row.tags).map((tag) => String(tag).trim().toLowerCase());
|
|
123
|
+
const currentSkill = String(row.skill || '').trim().toLowerCase();
|
|
124
|
+
const domain = String(row.domain || row.richContext && row.richContext.domain || 'general').trim().toLowerCase();
|
|
125
|
+
const context = String(row.context || '').toLowerCase();
|
|
126
|
+
const rubric = row.rubric || {};
|
|
127
|
+
const filePathCount = Number(row.filePathCount || 0);
|
|
128
|
+
const hasErrorType = row.errorType ? 1 : 0;
|
|
129
|
+
const failingCriteria = toArray(rubric.failingCriteria);
|
|
130
|
+
const failingGuardrails = toArray(rubric.failingGuardrails);
|
|
131
|
+
const judgeDisagreements = toArray(rubric.judgeDisagreements);
|
|
132
|
+
const weightedScore = Number(rubric.weightedScore);
|
|
133
|
+
|
|
134
|
+
const features = {
|
|
135
|
+
recentTrend: Number(row.features && row.features.recentTrend || 0),
|
|
136
|
+
sequenceLength: rewardSequence.length,
|
|
137
|
+
recentNegativeCount: countNegatives(rewardSequence),
|
|
138
|
+
recentPositiveCount: countPositives(rewardSequence),
|
|
139
|
+
avgTimeGap: average(timeGaps),
|
|
140
|
+
maxTimeGap: max(timeGaps),
|
|
141
|
+
tagCount: currentTags.length,
|
|
142
|
+
filePathCount,
|
|
143
|
+
hasErrorType,
|
|
144
|
+
hasRubric: rubric.weightedScore != null ? 1 : 0,
|
|
145
|
+
rubricWeightedScore: Number.isFinite(weightedScore) ? weightedScore : 0.5,
|
|
146
|
+
failingCriteriaCount: failingCriteria.length,
|
|
147
|
+
failingGuardrailsCount: failingGuardrails.length,
|
|
148
|
+
judgeDisagreementCount: judgeDisagreements.length,
|
|
149
|
+
actionNegativeRate: deriveActionNegativeRate(row.features && row.features.actionPatterns),
|
|
150
|
+
containsRiskWord: RISK_WORD_RE.test(context) ? 1 : 0,
|
|
151
|
+
containsVerificationWord: VERIFY_WORD_RE.test(context) ? 1 : 0,
|
|
152
|
+
containsSafetyWord: SAFETY_WORD_RE.test(context) ? 1 : 0,
|
|
153
|
+
containsSuccessWord: SUCCESS_WORD_RE.test(context) ? 1 : 0,
|
|
154
|
+
};
|
|
155
|
+
|
|
156
|
+
registry.domains.forEach((knownDomain) => {
|
|
157
|
+
features[`domain:${knownDomain}`] = domain === knownDomain ? 1 : 0;
|
|
158
|
+
});
|
|
159
|
+
registry.topTags.forEach((tag) => {
|
|
160
|
+
features[`tag:${tag}`] = currentTags.includes(tag) ? 1 : 0;
|
|
161
|
+
});
|
|
162
|
+
registry.topSkills.forEach((skill) => {
|
|
163
|
+
features[`skill:${skill}`] = currentSkill === skill ? 1 : 0;
|
|
164
|
+
});
|
|
165
|
+
|
|
166
|
+
return features;
|
|
167
|
+
}
|
|
168
|
+
|
|
169
|
+
function candidateThresholds(values) {
|
|
170
|
+
const uniques = [...new Set(values.map((value) => Number(value || 0)))].sort((left, right) => left - right);
|
|
171
|
+
if (uniques.length <= 1) return uniques.length === 1 ? [uniques[0]] : [0];
|
|
172
|
+
if (uniques.length <= 6) {
|
|
173
|
+
return uniques.slice(0, -1).map((value, index) => (value + uniques[index + 1]) / 2);
|
|
174
|
+
}
|
|
175
|
+
|
|
176
|
+
const percentiles = [0.2, 0.4, 0.6, 0.8].map((pct) => {
|
|
177
|
+
const position = Math.min(uniques.length - 2, Math.max(0, Math.floor((uniques.length - 1) * pct)));
|
|
178
|
+
return (uniques[position] + uniques[position + 1]) / 2;
|
|
179
|
+
});
|
|
180
|
+
return [...new Set(percentiles)];
|
|
181
|
+
}
|
|
182
|
+
|
|
183
|
+
function stumpPredict(value, threshold, polarity) {
|
|
184
|
+
const decision = Number(value || 0) > threshold ? 1 : -1;
|
|
185
|
+
return decision * polarity;
|
|
186
|
+
}
|
|
187
|
+
|
|
188
|
+
function findBestWeakLearner(examples, weights, featureNames) {
|
|
189
|
+
let best = null;
|
|
190
|
+
|
|
191
|
+
featureNames.forEach((feature) => {
|
|
192
|
+
const values = examples.map((example) => example.features[feature]);
|
|
193
|
+
const thresholds = candidateThresholds(values);
|
|
194
|
+
thresholds.forEach((threshold) => {
|
|
195
|
+
[-1, 1].forEach((polarity) => {
|
|
196
|
+
let error = 0;
|
|
197
|
+
const predictions = [];
|
|
198
|
+
examples.forEach((example, index) => {
|
|
199
|
+
const prediction = stumpPredict(example.features[feature], threshold, polarity);
|
|
200
|
+
predictions.push(prediction);
|
|
201
|
+
if (prediction !== example.label) {
|
|
202
|
+
error += weights[index];
|
|
203
|
+
}
|
|
204
|
+
});
|
|
205
|
+
|
|
206
|
+
if (!best || error < best.error) {
|
|
207
|
+
best = {
|
|
208
|
+
feature,
|
|
209
|
+
threshold,
|
|
210
|
+
polarity,
|
|
211
|
+
error,
|
|
212
|
+
predictions,
|
|
213
|
+
};
|
|
214
|
+
}
|
|
215
|
+
});
|
|
216
|
+
});
|
|
217
|
+
});
|
|
218
|
+
|
|
219
|
+
return best;
|
|
220
|
+
}
|
|
221
|
+
|
|
222
|
+
function normalizeWeights(weights) {
|
|
223
|
+
const total = weights.reduce((sum, value) => sum + value, 0) || 1;
|
|
224
|
+
return weights.map((value) => value / total);
|
|
225
|
+
}
|
|
226
|
+
|
|
227
|
+
function trainingAccuracy(model, examples) {
|
|
228
|
+
if (examples.length === 0) return 0;
|
|
229
|
+
const correct = examples.filter((example) => {
|
|
230
|
+
const prediction = predictRisk(model, example.row);
|
|
231
|
+
return prediction.label === (example.label === 1 ? 'high-risk' : 'low-risk');
|
|
232
|
+
}).length;
|
|
233
|
+
return correct / examples.length;
|
|
234
|
+
}
|
|
235
|
+
|
|
236
|
+
function buildPatternSummary(rows) {
|
|
237
|
+
function summarize(valuesFn) {
|
|
238
|
+
const buckets = new Map();
|
|
239
|
+
rows.forEach((row) => {
|
|
240
|
+
valuesFn(row).forEach((value) => {
|
|
241
|
+
const key = String(value || '').trim().toLowerCase();
|
|
242
|
+
if (!key) return;
|
|
243
|
+
if (!buckets.has(key)) {
|
|
244
|
+
buckets.set(key, { key, total: 0, highRisk: 0 });
|
|
245
|
+
}
|
|
246
|
+
const bucket = buckets.get(key);
|
|
247
|
+
bucket.total += 1;
|
|
248
|
+
bucket.highRisk += deriveTargetRisk(row);
|
|
249
|
+
});
|
|
250
|
+
});
|
|
251
|
+
|
|
252
|
+
return [...buckets.values()]
|
|
253
|
+
.filter((bucket) => bucket.total >= 2)
|
|
254
|
+
.map((bucket) => ({
|
|
255
|
+
...bucket,
|
|
256
|
+
riskRate: Math.round((bucket.highRisk / bucket.total) * 1000) / 1000,
|
|
257
|
+
}))
|
|
258
|
+
.sort((left, right) => right.riskRate - left.riskRate || right.total - left.total || left.key.localeCompare(right.key))
|
|
259
|
+
.slice(0, 5);
|
|
260
|
+
}
|
|
261
|
+
|
|
262
|
+
return {
|
|
263
|
+
tags: summarize((row) => toArray(row.targetTags || row.tags)),
|
|
264
|
+
domains: summarize((row) => [row.domain || row.richContext && row.richContext.domain || 'general']),
|
|
265
|
+
skills: summarize((row) => row.skill ? [row.skill] : []),
|
|
266
|
+
};
|
|
267
|
+
}
|
|
268
|
+
|
|
269
|
+
function trainRiskModel(rows, options = {}) {
|
|
270
|
+
const registry = buildFeatureRegistry(rows, options);
|
|
271
|
+
const examples = rows.map((row) => ({
|
|
272
|
+
row,
|
|
273
|
+
label: deriveTargetRisk(row) === 1 ? 1 : -1,
|
|
274
|
+
features: extractFeatureMap(row, registry),
|
|
275
|
+
}));
|
|
276
|
+
|
|
277
|
+
const model = {
|
|
278
|
+
version: 1,
|
|
279
|
+
algorithm: 'adaboost-stumps',
|
|
280
|
+
trainedAt: new Date().toISOString(),
|
|
281
|
+
exampleCount: examples.length,
|
|
282
|
+
highRiskExamples: examples.filter((example) => example.label === 1).length,
|
|
283
|
+
baseRate: examples.length > 0
|
|
284
|
+
? examples.filter((example) => example.label === 1).length / examples.length
|
|
285
|
+
: 0,
|
|
286
|
+
featureRegistry: registry,
|
|
287
|
+
featureNames: examples[0] ? Object.keys(examples[0].features) : [],
|
|
288
|
+
learners: [],
|
|
289
|
+
patterns: buildPatternSummary(rows),
|
|
290
|
+
metrics: {
|
|
291
|
+
trainingAccuracy: 0,
|
|
292
|
+
rounds: 0,
|
|
293
|
+
mode: 'baseline',
|
|
294
|
+
},
|
|
295
|
+
};
|
|
296
|
+
|
|
297
|
+
if (examples.length < 6 || model.highRiskExamples === 0 || model.highRiskExamples === examples.length) {
|
|
298
|
+
model.metrics.trainingAccuracy = trainingAccuracy(model, examples);
|
|
299
|
+
return model;
|
|
300
|
+
}
|
|
301
|
+
|
|
302
|
+
let weights = normalizeWeights(Array(examples.length).fill(1));
|
|
303
|
+
const rounds = Math.max(1, Math.min(12, Number(options.rounds || 8)));
|
|
304
|
+
|
|
305
|
+
for (let round = 0; round < rounds; round += 1) {
|
|
306
|
+
const learner = findBestWeakLearner(examples, weights, model.featureNames);
|
|
307
|
+
if (!learner) break;
|
|
308
|
+
|
|
309
|
+
const clippedError = Math.min(Math.max(learner.error, 1e-6), 1 - 1e-6);
|
|
310
|
+
if (clippedError >= 0.5) break;
|
|
311
|
+
|
|
312
|
+
const alpha = 0.5 * Math.log((1 - clippedError) / clippedError);
|
|
313
|
+
model.learners.push({
|
|
314
|
+
feature: learner.feature,
|
|
315
|
+
threshold: learner.threshold,
|
|
316
|
+
polarity: learner.polarity,
|
|
317
|
+
alpha: Math.round(alpha * 1000) / 1000,
|
|
318
|
+
});
|
|
319
|
+
|
|
320
|
+
weights = normalizeWeights(weights.map((weight, index) => (
|
|
321
|
+
weight * Math.exp(-alpha * examples[index].label * learner.predictions[index])
|
|
322
|
+
)));
|
|
323
|
+
}
|
|
324
|
+
|
|
325
|
+
model.metrics.rounds = model.learners.length;
|
|
326
|
+
model.metrics.mode = model.learners.length > 0 ? 'boosted' : 'baseline';
|
|
327
|
+
model.metrics.trainingAccuracy = trainingAccuracy(model, examples);
|
|
328
|
+
return model;
|
|
329
|
+
}
|
|
330
|
+
|
|
331
|
+
function rawScore(model, row) {
|
|
332
|
+
if (!model || !model.featureRegistry) {
|
|
333
|
+
return 0;
|
|
334
|
+
}
|
|
335
|
+
|
|
336
|
+
if (!model.learners || model.learners.length === 0) {
|
|
337
|
+
const centeredBase = Number(model.baseRate || 0.5) - 0.5;
|
|
338
|
+
return centeredBase * 2;
|
|
339
|
+
}
|
|
340
|
+
|
|
341
|
+
const features = extractFeatureMap(row, model.featureRegistry);
|
|
342
|
+
return model.learners.reduce((sum, learner) => (
|
|
343
|
+
sum + learner.alpha * stumpPredict(features[learner.feature], learner.threshold, learner.polarity)
|
|
344
|
+
), 0);
|
|
345
|
+
}
|
|
346
|
+
|
|
347
|
+
function predictRisk(model, row) {
|
|
348
|
+
const score = rawScore(model, row);
|
|
349
|
+
const probability = model.learners && model.learners.length > 0
|
|
350
|
+
? 1 / (1 + Math.exp(-2 * score))
|
|
351
|
+
: Number(model.baseRate || 0);
|
|
352
|
+
return {
|
|
353
|
+
score: Math.round(score * 1000) / 1000,
|
|
354
|
+
probability: Math.round(probability * 1000) / 1000,
|
|
355
|
+
label: probability >= 0.5 ? 'high-risk' : 'low-risk',
|
|
356
|
+
};
|
|
357
|
+
}
|
|
358
|
+
|
|
359
|
+
function buildRiskCandidate(params = {}, historyRows = []) {
|
|
360
|
+
const currentTags = toArray(params.tags)
|
|
361
|
+
.map((tag) => String(tag).trim())
|
|
362
|
+
.filter(Boolean);
|
|
363
|
+
const rewardSequence = historyRows.slice(-10).map((row) => Number(row.targetReward || 0)).filter((value) => Number.isFinite(value));
|
|
364
|
+
const timeGaps = [];
|
|
365
|
+
for (let index = Math.max(0, historyRows.length - 10); index < historyRows.length; index += 1) {
|
|
366
|
+
if (index === 0) continue;
|
|
367
|
+
const previous = Date.parse(historyRows[index - 1].timestamp || '');
|
|
368
|
+
const current = Date.parse(historyRows[index].timestamp || '');
|
|
369
|
+
if (Number.isFinite(previous) && Number.isFinite(current)) {
|
|
370
|
+
timeGaps.push((current - previous) / 1000 / 60);
|
|
371
|
+
}
|
|
372
|
+
}
|
|
373
|
+
|
|
374
|
+
return {
|
|
375
|
+
context: params.context || '',
|
|
376
|
+
targetTags: currentTags,
|
|
377
|
+
skill: params.skill || null,
|
|
378
|
+
domain: params.domain || 'general',
|
|
379
|
+
filePathCount: Number(params.filePathCount || 0),
|
|
380
|
+
errorType: params.errorType || null,
|
|
381
|
+
rubric: params.rubric || null,
|
|
382
|
+
features: {
|
|
383
|
+
rewardSequence,
|
|
384
|
+
recentTrend: rewardSequence.length > 0 ? average(rewardSequence.slice(-5)) : 0,
|
|
385
|
+
timeGaps,
|
|
386
|
+
actionPatterns: {},
|
|
387
|
+
},
|
|
388
|
+
};
|
|
389
|
+
}
|
|
390
|
+
|
|
391
|
+
function modelPathFor(feedbackDir) {
|
|
392
|
+
return path.join(resolveFeedbackDir(feedbackDir), 'risk-model.json');
|
|
393
|
+
}
|
|
394
|
+
|
|
395
|
+
function sequencePathFor(feedbackDir) {
|
|
396
|
+
return path.join(resolveFeedbackDir(feedbackDir), 'feedback-sequences.jsonl');
|
|
397
|
+
}
|
|
398
|
+
|
|
399
|
+
function saveRiskModel(model, feedbackDir) {
|
|
400
|
+
const targetPath = modelPathFor(feedbackDir);
|
|
401
|
+
fs.mkdirSync(path.dirname(targetPath), { recursive: true });
|
|
402
|
+
fs.writeFileSync(targetPath, `${JSON.stringify(model, null, 2)}\n`);
|
|
403
|
+
return targetPath;
|
|
404
|
+
}
|
|
405
|
+
|
|
406
|
+
function loadRiskModel(feedbackDir) {
|
|
407
|
+
const targetPath = modelPathFor(feedbackDir);
|
|
408
|
+
if (!fs.existsSync(targetPath)) return null;
|
|
409
|
+
return JSON.parse(fs.readFileSync(targetPath, 'utf8'));
|
|
410
|
+
}
|
|
411
|
+
|
|
412
|
+
function trainAndPersistRiskModel(feedbackDir, options = {}) {
|
|
413
|
+
const resolvedDir = resolveFeedbackDir(feedbackDir);
|
|
414
|
+
const rows = readJSONL(sequencePathFor(resolvedDir));
|
|
415
|
+
const model = trainRiskModel(rows, options);
|
|
416
|
+
const modelPath = saveRiskModel(model, resolvedDir);
|
|
417
|
+
return { model, modelPath, rows };
|
|
418
|
+
}
|
|
419
|
+
|
|
420
|
+
function getRiskSummary(feedbackDir) {
|
|
421
|
+
const resolvedDir = resolveFeedbackDir(feedbackDir);
|
|
422
|
+
const rows = readJSONL(sequencePathFor(resolvedDir));
|
|
423
|
+
if (rows.length === 0) return null;
|
|
424
|
+
|
|
425
|
+
const model = loadRiskModel(resolvedDir) || trainRiskModel(rows);
|
|
426
|
+
return {
|
|
427
|
+
exampleCount: model.exampleCount,
|
|
428
|
+
baseRate: Math.round((model.baseRate || 0) * 1000) / 1000,
|
|
429
|
+
mode: model.metrics.mode,
|
|
430
|
+
trainingAccuracy: Math.round((model.metrics.trainingAccuracy || 0) * 1000) / 1000,
|
|
431
|
+
highRiskTags: model.patterns.tags,
|
|
432
|
+
highRiskDomains: model.patterns.domains,
|
|
433
|
+
highRiskSkills: model.patterns.skills,
|
|
434
|
+
};
|
|
435
|
+
}
|
|
436
|
+
|
|
437
|
+
module.exports = {
|
|
438
|
+
DEFAULT_MODEL_PATH,
|
|
439
|
+
DEFAULT_SEQUENCE_PATH,
|
|
440
|
+
buildFeatureRegistry,
|
|
441
|
+
buildRiskCandidate,
|
|
442
|
+
deriveTargetRisk,
|
|
443
|
+
extractFeatureMap,
|
|
444
|
+
loadRiskModel,
|
|
445
|
+
modelPathFor,
|
|
446
|
+
predictRisk,
|
|
447
|
+
readJSONL,
|
|
448
|
+
saveRiskModel,
|
|
449
|
+
sequencePathFor,
|
|
450
|
+
trainAndPersistRiskModel,
|
|
451
|
+
trainRiskModel,
|
|
452
|
+
getRiskSummary,
|
|
453
|
+
};
|
|
454
|
+
|
|
455
|
+
if (require.main === module) {
|
|
456
|
+
const { model, modelPath } = trainAndPersistRiskModel();
|
|
457
|
+
process.stdout.write(`${JSON.stringify({ modelPath, model }, null, 2)}\n`);
|
|
458
|
+
}
|
|
@@ -0,0 +1,129 @@
|
|
|
1
|
+
'use strict';
|
|
2
|
+
/**
|
|
3
|
+
* RLAIF Self-Audit Module (DPO-01)
|
|
4
|
+
*
|
|
5
|
+
* Heuristic self-scoring of feedback events against CLAUDE.md constraints.
|
|
6
|
+
* NO API calls — pure synchronous evaluation of event fields.
|
|
7
|
+
*
|
|
8
|
+
* Exports: selfAudit, selfAuditAndLog, CONSTRAINTS
|
|
9
|
+
*/
|
|
10
|
+
|
|
11
|
+
const fs = require('fs');
|
|
12
|
+
const path = require('path');
|
|
13
|
+
const { assessFeedbackActionability } = require('./feedback-quality');
|
|
14
|
+
|
|
15
|
+
// ---------------------------------------------------------------------------
|
|
16
|
+
// CLAUDE.md Constraint Definitions (weight sum = 1.0)
|
|
17
|
+
// ---------------------------------------------------------------------------
|
|
18
|
+
|
|
19
|
+
const CONSTRAINTS = [
|
|
20
|
+
{
|
|
21
|
+
id: 'has_context',
|
|
22
|
+
weight: 0.20,
|
|
23
|
+
check: (e) => typeof e.context === 'string' && e.context.length >= 20,
|
|
24
|
+
},
|
|
25
|
+
{
|
|
26
|
+
id: 'has_actionable_detail',
|
|
27
|
+
weight: 0.25,
|
|
28
|
+
check: (e) => {
|
|
29
|
+
if (e.signal === 'positive') return Boolean(e.whatWorked);
|
|
30
|
+
return Boolean(e.whatWentWrong) && Boolean(e.whatToChange);
|
|
31
|
+
},
|
|
32
|
+
},
|
|
33
|
+
{
|
|
34
|
+
id: 'schema_valid',
|
|
35
|
+
weight: 0.15,
|
|
36
|
+
check: (e) =>
|
|
37
|
+
['positive', 'negative'].includes(e.signal) &&
|
|
38
|
+
Array.isArray(e.tags) &&
|
|
39
|
+
e.tags.length > 0,
|
|
40
|
+
},
|
|
41
|
+
{
|
|
42
|
+
id: 'rubric_evaluated',
|
|
43
|
+
weight: 0.20,
|
|
44
|
+
check: (e) => e.rubric != null && e.rubric.promotionEligible != null,
|
|
45
|
+
},
|
|
46
|
+
{
|
|
47
|
+
id: 'budget_compliant',
|
|
48
|
+
weight: 0.10,
|
|
49
|
+
check: (e) =>
|
|
50
|
+
!e.rubric ||
|
|
51
|
+
!e.rubric.failingGuardrails ||
|
|
52
|
+
!e.rubric.failingGuardrails.includes('budgetCompliant'),
|
|
53
|
+
},
|
|
54
|
+
{
|
|
55
|
+
id: 'no_vague_signal',
|
|
56
|
+
weight: 0.10,
|
|
57
|
+
check: (e) => assessFeedbackActionability({
|
|
58
|
+
signal: e.signal,
|
|
59
|
+
context: e.context,
|
|
60
|
+
whatWentWrong: e.whatWentWrong,
|
|
61
|
+
whatWorked: e.whatWorked,
|
|
62
|
+
}).promotable,
|
|
63
|
+
},
|
|
64
|
+
];
|
|
65
|
+
|
|
66
|
+
// ---------------------------------------------------------------------------
|
|
67
|
+
// selfAudit — pure function, no I/O, no API calls
|
|
68
|
+
// ---------------------------------------------------------------------------
|
|
69
|
+
|
|
70
|
+
/**
|
|
71
|
+
* Evaluate a feedback event against all CLAUDE.md constraints.
|
|
72
|
+
*
|
|
73
|
+
* @param {Object} feedbackEvent - A feedback event object
|
|
74
|
+
* @returns {{ score: number, constraints: Array, timestamp: string }}
|
|
75
|
+
* score: float in [0, 1] rounded to 3 decimals
|
|
76
|
+
* constraints: array of { constraint, passed, weight }
|
|
77
|
+
* timestamp: ISO 8601 string at evaluation time
|
|
78
|
+
*/
|
|
79
|
+
function selfAudit(feedbackEvent) {
|
|
80
|
+
const e = feedbackEvent || {};
|
|
81
|
+
const results = CONSTRAINTS.map((c) => ({
|
|
82
|
+
constraint: c.id,
|
|
83
|
+
passed: Boolean(c.check(e)),
|
|
84
|
+
weight: c.weight,
|
|
85
|
+
}));
|
|
86
|
+
const score = results.reduce((sum, r) => sum + (r.passed ? r.weight : 0), 0);
|
|
87
|
+
return {
|
|
88
|
+
score: Math.round(score * 1000) / 1000,
|
|
89
|
+
constraints: results,
|
|
90
|
+
timestamp: new Date().toISOString(),
|
|
91
|
+
};
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
// ---------------------------------------------------------------------------
|
|
95
|
+
// selfAuditAndLog — evaluates and appends to self-score-log.jsonl (sync)
|
|
96
|
+
// ---------------------------------------------------------------------------
|
|
97
|
+
|
|
98
|
+
/**
|
|
99
|
+
* Score a feedback event and append the result to self-score-log.jsonl.
|
|
100
|
+
*
|
|
101
|
+
* Non-critical: any filesystem error is swallowed — result is returned regardless.
|
|
102
|
+
*
|
|
103
|
+
* @param {Object} feedbackEvent - The feedback event to score
|
|
104
|
+
* @param {Object} mlPaths - Object with feedbackDir property (from getFeedbackPaths())
|
|
105
|
+
* @returns {{ score: number, constraints: Array, timestamp: string }}
|
|
106
|
+
*/
|
|
107
|
+
function selfAuditAndLog(feedbackEvent, mlPaths) {
|
|
108
|
+
const result = selfAudit(feedbackEvent);
|
|
109
|
+
try {
|
|
110
|
+
const feedbackDir = (mlPaths && mlPaths.FEEDBACK_DIR) || (mlPaths && mlPaths.feedbackDir);
|
|
111
|
+
if (feedbackDir) {
|
|
112
|
+
const logPath = path.join(feedbackDir, 'self-score-log.jsonl');
|
|
113
|
+
const entry = {
|
|
114
|
+
feedbackId: (feedbackEvent || {}).id || null,
|
|
115
|
+
...result,
|
|
116
|
+
};
|
|
117
|
+
fs.appendFileSync(logPath, `${JSON.stringify(entry)}\n`);
|
|
118
|
+
}
|
|
119
|
+
} catch (_err) {
|
|
120
|
+
// Non-critical side-effect — swallow and return result anyway
|
|
121
|
+
}
|
|
122
|
+
return result;
|
|
123
|
+
}
|
|
124
|
+
|
|
125
|
+
// ---------------------------------------------------------------------------
|
|
126
|
+
// Exports
|
|
127
|
+
// ---------------------------------------------------------------------------
|
|
128
|
+
|
|
129
|
+
module.exports = { selfAudit, selfAuditAndLog, CONSTRAINTS };
|