npm - rlhf-feedback-loop - Versions diffs - 0.5.0 - Mend

rlhf-feedback-loop 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

package/CHANGELOG.md +26 -0
package/LICENSE +21 -0
package/README.md +308 -0
package/adapters/README.md +8 -0
package/adapters/amp/skills/rlhf-feedback/SKILL.md +20 -0
package/adapters/chatgpt/INSTALL.md +80 -0
package/adapters/chatgpt/openapi.yaml +292 -0
package/adapters/claude/.mcp.json +8 -0
package/adapters/codex/config.toml +4 -0
package/adapters/gemini/function-declarations.json +95 -0
package/adapters/mcp/server-stdio.js +444 -0
package/bin/cli.js +167 -0
package/config/mcp-allowlists.json +29 -0
package/config/policy-bundles/constrained-v1.json +53 -0
package/config/policy-bundles/default-v1.json +80 -0
package/config/rubrics/default-v1.json +52 -0
package/config/subagent-profiles.json +32 -0
package/openapi/openapi.yaml +292 -0
package/package.json +91 -0
package/plugins/amp-skill/INSTALL.md +52 -0
package/plugins/amp-skill/SKILL.md +31 -0
package/plugins/claude-skill/INSTALL.md +55 -0
package/plugins/claude-skill/SKILL.md +46 -0
package/plugins/codex-profile/AGENTS.md +20 -0
package/plugins/codex-profile/INSTALL.md +57 -0
package/plugins/gemini-extension/INSTALL.md +74 -0
package/plugins/gemini-extension/gemini_prompt.txt +10 -0
package/plugins/gemini-extension/tool_contract.json +28 -0
package/scripts/billing.js +471 -0
package/scripts/budget-guard.js +173 -0
package/scripts/code-reasoning.js +307 -0
package/scripts/context-engine.js +547 -0
package/scripts/contextfs.js +513 -0
package/scripts/contract-audit.js +198 -0
package/scripts/dpo-optimizer.js +208 -0
package/scripts/export-dpo-pairs.js +316 -0
package/scripts/export-training.js +448 -0
package/scripts/feedback-attribution.js +313 -0
package/scripts/feedback-inbox-read.js +162 -0
package/scripts/feedback-loop.js +838 -0
package/scripts/feedback-schema.js +300 -0
package/scripts/feedback-to-memory.js +165 -0
package/scripts/feedback-to-rules.js +109 -0
package/scripts/generate-paperbanana-diagrams.sh +99 -0
package/scripts/hybrid-feedback-context.js +676 -0
package/scripts/intent-router.js +164 -0
package/scripts/mcp-policy.js +92 -0
package/scripts/meta-policy.js +194 -0
package/scripts/plan-gate.js +154 -0
package/scripts/prove-adapters.js +364 -0
package/scripts/prove-attribution.js +364 -0
package/scripts/prove-automation.js +393 -0
package/scripts/prove-data-quality.js +219 -0
package/scripts/prove-intelligence.js +256 -0
package/scripts/prove-lancedb.js +370 -0
package/scripts/prove-loop-closure.js +255 -0
package/scripts/prove-rlaif.js +404 -0
package/scripts/prove-subway-upgrades.js +250 -0
package/scripts/prove-training-export.js +324 -0
package/scripts/prove-v2-milestone.js +273 -0
package/scripts/prove-v3-milestone.js +381 -0
package/scripts/rlaif-self-audit.js +123 -0
package/scripts/rubric-engine.js +230 -0
package/scripts/self-heal.js +127 -0
package/scripts/self-healing-check.js +111 -0
package/scripts/skill-quality-tracker.js +284 -0
package/scripts/subagent-profiles.js +79 -0
package/scripts/sync-gh-secrets-from-env.sh +29 -0
package/scripts/thompson-sampling.js +331 -0
package/scripts/train_from_feedback.py +914 -0
package/scripts/validate-feedback.js +580 -0
package/scripts/vector-store.js +100 -0
package/src/api/server.js +497 -0

package/scripts/skill-quality-tracker.js ADDED Viewed

@@ -0,0 +1,284 @@
+#!/usr/bin/env node
+/**
+ * Skill Quality Tracker
+ *
+ * Correlates tool call metrics to feedback signals by timestamp proximity.
+ * After a sequence of tool calls and feedback captures, produces a per-skill
+ * quality score derived from timestamp-proximity correlation.
+ *
+ * Ported from Subway_RN_Demo/.claude/scripts/feedback/skill-quality-tracker.js
+ * PATH: PROJECT_ROOT = path.join(__dirname, '..') — 1 level up from scripts/
+ */
+'use strict';
+const fs = require('fs');
+const readline = require('readline');
+const path = require('path');
+const FEEDBACK_DIR = process.env.RLHF_FEEDBACK_DIR
+  || path.join(__dirname, '..', '.claude', 'memory', 'feedback');
+const METRICS_PATH = process.env.METRICS_PATH
+  || path.join(FEEDBACK_DIR, 'tool-metrics.jsonl');
+const FEEDBACK_PATH = process.env.FEEDBACK_PATH
+  || path.join(FEEDBACK_DIR, 'feedback-log.jsonl');
+// Correlation window: feedback within 60 seconds of a tool call is considered correlated
+const CORRELATION_WINDOW_MS = 60_000;
+/**
+ * Safely parse a single JSON line.
+ *
+ * @param {string} line
+ * @returns {object|null}
+ */
+function parseLine(line) {
+  try {
+    return JSON.parse(line);
+  } catch {
+    return null;
+  }
+}
+/**
+ * Load feedback entries from JSONL file.
+ * Each entry needs: timestamp, feedback (signal).
+ *
+ * @param {string} filePath
+ * @returns {Promise<Array<{ ts: number, feedback: string, tool: string|null }>>}
+ */
+async function loadFeedback(filePath) {
+  const entries = [];
+  if (!fs.existsSync(filePath)) return entries;
+  const rl = readline.createInterface({
+    input: fs.createReadStream(filePath),
+    crlfDelay: Infinity,
+  });
+  for await (const line of rl) {
+    const obj = parseLine(line);
+    if (obj && obj.timestamp) {
+      // Support both 'feedback' (Subway) and 'signal' (rlhf) field names
+      const feedbackVal = obj.feedback || obj.signal;
+      if (feedbackVal) {
+        // Normalize to 'positive'/'negative' regardless of source schema
+        let normalized = feedbackVal;
+        if (feedbackVal === 'up') normalized = 'positive';
+        else if (feedbackVal === 'down') normalized = 'negative';
+        entries.push({
+          ts: new Date(obj.timestamp).getTime(),
+          feedback: normalized,
+          tool: obj.tool_name || null,
+        });
+      }
+    }
+  }
+  entries.sort((a, b) => a.ts - b.ts);
+  return entries;
+}
+/**
+ * Find correlated feedback for a tool call by timestamp proximity.
+ *
+ * Searches feedback entries within CORRELATION_WINDOW_MS of the metric timestamp.
+ * If the feedback entry has a tool_name, it must match the metric's tool name.
+ *
+ * @param {number} metricTs - Timestamp of the tool call (ms)
+ * @param {string} metricTool - Tool name
+ * @param {Array<{ ts: number, feedback: string, tool: string|null }>} feedbackEntries
+ * @returns {string|null} 'positive', 'negative', or null if no correlation found
+ */
+function correlateFeedback(metricTs, metricTool, feedbackEntries) {
+  for (const fb of feedbackEntries) {
+    if (Math.abs(fb.ts - metricTs) <= CORRELATION_WINDOW_MS) {
+      // If feedback has a tool name, it must match; otherwise correlate by time alone
+      if (!fb.tool || fb.tool === metricTool) {
+        return fb.feedback;
+      }
+    }
+  }
+  return null;
+}
+/**
+ * Process tool metrics JSONL and correlate with feedback.
+ *
+ * @param {string} metricsPath
+ * @param {Array<{ ts: number, feedback: string, tool: string|null }>} feedbackEntries
+ * @returns {Promise<{ totalToolUses: number, breakdown: object }>}
+ */
+async function processMetrics(metricsPath, feedbackEntries) {
+  const breakdown = {};
+  let totalToolUses = 0;
+  if (!fs.existsSync(metricsPath)) return { totalToolUses, breakdown };
+  const rl = readline.createInterface({
+    input: fs.createReadStream(metricsPath),
+    crlfDelay: Infinity,
+  });
+  for await (const line of rl) {
+    const obj = parseLine(line);
+    if (!obj || !obj.tool_name) continue;
+    totalToolUses++;
+    const name = obj.tool_name;
+    if (!breakdown[name]) {
+      breakdown[name] = { uses: 0, correlatedPositive: 0, correlatedNegative: 0 };
+    }
+    breakdown[name].uses++;
+    const ts = new Date(obj.timestamp).getTime();
+    if (!isNaN(ts)) {
+      const signal = correlateFeedback(ts, name, feedbackEntries);
+      if (signal === 'positive') breakdown[name].correlatedPositive++;
+      else if (signal === 'negative') breakdown[name].correlatedNegative++;
+    }
+  }
+  return { totalToolUses, breakdown };
+}
+/**
+ * Compute per-tool success rates from correlation counts.
+ * Mutates the breakdown object in place.
+ *
+ * @param {object} breakdown - { toolName: { uses, correlatedPositive, correlatedNegative } }
+ */
+function computeSuccessRates(breakdown) {
+  for (const tool of Object.values(breakdown)) {
+    const correlated = tool.correlatedPositive + tool.correlatedNegative;
+    tool.successRate = correlated > 0
+      ? +(tool.correlatedPositive / correlated).toFixed(4)
+      : null;
+  }
+}
+/**
+ * Return top-performing tools sorted by success rate.
+ *
+ * @param {object} breakdown
+ * @param {number} [min=10] - Minimum uses threshold
+ * @param {number} [limit=5] - Maximum entries to return
+ * @returns {Array<{ tool: string, successRate: number, uses: number }>}
+ */
+function topPerformers(breakdown, min = 10, limit = 5) {
+  return Object.entries(breakdown)
+    .filter(([, v]) => v.uses >= min && v.successRate !== null)
+    .sort((a, b) => b[1].successRate - a[1].successRate || b[1].uses - a[1].uses)
+    .slice(0, limit)
+    .map(([name, v]) => ({ tool: name, successRate: v.successRate, uses: v.uses }));
+}
+/**
+ * Return tools with high negative correlation (potential trouble spots).
+ * Threshold: >30% negative rate among correlated feedback.
+ *
+ * @param {object} breakdown
+ * @returns {Array<{ tool: string, negativeRate: number, uses: number }>}
+ */
+function troubleSpots(breakdown) {
+  return Object.entries(breakdown)
+    .filter(([, v]) => {
+      const total = v.correlatedPositive + v.correlatedNegative;
+      return total > 0 && v.correlatedNegative / total > 0.3;
+    })
+    .map(([name, v]) => {
+      const total = v.correlatedPositive + v.correlatedNegative;
+      return {
+        tool: name,
+        negativeRate: +(v.correlatedNegative / total).toFixed(4),
+        uses: v.uses,
+      };
+    })
+    .sort((a, b) => b.negativeRate - a.negativeRate);
+}
+/**
+ * Generate actionable recommendations from top performers and trouble spots.
+ *
+ * @param {Array} top - topPerformers result
+ * @param {Array} trouble - troubleSpots result
+ * @param {object} breakdown - full breakdown
+ * @returns {string[]}
+ */
+function generateRecommendations(top, trouble, breakdown) {
+  const recs = [];
+  for (const t of trouble) {
+    recs.push(
+      `Investigate "${t.tool}" — ${(t.negativeRate * 100).toFixed(1)}% negative correlation across ${t.uses} uses.`
+    );
+  }
+  if (top.length > 0) {
+    recs.push(
+      `"${top[0].tool}" is the top performer (${(top[0].successRate * 100).toFixed(1)}% success). Consider expanding its usage patterns.`
+    );
+  }
+  const uncorrelated = Object.entries(breakdown).filter(
+    ([, v]) => v.uses >= 10 && v.successRate === null
+  );
+  if (uncorrelated.length > 0) {
+    recs.push(
+      `${uncorrelated.length} tool(s) with 10+ uses have no correlated feedback — consider adding coverage.`
+    );
+  }
+  if (recs.length === 0) recs.push('No actionable recommendations at this time.');
+  return recs;
+}
+/**
+ * Main entry point: load data, correlate, produce report.
+ *
+ * @returns {Promise<object>} Full skill quality report
+ */
+async function run() {
+  const feedbackEntries = await loadFeedback(FEEDBACK_PATH);
+  const { totalToolUses, breakdown } = await processMetrics(METRICS_PATH, feedbackEntries);
+  computeSuccessRates(breakdown);
+  const top = topPerformers(breakdown);
+  const trouble = troubleSpots(breakdown);
+  const recommendations = generateRecommendations(top, trouble, breakdown);
+  const report = {
+    generatedAt: new Date().toISOString(),
+    totalToolUses,
+    toolBreakdown: breakdown,
+    topPerformers: top,
+    troubleSpots: trouble,
+    recommendations,
+  };
+  console.log(JSON.stringify(report, null, 2));
+  return report;
+}
+if (require.main === module) {
+  run().catch(() => {}).finally(() => process.exit(0));
+}
+module.exports = {
+  parseLine,
+  correlateFeedback,
+  computeSuccessRates,
+  topPerformers,
+  troubleSpots,
+  generateRecommendations,
+  loadFeedback,
+  processMetrics,
+  run,
+  CORRELATION_WINDOW_MS,
+};

package/scripts/subagent-profiles.js ADDED Viewed

@@ -0,0 +1,79 @@
+#!/usr/bin/env node
+const fs = require('fs');
+const path = require('path');
+const { loadMcpPolicy } = require('./mcp-policy');
+const PROJECT_ROOT = path.join(__dirname, '..');
+const DEFAULT_SUBAGENT_PROFILE_PATH = path.join(PROJECT_ROOT, 'config', 'subagent-profiles.json');
+function getSubagentProfilePath() {
+  return process.env.RLHF_SUBAGENT_PROFILE_PATH || DEFAULT_SUBAGENT_PROFILE_PATH;
+}
+function loadSubagentProfiles() {
+  const raw = fs.readFileSync(getSubagentProfilePath(), 'utf-8');
+  const parsed = JSON.parse(raw);
+  if (!parsed.profiles || typeof parsed.profiles !== 'object') {
+    throw new Error('Invalid subagent profile config: missing profiles object');
+  }
+  return parsed;
+}
+function listSubagentProfiles() {
+  const parsed = loadSubagentProfiles();
+  return Object.keys(parsed.profiles);
+}
+function getSubagentProfile(name) {
+  const parsed = loadSubagentProfiles();
+  const profile = parsed.profiles[name];
+  if (!profile) {
+    throw new Error(`Unknown subagent profile: ${name}`);
+  }
+  return profile;
+}
+function validateSubagentProfiles() {
+  const parsed = loadSubagentProfiles();
+  const policy = loadMcpPolicy();
+  const issues = [];
+  for (const [name, profile] of Object.entries(parsed.profiles)) {
+    if (!profile.mcpProfile) {
+      issues.push(`${name}: missing mcpProfile`);
+    } else if (!policy.profiles[profile.mcpProfile]) {
+      issues.push(`${name}: unknown mcpProfile '${profile.mcpProfile}'`);
+    }
+    if (!profile.context || typeof profile.context !== 'object') {
+      issues.push(`${name}: missing context settings`);
+    } else {
+      if (!Number.isFinite(profile.context.maxItems) || profile.context.maxItems <= 0) {
+        issues.push(`${name}: invalid context.maxItems`);
+      }
+      if (!Number.isFinite(profile.context.maxChars) || profile.context.maxChars <= 0) {
+        issues.push(`${name}: invalid context.maxChars`);
+      }
+    }
+  }
+  return {
+    valid: issues.length === 0,
+    issues,
+  };
+}
+module.exports = {
+  DEFAULT_SUBAGENT_PROFILE_PATH,
+  getSubagentProfilePath,
+  loadSubagentProfiles,
+  listSubagentProfiles,
+  getSubagentProfile,
+  validateSubagentProfiles,
+};
+if (require.main === module) {
+  const result = validateSubagentProfiles();
+  console.log(JSON.stringify({ profiles: listSubagentProfiles(), ...result }, null, 2));
+  process.exit(result.valid ? 0 : 1);
+}

package/scripts/sync-gh-secrets-from-env.sh ADDED Viewed

@@ -0,0 +1,29 @@
+#!/usr/bin/env bash
+set -euo pipefail
+REPO="${1:-IgorGanapolsky/rlhf-feedback-loop}"
+# Minimal secret set for autonomous PR merge + optional LLM routing.
+SECRET_KEYS=(
+  GH_PAT
+  SENTRY_DSN
+  SENTRY_AUTH_TOKEN
+  LLM_GATEWAY_BASE_URL
+  LLM_GATEWAY_API_KEY
+  TETRATE_API_KEY
+)
+echo "Syncing secrets to $REPO (only keys present in current environment)..."
+for key in "${SECRET_KEYS[@]}"; do
+  value="${!key:-}"
+  if [[ -z "$value" ]]; then
+    echo "- skip $key (not set)"
+    continue
+  fi
+  printf '%s' "$value" | gh secret set "$key" -R "$REPO"
+  echo "- set $key"
+done
+echo "Done."