npm - rlhf-feedback-loop - Versions diffs - 0.6.2 → 0.6.3 - Mend

rlhf-feedback-loop 0.6.2 → 0.6.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md +2 -0
package/bin/cli.js +33 -13
package/package.json +1 -1
package/scripts/hook-auto-capture.sh +69 -0
package/src/api/server.js +12 -5

package/README.md CHANGED Viewed

@@ -23,6 +23,8 @@ One command. Pick your platform:
 | **Claude** | `claude mcp add rlhf -- npx -y rlhf-feedback-loop serve` |
 | **Codex** | `codex mcp add rlhf -- npx -y rlhf-feedback-loop serve` |
 | **Gemini** | `gemini mcp add rlhf -- npx -y rlhf-feedback-loop serve` |
+| **Amp** | `cp node_modules/rlhf-feedback-loop/plugins/amp-skill/SKILL.md .amp/skills/rlhf-feedback/SKILL.md` |
+| **Cursor** | `cursor mcp add rlhf -- npx -y rlhf-feedback-loop serve` |
 | **All at once** | `npx add-mcp rlhf-feedback-loop` |
 That's it. Your agent can now capture feedback, recall past learnings mid-conversation, and block repeated mistakes.

package/bin/cli.js CHANGED Viewed

@@ -210,19 +210,39 @@ function capture() {
     return;
   }
-  // Normalize signal with fuzzy matching (uses the full engine's normalize)
-  const captureScript = require(path.join(PKG_ROOT, '.claude', 'scripts', 'feedback', 'capture-feedback.js'));
-  // The capture-feedback.js runs as main when required directly, so we call via subprocess
-  const scriptArgs = process.argv.slice(3).join(' ');
-  try {
-    const output = execSync(
-      `node "${path.join(PKG_ROOT, '.claude', 'scripts', 'feedback', 'capture-feedback.js')}" ${scriptArgs}`,
-      { encoding: 'utf8', stdio: 'pipe', cwd: CWD }
-    );
-    process.stdout.write(output);
-  } catch (err) {
-    process.stderr.write(err.stderr || err.stdout || err.message);
-    process.exit(err.status || 1);
+  const signal = (args.feedback || '').toLowerCase();
+  const normalized = ['up', 'thumbsup', 'thumbs_up', 'positive'].some(v => signal.includes(v)) ? 'up'
+    : ['down', 'thumbsdown', 'thumbs_down', 'negative'].some(v => signal.includes(v)) ? 'down'
+    : signal;
+  if (normalized !== 'up' && normalized !== 'down') {
+    console.error('Missing or unrecognized --feedback=up|down');
+    process.exit(1);
+  }
+  const result = captureFeedback({
+    signal: normalized,
+    context: args.context || '',
+    whatWentWrong: args['what-went-wrong'],
+    whatToChange: args['what-to-change'],
+    whatWorked: args['what-worked'],
+    tags: args.tags,
+  });
+  if (result.accepted) {
+    const ev = result.feedbackEvent;
+    const mem = result.memoryRecord;
+    console.log(`\nRLHF Feedback Captured [${normalized.toUpperCase()}]`);
+    console.log('─'.repeat(50));
+    console.log(`  Feedback ID : ${ev.id}`);
+    console.log(`  Signal      : ${ev.signal} (${ev.actionType})`);
+    console.log(`  Memory ID   : ${mem.id}`);
+    console.log(`  Storage     : JSONL log + LanceDB vector index\n`);
+  } else {
+    console.log(`\nRLHF Feedback Recorded [${normalized.toUpperCase()}] — not promoted`);
+    console.log('─'.repeat(50));
+    console.log(`  Reason      : ${result.reason}\n`);
+    process.exit(2);
   }
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rlhf-feedback-loop",
-  "version": "0.6.2",
+  "version": "0.6.3",
   "description": "Make your AI agent learn from mistakes. Capture thumbs up/down feedback, block repeated failures, export DPO training data. Works with ChatGPT, Claude, Codex, Gemini, Amp.",
   "homepage": "https://github.com/IgorGanapolsky/rlhf-feedback-loop#readme",
   "repository": {

package/scripts/hook-auto-capture.sh ADDED Viewed

@@ -0,0 +1,69 @@
+#!/bin/bash
+# Claude Code UserPromptSubmit hook — auto-captures thumbs up/down feedback
+# Triggered on every user message. Only acts on feedback signals.
+# Shows full verbose output with storage paths, memory IDs, and stats.
+PROMPT="$CLAUDE_USER_PROMPT"
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+CAPTURE="$SCRIPT_DIR/../.claude/scripts/feedback/capture-feedback.js"
+FEEDBACK_LOG="$SCRIPT_DIR/../.claude/memory/feedback/feedback-log.jsonl"
+MEMORY_LOG="$SCRIPT_DIR/../.claude/memory/feedback/memory-log.jsonl"
+# Normalize to lowercase for matching
+LOWER=$(echo "$PROMPT" | tr '[:upper:]' '[:lower:]')
+capture_and_report() {
+  local SIGNAL="$1"
+  # Capture feedback (verbose output already shows IDs, signal, storage)
+  node "$CAPTURE" --feedback="$SIGNAL" --context="$PROMPT" --tags="auto-capture,hook"
+  # Show storage proof
+  echo ""
+  echo "Storage Proof:"
+  echo "  Feedback log : $FEEDBACK_LOG ($(wc -l < "$FEEDBACK_LOG" 2>/dev/null || echo 0) entries)"
+  echo "  Memory log   : $MEMORY_LOG ($(wc -l < "$MEMORY_LOG" 2>/dev/null || echo 0) entries)"
+  echo "  LanceDB      : $SCRIPT_DIR/../.claude/memory/feedback/lancedb/"
+  echo ""
+  # Show last entry written
+  echo "Last Entry Written:"
+  tail -1 "$FEEDBACK_LOG" 2>/dev/null | node -e "
+    const d = JSON.parse(require('fs').readFileSync('/dev/stdin','utf8'));
+    console.log('  ID        :', d.id);
+    console.log('  Signal    :', d.signal, '(' + d.actionType + ')');
+    console.log('  Context   :', (d.context||'').slice(0,80));
+    console.log('  Tags      :', (d.tags||[]).join(', '));
+    console.log('  Timestamp :', d.timestamp);
+    console.log('  Domain    :', (d.richContext||{}).domain || 'general');
+  " 2>/dev/null
+  # Show cumulative stats
+  echo ""
+  echo "Cumulative Stats:"
+  node -e "
+    const fs = require('fs');
+    const lines = fs.readFileSync('$FEEDBACK_LOG','utf8').trim().split('\n').filter(Boolean);
+    const entries = lines.map(l => { try { return JSON.parse(l); } catch(e) { return null; } }).filter(Boolean);
+    const pos = entries.filter(e => e.signal === 'positive').length;
+    const neg = entries.filter(e => e.signal === 'negative').length;
+    const promoted = entries.filter(e => e.actionType === 'store-learning' || e.actionType === 'store-mistake').length;
+    console.log('  Total feedback  :', entries.length);
+    console.log('  Positive (up)   :', pos);
+    console.log('  Negative (down) :', neg);
+    console.log('  Promoted to mem :', promoted);
+    console.log('  Ratio           :', pos > 0 ? (pos/(pos+neg)*100).toFixed(0) + '% positive' : 'n/a');
+  " 2>/dev/null
+}
+# Check for thumbs up signals
+if echo "$LOWER" | grep -qE '(thumbs? ?up|that worked|looks good|nice work|perfect|good job)'; then
+  capture_and_report "up"
+  exit 0
+fi
+# Check for thumbs down signals
+if echo "$LOWER" | grep -qE '(thumbs? ?down|that failed|that was wrong|fix this)'; then
+  capture_and_report "down"
+  exit 0
+fi

package/src/api/server.js CHANGED Viewed

@@ -183,7 +183,18 @@ function createApiServer() {
     const parsed = new URL(req.url, 'http://localhost');
     const pathname = parsed.pathname;
-    // Health check is unauthenticated — required for Railway/load-balancer probes
+    // Public endpoints — no auth required
+    if (req.method === 'GET' && pathname === '/') {
+      sendJson(res, 200, {
+        name: 'rlhf-feedback-loop',
+        version: pkg.version,
+        status: 'ok',
+        docs: 'https://github.com/IgorGanapolsky/rlhf-feedback-loop',
+        endpoints: ['/health', '/v1/feedback/capture', '/v1/feedback/stats', '/v1/dpo/export'],
+      });
+      return;
+    }
     if (req.method === 'GET' && pathname === '/health') {
       sendJson(res, 200, {
         status: 'ok',
@@ -409,10 +420,6 @@ function createApiServer() {
         return;
       }
-      if (req.method === 'GET' && pathname === '/') {
-        sendText(res, 200, 'RLHF Feedback Loop API is running.');
-        return;
-      }
       // ----------------------------------------------------------------
       // Billing routes