npm - rlhf-feedback-loop - Versions diffs - 0.5.0 - Mend

rlhf-feedback-loop 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

package/CHANGELOG.md +26 -0
package/LICENSE +21 -0
package/README.md +308 -0
package/adapters/README.md +8 -0
package/adapters/amp/skills/rlhf-feedback/SKILL.md +20 -0
package/adapters/chatgpt/INSTALL.md +80 -0
package/adapters/chatgpt/openapi.yaml +292 -0
package/adapters/claude/.mcp.json +8 -0
package/adapters/codex/config.toml +4 -0
package/adapters/gemini/function-declarations.json +95 -0
package/adapters/mcp/server-stdio.js +444 -0
package/bin/cli.js +167 -0
package/config/mcp-allowlists.json +29 -0
package/config/policy-bundles/constrained-v1.json +53 -0
package/config/policy-bundles/default-v1.json +80 -0
package/config/rubrics/default-v1.json +52 -0
package/config/subagent-profiles.json +32 -0
package/openapi/openapi.yaml +292 -0
package/package.json +91 -0
package/plugins/amp-skill/INSTALL.md +52 -0
package/plugins/amp-skill/SKILL.md +31 -0
package/plugins/claude-skill/INSTALL.md +55 -0
package/plugins/claude-skill/SKILL.md +46 -0
package/plugins/codex-profile/AGENTS.md +20 -0
package/plugins/codex-profile/INSTALL.md +57 -0
package/plugins/gemini-extension/INSTALL.md +74 -0
package/plugins/gemini-extension/gemini_prompt.txt +10 -0
package/plugins/gemini-extension/tool_contract.json +28 -0
package/scripts/billing.js +471 -0
package/scripts/budget-guard.js +173 -0
package/scripts/code-reasoning.js +307 -0
package/scripts/context-engine.js +547 -0
package/scripts/contextfs.js +513 -0
package/scripts/contract-audit.js +198 -0
package/scripts/dpo-optimizer.js +208 -0
package/scripts/export-dpo-pairs.js +316 -0
package/scripts/export-training.js +448 -0
package/scripts/feedback-attribution.js +313 -0
package/scripts/feedback-inbox-read.js +162 -0
package/scripts/feedback-loop.js +838 -0
package/scripts/feedback-schema.js +300 -0
package/scripts/feedback-to-memory.js +165 -0
package/scripts/feedback-to-rules.js +109 -0
package/scripts/generate-paperbanana-diagrams.sh +99 -0
package/scripts/hybrid-feedback-context.js +676 -0
package/scripts/intent-router.js +164 -0
package/scripts/mcp-policy.js +92 -0
package/scripts/meta-policy.js +194 -0
package/scripts/plan-gate.js +154 -0
package/scripts/prove-adapters.js +364 -0
package/scripts/prove-attribution.js +364 -0
package/scripts/prove-automation.js +393 -0
package/scripts/prove-data-quality.js +219 -0
package/scripts/prove-intelligence.js +256 -0
package/scripts/prove-lancedb.js +370 -0
package/scripts/prove-loop-closure.js +255 -0
package/scripts/prove-rlaif.js +404 -0
package/scripts/prove-subway-upgrades.js +250 -0
package/scripts/prove-training-export.js +324 -0
package/scripts/prove-v2-milestone.js +273 -0
package/scripts/prove-v3-milestone.js +381 -0
package/scripts/rlaif-self-audit.js +123 -0
package/scripts/rubric-engine.js +230 -0
package/scripts/self-heal.js +127 -0
package/scripts/self-healing-check.js +111 -0
package/scripts/skill-quality-tracker.js +284 -0
package/scripts/subagent-profiles.js +79 -0
package/scripts/sync-gh-secrets-from-env.sh +29 -0
package/scripts/thompson-sampling.js +331 -0
package/scripts/train_from_feedback.py +914 -0
package/scripts/validate-feedback.js +580 -0
package/scripts/vector-store.js +100 -0
package/src/api/server.js +497 -0

package/adapters/chatgpt/openapi.yaml ADDED Viewed

@@ -0,0 +1,292 @@
+openapi: 3.1.0
+info:
+  title: RLHF Feedback Loop API
+  version: 1.1.0
+  description: |
+    Production API for feedback capture, schema-validated memory promotion,
+    prevention rule generation, and DPO export.
+servers:
+  - url: http://localhost:8787
+security:
+  - bearerAuth: []
+components:
+  securitySchemes:
+    bearerAuth:
+      type: http
+      scheme: bearer
+      bearerFormat: API Key
+  schemas:
+    RubricScore:
+      type: object
+      required: [criterion, score]
+      properties:
+        criterion:
+          type: string
+        score:
+          type: number
+          minimum: 1
+          maximum: 5
+        evidence:
+          type: string
+        judge:
+          type: string
+    CaptureFeedbackRequest:
+      type: object
+      required: [signal, context]
+      properties:
+        signal:
+          type: string
+          enum: [up, down, positive, negative]
+        context:
+          type: string
+        whatWentWrong:
+          type: string
+        whatToChange:
+          type: string
+        whatWorked:
+          type: string
+        rubricScores:
+          type: array
+          items:
+            $ref: '#/components/schemas/RubricScore'
+        guardrails:
+          type: object
+          properties:
+            testsPassed:
+              type: boolean
+            pathSafety:
+              type: boolean
+            budgetCompliant:
+              type: boolean
+        tags:
+          oneOf:
+            - type: array
+              items:
+                type: string
+            - type: string
+        skill:
+          type: string
+    IntentPlanRequest:
+      type: object
+      required: [intentId]
+      properties:
+        intentId:
+          type: string
+        context:
+          type: string
+        mcpProfile:
+          type: string
+        bundleId:
+          type: string
+        approved:
+          type: boolean
+paths:
+  /healthz:
+    get:
+      operationId: healthz
+      responses:
+        '200':
+          description: Service health
+        '401':
+          description: Unauthorized
+  /v1/feedback/capture:
+    post:
+      operationId: captureFeedback
+      requestBody:
+        required: true
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/CaptureFeedbackRequest'
+      responses:
+        '200':
+          description: Feedback accepted and promoted to memory
+        '422':
+          description: Feedback recorded but rejected for memory promotion
+        '401':
+          description: Unauthorized
+  /v1/feedback/stats:
+    get:
+      operationId: getFeedbackStats
+      responses:
+        '200':
+          description: Aggregated feedback statistics
+        '401':
+          description: Unauthorized
+  /v1/intents/catalog:
+    get:
+      operationId: listIntentCatalog
+      parameters:
+        - in: query
+          name: mcpProfile
+          schema:
+            type: string
+        - in: query
+          name: bundleId
+          schema:
+            type: string
+      responses:
+        '200':
+          description: Intent catalog with risk and checkpoint metadata
+        '401':
+          description: Unauthorized
+  /v1/intents/plan:
+    post:
+      operationId: planIntent
+      requestBody:
+        required: true
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/IntentPlanRequest'
+      responses:
+        '200':
+          description: Policy-scoped intent execution plan
+        '400':
+          description: Invalid intent request
+        '401':
+          description: Unauthorized
+  /v1/feedback/summary:
+    get:
+      operationId: getFeedbackSummary
+      parameters:
+        - in: query
+          name: recent
+          schema:
+            type: integer
+            default: 20
+      responses:
+        '200':
+          description: Feedback summary text
+        '401':
+          description: Unauthorized
+  /v1/feedback/rules:
+    post:
+      operationId: generatePreventionRules
+      requestBody:
+        required: false
+        content:
+          application/json:
+            schema:
+              type: object
+              properties:
+                minOccurrences:
+                  type: integer
+                  default: 2
+                outputPath:
+                  type: string
+      responses:
+        '200':
+          description: Prevention rules generated
+        '401':
+          description: Unauthorized
+  /v1/dpo/export:
+    post:
+      operationId: exportDpoPairs
+      requestBody:
+        required: false
+        content:
+          application/json:
+            schema:
+              type: object
+              properties:
+                inputPath:
+                  type: string
+                memoryLogPath:
+                  type: string
+                outputPath:
+                  type: string
+      responses:
+        '200':
+          description: DPO export completed
+        '401':
+          description: Unauthorized
+  /v1/context/construct:
+    post:
+      operationId: constructContextPack
+      requestBody:
+        required: false
+        content:
+          application/json:
+            schema:
+              type: object
+              properties:
+                query:
+                  type: string
+                maxItems:
+                  type: integer
+                  default: 8
+                maxChars:
+                  type: integer
+                  default: 6000
+                namespaces:
+                  type: array
+                  items:
+                    type: string
+                    enum:
+                      - raw_history
+                      - memory/error
+                      - memory/learning
+                      - rules
+                      - tools
+                      - provenance
+      responses:
+        '200':
+          description: Context pack created
+        '400':
+          description: Invalid namespace selection
+        '401':
+          description: Unauthorized
+  /v1/context/evaluate:
+    post:
+      operationId: evaluateContextPack
+      requestBody:
+        required: true
+        content:
+          application/json:
+            schema:
+              type: object
+              required: [packId, outcome]
+              properties:
+                packId:
+                  type: string
+                outcome:
+                  type: string
+                signal:
+                  type: string
+                notes:
+                  type: string
+                rubricScores:
+                  type: array
+                  items:
+                    $ref: '#/components/schemas/RubricScore'
+                guardrails:
+                  type: object
+                  properties:
+                    testsPassed:
+                      type: boolean
+                    pathSafety:
+                      type: boolean
+                    budgetCompliant:
+                      type: boolean
+      responses:
+        '200':
+          description: Evaluation recorded
+        '400':
+          description: Invalid rubric payload
+        '401':
+          description: Unauthorized
+  /v1/context/provenance:
+    get:
+      operationId: getContextProvenance
+      parameters:
+        - in: query
+          name: limit
+          schema:
+            type: integer
+            default: 50
+      responses:
+        '200':
+          description: Recent provenance events
+        '401':
+          description: Unauthorized

package/adapters/claude/.mcp.json ADDED Viewed

@@ -0,0 +1,8 @@
+{
+  "mcpServers": {
+    "rlhf-feedback-loop": {
+      "command": "node",
+      "args": ["adapters/mcp/server-stdio.js"]
+    }
+  }
+}

package/adapters/codex/config.toml ADDED Viewed

@@ -0,0 +1,4 @@
+# Codex MCP profile (copy into ~/.codex/config.toml or merge section)
+[mcp_servers.rlhf_feedback_loop]
+command = "node"
+args = ["adapters/mcp/server-stdio.js"]

package/adapters/gemini/function-declarations.json ADDED Viewed

@@ -0,0 +1,95 @@
+{
+  "tools": [
+    {
+      "name": "capture_feedback",
+      "description": "Capture thumbs-up/down feedback and promote actionable memories",
+      "parameters": {
+        "type": "object",
+        "properties": {
+          "signal": { "type": "string", "enum": ["up", "down"] },
+          "context": { "type": "string" },
+          "whatWentWrong": { "type": "string" },
+          "whatToChange": { "type": "string" },
+          "whatWorked": { "type": "string" },
+          "rubricScores": {
+            "type": "array",
+            "items": {
+              "type": "object",
+              "properties": {
+                "criterion": { "type": "string" },
+                "score": { "type": "number" },
+                "evidence": { "type": "string" },
+                "judge": { "type": "string" }
+              }
+            }
+          },
+          "guardrails": {
+            "type": "object",
+            "properties": {
+              "testsPassed": { "type": "boolean" },
+              "pathSafety": { "type": "boolean" },
+              "budgetCompliant": { "type": "boolean" }
+            }
+          },
+          "tags": {
+            "type": "array",
+            "items": { "type": "string" }
+          },
+          "skill": { "type": "string" }
+        },
+        "required": ["signal", "context"]
+      },
+      "http": {
+        "method": "POST",
+        "path": "/v1/feedback/capture"
+      }
+    },
+    {
+      "name": "feedback_summary",
+      "description": "Get a compact summary of recent feedback performance",
+      "parameters": {
+        "type": "object",
+        "properties": {
+          "recent": { "type": "integer" }
+        }
+      },
+      "http": {
+        "method": "GET",
+        "path": "/v1/feedback/summary"
+      }
+    },
+    {
+      "name": "prevention_rules",
+      "description": "Generate prevention rules from repeated mistakes",
+      "parameters": {
+        "type": "object",
+        "properties": {
+          "minOccurrences": { "type": "integer" }
+        }
+      },
+      "http": {
+        "method": "POST",
+        "path": "/v1/feedback/rules"
+      }
+    },
+    {
+      "name": "plan_intent",
+      "description": "Generate a policy-aware execution plan with checkpoint requirements",
+      "parameters": {
+        "type": "object",
+        "properties": {
+          "intentId": { "type": "string" },
+          "context": { "type": "string" },
+          "mcpProfile": { "type": "string" },
+          "bundleId": { "type": "string" },
+          "approved": { "type": "boolean" }
+        },
+        "required": ["intentId"]
+      },
+      "http": {
+        "method": "POST",
+        "path": "/v1/intents/plan"
+      }
+    }
+  ]
+}