npm - @caupulican/pi-adaptative - Versions diffs - 0.80.61 → 0.80.62 - Mend

@caupulican/pi-adaptative 0.80.61 → 0.80.62

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/CHANGELOG.md +6 -0
package/dist/core/agent-session.d.ts +2 -0
package/dist/core/agent-session.d.ts.map +1 -1
package/dist/core/agent-session.js +27 -1
package/dist/core/agent-session.js.map +1 -1
package/dist/core/memory/effectiveness-tracker.d.ts +31 -0
package/dist/core/memory/effectiveness-tracker.d.ts.map +1 -0
package/dist/core/memory/effectiveness-tracker.js +54 -0
package/dist/core/memory/effectiveness-tracker.js.map +1 -0
package/examples/extensions/custom-provider-anthropic/package-lock.json +2 -2
package/examples/extensions/custom-provider-anthropic/package.json +1 -1
package/examples/extensions/custom-provider-gitlab-duo/package.json +1 -1
package/examples/extensions/sandbox/package-lock.json +2 -2
package/examples/extensions/sandbox/package.json +1 -1
package/examples/extensions/with-deps/package-lock.json +2 -2
package/examples/extensions/with-deps/package.json +1 -1
package/npm-shrinkwrap.json +12 -12
package/package.json +4 -4

package/dist/core/memory/effectiveness-tracker.d.ts ADDED Viewed

@@ -0,0 +1,31 @@
+/**
+ * EffectivenessTracker — the closed adaptive loop (adaptive-agent design R4, leapfrog #9).
+ *
+ * Recall (R3) injects a `<memory_context>` page; this tracks whether the agent actually USED it, so the
+ * recall gate can adapt — recall more when it's paying off, back off when it isn't. "Used" = the
+ * fraction of the recall page's DISTINCTIVE tokens (those not already in the user's query) that reappear
+ * in the assistant's response. We isolate distinctive tokens so we measure recall's own contribution,
+ * not the baseline overlap every response shares with the query.
+ *
+ * The score is an exponential moving average ("useful lately") in [0,1], starting at a neutral prior so
+ * recall is given a fair chance before the loop adapts.
+ */
+export declare class EffectivenessTracker {
+    private ema;
+    private samples;
+    /**
+     * Record the outcome of a turn that received a recall page: how much of the recall's distinctive
+     * content the assistant's response actually drew on.
+     */
+    recordRecallOutcome(recallText: string, queryText: string, responseText: string): void;
+    /** Rolling "useful lately" score in [0,1]. Neutral until enough samples accumulate. */
+    usefulLately(): number;
+    /** Number of recorded recall outcomes. */
+    get sampleCount(): number;
+}
+/**
+ * Fraction of the recall page's distinctive tokens (present in recall but NOT in the query) that appear
+ * in the response. 0 when recall added nothing the query didn't already carry.
+ */
+export declare function distinctiveRecallUsage(recallText: string, queryText: string, responseText: string): number;
+//# sourceMappingURL=effectiveness-tracker.d.ts.map

package/dist/core/memory/effectiveness-tracker.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"effectiveness-tracker.d.ts","sourceRoot":"","sources":["../../../src/core/memory/effectiveness-tracker.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;GAWG;AAOH,qBAAa,oBAAoB;IAChC,OAAO,CAAC,GAAG,CAAiB;IAC5B,OAAO,CAAC,OAAO,CAAK;IAEpB;;;OAGG;IACH,mBAAmB,CAAC,UAAU,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,YAAY,EAAE,MAAM,GAAG,IAAI,CAIrF;IAED,uFAAuF;IACvF,YAAY,IAAI,MAAM,CAErB;IAED,0CAA0C;IAC1C,IAAI,WAAW,IAAI,MAAM,CAExB;CACD;AAED;;;GAGG;AACH,wBAAgB,sBAAsB,CAAC,UAAU,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,YAAY,EAAE,MAAM,GAAG,MAAM,CAU1G","sourcesContent":["/**\n * EffectivenessTracker — the closed adaptive loop (adaptive-agent design R4, leapfrog #9).\n *\n * Recall (R3) injects a `<memory_context>` page; this tracks whether the agent actually USED it, so the\n * recall gate can adapt — recall more when it's paying off, back off when it isn't. \"Used\" = the\n * fraction of the recall page's DISTINCTIVE tokens (those not already in the user's query) that reappear\n * in the assistant's response. We isolate distinctive tokens so we measure recall's own contribution,\n * not the baseline overlap every response shares with the query.\n *\n * The score is an exponential moving average (\"useful lately\") in [0,1], starting at a neutral prior so\n * recall is given a fair chance before the loop adapts.\n */\n\nimport { tokenize } from \"../tools/skill-audit.ts\";\n\nconst NEUTRAL_PRIOR = 0.5;\nconst ALPHA = 0.3; // EMA weight on the newest outcome\n\nexport class EffectivenessTracker {\n\tprivate ema = NEUTRAL_PRIOR;\n\tprivate samples = 0;\n\n\t/**\n\t * Record the outcome of a turn that received a recall page: how much of the recall's distinctive\n\t * content the assistant's response actually drew on.\n\t */\n\trecordRecallOutcome(recallText: string, queryText: string, responseText: string): void {\n\t\tconst used = distinctiveRecallUsage(recallText, queryText, responseText);\n\t\tthis.ema = ALPHA * used + (1 - ALPHA) * this.ema;\n\t\tthis.samples += 1;\n\t}\n\n\t/** Rolling \"useful lately\" score in [0,1]. Neutral until enough samples accumulate. */\n\tusefulLately(): number {\n\t\treturn this.ema;\n\t}\n\n\t/** Number of recorded recall outcomes. */\n\tget sampleCount(): number {\n\t\treturn this.samples;\n\t}\n}\n\n/**\n * Fraction of the recall page's distinctive tokens (present in recall but NOT in the query) that appear\n * in the response. 0 when recall added nothing the query didn't already carry.\n */\nexport function distinctiveRecallUsage(recallText: string, queryText: string, responseText: string): number {\n\tconst queryTokens = new Set(tokenize(queryText));\n\tconst distinctive = tokenize(recallText).filter((t) => !queryTokens.has(t));\n\tif (distinctive.length === 0) return 0;\n\tconst responseTokens = new Set(tokenize(responseText));\n\tlet hits = 0;\n\tfor (const token of distinctive) {\n\t\tif (responseTokens.has(token)) hits++;\n\t}\n\treturn hits / distinctive.length;\n}\n"]}

package/dist/core/memory/effectiveness-tracker.js ADDED Viewed

@@ -0,0 +1,54 @@
+/**
+ * EffectivenessTracker — the closed adaptive loop (adaptive-agent design R4, leapfrog #9).
+ *
+ * Recall (R3) injects a `<memory_context>` page; this tracks whether the agent actually USED it, so the
+ * recall gate can adapt — recall more when it's paying off, back off when it isn't. "Used" = the
+ * fraction of the recall page's DISTINCTIVE tokens (those not already in the user's query) that reappear
+ * in the assistant's response. We isolate distinctive tokens so we measure recall's own contribution,
+ * not the baseline overlap every response shares with the query.
+ *
+ * The score is an exponential moving average ("useful lately") in [0,1], starting at a neutral prior so
+ * recall is given a fair chance before the loop adapts.
+ */
+import { tokenize } from "../tools/skill-audit.js";
+const NEUTRAL_PRIOR = 0.5;
+const ALPHA = 0.3; // EMA weight on the newest outcome
+export class EffectivenessTracker {
+    ema = NEUTRAL_PRIOR;
+    samples = 0;
+    /**
+     * Record the outcome of a turn that received a recall page: how much of the recall's distinctive
+     * content the assistant's response actually drew on.
+     */
+    recordRecallOutcome(recallText, queryText, responseText) {
+        const used = distinctiveRecallUsage(recallText, queryText, responseText);
+        this.ema = ALPHA * used + (1 - ALPHA) * this.ema;
+        this.samples += 1;
+    }
+    /** Rolling "useful lately" score in [0,1]. Neutral until enough samples accumulate. */
+    usefulLately() {
+        return this.ema;
+    }
+    /** Number of recorded recall outcomes. */
+    get sampleCount() {
+        return this.samples;
+    }
+}
+/**
+ * Fraction of the recall page's distinctive tokens (present in recall but NOT in the query) that appear
+ * in the response. 0 when recall added nothing the query didn't already carry.
+ */
+export function distinctiveRecallUsage(recallText, queryText, responseText) {
+    const queryTokens = new Set(tokenize(queryText));
+    const distinctive = tokenize(recallText).filter((t) => !queryTokens.has(t));
+    if (distinctive.length === 0)
+        return 0;
+    const responseTokens = new Set(tokenize(responseText));
+    let hits = 0;
+    for (const token of distinctive) {
+        if (responseTokens.has(token))
+            hits++;
+    }
+    return hits / distinctive.length;
+}
+//# sourceMappingURL=effectiveness-tracker.js.map

package/dist/core/memory/effectiveness-tracker.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"effectiveness-tracker.js","sourceRoot":"","sources":["../../../src/core/memory/effectiveness-tracker.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;GAWG;AAEH,OAAO,EAAE,QAAQ,EAAE,MAAM,yBAAyB,CAAC;AAEnD,MAAM,aAAa,GAAG,GAAG,CAAC;AAC1B,MAAM,KAAK,GAAG,GAAG,CAAC,CAAC,mCAAmC;AAEtD,MAAM,OAAO,oBAAoB;IACxB,GAAG,GAAG,aAAa,CAAC;IACpB,OAAO,GAAG,CAAC,CAAC;IAEpB;;;OAGG;IACH,mBAAmB,CAAC,UAAkB,EAAE,SAAiB,EAAE,YAAoB,EAAQ;QACtF,MAAM,IAAI,GAAG,sBAAsB,CAAC,UAAU,EAAE,SAAS,EAAE,YAAY,CAAC,CAAC;QACzE,IAAI,CAAC,GAAG,GAAG,KAAK,GAAG,IAAI,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC;QACjD,IAAI,CAAC,OAAO,IAAI,CAAC,CAAC;IAAA,CAClB;IAED,uFAAuF;IACvF,YAAY,GAAW;QACtB,OAAO,IAAI,CAAC,GAAG,CAAC;IAAA,CAChB;IAED,0CAA0C;IAC1C,IAAI,WAAW,GAAW;QACzB,OAAO,IAAI,CAAC,OAAO,CAAC;IAAA,CACpB;CACD;AAED;;;GAGG;AACH,MAAM,UAAU,sBAAsB,CAAC,UAAkB,EAAE,SAAiB,EAAE,YAAoB,EAAU;IAC3G,MAAM,WAAW,GAAG,IAAI,GAAG,CAAC,QAAQ,CAAC,SAAS,CAAC,CAAC,CAAC;IACjD,MAAM,WAAW,GAAG,QAAQ,CAAC,UAAU,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,WAAW,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC;IAC5E,IAAI,WAAW,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IACvC,MAAM,cAAc,GAAG,IAAI,GAAG,CAAC,QAAQ,CAAC,YAAY,CAAC,CAAC,CAAC;IACvD,IAAI,IAAI,GAAG,CAAC,CAAC;IACb,KAAK,MAAM,KAAK,IAAI,WAAW,EAAE,CAAC;QACjC,IAAI,cAAc,CAAC,GAAG,CAAC,KAAK,CAAC;YAAE,IAAI,EAAE,CAAC;IACvC,CAAC;IACD,OAAO,IAAI,GAAG,WAAW,CAAC,MAAM,CAAC;AAAA,CACjC","sourcesContent":["/**\n * EffectivenessTracker — the closed adaptive loop (adaptive-agent design R4, leapfrog #9).\n *\n * Recall (R3) injects a `<memory_context>` page; this tracks whether the agent actually USED it, so the\n * recall gate can adapt — recall more when it's paying off, back off when it isn't. \"Used\" = the\n * fraction of the recall page's DISTINCTIVE tokens (those not already in the user's query) that reappear\n * in the assistant's response. We isolate distinctive tokens so we measure recall's own contribution,\n * not the baseline overlap every response shares with the query.\n *\n * The score is an exponential moving average (\"useful lately\") in [0,1], starting at a neutral prior so\n * recall is given a fair chance before the loop adapts.\n */\n\nimport { tokenize } from \"../tools/skill-audit.ts\";\n\nconst NEUTRAL_PRIOR = 0.5;\nconst ALPHA = 0.3; // EMA weight on the newest outcome\n\nexport class EffectivenessTracker {\n\tprivate ema = NEUTRAL_PRIOR;\n\tprivate samples = 0;\n\n\t/**\n\t * Record the outcome of a turn that received a recall page: how much of the recall's distinctive\n\t * content the assistant's response actually drew on.\n\t */\n\trecordRecallOutcome(recallText: string, queryText: string, responseText: string): void {\n\t\tconst used = distinctiveRecallUsage(recallText, queryText, responseText);\n\t\tthis.ema = ALPHA * used + (1 - ALPHA) * this.ema;\n\t\tthis.samples += 1;\n\t}\n\n\t/** Rolling \"useful lately\" score in [0,1]. Neutral until enough samples accumulate. */\n\tusefulLately(): number {\n\t\treturn this.ema;\n\t}\n\n\t/** Number of recorded recall outcomes. */\n\tget sampleCount(): number {\n\t\treturn this.samples;\n\t}\n}\n\n/**\n * Fraction of the recall page's distinctive tokens (present in recall but NOT in the query) that appear\n * in the response. 0 when recall added nothing the query didn't already carry.\n */\nexport function distinctiveRecallUsage(recallText: string, queryText: string, responseText: string): number {\n\tconst queryTokens = new Set(tokenize(queryText));\n\tconst distinctive = tokenize(recallText).filter((t) => !queryTokens.has(t));\n\tif (distinctive.length === 0) return 0;\n\tconst responseTokens = new Set(tokenize(responseText));\n\tlet hits = 0;\n\tfor (const token of distinctive) {\n\t\tif (responseTokens.has(token)) hits++;\n\t}\n\treturn hits / distinctive.length;\n}\n"]}

package/examples/extensions/custom-provider-anthropic/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "pi-extension-custom-provider",
-  "version": "0.80.58",
+  "version": "0.80.59",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "pi-extension-custom-provider",
-      "version": "0.80.58",
+      "version": "0.80.59",
       "dependencies": {
         "@anthropic-ai/sdk": "^0.52.0"
       }

package/examples/extensions/custom-provider-anthropic/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "pi-extension-custom-provider-anthropic",
   "private": true,
-  "version": "0.80.58",
+  "version": "0.80.59",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/examples/extensions/custom-provider-gitlab-duo/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "pi-extension-custom-provider-gitlab-duo",
   "private": true,
-  "version": "0.80.58",
+  "version": "0.80.59",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/examples/extensions/sandbox/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
 	"name": "pi-extension-sandbox",
-	"version": "0.80.58",
+	"version": "0.80.59",
 	"lockfileVersion": 3,
 	"requires": true,
 	"packages": {
 		"": {
 			"name": "pi-extension-sandbox",
-			"version": "0.80.58",
+			"version": "0.80.59",
 			"dependencies": {
 				"@anthropic-ai/sandbox-runtime": "^0.0.26"
 			}

package/examples/extensions/sandbox/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
 	"name": "pi-extension-sandbox",
 	"private": true,
-	"version": "0.80.58",
+	"version": "0.80.59",
 	"type": "module",
 	"scripts": {
 		"clean": "echo 'nothing to clean'",

package/examples/extensions/with-deps/package-lock.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "name": "pi-extension-with-deps",
-  "version": "0.80.58",
+  "version": "0.80.59",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "pi-extension-with-deps",
-      "version": "0.80.58",
+      "version": "0.80.59",
       "dependencies": {
         "ms": "^2.1.3"
       },

package/examples/extensions/with-deps/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "pi-extension-with-deps",
   "private": true,
-  "version": "0.80.58",
+  "version": "0.80.59",
   "type": "module",
   "scripts": {
     "clean": "echo 'nothing to clean'",

package/npm-shrinkwrap.json CHANGED Viewed

@@ -1,17 +1,17 @@
 {
 	"name": "@caupulican/pi-adaptative",
-	"version": "0.80.61",
+	"version": "0.80.62",
 	"lockfileVersion": 3,
 	"requires": true,
 	"packages": {
 		"": {
 			"name": "@caupulican/pi-adaptative",
-			"version": "0.80.61",
+			"version": "0.80.62",
 			"license": "MIT",
 			"dependencies": {
-				"@caupulican/pi-agent-core": "^0.80.61",
-				"@caupulican/pi-ai": "^0.80.61",
-				"@caupulican/pi-tui": "^0.80.61",
+				"@caupulican/pi-agent-core": "^0.80.62",
+				"@caupulican/pi-ai": "^0.80.62",
+				"@caupulican/pi-tui": "^0.80.62",
 				"@silvia-odwyer/photon-node": "0.3.4",
 				"chalk": "5.6.2",
 				"cross-spawn": "7.0.6",
@@ -474,11 +474,11 @@
 			}
 		},
 		"node_modules/@caupulican/pi-agent-core": {
-			"version": "0.80.61",
-			"resolved": "https://registry.npmjs.org/@caupulican/pi-agent-core/-/pi-agent-core-0.80.61.tgz",
+			"version": "0.80.62",
+			"resolved": "https://registry.npmjs.org/@caupulican/pi-agent-core/-/pi-agent-core-0.80.62.tgz",
 			"license": "MIT",
 			"dependencies": {
-				"@caupulican/pi-ai": "^0.80.61",
+				"@caupulican/pi-ai": "^0.80.62",
 				"ignore": "7.0.5",
 				"typebox": "1.1.38",
 				"yaml": "2.9.0"
@@ -488,8 +488,8 @@
 			}
 		},
 		"node_modules/@caupulican/pi-ai": {
-			"version": "0.80.61",
-			"resolved": "https://registry.npmjs.org/@caupulican/pi-ai/-/pi-ai-0.80.61.tgz",
+			"version": "0.80.62",
+			"resolved": "https://registry.npmjs.org/@caupulican/pi-ai/-/pi-ai-0.80.62.tgz",
 			"license": "MIT",
 			"dependencies": {
 				"@anthropic-ai/sdk": "0.91.1",
@@ -511,8 +511,8 @@
 			}
 		},
 		"node_modules/@caupulican/pi-tui": {
-			"version": "0.80.61",
-			"resolved": "https://registry.npmjs.org/@caupulican/pi-tui/-/pi-tui-0.80.61.tgz",
+			"version": "0.80.62",
+			"resolved": "https://registry.npmjs.org/@caupulican/pi-tui/-/pi-tui-0.80.62.tgz",
 			"license": "MIT",
 			"dependencies": {
 				"get-east-asian-width": "1.6.0",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "@caupulican/pi-adaptative",
-	"version": "0.80.61",
+	"version": "0.80.62",
 	"description": "Adaptive fork of Pi coding agent for self-evolving agent harness experiments",
 	"type": "module",
 	"piConfig": {
@@ -41,9 +41,9 @@
 		"prepublishOnly": "npm run clean && npm run build && npm run shrinkwrap"
 	},
 	"dependencies": {
-		"@caupulican/pi-agent-core": "^0.80.61",
-		"@caupulican/pi-ai": "^0.80.61",
-		"@caupulican/pi-tui": "^0.80.61",
+		"@caupulican/pi-agent-core": "^0.80.62",
+		"@caupulican/pi-ai": "^0.80.62",
+		"@caupulican/pi-tui": "^0.80.62",
 		"@silvia-odwyer/photon-node": "0.3.4",
 		"chalk": "5.6.2",
 		"cross-spawn": "7.0.6",