npm - @caupulican/pi-adaptative - Versions diffs - 0.80.30 → 0.80.34 - Mend

@caupulican/pi-adaptative 0.80.30 → 0.80.34

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

package/CHANGELOG.md +26 -0
package/dist/core/agent-session.d.ts +3 -0
package/dist/core/agent-session.d.ts.map +1 -1
package/dist/core/agent-session.js +17 -2
package/dist/core/agent-session.js.map +1 -1
package/dist/core/context-gc.d.ts.map +1 -1
package/dist/core/context-gc.js +1 -1
package/dist/core/context-gc.js.map +1 -1
package/dist/core/sdk.d.ts.map +1 -1
package/dist/core/sdk.js +1 -0
package/dist/core/sdk.js.map +1 -1
package/dist/modes/interactive/interactive-mode.d.ts.map +1 -1
package/dist/modes/interactive/interactive-mode.js +35 -8
package/dist/modes/interactive/interactive-mode.js.map +1 -1
package/examples/extensions/custom-provider-anthropic/package-lock.json +2 -2
package/examples/extensions/custom-provider-anthropic/package.json +1 -1
package/examples/extensions/custom-provider-gitlab-duo/package.json +1 -1
package/examples/extensions/sandbox/package-lock.json +2 -2
package/examples/extensions/sandbox/package.json +1 -1
package/examples/extensions/with-deps/package-lock.json +2 -2
package/examples/extensions/with-deps/package.json +1 -1
package/npm-shrinkwrap.json +12 -12
package/package.json +4 -4

package/dist/modes/interactive/interactive-mode.js CHANGED Viewed

@@ -102,7 +102,7 @@ const AUTO_LEARN_DEFAULTS = {
     maxConcurrentLearners: 1,
     applyHighConfidence: false,
     reflectionReview: true,
-    reflectionMinToolCalls: 8,
+    reflectionMinToolCalls: 5,
     reflectionCooldownMinutes: 24 * 60,
 };
 const AUTONOMY_AUTO_LEARN_PRESETS = {
@@ -117,7 +117,7 @@ const AUTONOMY_AUTO_LEARN_PRESETS = {
         maxConcurrentLearners: 1,
         applyHighConfidence: false,
         reflectionReview: true,
-        reflectionMinToolCalls: 8,
+        reflectionMinToolCalls: 5,
         reflectionCooldownMinutes: 24 * 60,
     },
     balanced: {
@@ -130,7 +130,7 @@ const AUTONOMY_AUTO_LEARN_PRESETS = {
         maxConcurrentLearners: 1,
         applyHighConfidence: false,
         reflectionReview: true,
-        reflectionMinToolCalls: 8,
+        reflectionMinToolCalls: 5,
         reflectionCooldownMinutes: 24 * 60,
     },
     full: {
@@ -143,13 +143,14 @@ const AUTONOMY_AUTO_LEARN_PRESETS = {
         maxConcurrentLearners: 1,
         applyHighConfidence: true,
         reflectionReview: true,
-        reflectionMinToolCalls: 8,
+        reflectionMinToolCalls: 5,
         reflectionCooldownMinutes: 24 * 60,
     },
 };
 const AUTONOMY_MODES = ["off", "safe", "balanced", "full"];
 const AUTO_LEARN_RESERVATION_MS = 2 * 60 * 1000;
 const AUTO_LEARN_THINKING_LEVEL = "xhigh";
+const AUTO_LEARN_COMPLEX_TASK_TOOL_CALLS = 5;
 export const AUTO_LEARN_HISTORY_RETENTION_MS = 7 * 24 * 60 * 60 * 1000;
 function definedStringSet(values) {
     const set = new Set();
@@ -4020,16 +4021,16 @@ export class InteractiveMode {
             ? `\n\nLatest completed turn digest (bounded; use only as current-session evidence, not as longitudinal proof):\n<turn_digest>\n${options.turnDigest}\n</turn_digest>`
             : "";
         const objective = options.kind === "reflection"
-            ? "review the latest completed turn for durable memory, skill, validation, and tooling-improvement cues, then run one bounded continuous-learning pass if the learning tools are available"
+            ? "review the latest completed turn for durable memory, skill, validation, tooling, and code-baked self-improvement cues, then run one bounded continuous-learning pass if the learning tools are available"
             : "run one bounded continuous-learning pass for this Pi tenant";
-        return `You are Pi Auto Learn running as a background learner.\n\nObjective: ${objective}.\nTrigger: ${reason}.\n\n${authorityBlock}\n\nRequired workflow:\n1. Query existing durable memory/rules first when tools allow it. Memory confrontation is mandatory before accepting, merging, upgrading, or rejecting learning candidates.\n2. Run the available Auto Learn tooling, preferably learning_run_auto, with applyHighConfidence=${settings.applyHighConfidence}. Process candidate validation in vectorized chunks/batches; avoid scalar per-candidate memory queries except for final selected writes.\n3. Apply the learning validation tree to each candidate chunk: (a) Why is this good for the user? (b) Is it unique, or similar to existing memory/skills/agents so it should merge or upgrade existing knowledge? (c) Will this make Pi a better agent? Candidates that cannot answer all three are noise.\n4. Treat the latest-turn digest as current-session evidence only; do not auto-commit one-off cues unless deterministic tooling and memory confrontation corroborate them.\n5. In mode=full, apply safe memory/skill/user-extension/authorized-source improvements under the standing grant above; otherwise keep them proposal-gated.\n6. Never cross hard-stop boundaries from the authority policy.\n7. If the learning tools are unavailable, report BLOCKED with the missing tool names and do not improvise.\n8. Finish with PASS, BLOCKED, or FAIL and concise evidence, including chunk counts, merge/upgrade decisions, and cleanup/purge status.${reflectionBlock}`;
+        return `You are Pi Auto Learn running as a background learner.\n\nObjective: ${objective}.\nTrigger: ${reason}.\n\n${authorityBlock}\n\nRequired workflow:\n1. Query existing durable memory/rules first when tools allow it. Memory confrontation is mandatory before accepting, merging, upgrading, or rejecting learning candidates.\n2. Run the available Auto Learn tooling, preferably learning_run_auto, with applyHighConfidence=${settings.applyHighConfidence}. Process candidate validation in vectorized chunks/batches; avoid scalar per-candidate memory queries except for final selected writes.\n3. Apply the learning validation tree to each candidate chunk: (a) Why is this good for the user? (b) Is it unique, or similar to existing memory/skills/agents so it should merge or upgrade existing knowledge? (c) Will this make Pi a better agent? Candidates that cannot answer all three are noise.\n4. Hermes-style learning cycle: after a complex task (${AUTO_LEARN_COMPLEX_TASK_TOOL_CALLS}+ tool calls), user correction, repeated steering pattern, non-trivial fix/workaround/debugging path, loaded-skill defect, trigger gap, tool gap, or harness workflow defect, actively create or update durable learning artifacts. Memory stores compact facts/preferences/state; skills/prompts/agents/extensions/source store procedural behavior. When a lesson changes how Pi should act on a future class of task, memory alone is not completion.\n5. Skill update preference order: (1) patch the currently loaded or consulted skill that governed the task; (2) patch an existing class-level umbrella skill/agent/prompt; (3) add a support file under references/, templates/, or scripts/ and add a SKILL.md pointer; (4) create a new class-level umbrella skill only when no existing artifact fits. Never create one-off PR/error/codename/session skills.\n6. Behavioral self-improvement is code-baked by default: prefer the lowest durable executable layer that fixes the behavior — patch an existing skill/prompt/agent/extension/tool, tune an approved setting, or edit the authorized Pi source when source authority is available. Use Automata only for concise facts/evidence pointers that support the baked change.\n7. Do not harden transient or environment-dependent failures into durable behavior: missing binaries, fresh-install package gaps, credentials not configured, path mismatches, one-off task narratives, or negative tool-broken claims should become setup/troubleshooting fixes only when the fix itself is reusable.\n8. Treat the latest-turn digest as current-session evidence only; do not auto-commit one-off cues unless deterministic tooling and memory confrontation corroborate them.\n9. In mode=full, apply safe memory/skill/user-extension/authorized-source improvements under the standing grant above; otherwise keep them proposal-gated.\n10. Never cross hard-stop boundaries from the authority policy.\n11. If the learning tools are unavailable, report BLOCKED with the missing tool names and do not improvise.\n12. Finish with PASS, BLOCKED, or FAIL and concise evidence, including chunk counts, merge/upgrade/code-bake decisions, changed paths/settings, validation, and cleanup/purge status.${reflectionBlock}`;
     }
     reserveAutoLearnRun(params) {
         return this.withAutoLearnStateLock((current) => {
             const now = Date.now();
             const state = this.pruneAutoLearnHistoryFromState(current, now);
             const tenant = this.getAutoLearnTenantKey();
-            if (params.cooldownKind === "reflection") {
+            if (params.cooldownKind === "reflection" && !params.bypassReflectionCooldown) {
                 const lastReflection = state.lastReflectionByTenant?.[tenant] ?? 0;
                 const cooldownMs = params.settings.reflectionCooldownMinutes * 60 * 1000;
                 if (Math.max(0, lastReflection + cooldownMs - now) > 0) {
@@ -4168,6 +4169,7 @@ export class InteractiveMode {
             settings,
             force,
             cooldownKind: options.cooldownKind,
+            bypassReflectionCooldown: options.bypassReflectionCooldown,
             runId,
             modelPattern,
             reason,
@@ -4332,6 +4334,10 @@ export class InteractiveMode {
             .map((message) => this.getAgentMessagePlainText(message))
             .join("\n");
         const correctionSignal = /\b(next time|for future|from now on|remember this|don't|do not|avoid|instead|you should|should have|you forgot|you missed|not what i asked|wrong again)\b/i.test(userText);
+        const behavioralSelfImprovementSignal = /\b(harness|pi|agent|autonomy|autonomous|self[- ]?improv(?:e|ement|ing)?|steer(?:ing)?|trigger(?:s)?|skill(?:s)?|code[- ]?bak(?:e|ed)|bake(?:d)? into code|not (?:automata|memory)|reference agent|hermes)\b/i.test(userText) &&
+            /\b(improve|automatic(?:ally)?|autonomous|trigger|fire|skill|steer|self[- ]?improv(?:e|ement|ing)?|code[- ]?bak(?:e|ed)|bake(?:d)?|too much|less)\b/i.test(userText);
+        const complexTaskSignal = toolCalls >= AUTO_LEARN_COMPLEX_TASK_TOOL_CALLS;
+        const bypassCooldown = correctionSignal || behavioralSelfImprovementSignal || complexTaskSignal;
         const base = { messageCount, contextPercent, cooldownRemainingMs, runningCount, toolCalls };
         if (!settings.enabled)
             return { ...base, shouldRun: false, reason: "disabled" };
@@ -4344,14 +4350,34 @@ export class InteractiveMode {
                 reason: `max tenant learners running (${runningCount}/${settings.maxConcurrentLearners})`,
             };
         }
-        if (cooldownRemainingMs > 0)
+        if (cooldownRemainingMs > 0 && !bypassCooldown) {
             return { ...base, shouldRun: false, reason: "reflection cooldown" };
+        }
+        if (behavioralSelfImprovementSignal) {
+            return {
+                ...base,
+                shouldRun: true,
+                reason: "reflection behavioral self-improvement signal",
+                digest: this.buildAutonomyReviewDigest(messages),
+                bypassCooldown: true,
+            };
+        }
         if (correctionSignal) {
             return {
                 ...base,
                 shouldRun: true,
                 reason: "reflection correction signal",
                 digest: this.buildAutonomyReviewDigest(messages),
+                bypassCooldown: true,
+            };
+        }
+        if (complexTaskSignal) {
+            return {
+                ...base,
+                shouldRun: true,
+                reason: `reflection complex task learning signal (${toolCalls}/${AUTO_LEARN_COMPLEX_TASK_TOOL_CALLS} tool calls)`,
+                digest: this.buildAutonomyReviewDigest(messages),
+                bypassCooldown: true,
             };
         }
         if (autonomy.mode === "full") {
@@ -4395,6 +4421,7 @@ export class InteractiveMode {
             cooldownKind: "reflection",
             promptKind: "reflection",
             turnDigest: decision.digest,
+            bypassReflectionCooldown: decision.bypassCooldown,
         });
         if (!message.startsWith("Auto Learn started"))
             this.showStatus(message);