npm - open-agents-ai - Versions diffs - 0.187.27 → 0.187.29 - Mend

open-agents-ai 0.187.27 → 0.187.29

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +42 -0
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -260551,6 +260551,39 @@ Briefly assess your situation and choose ONE action:
 Respond with your assessment, then take action.`;
       }
+      /**
+       * WO-RL-02: Best-of-N execution — run N independent attempts, return highest-scoring.
+       * Research: SWE-RM (2512.21919) +7-10 pts, MCTSr (2406.07394) 8B→GPT-4 level.
+       * Research: Test-Time Compute Scaling (2408.03314) small + compute = 14x larger.
+       *
+       * Scoring: completed > not, fewer turns > more, has summary > no summary.
+       * Candidates run sequentially to avoid overloading the backend.
+       */
+      async runBestOfN(task, context, n2) {
+        const count = Math.min(n2 ?? this.options.bestOfN ?? 1, 5);
+        if (count <= 1)
+          return this.run(task, context);
+        const candidates = [];
+        const perCandidateTurns = Math.max(5, Math.floor((this.options.maxTurns ?? 25) / count));
+        for (let i2 = 0; i2 < count; i2++) {
+          const savedMaxTurns = this.options.maxTurns;
+          this.options.maxTurns = perCandidateTurns;
+          try {
+            const result = await this.run(task, context);
+            candidates.push(result);
+            if (result.completed)
+              break;
+          } finally {
+            this.options.maxTurns = savedMaxTurns;
+          }
+        }
+        const scored = candidates.map((r2) => ({
+          result: r2,
+          score: (r2.completed ? 10 : 0) + (r2.summary && r2.summary.length > 50 ? 2 : 0) + Math.max(0, 5 - r2.turns * 0.3)
+        }));
+        scored.sort((a2, b) => b.score - a2.score);
+        return scored[0].result;
+      }
       /** Run a task through the agentic loop */
       async run(task, context) {
         this.aborted = false;
@@ -261342,6 +261375,15 @@ If you're stuck, try a completely different approach. Do NOT repeat what failed
               }
               if (!result.success && tc.name !== "task_complete") {
                 const failDesc = `${tc.name}(${filePath || "..."}): ${(result.error || "").slice(0, 100)}`;
+                const consecutiveSameTool = this._taskState.failedApproaches.slice(-2).filter((f2) => f2.startsWith(`${tc.name}(`)).length;
+                if (consecutiveSameTool >= 2 && (this.options.modelTier === "small" || this.options.modelTier === "medium")) {
+                  this.pendingUserMessages.push(`[PIVOT REQUIRED] You have failed ${consecutiveSameTool + 1} times in a row with ${tc.name}. Your current approach is not working. You MUST try something fundamentally different:
+- If file_edit keeps failing: re-read the file first, then use the EXACT text from the file
+- If shell keeps failing: try a different command or check prerequisites
+- If grep_search finds nothing: try broader patterns or list_directory
+- Consider using a completely different tool or strategy
+Do NOT retry ${tc.name} with similar arguments.`);
+                }
                 if (!this._taskState.failedApproaches.includes(failDesc)) {
                   this._taskState.failedApproaches.push(failDesc);
                   if (this._taskState.failedApproaches.length > 10) {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "open-agents-ai",
-  "version": "0.187.27",
+  "version": "0.187.29",
   "description": "AI coding agent powered by open-source models (Ollama/vLLM) — interactive TUI with agentic tool-calling loop",
   "type": "module",
   "main": "./dist/index.js",