npm - @kognai/orchestrator-core - Versions diffs - 0.2.5 → 0.2.7 - Mend

@kognai/orchestrator-core 0.2.5 → 0.2.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/lib/engine-coding-agent.js +31 -14
package/dist/lib/sprint-runner-engine.js +78 -0
package/package.json +1 -1

package/dist/lib/engine-coding-agent.js CHANGED Viewed

@@ -320,35 +320,52 @@ Write ONLY the content for "${filepath}". Rules:
                         fileContent = await this.fixJsonWithOllama(fileContent, filepath);
                     }
                 }
-                // TRUNCATION PRE-CHECK: Detect if MiniMax cut off output mid-function
-                // If code ends inside an open block (unclosed braces) or with an incomplete statement,
-                // retry once with a "continue" prompt before sending to supervisor review.
-                const truncationDetected = this.detectTruncation(fileContent);
-                if (truncationDetected && (provider === 'clawrouter' || provider === 'ollama')) {
-                    (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.yellow, `  ! TRUNCATION detected in ${filepath} — retrying with continuation prompt...`);
-                    const continuationPrompt = `The previous response for "${filepath}" was TRUNCATED — it ended mid-function or with an incomplete block. Here is what was generated so far:
+                // TICKET-349: multi-pass chunked generation. The OpenClaw gateway clamps
+                // output to ~4096 tokens regardless of the requested max_tokens, so a file
+                // larger than one chunk gets cut mid-statement → [TRUNCATION] reject, no
+                // matter how capable the model is (deepseek AND sonnet truncate at the
+                // same length). Decompose the GENERATION: keep issuing continuation passes
+                // and appending until the file is complete (no truncation) or we hit the
+                // chunk cap. Works for ALL providers (previously clawrouter/ollama-only).
+                // Bounded by KOGNAI_MAX_CONTINUATION_CHUNKS (default 5 → ~5×4k≈20k output)
+                // and a no-progress guard so it can never loop forever.
+                const MAX_CONTINUATION_CHUNKS = parseInt(process.env.KOGNAI_MAX_CONTINUATION_CHUNKS ?? '5', 10);
+                let chunk = 0;
+                while (this.detectTruncation(fileContent) && chunk < MAX_CONTINUATION_CHUNKS) {
+                    chunk++;
+                    (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.yellow, `  ! TRUNCATION in ${filepath} — continuation pass ${chunk}/${MAX_CONTINUATION_CHUNKS} (gateway ~4k output cap)...`);
+                    const continuationPrompt = `The previous response for "${filepath}" was TRUNCATED — it ended mid-function or with an incomplete block. Here is the tail of what exists so far:
 \`\`\`typescript
 ${fileContent.substring(fileContent.length - 1500)}
 \`\`\`
-Continue from where it left off and output ONLY the remaining code (no duplicated content). Output a COMPLETE, valid TypeScript/JavaScript file ending with the final closing brace.`;
+Continue EXACTLY from where it left off and output ONLY the remaining code (no duplicated content, no preamble, no markdown fences). End the file with its final closing brace.`;
+                    let grew = false;
                     try {
-                        const contResponse = await (0, orchestrate_engine_1.callLLM)(provider, model, this.systemPrompt, continuationPrompt, 120000, this.name, `${task.id}_continuation`);
+                        const contResponse = await (0, orchestrate_engine_1.callLLM)(provider, model, this.systemPrompt, continuationPrompt, 120000, this.name, `${task.id}_continuation_${chunk}`);
                         let contContent = contResponse.choices?.[0]?.message?.content || '';
                         contContent = contContent.replace(/<think>[\s\S]*?<\/think>/g, '').trim();
                         const contBlocks = this.extractCodeBlocks(contContent);
                         const continuation = contBlocks.length > 0 ? contBlocks[0] : this.stripResidualFences(contContent);
                         if (continuation.length > 50) {
-                            // Merge: use the original up to the last complete line, then append continuation
-                            fileContent = fileContent + '\n' + continuation;
-                            fileContent = this.stripResidualFences(fileContent);
-                            (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.green, `  ✓ Continuation merged for ${filepath} (+${continuation.length} chars)`);
+                            fileContent = this.stripResidualFences(fileContent + '\n' + continuation);
+                            grew = true;
+                            (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.green, `  ✓ Pass ${chunk} merged for ${filepath} (+${continuation.length} chars, total ${fileContent.length})`);
                         }
                     }
                     catch (contErr) {
-                        (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.yellow, `  ! Continuation failed: ${contErr.message}`);
+                        (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.yellow, `  ! Continuation pass ${chunk} failed: ${contErr.message}`);
                     }
+                    // No-progress guard: if a pass added nothing usable, stop — further
+                    // passes won't help and would just burn budget.
+                    if (!grew) {
+                        (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.yellow, `  ! Continuation made no progress — stopping at pass ${chunk}`);
+                        break;
+                    }
+                }
+                if (chunk > 0 && !this.detectTruncation(fileContent)) {
+                    (0, orchestrate_engine_1.log)(orchestrate_engine_1.c.green, `  ✓ ${filepath} assembled complete over ${chunk + 1} pass(es)`);
                 }
                 createdFiles.push({ path: filepath, content: fileContent });
             }

package/dist/lib/sprint-runner-engine.js CHANGED Viewed

@@ -79,6 +79,13 @@ const MAX_HOURS = 6; // kill orchestrator if it runs longer than this
 // Rate limiter: minimum gap between sprint executions (prevents burning Claude 5h limit)
 // Default: 30 min. Override via SPRINT_COOLDOWN_MINUTES env var.
 const COOLDOWN_MINUTES = parseInt(process.env.SPRINT_COOLDOWN_MINUTES ?? '30', 10);
+// TICKET-348 sprint-level backoff: a sprint whose run makes NO forward progress
+// (no pending task reached a terminal/done state) this many times IN A ROW is
+// auto-skipped as 'loop-stuck', so a permanently-failing sprint (e.g. one whose
+// files keep truncating) stops monopolising the runner and the selector advances
+// to other queued work. State lives in .swarm-state/sprint-backoff.json.
+const SPRINT_BACKOFF = (0, path_1.join)(ROOT, '.swarm-state', 'sprint-backoff.json');
+const SPRINT_BACKOFF_THRESHOLD = parseInt(process.env.SPRINT_BACKOFF_THRESHOLD ?? '2', 10);
 // Daily cap: max sprints per calendar day. Default: 100.
 const DAILY_SPRINT_CAP = parseInt(process.env.DAILY_SPRINT_CAP ?? '100', 10);
 // Rolling window cap: max sprints within the last N hours. Default: 20 per 5h.
@@ -354,6 +361,63 @@ function extractSprintNumber(filename) {
 // (Multi-session safety: prevents another Claude session reverting a local file
 // from causing the runner to re-execute paused/done work.)
 const NOTION_OVERRIDE_STATUSES = new Set(['skipped', 'blocked', 'done', 'done-manual', 'loop-stuck', 'rejected']);
+function readBackoff() {
+    try {
+        return JSON.parse((0, fs_1.readFileSync)(SPRINT_BACKOFF, 'utf8'));
+    }
+    catch {
+        return {};
+    }
+}
+function writeBackoff(data) {
+    try {
+        const dir = (0, path_1.join)(ROOT, '.swarm-state');
+        if (!(0, fs_1.existsSync)(dir))
+            (0, fs_1.mkdirSync)(dir, { recursive: true });
+        const tmp = `${SPRINT_BACKOFF}.tmp.${process.pid}`;
+        (0, fs_1.writeFileSync)(tmp, JSON.stringify(data, null, 2));
+        (0, fs_1.renameSync)(tmp, SPRINT_BACKOFF);
+    }
+    catch { /* backoff bookkeeping is best-effort — never block a run */ }
+}
+/** Count pending tasks in a sprint's MERGED view (source + .swarm-state status). */
+function countPendingTasks(sprintPath) {
+    try {
+        return ((0, sprint_state_1.loadSprintMerged)(sprintPath).tasks ?? []).filter((t) => t.status === 'pending').length;
+    }
+    catch {
+        return 0;
+    }
+}
+/** True once a sprint has hit the no-progress threshold — selector skips it. */
+function isBackedOff(sprintId) {
+    const e = readBackoff()[sprintId];
+    return !!e && (e.loop_stuck === true || e.no_progress >= SPRINT_BACKOFF_THRESHOLD);
+}
+/** Post-run: progress = pending count dropped (a task reached terminal/done).
+ *  No progress → increment the consecutive counter; at the threshold, flag
+ *  loop_stuck so findPendingSprint skips it. Any progress → reset. */
+function recordSprintProgress(sprintId, pendingBefore, pendingAfter) {
+    const data = readBackoff();
+    if (pendingAfter < pendingBefore) {
+        if (data[sprintId]) {
+            delete data[sprintId];
+            writeBackoff(data);
+        }
+        return;
+    }
+    const prev = data[sprintId]?.no_progress ?? 0;
+    const next = prev + 1;
+    const loop_stuck = next >= SPRINT_BACKOFF_THRESHOLD;
+    data[sprintId] = { no_progress: next, last: new Date().toISOString(), loop_stuck };
+    writeBackoff(data);
+    if (loop_stuck) {
+        log(`⛔ Backoff: ${sprintId} made no progress ${next}× in a row — marked loop-stuck (auto-skipped). Clear .swarm-state/sprint-backoff.json or fix the sprint to re-enable.`);
+    }
+    else {
+        log(`Backoff: ${sprintId} no progress this run (${next}/${SPRINT_BACKOFF_THRESHOLD} before auto-skip).`);
+    }
+}
 async function findPendingSprint() {
     if (!(0, fs_1.existsSync)(SPRINTS))
         return null;
@@ -404,6 +468,12 @@ async function findPendingSprint() {
                 log(`Skipped ${file}: Notion source-of-truth says '${notionStatus}' (overrides local pending)`);
                 continue;
             }
+            // TICKET-348: local backoff — skip a sprint that has made no forward
+            // progress N runs in a row (loop-stuck), so it can't monopolise the runner.
+            if (isBackedOff(sprintId)) {
+                log(`Skipped ${file}: backoff — no forward progress ${SPRINT_BACKOFF_THRESHOLD}× in a row (loop-stuck, auto-skipped)`);
+                continue;
+            }
             // Dependency check: respect depends_on_sprint — if the upstream sprint
             // has any non-terminal task, skip this one. Founder directive 2026-05-26:
             // swarm must never deadlock on a sprint whose prereqs haven't shipped.
@@ -828,6 +898,10 @@ async function runSprintCycle(opts) {
         return;
     }
     log(`Found pending sprint: ${sprintPath}`);
+    // TICKET-348: snapshot pending count before the run so we can detect whether
+    // this run made any forward progress (and apply backoff if it didn't).
+    const backoffSprintId = (0, path_1.basename)(sprintPath).replace(/\.json$/, '');
+    const pendingBefore = countPendingTasks(sprintPath);
     // TICKET-210: build the ACTIVE sprint from the MERGED view (source definition
     // + .swarm-state status), NOT raw source. The source file holds every task at
     // its authored status (usually 'pending'); reading it directly meant a sprint
@@ -1067,6 +1141,10 @@ async function runSprintCycle(opts) {
     catch {
         // non-fatal
     }
+    // TICKET-348: update sprint backoff. State is fully synced by now (ACTIVE→
+    // .swarm-state + forensic git-log recovery), so countPendingTasks reflects the
+    // post-run truth. No drop in pending = no progress = step toward loop-stuck.
+    recordSprintProgress(backoffSprintId, pendingBefore, countPendingTasks(sprintPath));
     // TICKET-201: post-sprint hook (e.g. dispatch-approved-proposals).
     // Supplied by the product entry so core stays product-agnostic.
     try {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@kognai/orchestrator-core",
-  "version": "0.2.5",
+  "version": "0.2.7",
   "description": "Kognai sovereign orchestrator — core engine (template-agnostic). Shared by all products (Kognai/coding, Voxight/market-intel, Invoica/fin-compliance); each supplies only its template. Replaces per-repo forks of orchestrate-agents-v2 / sprint-runner / lib.",
   "license": "MIT",
   "author": "SkinGem",