npm - majlis - Versions diffs - 0.4.2 → 0.4.4 - Mend

majlis 0.4.2 → 0.4.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/cli.js +128 -41
package/package.json +1 -1

package/dist/cli.js CHANGED Viewed

@@ -2054,7 +2054,8 @@ var init_types = __esm({
     TRANSITIONS = {
       ["classified" /* CLASSIFIED */]: ["reframed" /* REFRAMED */, "building" /* BUILDING */],
       ["reframed" /* REFRAMED */]: ["building" /* BUILDING */],
-      ["building" /* BUILDING */]: ["built" /* BUILT */],
+      ["building" /* BUILDING */]: ["built" /* BUILT */, "building" /* BUILDING */],
+      // self-loop for retry after truncation
       ["built" /* BUILT */]: ["challenged" /* CHALLENGED */, "doubted" /* DOUBTED */],
       ["challenged" /* CHALLENGED */]: ["doubted" /* DOUBTED */, "verifying" /* VERIFYING */],
       ["doubted" /* DOUBTED */]: ["challenged" /* CHALLENGED */, "scouted" /* SCOUTED */, "verifying" /* VERIFYING */],
@@ -2305,22 +2306,23 @@ ${contextJson}
 ${taskPrompt}`;
   const turns = ROLE_MAX_TURNS[role] ?? 15;
-  console.log(`[majlis] Spawning ${role} agent (model: ${agentDef.model}, maxTurns: ${turns})...`);
-  const { text: markdown, costUsd } = await runQuery({
+  console.log(`[${role}] Spawning (model: ${agentDef.model}, maxTurns: ${turns})...`);
+  const { text: markdown, costUsd, truncated } = await runQuery({
     prompt,
     model: agentDef.model,
     tools: agentDef.tools,
     systemPrompt: agentDef.systemPrompt,
     cwd: root,
-    maxTurns: turns
+    maxTurns: turns,
+    label: role
   });
-  console.log(`[majlis] ${role} agent complete (cost: $${costUsd.toFixed(4)})`);
+  console.log(`[${role}] Complete (cost: $${costUsd.toFixed(4)}${truncated ? ", TRUNCATED" : ""})`);
   const artifactPath = writeArtifact(role, context, markdown, root);
   if (artifactPath) {
-    console.log(`[majlis] ${role} artifact written to ${artifactPath}`);
+    console.log(`[${role}] Artifact written to ${artifactPath}`);
   }
   const structured = await extractStructuredData(role, markdown);
-  return { output: markdown, structured };
+  return { output: markdown, structured, truncated };
 }
 async function spawnSynthesiser(context, projectRoot) {
   const root = projectRoot ?? findProjectRoot() ?? process.cwd();
@@ -2334,20 +2336,70 @@ ${contextJson}
 ${taskPrompt}`;
   const systemPrompt = 'You are a Synthesis Agent. Be concrete: which decisions failed, which assumptions broke, what constraints must the next approach satisfy. CRITICAL: Your LAST line of output MUST be a <!-- majlis-json --> block. The framework parses this programmatically \u2014 if you omit it, the pipeline breaks. Format: <!-- majlis-json {"guidance": "your guidance here"} -->';
-  console.log(`[majlis] Spawning synthesiser micro-agent...`);
-  const { text: markdown, costUsd } = await runQuery({
+  console.log(`[synthesiser] Spawning (maxTurns: 5)...`);
+  const { text: markdown, costUsd, truncated } = await runQuery({
     prompt,
     model: "opus",
     tools: ["Read", "Glob", "Grep"],
     systemPrompt,
     cwd: root,
-    maxTurns: 5
+    maxTurns: 5,
+    label: "synthesiser"
   });
-  console.log(`[majlis] Synthesiser complete (cost: $${costUsd.toFixed(4)})`);
-  const structured = await extractStructuredData("synthesiser", markdown);
-  return { output: markdown, structured };
+  console.log(`[synthesiser] Complete (cost: $${costUsd.toFixed(4)})`);
+  return { output: markdown, structured: { guidance: markdown }, truncated };
+}
+async function spawnRecovery(role, partialOutput, context, projectRoot) {
+  const root = projectRoot ?? findProjectRoot() ?? process.cwd();
+  const expSlug = context.experiment?.slug ?? "unknown";
+  console.log(`[recovery] Cleaning up after truncated ${role} for ${expSlug}...`);
+  const expDocPath = path7.join(
+    root,
+    "docs",
+    "experiments",
+    `${String(context.experiment?.id ?? 0).padStart(3, "0")}-${expSlug}.md`
+  );
+  const templatePath = path7.join(root, "docs", "experiments", "_TEMPLATE.md");
+  const template = fs7.existsSync(templatePath) ? fs7.readFileSync(templatePath, "utf-8") : "";
+  const currentDoc = fs7.existsSync(expDocPath) ? fs7.readFileSync(expDocPath, "utf-8") : "";
+  const prompt = `The ${role} agent was truncated (hit max turns) while working on experiment "${expSlug}".
+Here is the partial agent output (reasoning + tool calls):
+<partial_output>
+${partialOutput.slice(-3e3)}
+</partial_output>
+Here is the current experiment doc:
+<current_doc>
+${currentDoc}
+</current_doc>
+Here is the template that the experiment doc should follow:
+<template>
+${template}
+</template>
+Your job: Write a CLEAN experiment doc to ${expDocPath} using the Write tool.
+- Keep any valid content from the current doc
+- Fill in what you can infer from the partial output
+- Mark incomplete sections with "[TRUNCATED \u2014 ${role} did not finish]"
+- The doc MUST have the <!-- majlis-json --> block, even if decisions are empty
+- Do NOT include agent reasoning or thinking \u2014 only structured experiment content
+- Be concise. This is cleanup, not new work.`;
+  const { text: _markdown } = await runQuery({
+    prompt,
+    model: "haiku",
+    tools: ["Read", "Write"],
+    systemPrompt: `You are a Recovery Agent. You clean up experiment docs after truncated agent runs. Write clean, structured docs. Never include agent reasoning or monologue.`,
+    cwd: root,
+    maxTurns: 5,
+    label: "recovery"
+  });
+  console.log(`[recovery] Cleanup complete for ${expSlug}.`);
 }
 async function runQuery(opts) {
+  let truncated = false;
+  const tag = opts.label ?? "majlis";
   const conversation = (0, import_claude_agent_sdk2.query)({
     prompt: opts.prompt,
     options: {
@@ -2381,36 +2433,37 @@ async function runQuery(opts) {
           const toolName = block.name ?? "tool";
           const input = block.input ?? {};
           const detail = formatToolDetail(toolName, input);
-          process.stderr.write(`${DIM2}[majlis]   ${CYAN2}${toolName}${RESET2}${DIM2}${detail}${RESET2}
+          process.stderr.write(`${DIM2}[${tag}]   ${CYAN2}${toolName}${RESET2}${DIM2}${detail}${RESET2}
 `);
         }
       }
       if (hasText) {
         const preview = textParts[textParts.length - 1].slice(0, 120).replace(/\n/g, " ").trim();
         if (preview) {
-          process.stderr.write(`${DIM2}[majlis]   writing: ${preview}${preview.length >= 120 ? "..." : ""}${RESET2}
+          process.stderr.write(`${DIM2}[${tag}]   writing: ${preview}${preview.length >= 120 ? "..." : ""}${RESET2}
 `);
         }
       }
     } else if (message.type === "tool_progress") {
       const elapsed = Math.round(message.elapsed_time_seconds);
       if (elapsed > 0 && elapsed % 5 === 0) {
-        process.stderr.write(`${DIM2}[majlis]   ${message.tool_name} running (${elapsed}s)...${RESET2}
+        process.stderr.write(`${DIM2}[${tag}]   ${message.tool_name} running (${elapsed}s)...${RESET2}
 `);
       }
     } else if (message.type === "result") {
       if (message.subtype === "success") {
         costUsd = message.total_cost_usd;
       } else if (message.subtype === "error_max_turns") {
+        truncated = true;
         costUsd = "total_cost_usd" in message ? message.total_cost_usd : 0;
-        console.warn(`[majlis] Agent hit max turns (${turnCount}). Returning partial output.`);
+        console.warn(`[${tag}] Hit max turns (${turnCount}). Returning partial output.`);
       } else {
         const errors = "errors" in message ? message.errors?.join("; ") ?? "Unknown error" : "Unknown error";
         throw new Error(`Agent query failed (${message.subtype}): ${errors}`);
       }
     }
   }
-  return { text: textParts.join("\n\n"), costUsd };
+  return { text: textParts.join("\n\n"), costUsd, truncated };
 }
 function formatToolDetail(toolName, input) {
   switch (toolName) {
@@ -2444,19 +2497,14 @@ function writeArtifact(role, context, markdown, projectRoot) {
   };
   const dir = dirMap[role];
   if (!dir) return null;
+  if (role === "builder" || role === "compressor") return null;
   const fullDir = path7.join(projectRoot, dir);
   if (!fs7.existsSync(fullDir)) {
     fs7.mkdirSync(fullDir, { recursive: true });
   }
-  if (role === "compressor") {
-    const target2 = path7.join(fullDir, "current.md");
-    fs7.writeFileSync(target2, markdown);
-    return target2;
-  }
   const expSlug = context.experiment?.slug ?? "general";
-  const existing = fs7.readdirSync(fullDir).filter((f) => f.endsWith(".md") && !f.startsWith("_"));
-  const nextNum = String(existing.length + 1).padStart(3, "0");
-  const filename = role === "builder" ? `${nextNum}-${expSlug}.md` : `${nextNum}-${role}-${expSlug}.md`;
+  const nextNum = String(context.experiment?.id ?? 1).padStart(3, "0");
+  const filename = `${nextNum}-${role}-${expSlug}.md`;
   const target = path7.join(fullDir, filename);
   fs7.writeFileSync(target, markdown);
   return target;
@@ -2472,12 +2520,12 @@ var init_spawn = __esm({
     init_connection();
     ROLE_MAX_TURNS = {
       builder: 50,
-      critic: 12,
-      adversary: 12,
-      verifier: 15,
-      compressor: 15,
-      reframer: 12,
-      scout: 12
+      critic: 30,
+      adversary: 30,
+      verifier: 50,
+      compressor: 30,
+      reframer: 20,
+      scout: 20
     };
     DIM2 = "\x1B[2m";
     RESET2 = "\x1B[0m";
@@ -2493,9 +2541,19 @@ function worstGrade(grades) {
   return "sound";
 }
 async function resolve(db, exp, projectRoot) {
-  const grades = getVerificationsByExperiment(db, exp.id);
+  let grades = getVerificationsByExperiment(db, exp.id);
   if (grades.length === 0) {
-    throw new Error(`No verifications found for experiment ${exp.slug}. Run verify first.`);
+    warn(`No verification records for ${exp.slug}. Defaulting to weak.`);
+    insertVerification(
+      db,
+      exp.id,
+      "auto-default",
+      "weak",
+      null,
+      null,
+      "No structured verification output. Auto-defaulted to weak."
+    );
+    grades = getVerificationsByExperiment(db, exp.id);
   }
   const overallGrade = worstGrade(grades);
   switch (overallGrade) {
@@ -2678,8 +2736,16 @@ ${builderGuidance}
 Build the experiment: ${exp.hypothesis}` : `Build the experiment: ${exp.hypothesis}`
   }, root);
   ingestStructuredOutput(db, exp.id, result.structured);
-  updateExperimentStatus(db, exp.id, "built");
-  success(`Build complete for ${exp.slug}. Run \`majlis doubt\` or \`majlis challenge\` next.`);
+  if (result.truncated && !result.structured) {
+    warn(`Builder was truncated (hit max turns) without producing structured output.`);
+    await spawnRecovery("builder", result.output, {
+      experiment: { id: exp.id, slug: exp.slug, hypothesis: exp.hypothesis, status: "building", sub_type: exp.sub_type, builder_guidance: null }
+    }, root);
+    warn(`Experiment stays at 'building'. Run \`majlis build\` to retry or \`majlis revert\` to abandon.`);
+  } else {
+    updateExperimentStatus(db, exp.id, "built");
+    success(`Build complete for ${exp.slug}. Run \`majlis doubt\` or \`majlis challenge\` next.`);
+  }
 }
 async function doChallenge(db, exp, root) {
   transition(exp.status, "challenged" /* CHALLENGED */);
@@ -2695,8 +2761,12 @@ async function doChallenge(db, exp, root) {
     taskPrompt: `Construct adversarial test cases for experiment ${exp.slug}: ${exp.hypothesis}`
   }, root);
   ingestStructuredOutput(db, exp.id, result.structured);
-  updateExperimentStatus(db, exp.id, "challenged");
-  success(`Challenge complete for ${exp.slug}. Run \`majlis doubt\` or \`majlis verify\` next.`);
+  if (result.truncated && !result.structured) {
+    warn(`Adversary was truncated without structured output. Experiment stays at current status.`);
+  } else {
+    updateExperimentStatus(db, exp.id, "challenged");
+    success(`Challenge complete for ${exp.slug}. Run \`majlis doubt\` or \`majlis verify\` next.`);
+  }
 }
 async function doDoubt(db, exp, root) {
   transition(exp.status, "doubted" /* DOUBTED */);
@@ -2713,8 +2783,12 @@ async function doDoubt(db, exp, root) {
     taskPrompt: `Doubt the work in experiment ${exp.slug}: ${exp.hypothesis}. Produce a doubt document with evidence for each doubt.`
   }, root);
   ingestStructuredOutput(db, exp.id, result.structured);
-  updateExperimentStatus(db, exp.id, "doubted");
-  success(`Doubt pass complete for ${exp.slug}. Run \`majlis challenge\` or \`majlis verify\` next.`);
+  if (result.truncated && !result.structured) {
+    warn(`Critic was truncated without structured output. Experiment stays at current status.`);
+  } else {
+    updateExperimentStatus(db, exp.id, "doubted");
+    success(`Doubt pass complete for ${exp.slug}. Run \`majlis challenge\` or \`majlis verify\` next.`);
+  }
 }
 async function doScout(db, exp, root) {
   transition(exp.status, "scouted" /* SCOUTED */);
@@ -2762,6 +2836,10 @@ async function doVerify(db, exp, root) {
     taskPrompt: `Verify experiment ${exp.slug}: ${exp.hypothesis}. Check provenance and content. Test the ${doubts.length} doubt(s) and any adversarial challenges.`
   }, root);
   ingestStructuredOutput(db, exp.id, result.structured);
+  if (result.truncated && !result.structured) {
+    warn(`Verifier was truncated without structured output. Experiment stays at 'verifying'.`);
+    return;
+  }
   if (result.structured?.doubt_resolutions) {
     for (const dr of result.structured.doubt_resolutions) {
       if (dr.doubt_id && dr.resolution) {
@@ -3241,7 +3319,16 @@ async function run(args) {
       continue;
     }
     info(`[Step ${stepCount}] ${exp.slug}: ${exp.status}`);
-    await next([exp.slug], false);
+    try {
+      await next([exp.slug], false);
+    } catch (err) {
+      const message = err instanceof Error ? err.message : String(err);
+      warn(`Step failed for ${exp.slug}: ${message}`);
+      try {
+        updateExperimentStatus(db, exp.id, "dead_end");
+      } catch {
+      }
+    }
   }
   if (stepCount >= MAX_STEPS) {
     warn(`Reached max steps (${MAX_STEPS}). Stopping autonomous mode.`);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "majlis",
-  "version": "0.4.2",
+  "version": "0.4.4",
   "description": "Multi-agent workflow CLI for structured doubt, independent verification, and compressed knowledge",
   "bin": {
     "majlis": "./dist/cli.js"