npm - chainlesschain - Versions diffs - 0.45.81 → 0.46.0 - Mend

chainlesschain 0.45.81 → 0.46.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

package/bin/chainlesschain.js +0 -0
package/package.json +1 -1
package/src/assets/web-panel/.build-hash +1 -1
package/src/assets/web-panel/assets/{AppLayout-YdvJBMHH.js → AppLayout-BnvARObz.js} +1 -1
package/src/assets/web-panel/assets/Cowork-B8ZDdRm4.js +7 -0
package/src/assets/web-panel/assets/Cowork-CXuhlHew.css +1 -0
package/src/assets/web-panel/assets/Dashboard-CKeMmCoT.css +1 -0
package/src/assets/web-panel/assets/{Dashboard-HPh9FcPt.js → Dashboard-jt6XPIjB.js} +2 -2
package/src/assets/web-panel/assets/{index-ByUk2Wmr.js → index-C1SPm_5l.js} +2 -2
package/src/assets/web-panel/index.html +1 -1
package/src/commands/cowork.js +695 -0
package/src/gateways/ws/action-protocol.js +42 -2
package/src/lib/cowork-cron.js +474 -0
package/src/lib/cowork-learning.js +438 -0
package/src/lib/cowork-mcp-tools.js +182 -0
package/src/lib/cowork-share.js +218 -0
package/src/lib/cowork-task-runner.js +317 -3
package/src/lib/cowork-task-templates.js +101 -13
package/src/lib/cowork-template-marketplace.js +205 -0
package/src/lib/cowork-workflow.js +571 -0
package/src/lib/sub-agent-context.js +40 -0
package/src/lib/workflow-expr.js +318 -0
package/src/assets/web-panel/assets/Cowork-BnrHWwZw.js +0 -7
package/src/assets/web-panel/assets/Cowork-CcSoS3eX.css +0 -1
package/src/assets/web-panel/assets/Dashboard-BS-tzGNj.css +0 -1

package/src/lib/cowork-learning.js ADDED Viewed

@@ -0,0 +1,438 @@
+/**
+ * Cowork Learning Engine — analyze historical runs to optimize template
+ * selection, surface failure patterns, and recommend templates for new
+ * prompts based on past outcomes.
+ *
+ * Reads `.chainlesschain/cowork/history.jsonl` produced by the runner.
+ * Records have shape:
+ *   { taskId, status, templateId, templateName, result, userMessage, timestamp }
+ * where result = { summary, tokenCount, toolsUsed, iterationCount, artifacts }.
+ *
+ * All operations are pure/sync over the in-memory record list, making the
+ * module trivially testable with injected fs.
+ *
+ * @module cowork-learning
+ */
+import {
+  existsSync,
+  readFileSync,
+  writeFileSync,
+  mkdirSync,
+  appendFileSync,
+} from "node:fs";
+import { join } from "node:path";
+export const _deps = {
+  existsSync,
+  readFileSync,
+  writeFileSync,
+  mkdirSync,
+  appendFileSync,
+  now: () => new Date(),
+};
+/** Minimum historical runs before a template qualifies for a patch suggestion. */
+export const MIN_RUNS_FOR_PATCH = 10;
+/** Minimum distinct failures needed to trigger a suggestion. */
+export const MIN_FAILURES_FOR_PATCH = 3;
+// ─── Loading ─────────────────────────────────────────────────────────────────
+/** Read the full history as an array. Returns [] if the file is missing. */
+export function loadHistory(cwd) {
+  const file = join(cwd, ".chainlesschain", "cowork", "history.jsonl");
+  if (!_deps.existsSync(file)) return [];
+  const raw = _deps.readFileSync(file, "utf-8");
+  const out = [];
+  for (const line of raw.split("\n")) {
+    const trimmed = line.trim();
+    if (!trimmed) continue;
+    try {
+      out.push(JSON.parse(trimmed));
+    } catch (_e) {
+      // Skip malformed lines
+    }
+  }
+  return out;
+}
+// ─── Stats ───────────────────────────────────────────────────────────────────
+/**
+ * Aggregate per-template stats across all runs.
+ *
+ * @returns {Array<{
+ *   templateId: string,
+ *   templateName: string,
+ *   runs: number,
+ *   successes: number,
+ *   failures: number,
+ *   successRate: number,  // 0..1
+ *   avgTokens: number,
+ *   avgIterations: number,
+ *   topTools: Array<{ tool: string, count: number }>,
+ *   lastRunAt: string|null,
+ * }>}
+ */
+export function computeTemplateStats(history) {
+  const groups = new Map();
+  for (const rec of history) {
+    const id = rec.templateId || "unknown";
+    if (!groups.has(id)) {
+      groups.set(id, {
+        templateId: id,
+        templateName: rec.templateName || id,
+        runs: 0,
+        successes: 0,
+        failures: 0,
+        totalTokens: 0,
+        totalIterations: 0,
+        toolCounts: new Map(),
+        lastRunAt: null,
+      });
+    }
+    const g = groups.get(id);
+    g.runs += 1;
+    if (rec.status === "completed") g.successes += 1;
+    else g.failures += 1;
+    const r = rec.result || {};
+    g.totalTokens += Number(r.tokenCount || 0);
+    g.totalIterations += Number(r.iterationCount || 0);
+    for (const t of r.toolsUsed || []) {
+      g.toolCounts.set(t, (g.toolCounts.get(t) || 0) + 1);
+    }
+    if (rec.timestamp && (!g.lastRunAt || rec.timestamp > g.lastRunAt)) {
+      g.lastRunAt = rec.timestamp;
+    }
+  }
+  const result = [];
+  for (const g of groups.values()) {
+    const topTools = [...g.toolCounts.entries()]
+      .sort((a, b) => b[1] - a[1])
+      .slice(0, 5)
+      .map(([tool, count]) => ({ tool, count }));
+    result.push({
+      templateId: g.templateId,
+      templateName: g.templateName,
+      runs: g.runs,
+      successes: g.successes,
+      failures: g.failures,
+      successRate: g.runs > 0 ? g.successes / g.runs : 0,
+      avgTokens: g.runs > 0 ? Math.round(g.totalTokens / g.runs) : 0,
+      avgIterations: g.runs > 0 ? +(g.totalIterations / g.runs).toFixed(1) : 0,
+      topTools,
+      lastRunAt: g.lastRunAt,
+    });
+  }
+  // Sort by runs desc, then successRate desc
+  result.sort((a, b) => b.runs - a.runs || b.successRate - a.successRate);
+  return result;
+}
+// ─── Recommendation ──────────────────────────────────────────────────────────
+/**
+ * Tokenize a string into lowercased word tokens (Unicode-aware, keeps CJK).
+ * Splits on non-letter/digit/CJK characters.
+ */
+function tokenize(text) {
+  if (!text || typeof text !== "string") return [];
+  const tokens = text
+    .toLowerCase()
+    .split(/[^\p{L}\p{N}]+/u)
+    .filter(Boolean);
+  return tokens;
+}
+/**
+ * Recommend the best template for a new user message based on history.
+ *
+ * Scoring: for each historical record of a successful run, count token
+ * overlap between its userMessage and the query. The template with the
+ * highest cumulative overlap × successRate wins.
+ *
+ * @param {string} userMessage
+ * @param {Array<object>} history
+ * @param {object} [options]
+ * @param {number} [options.minRuns] - Only consider templates with at least this many runs
+ * @returns {{ templateId: string, score: number, confidence: number, reasons: string[] } | null}
+ */
+export function recommendTemplate(userMessage, history, options = {}) {
+  const { minRuns = 1 } = options;
+  const queryTokens = new Set(tokenize(userMessage));
+  if (queryTokens.size === 0) return null;
+  const stats = computeTemplateStats(history);
+  const statsById = new Map(stats.map((s) => [s.templateId, s]));
+  const scores = new Map(); // templateId -> cumulative overlap
+  for (const rec of history) {
+    if (rec.status !== "completed") continue;
+    const id = rec.templateId || "unknown";
+    const histTokens = tokenize(rec.userMessage || "");
+    let overlap = 0;
+    for (const t of histTokens) {
+      if (queryTokens.has(t)) overlap += 1;
+    }
+    if (overlap > 0) {
+      scores.set(id, (scores.get(id) || 0) + overlap);
+    }
+  }
+  let best = null;
+  for (const [templateId, overlap] of scores) {
+    const s = statsById.get(templateId);
+    if (!s || s.runs < minRuns) continue;
+    const finalScore = overlap * (0.5 + s.successRate / 2);
+    if (!best || finalScore > best.score) {
+      best = {
+        templateId,
+        score: +finalScore.toFixed(2),
+        confidence: +s.successRate.toFixed(2),
+        reasons: [
+          `${overlap} overlapping token(s) with past runs`,
+          `${s.successes}/${s.runs} past successes (${Math.round(s.successRate * 100)}%)`,
+        ],
+      };
+    }
+  }
+  return best;
+}
+// ─── Failure analysis ────────────────────────────────────────────────────────
+/**
+ * Group failures by template and surface the most common failure summaries.
+ *
+ * @param {Array<object>} history
+ * @param {object} [options]
+ * @param {number} [options.limit] - Max examples per template
+ * @returns {Array<{
+ *   templateId: string,
+ *   templateName: string,
+ *   failureCount: number,
+ *   commonSummaries: Array<{ summary: string, count: number }>,
+ *   examples: Array<{ taskId: string, userMessage: string, summary: string, timestamp: string }>,
+ * }>}
+ */
+export function summarizeFailures(history, options = {}) {
+  const { limit = 3 } = options;
+  const groups = new Map();
+  for (const rec of history) {
+    if (rec.status === "completed") continue;
+    const id = rec.templateId || "unknown";
+    if (!groups.has(id)) {
+      groups.set(id, {
+        templateId: id,
+        templateName: rec.templateName || id,
+        failureCount: 0,
+        summaryCounts: new Map(),
+        examples: [],
+      });
+    }
+    const g = groups.get(id);
+    g.failureCount += 1;
+    const summary = (rec.result?.summary || "").slice(0, 200);
+    if (summary) {
+      g.summaryCounts.set(summary, (g.summaryCounts.get(summary) || 0) + 1);
+    }
+    if (g.examples.length < limit) {
+      g.examples.push({
+        taskId: rec.taskId,
+        userMessage: (rec.userMessage || "").slice(0, 200),
+        summary,
+        timestamp: rec.timestamp || "",
+      });
+    }
+  }
+  const out = [];
+  for (const g of groups.values()) {
+    const commonSummaries = [...g.summaryCounts.entries()]
+      .sort((a, b) => b[1] - a[1])
+      .slice(0, 5)
+      .map(([summary, count]) => ({ summary, count }));
+    out.push({
+      templateId: g.templateId,
+      templateName: g.templateName,
+      failureCount: g.failureCount,
+      commonSummaries,
+      examples: g.examples,
+    });
+  }
+  out.sort((a, b) => b.failureCount - a.failureCount);
+  return out;
+}
+// ─── N2: Feedback loop — suggest + apply prompt patches ──────────────────────
+/**
+ * Classify suggestion confidence based on sample size and failure rate.
+ * Thresholds mirror the design doc in 87-cowork-evolution-n1-n7.md.
+ */
+function _classifyConfidence(runs, failures) {
+  const rate = runs > 0 ? failures / runs : 0;
+  if (runs >= 30 && rate >= 0.4) return "high";
+  if (runs >= 20 && rate >= 0.25) return "medium";
+  return "low";
+}
+/**
+ * Extract short hint phrases from a batch of failure summaries — cheap
+ * heuristic without LLM. Picks the top N most-repeated normalized tokens
+ * longer than 3 chars (we use this to compose a human-readable patch body).
+ */
+function _extractHintPhrases(summaries, maxHints = 3) {
+  const counts = new Map();
+  for (const s of summaries) {
+    const txt = (s?.summary || "").toLowerCase();
+    if (!txt) continue;
+    for (const word of txt.split(/[^\p{L}\p{N}]+/u)) {
+      if (word.length < 4) continue;
+      counts.set(word, (counts.get(word) || 0) + (s.count || 1));
+    }
+  }
+  return [...counts.entries()]
+    .sort((a, b) => b[1] - a[1])
+    .slice(0, maxHints)
+    .map(([w]) => w);
+}
+/**
+ * Build a prompt patch for one template based on its failure analysis.
+ * Returns null when below thresholds.
+ */
+export function buildPatchForTemplate(statsEntry, failureEntry) {
+  if (!statsEntry || !failureEntry) return null;
+  if (statsEntry.runs < MIN_RUNS_FOR_PATCH) return null;
+  if (failureEntry.failureCount < MIN_FAILURES_FOR_PATCH) return null;
+  const hints = _extractHintPhrases(failureEntry.commonSummaries);
+  const confidence = _classifyConfidence(
+    statsEntry.runs,
+    failureEntry.failureCount,
+  );
+  const lines = [];
+  lines.push(
+    `Historical failure pattern detected (${failureEntry.failureCount}/${statsEntry.runs} runs failed).`,
+  );
+  if (hints.length > 0) {
+    lines.push(
+      `Common terms in failures: ${hints.join(", ")}. When relevant, double-check assumptions around these areas before proceeding.`,
+    );
+  }
+  return {
+    templateId: statsEntry.templateId,
+    templateName: statsEntry.templateName,
+    runs: statsEntry.runs,
+    failures: failureEntry.failureCount,
+    failureRate: +(failureEntry.failureCount / statsEntry.runs).toFixed(2),
+    confidence,
+    patch: lines.join(" "),
+    hints,
+    sampleSummaries: failureEntry.commonSummaries.slice(0, 3),
+  };
+}
+/**
+ * Scan history and return one suggested patch per qualifying template.
+ * Pure: never writes to disk. Call `applyPromptPatch` to persist.
+ *
+ * @param {Array<object>} history
+ * @returns {Array<{
+ *   templateId, templateName, runs, failures, failureRate,
+ *   confidence, patch, hints, sampleSummaries,
+ * }>}
+ */
+export function suggestPromptPatch(history) {
+  const stats = computeTemplateStats(history);
+  const failures = summarizeFailures(history);
+  const failuresById = new Map(failures.map((f) => [f.templateId, f]));
+  const out = [];
+  for (const s of stats) {
+    const f = failuresById.get(s.templateId);
+    if (!f) continue;
+    const patch = buildPatchForTemplate(s, f);
+    if (patch) out.push(patch);
+  }
+  // Highest-confidence first, then biggest failure count
+  const order = { high: 3, medium: 2, low: 1 };
+  out.sort(
+    (a, b) =>
+      order[b.confidence] - order[a.confidence] || b.failures - a.failures,
+  );
+  return out;
+}
+function _userTemplatesDir(cwd) {
+  return join(cwd, ".chainlesschain", "cowork", "user-templates");
+}
+function _patchesLogFile(cwd) {
+  return join(cwd, ".chainlesschain", "cowork", "learning-patches.jsonl");
+}
+/**
+ * Load an existing user-override template JSON (or null if none).
+ */
+export function loadUserTemplate(cwd, templateId) {
+  const file = join(_userTemplatesDir(cwd), `${templateId}.json`);
+  if (!_deps.existsSync(file)) return null;
+  try {
+    return JSON.parse(_deps.readFileSync(file, "utf-8"));
+  } catch (_e) {
+    return null;
+  }
+}
+/**
+ * Persist a patch to the user-templates layer and append an audit record.
+ * Never modifies the bundled templates. Always additive — existing patches
+ * for the same template are concatenated with a newline so history is
+ * preserved.
+ *
+ * @param {string} cwd
+ * @param {object} patch - output from `suggestPromptPatch`
+ * @returns {{ templateId, file, systemPromptExtension }}
+ */
+export function applyPromptPatch(cwd, patch) {
+  if (!patch || !patch.templateId) {
+    throw new Error("patch must include templateId");
+  }
+  const dir = _userTemplatesDir(cwd);
+  _deps.mkdirSync(dir, { recursive: true });
+  const existing = loadUserTemplate(cwd, patch.templateId);
+  const prev = existing?.systemPromptExtension || "";
+  const extended = prev ? `${prev}\n\n${patch.patch}` : patch.patch;
+  const doc = {
+    templateId: patch.templateId,
+    templateName: patch.templateName,
+    systemPromptExtension: extended,
+    updatedAt: _deps.now().toISOString(),
+  };
+  const file = join(dir, `${patch.templateId}.json`);
+  _deps.writeFileSync(file, JSON.stringify(doc, null, 2), "utf-8");
+  // Audit trail — never pruned automatically
+  _deps.appendFileSync(
+    _patchesLogFile(cwd),
+    JSON.stringify({
+      appliedAt: _deps.now().toISOString(),
+      templateId: patch.templateId,
+      confidence: patch.confidence,
+      runs: patch.runs,
+      failures: patch.failures,
+      patch: patch.patch,
+    }) + "\n",
+    "utf-8",
+  );
+  return {
+    templateId: patch.templateId,
+    file,
+    systemPromptExtension: extended,
+  };
+}

package/src/lib/cowork-mcp-tools.js ADDED Viewed

@@ -0,0 +1,182 @@
+/**
+ * Cowork Template MCP Tools — mount a template's declared MCP servers and
+ * expose their tools to the sub-agent's LLM.
+ *
+ * A template can declare `mcpServers: [{ name, command, args, env, cwd }]`
+ * (same shape accepted by skill-mcp's validateMcpServerConfig). At task
+ * start we spawn an MCPClient, connect each server, list their tools, and
+ * build three parallel maps the agent-core runtime already consumes:
+ *
+ *  - `extraToolDefinitions`    — OpenAI-style function definitions appended
+ *    to the tool list the LLM sees.
+ *  - `externalToolDescriptors` — descriptor metadata keyed by tool name.
+ *  - `externalToolExecutors`   — { kind: "mcp", serverName, toolName } routing
+ *    handles that agent-core's default-case switch dispatches through
+ *    `mcpClient.callTool(serverName, toolName, args)`.
+ *
+ * Tool names are prefixed `mcp__<serverName>__<toolName>` to avoid collisions
+ * across servers and with built-in AGENT_TOOLS.
+ *
+ * @module cowork-mcp-tools
+ */
+import { validateMcpServerConfig } from "./skill-mcp.js";
+export const _deps = {
+  importMcpClient: async () => {
+    const mod = await import("../harness/mcp-client.js");
+    return mod.MCPClient;
+  },
+};
+/** Build the namespaced tool name used on the wire. */
+export function buildToolName(serverName, toolName) {
+  return `mcp__${serverName}__${toolName}`;
+}
+/**
+ * Convert a single MCP tool (from tools/list) into the three shapes
+ * agent-core consumes.
+ *
+ * @param {string} serverName
+ * @param {{ name: string, description?: string, inputSchema?: object }} tool
+ * @returns {{ definition: object, descriptor: object, executor: object }}
+ */
+export function toAgentTool(serverName, tool) {
+  const wireName = buildToolName(serverName, tool.name);
+  return {
+    definition: {
+      type: "function",
+      function: {
+        name: wireName,
+        description:
+          tool.description ||
+          `MCP tool "${tool.name}" from server "${serverName}"`,
+        parameters: tool.inputSchema || {
+          type: "object",
+          properties: {},
+        },
+      },
+    },
+    descriptor: {
+      name: wireName,
+      kind: "mcp",
+      category: "mcp",
+      source: "cowork-template-mcp",
+      serverName,
+      originalName: tool.name,
+    },
+    executor: {
+      kind: "mcp",
+      serverName,
+      toolName: tool.name,
+    },
+  };
+}
+/**
+ * Mount a template's MCP servers and expose their tools. Returns maps ready
+ * to hand to SubAgentContext + a cleanup() that disconnects all servers.
+ *
+ * Failures connecting individual servers are tolerated — the returned
+ * `skipped` array lists them with error messages. The whole call only
+ * throws if `template.mcpServers` is non-empty but validation produces zero
+ * valid configs (caller likely mis-configured the template).
+ *
+ * @param {{ mcpServers?: Array<object> }} template
+ * @param {object} [opts]
+ * @param {(msg: string, err?: Error) => void} [opts.onWarn]
+ * @returns {Promise<{
+ *   mcpClient: object|null,
+ *   mounted: string[],
+ *   skipped: Array<{ name: string, error: string }>,
+ *   extraToolDefinitions: Array<object>,
+ *   externalToolDescriptors: Record<string, object>,
+ *   externalToolExecutors: Record<string, object>,
+ *   cleanup: () => Promise<void>,
+ * }>}
+ */
+export async function mountTemplateMcpTools(template, opts = {}) {
+  const empty = {
+    mcpClient: null,
+    mounted: [],
+    skipped: [],
+    extraToolDefinitions: [],
+    externalToolDescriptors: {},
+    externalToolExecutors: {},
+    cleanup: async () => {},
+  };
+  const declared = Array.isArray(template?.mcpServers)
+    ? template.mcpServers
+    : [];
+  if (declared.length === 0) return empty;
+  const validated = declared
+    .map((entry) => validateMcpServerConfig(entry))
+    .filter(Boolean);
+  if (validated.length === 0) return empty;
+  const MCPClient = await _deps.importMcpClient();
+  const mcpClient = new MCPClient();
+  const mounted = [];
+  const skipped = [];
+  const extraToolDefinitions = [];
+  const externalToolDescriptors = {};
+  const externalToolExecutors = {};
+  for (const server of validated) {
+    try {
+      await mcpClient.connect(server.name, server);
+      mounted.push(server.name);
+      const tools = mcpClient.listTools(server.name);
+      for (const tool of tools) {
+        const { definition, descriptor, executor } = toAgentTool(
+          server.name,
+          tool,
+        );
+        extraToolDefinitions.push(definition);
+        externalToolDescriptors[definition.function.name] = descriptor;
+        externalToolExecutors[definition.function.name] = executor;
+      }
+    } catch (err) {
+      const message = err?.message || String(err);
+      skipped.push({ name: server.name, error: message });
+      if (typeof opts.onWarn === "function") {
+        opts.onWarn(
+          `[cowork-mcp] Failed to mount "${server.name}": ${message}`,
+          err,
+        );
+      }
+    }
+  }
+  const cleanup = async () => {
+    if (typeof mcpClient.disconnectAll === "function") {
+      try {
+        await mcpClient.disconnectAll();
+        return;
+      } catch (_e) {
+        // fall through to per-server disconnect
+      }
+    }
+    for (const name of mounted) {
+      try {
+        if (typeof mcpClient.disconnect === "function") {
+          await mcpClient.disconnect(name);
+        }
+      } catch (_e) {
+        // swallow — cleanup must not fail the task
+      }
+    }
+  };
+  return {
+    mcpClient,
+    mounted,
+    skipped,
+    extraToolDefinitions,
+    externalToolDescriptors,
+    externalToolExecutors,
+    cleanup,
+  };
+}