npm - @bastani/atomic - Versions diffs - 0.5.3-1 → 0.5.4-0 - Mend

@bastani/atomic 0.5.3-1 → 0.5.4-0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

package/README.md +110 -11
package/dist/{chunk-mn870nrv.js → chunk-xkxndz5g.js} +213 -154
package/dist/sdk/components/workflow-picker-panel.d.ts +120 -0
package/dist/sdk/define-workflow.d.ts +1 -1
package/dist/sdk/index.js +1 -1
package/dist/sdk/runtime/discovery.d.ts +57 -3
package/dist/sdk/runtime/executor.d.ts +15 -2
package/dist/sdk/runtime/tmux.d.ts +9 -0
package/dist/sdk/types.d.ts +63 -4
package/dist/sdk/workflows/builtin/deep-research-codebase/claude/index.d.ts +61 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/copilot/index.d.ts +48 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/helpers/heuristic.d.ts +25 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/helpers/prompts.d.ts +91 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/helpers/scout.d.ts +56 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/opencode/index.d.ts +48 -0
package/dist/sdk/workflows/builtin/ralph/claude/index.js +6 -5
package/dist/sdk/workflows/builtin/ralph/copilot/index.js +6 -5
package/dist/sdk/workflows/builtin/ralph/opencode/index.js +6 -5
package/dist/sdk/workflows/index.d.ts +4 -4
package/dist/sdk/workflows/index.js +7 -1
package/package.json +1 -1
package/src/cli.ts +25 -3
package/src/commands/cli/chat/index.ts +5 -5
package/src/commands/cli/init/index.ts +79 -77
package/src/commands/cli/workflow-command.test.ts +757 -0
package/src/commands/cli/workflow.test.ts +310 -0
package/src/commands/cli/workflow.ts +445 -105
package/src/sdk/components/workflow-picker-panel.tsx +1462 -0
package/src/sdk/define-workflow.test.ts +101 -0
package/src/sdk/define-workflow.ts +62 -2
package/src/sdk/runtime/discovery.ts +111 -8
package/src/sdk/runtime/executor.ts +89 -32
package/src/sdk/runtime/tmux.conf +55 -0
package/src/sdk/runtime/tmux.ts +34 -10
package/src/sdk/types.ts +67 -4
package/src/sdk/workflows/builtin/deep-research-codebase/claude/index.ts +294 -0
package/src/sdk/workflows/builtin/deep-research-codebase/copilot/index.ts +276 -0
package/src/sdk/workflows/builtin/deep-research-codebase/helpers/heuristic.ts +38 -0
package/src/sdk/workflows/builtin/deep-research-codebase/helpers/prompts.ts +816 -0
package/src/sdk/workflows/builtin/deep-research-codebase/helpers/scout.ts +334 -0
package/src/sdk/workflows/builtin/deep-research-codebase/opencode/index.ts +284 -0
package/src/sdk/workflows/builtin/ralph/claude/index.ts +8 -4
package/src/sdk/workflows/builtin/ralph/copilot/index.ts +10 -4
package/src/sdk/workflows/builtin/ralph/opencode/index.ts +8 -4
package/src/sdk/workflows/index.ts +9 -1
package/src/services/system/auto-sync.ts +1 -1
package/src/services/system/install-ui.ts +109 -39
package/src/theme/colors.ts +65 -1

package/src/sdk/workflows/builtin/deep-research-codebase/copilot/index.ts ADDED Viewed

@@ -0,0 +1,276 @@
+/**
+ * deep-research-codebase / copilot
+ *
+ * Copilot replica of the Claude deep-research-codebase workflow. The Claude
+ * version dispatches specialist sub-agents (codebase-locator, codebase-
+ * analyzer, etc.) inside a single explorer session via `@"name (agent)"`
+ * syntax — a Claude-specific feature. Copilot sessions are bound to a single
+ * agent for their entire lifetime, so we keep the SAME graph topology
+ * (scout ∥ history → explorer-1..N → aggregator) but drive each explorer
+ * through the locate → analyze → patterns → synthesize sequence inline using
+ * the default agent's built-in file tools.
+ *
+ * Topology (identical to Claude version):
+ *
+ *           ┌─→ codebase-scout
+ *   parent ─┤
+ *           └─→ research-history
+ *                     │
+ *                     ▼
+ *   ┌──────────────────────────────────────────────────┐
+ *   │  explorer-1   explorer-2   ...   explorer-N      │   (Promise.all)
+ *   └──────────────────────────────────────────────────┘
+ *                     │
+ *                     ▼
+ *                aggregator
+ *
+ * Copilot-specific concerns baked in:
+ *
+ *  • F10 — every `sendAndWait` passes an explicit 30-minute timeout. The SDK
+ *    default is 60 seconds; a timeout THROWS and aborts the entire stage.
+ *    Explorers can easily exceed 60s on large partitions.
+ *
+ *  • F5 — every `ctx.stage()` call is a FRESH session with no memory of prior
+ *    stages. We forward the scout overview, history overview, and partition
+ *    assignment explicitly into each explorer's first prompt. The aggregator
+ *    gets the same plus the explorer scratch file paths.
+ *
+ *  • F9 — `s.save()` receives `SessionEvent[]` via `s.session.getMessages()`
+ *    (Copilot's correct shape). Passing anything else breaks downstream
+ *    `transcript()` reads.
+ *
+ *  • F6 — every prompt explicitly requires trailing prose AFTER any tool
+ *    call, so `transcript()` is never empty. A Copilot turn whose final
+ *    message is a tool call produces an empty assistant.message terminator
+ *    (F1); trailing prose is our insurance.
+ */
+import { defineWorkflow } from "../../../index.ts";
+import { mkdir } from "node:fs/promises";
+import path from "node:path";
+import {
+  getCodebaseRoot,
+  partitionUnits,
+  scoutCodebase,
+} from "../helpers/scout.ts";
+import {
+  calculateExplorerCount,
+  explainHeuristic,
+} from "../helpers/heuristic.ts";
+import {
+  buildAggregatorPrompt,
+  buildExplorerPromptGeneric,
+  buildHistoryPromptGeneric,
+  buildScoutPrompt,
+  slugifyPrompt,
+} from "../helpers/prompts.ts";
+// ── Timeouts ────────────────────────────────────────────────────────────────
+// Every sendAndWait call passes one of these explicitly — never relying on
+// the 60-second default (F10). Pick generously; a hung session still surfaces
+// as a clear error rather than silently breaking downstream stages.
+const SCOUT_TIMEOUT_MS = 15 * 60 * 1000; // 15 min — short orientation call
+const HISTORY_TIMEOUT_MS = 20 * 60 * 1000; // 20 min — reads research/ docs
+const EXPLORER_TIMEOUT_MS = 45 * 60 * 1000; // 45 min — multi-step locate/analyze
+const AGGREGATOR_TIMEOUT_MS = 45 * 60 * 1000; // 45 min — reads N explorer reports
+export default defineWorkflow<"copilot">({
+    name: "deep-research-codebase",
+    description:
+      "Deterministic deep codebase research: scout → LOC-driven parallel explorers → aggregator",
+  })
+  .run(async (ctx) => {
+    // Free-form workflows receive their positional prompt under
+    // `inputs.prompt`; destructure once so every stage below can close
+    // over a bare `prompt` string without re-reaching into ctx.inputs.
+    const prompt = ctx.inputs.prompt ?? "";
+    const root = getCodebaseRoot();
+    const startedAt = new Date();
+    const isoDate = startedAt.toISOString().slice(0, 10);
+    const slug = slugifyPrompt(prompt);
+    // ── Stages 1a + 1b: codebase-scout ∥ research-history ──────────────────
+    const [scout, history] = await Promise.all([
+      ctx.stage(
+        {
+          name: "codebase-scout",
+          description: "Map codebase, count LOC, partition for parallel explorers",
+        },
+        {},
+        {},
+        async (s) => {
+          // 1. Deterministic scouting (pure TypeScript — no LLM).
+          const data = scoutCodebase(root);
+          if (data.units.length === 0) {
+            throw new Error(
+              `deep-research-codebase: scout found no source files under ${root}. ` +
+                `Run from inside a code repository or check the CODE_EXTENSIONS list.`,
+            );
+          }
+          // 2. Heuristic decides explorer count (capped by available units).
+          const targetCount = calculateExplorerCount(data.totalLoc);
+          const partitions = partitionUnits(data.units, targetCount);
+          const actualCount = partitions.length;
+          // 3. Scratch directory for explorer outputs (timestamped to avoid
+          //    collisions across runs).
+          const scratchDir = path.join(
+            root,
+            "research",
+            "docs",
+            `.deep-research-${startedAt.getTime()}`,
+          );
+          await mkdir(scratchDir, { recursive: true });
+          // 4. Short LLM call: architectural orientation for downstream
+          //    explorers. The prompt forbids the agent from answering the
+          //    research question — its only job here is to orient.
+          await s.session.sendAndWait(
+            {
+              prompt: buildScoutPrompt({
+                question: prompt,
+                tree: data.tree,
+                totalLoc: data.totalLoc,
+                totalFiles: data.totalFiles,
+                explorerCount: actualCount,
+                partitionPreview: partitions,
+              }),
+            },
+            SCOUT_TIMEOUT_MS,
+          );
+          // F9: Copilot takes SessionEvent[], not a session ID.
+          s.save(await s.session.getMessages());
+          return {
+            root,
+            totalLoc: data.totalLoc,
+            totalFiles: data.totalFiles,
+            tree: data.tree,
+            partitions,
+            explorerCount: actualCount,
+            scratchDir,
+            heuristicNote: explainHeuristic(data.totalLoc, actualCount),
+          };
+        },
+      ),
+      ctx.stage(
+        {
+          name: "research-history",
+          description: "Surface prior research from research/ directory",
+        },
+        {},
+        {},
+        async (s) => {
+          // The generic history prompt drives a single default-agent session
+          // through locate → analyze → synthesize inline, instead of Claude's
+          // sub-agent dispatch.
+          await s.session.sendAndWait(
+            { prompt: buildHistoryPromptGeneric({ question: prompt, root }) },
+            HISTORY_TIMEOUT_MS,
+          );
+          s.save(await s.session.getMessages());
+        },
+      ),
+    ]);
+    const {
+      partitions,
+      explorerCount,
+      scratchDir,
+      totalLoc,
+      totalFiles,
+    } = scout.result;
+    // Pull both scout transcripts ONCE at the workflow level so every
+    // explorer + the aggregator can embed them in their prompts (F5). Both
+    // stages have completed here (we're past Promise.all), so these reads
+    // are safe (F13).
+    const scoutOverview = (await ctx.transcript(scout)).content;
+    const historyOverview = (await ctx.transcript(history)).content;
+    // ── Stage 2: parallel explorers ────────────────────────────────────────
+    // Each explorer is a separate Copilot session, running concurrently via
+    // Promise.all. Because the session is fresh (F5), every piece of context
+    // it needs — question, architectural orientation, historical context,
+    // partition assignment, scratch path — is injected into the first prompt
+    // via buildExplorerPromptGeneric.
+    const explorerHandles = await Promise.all(
+      partitions.map((partition, idx) => {
+        const i = idx + 1;
+        const scratchPath = path.join(scratchDir, `explorer-${i}.md`);
+        return ctx.stage(
+          {
+            name: `explorer-${i}`,
+            description: `Explore ${partition
+              .map((u) => u.path)
+              .join(", ")} (${partition.reduce((s, u) => s + u.fileCount, 0)} files)`,
+          },
+          {},
+          {},
+          async (s) => {
+            await s.session.sendAndWait(
+              {
+                prompt: buildExplorerPromptGeneric({
+                  question: prompt,
+                  index: i,
+                  total: explorerCount,
+                  partition,
+                  scoutOverview,
+                  historyOverview,
+                  scratchPath,
+                  root,
+                }),
+              },
+              EXPLORER_TIMEOUT_MS,
+            );
+            s.save(await s.session.getMessages());
+            // Returning structured metadata lets the aggregator stage reach
+            // each explorer's scratch path without re-parsing transcripts.
+            return { index: i, scratchPath, partition };
+          },
+        );
+      }),
+    );
+    // ── Stage 3: aggregator ────────────────────────────────────────────────
+    // Reads explorer findings via FILE PATHS (filesystem-context skill) to
+    // keep the aggregator's own context lean — we deliberately do NOT inline
+    // N transcripts into the prompt. Token cost stays roughly constant in N.
+    const finalPath = path.join(
+      root,
+      "research",
+      "docs",
+      `${isoDate}-${slug}.md`,
+    );
+    await ctx.stage(
+      {
+        name: "aggregator",
+        description: "Synthesize explorer findings + history into final research doc",
+      },
+      {},
+      {},
+      async (s) => {
+        await s.session.sendAndWait(
+          {
+            prompt: buildAggregatorPrompt({
+              question: prompt,
+              totalLoc,
+              totalFiles,
+              explorerCount,
+              explorerFiles: explorerHandles.map((h) => h.result),
+              finalPath,
+              scoutOverview,
+              historyOverview,
+            }),
+          },
+          AGGREGATOR_TIMEOUT_MS,
+        );
+        s.save(await s.session.getMessages());
+      },
+    );
+  })
+  .compile();

package/src/sdk/workflows/builtin/deep-research-codebase/helpers/heuristic.ts ADDED Viewed

@@ -0,0 +1,38 @@
+/**
+ * Determine how many parallel explorer sub-agents to spawn for the
+ * deep-research-codebase workflow, based on lines of code in the codebase.
+ *
+ * The heuristic balances coverage against coordination overhead:
+ *   - Too few explorers leave parts of the codebase under-investigated.
+ *   - Too many explorers flood the aggregator with redundant findings,
+ *     burn tokens on coordination, and exhaust tmux/process budgets.
+ *
+ * Tier choices were anchored to the rough sizes of common project shapes:
+ *
+ *   <    5,000 LOC →  2 explorers   scripts, single-purpose tools
+ *   <   25,000 LOC →  3 explorers   small libraries, CLI utilities
+ *   <  100,000 LOC →  5 explorers   medium applications
+ *   <  500,000 LOC →  7 explorers   large applications, small monorepos
+ *   <2,000,000 LOC →  9 explorers   large monorepos
+ *   ≥2,000,000 LOC → 12 explorers   massive monorepos (hard cap)
+ *
+ * The hard cap of 12 prevents runaway parallelism: each explorer is a
+ * Claude tmux pane plus an LLM session, so the cost grows linearly in
+ * tokens, processes, and walltime as well as in aggregator context.
+ */
+export function calculateExplorerCount(loc: number): number {
+  if (!Number.isFinite(loc) || loc <= 0) return 2;
+  if (loc < 5_000) return 2;
+  if (loc < 25_000) return 3;
+  if (loc < 100_000) return 5;
+  if (loc < 500_000) return 7;
+  if (loc < 2_000_000) return 9;
+  return 12;
+}
+/** Human-readable rationale for the heuristic decision — surfaced in logs/prompts. */
+export function explainHeuristic(loc: number, count: number): string {
+  return `Codebase: ${loc.toLocaleString()} LOC → spawning ${count} parallel explorer${
+    count === 1 ? "" : "s"
+  }.`;
+}