npm - @bastani/atomic - Versions diffs - 0.5.3 → 0.5.4-0 - Mend

@bastani/atomic 0.5.3 → 0.5.4-0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

package/README.md +110 -11
package/dist/{chunk-mn870nrv.js → chunk-xkxndz5g.js} +213 -154
package/dist/sdk/components/workflow-picker-panel.d.ts +120 -0
package/dist/sdk/define-workflow.d.ts +1 -1
package/dist/sdk/index.js +1 -1
package/dist/sdk/runtime/discovery.d.ts +57 -3
package/dist/sdk/runtime/executor.d.ts +15 -2
package/dist/sdk/runtime/tmux.d.ts +9 -0
package/dist/sdk/types.d.ts +63 -4
package/dist/sdk/workflows/builtin/deep-research-codebase/claude/index.d.ts +61 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/copilot/index.d.ts +48 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/helpers/heuristic.d.ts +25 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/helpers/prompts.d.ts +91 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/helpers/scout.d.ts +56 -0
package/dist/sdk/workflows/builtin/deep-research-codebase/opencode/index.d.ts +48 -0
package/dist/sdk/workflows/builtin/ralph/claude/index.js +6 -5
package/dist/sdk/workflows/builtin/ralph/copilot/index.js +6 -5
package/dist/sdk/workflows/builtin/ralph/opencode/index.js +6 -5
package/dist/sdk/workflows/index.d.ts +4 -4
package/dist/sdk/workflows/index.js +7 -1
package/package.json +1 -1
package/src/cli.ts +25 -3
package/src/commands/cli/chat/index.ts +5 -5
package/src/commands/cli/init/index.ts +79 -77
package/src/commands/cli/workflow-command.test.ts +757 -0
package/src/commands/cli/workflow.test.ts +310 -0
package/src/commands/cli/workflow.ts +445 -105
package/src/sdk/components/workflow-picker-panel.tsx +1462 -0
package/src/sdk/define-workflow.test.ts +101 -0
package/src/sdk/define-workflow.ts +62 -2
package/src/sdk/runtime/discovery.ts +111 -8
package/src/sdk/runtime/executor.ts +89 -32
package/src/sdk/runtime/tmux.conf +55 -0
package/src/sdk/runtime/tmux.ts +34 -10
package/src/sdk/types.ts +67 -4
package/src/sdk/workflows/builtin/deep-research-codebase/claude/index.ts +294 -0
package/src/sdk/workflows/builtin/deep-research-codebase/copilot/index.ts +276 -0
package/src/sdk/workflows/builtin/deep-research-codebase/helpers/heuristic.ts +38 -0
package/src/sdk/workflows/builtin/deep-research-codebase/helpers/prompts.ts +816 -0
package/src/sdk/workflows/builtin/deep-research-codebase/helpers/scout.ts +334 -0
package/src/sdk/workflows/builtin/deep-research-codebase/opencode/index.ts +284 -0
package/src/sdk/workflows/builtin/ralph/claude/index.ts +8 -4
package/src/sdk/workflows/builtin/ralph/copilot/index.ts +10 -4
package/src/sdk/workflows/builtin/ralph/opencode/index.ts +8 -4
package/src/sdk/workflows/index.ts +9 -1
package/src/services/system/auto-sync.ts +1 -1
package/src/services/system/install-ui.ts +109 -39
package/src/theme/colors.ts +65 -1

package/src/sdk/runtime/tmux.ts CHANGED Viewed

@@ -6,6 +6,19 @@
  * sending keystrokes, and pane state detection.
  */
+import { join } from "path";
+import type { Subprocess } from "bun";
+// ---------------------------------------------------------------------------
+// Constants
+// ---------------------------------------------------------------------------
+/** Dedicated tmux socket name — isolates Atomic sessions from the user's default server. */
+export const SOCKET_NAME = "atomic";
+/** Path to the bundled tmux config (shared by tmux and psmux). */
+const CONFIG_PATH = join(import.meta.dir, "tmux.conf");
 // ---------------------------------------------------------------------------
 // Core tmux primitives
 // ---------------------------------------------------------------------------
@@ -73,8 +86,9 @@ export function tmuxRun(args: string[]): { ok: true; stdout: string } | { ok: fa
   if (!binary) {
     return { ok: false, stderr: "No terminal multiplexer (tmux/psmux) found on PATH" };
   }
+  const fullArgs = ["-f", CONFIG_PATH, "-L", SOCKET_NAME, ...args];
   const result = Bun.spawnSync({
-    cmd: [binary, ...args],
+    cmd: [binary, ...fullArgs],
     stdout: "pipe",
     stderr: "pipe",
   });
@@ -318,14 +332,8 @@ export function killWindow(sessionName: string, windowName: string): void {
  * Check if a tmux session exists.
  */
 export function sessionExists(sessionName: string): boolean {
-  const binary = getMuxBinary();
-  if (!binary) return false;
-  const result = Bun.spawnSync({
-    cmd: [binary, "has-session", "-t", sessionName],
-    stdout: "pipe",
-    stderr: "pipe",
-  });
-  return result.success;
+  const result = tmuxRun(["has-session", "-t", sessionName]);
+  return result.ok;
 }
 /**
@@ -337,7 +345,7 @@ export function attachSession(sessionName: string): void {
     throw new Error("No terminal multiplexer (tmux/psmux) found on PATH");
   }
   const proc = Bun.spawnSync({
-    cmd: [binary, "attach-session", "-t", sessionName],
+    cmd: [binary, "-f", CONFIG_PATH, "-L", SOCKET_NAME, "attach-session", "-t", sessionName],
     stdin: "inherit",
     stdout: "inherit",
     stderr: "pipe",
@@ -348,6 +356,22 @@ export function attachSession(sessionName: string): void {
   }
 }
+/**
+ * Spawn an interactive attach-session process.
+ * Encapsulates binary resolution, config injection, and socket isolation.
+ * Used by all async attach call sites (executor, chat).
+ */
+export function spawnMuxAttach(sessionName: string): Subprocess {
+  const binary = getMuxBinary();
+  if (!binary) {
+    throw new Error("No terminal multiplexer (tmux/psmux) found on PATH");
+  }
+  return Bun.spawn(
+    [binary, "-f", CONFIG_PATH, "-L", SOCKET_NAME, "attach-session", "-t", sessionName],
+    { stdio: ["inherit", "inherit", "inherit"] },
+  );
+}
 /**
  * Switch the current tmux client to a different session.
  * Use this instead of `attachSession` when already inside tmux to avoid

package/src/sdk/types.ts CHANGED Viewed

@@ -95,6 +95,44 @@ export type {
   ClaudeQueryDefaults,
 };
+// ─── Workflow input schemas ─────────────────────────────────────────────────
+/**
+ * Supported field types for a workflow's declared inputs.
+ *
+ * - `"string"` — single-line free-form input (short values, identifiers, paths)
+ * - `"text"`   — multi-line free-form input (long prose, prompts, specs)
+ * - `"enum"`   — one of a fixed list of allowed `values`
+ */
+export type WorkflowInputType = "string" | "text" | "enum";
+/**
+ * A declared input for a workflow. When a workflow provides an `inputs`
+ * array, the CLI materialises one `--<name>` flag per input (and the
+ * interactive picker renders one field per input) so users can pass
+ * structured values rather than a single free-form prompt.
+ *
+ * Leaving `inputs` unset (or empty) signals that the workflow consumes a
+ * single free-form prompt instead — the legacy
+ * `atomic workflow -n <name> -a <agent> "prompt"` form.
+ */
+export interface WorkflowInput {
+  /** Field name — also the CLI flag (`--<name>`) and form field identifier. */
+  name: string;
+  /** Input kind — see {@link WorkflowInputType}. */
+  type: WorkflowInputType;
+  /** Whether the field must be non-empty before the workflow can run. */
+  required?: boolean;
+  /** Short human description shown as the field caption. */
+  description?: string;
+  /** Placeholder text shown when the field is empty. */
+  placeholder?: string;
+  /** Default value pre-filled into the field. Enums use this to pick their initial value. */
+  default?: string;
+  /** Allowed values — required when `type` is `"enum"`. */
+  values?: string[];
+}
 // ─── Core types ─────────────────────────────────────────────────────────────
 /**
@@ -169,8 +207,16 @@ export interface SessionContext<A extends AgentType = AgentType> {
   client: ProviderClient<A>;
   /** Provider-specific session (auto-created by runtime) */
   session: ProviderSession<A>;
-  /** The original user prompt from the CLI invocation */
-  userPrompt: string;
+  /**
+   * Structured inputs for this workflow run. Populated from CLI flags
+   * (`--<name>=<value>`) or the interactive picker.
+   *
+   * Free-form workflows (no declared `inputs` schema) receive their
+   * single positional prompt under the `prompt` key — so
+   * `s.inputs.prompt` is the canonical way to read the user's prompt
+   * regardless of whether the workflow is structured or free-form.
+   */
+  inputs: Record<string, string>;
   /** Which agent is running */
   agent: A;
   /**
@@ -212,8 +258,16 @@ export interface SessionContext<A extends AgentType = AgentType> {
  * Does not have session-specific fields (paneId, save, etc.).
  */
 export interface WorkflowContext<A extends AgentType = AgentType> {
-  /** The original user prompt from the CLI invocation */
-  userPrompt: string;
+  /**
+   * Structured inputs for this workflow run. Populated from CLI flags
+   * (`--<name>=<value>`) or the interactive picker.
+   *
+   * Free-form workflows (no declared `inputs` schema) receive their
+   * single positional prompt under the `prompt` key — so
+   * `ctx.inputs.prompt` is the canonical way to read the user's prompt
+   * regardless of whether the workflow is structured or free-form.
+   */
+  inputs: Record<string, string>;
   /** Which agent is running */
   agent: A;
   /**
@@ -248,6 +302,13 @@ export interface WorkflowOptions {
   name: string;
   /** Human-readable description */
   description?: string;
+  /**
+   * Optional declared inputs. When provided, the CLI materialises one
+   * `--<name>` flag per entry and the interactive picker renders one form
+   * field per entry. Leave unset to keep the workflow free-form (a single
+   * positional prompt argument).
+   */
+  inputs?: WorkflowInput[];
 }
 /**
@@ -257,6 +318,8 @@ export interface WorkflowDefinition<A extends AgentType = AgentType> {
   readonly __brand: "WorkflowDefinition";
   readonly name: string;
   readonly description: string;
+  /** Declared input schema — empty array for free-form workflows. */
+  readonly inputs: readonly WorkflowInput[];
   /** The workflow's entry point. Called by the executor with a WorkflowContext. */
   readonly run: (ctx: WorkflowContext<A>) => Promise<void>;
 }

package/src/sdk/workflows/builtin/deep-research-codebase/claude/index.ts ADDED Viewed

@@ -0,0 +1,294 @@
+/**
+ * deep-research-codebase / claude
+ *
+ * A deterministically-orchestrated, distributed version of the
+ * `research-codebase` skill. The research-codebase skill spawns
+ * codebase-locator / codebase-analyzer / codebase-pattern-finder /
+ * codebase-research-locator / codebase-research-analyzer /
+ * codebase-online-researcher sub-agents on the fly via LLM judgment;
+ * this workflow spawns the same agents on a deterministic schedule
+ * driven by the codebase's lines of code.
+ *
+ * Topology:
+ *
+ *           ┌─→ codebase-scout
+ *   parent ─┤
+ *           └─→ research-history
+ *                     │
+ *                     ▼
+ *   ┌──────────────────────────────────────────────────┐
+ *   │  explorer-1   explorer-2   ...   explorer-N      │   (Promise.all)
+ *   └──────────────────────────────────────────────────┘
+ *                     │
+ *                     ▼
+ *                aggregator
+ *
+ * Stage 1a — codebase-scout
+ *   Pure-TypeScript: lists files (git ls-files), counts LOC (batched wc -l),
+ *   renders a depth-bounded ASCII tree, and bin-packs directories into N
+ *   partitions where N is determined by the LOC heuristic. Then makes one
+ *   short LLM call to produce an architectural orientation that primes the
+ *   downstream explorers. Returns structured data via `handle.result` and
+ *   the agent's prose via `ctx.transcript(handle)`.
+ *
+ * Stage 1b — research-history (parallel sibling of scout)
+ *   Dispatches the codebase-research-locator and codebase-research-analyzer
+ *   sub-agents over the project's existing research/ directory to surface
+ *   prior decisions, completed investigations, and unresolved questions.
+ *   Output is consumed via session transcript (≤400 words) and feeds into
+ *   the aggregator as supplementary context.
+ *
+ * Stage 2 — explorer-1..N (parallel; depends on scout + history)
+ *   Each explorer is a coordinator that dispatches specialized sub-agents
+ *   over its assigned partition (single LOC-balanced slice of the codebase):
+ *     - codebase-locator       → finds relevant files in the partition
+ *     - codebase-analyzer      → documents how the most relevant files work
+ *     - codebase-pattern-finder → finds existing pattern examples
+ *     - codebase-online-researcher → (conditional) external library docs
+ *   The explorer never reads files directly — it orchestrates specialists
+ *   and writes a synthesized findings document to a known scratch path.
+ *
+ * Stage 3 — aggregator
+ *   Reads each explorer's scratch file by path (file-based handoff to keep
+ *   the aggregator's own context lean — we deliberately do NOT inline N
+ *   transcripts into the prompt). Folds in the research-history overview
+ *   as supplementary context. Synthesizes a single research document at
+ *   research/docs/YYYY-MM-DD-<slug>.md.
+ *
+ * Context-engineering decisions are documented at each stage below.
+ */
+import { defineWorkflow } from "../../../index.ts";
+import { mkdir } from "node:fs/promises";
+import path from "node:path";
+import {
+  getCodebaseRoot,
+  partitionUnits,
+  scoutCodebase,
+} from "../helpers/scout.ts";
+import {
+  calculateExplorerCount,
+  explainHeuristic,
+} from "../helpers/heuristic.ts";
+import {
+  buildAggregatorPrompt,
+  buildExplorerPrompt,
+  buildHistoryPrompt,
+  buildScoutPrompt,
+  slugifyPrompt,
+} from "../helpers/prompts.ts";
+export default defineWorkflow<"claude">({
+    name: "deep-research-codebase",
+    description:
+      "Deterministic deep codebase research: scout → LOC-driven parallel explorers → aggregator",
+  })
+  .run(async (ctx) => {
+    // Free-form workflows receive their positional prompt under
+    // `inputs.prompt`; destructure once so every stage below can close
+    // over a bare `prompt` string without re-reaching into ctx.inputs.
+    const prompt = ctx.inputs.prompt ?? "";
+    const root = getCodebaseRoot();
+    const startedAt = new Date();
+    const isoDate = startedAt.toISOString().slice(0, 10);
+    const slug = slugifyPrompt(prompt);
+    // ── Stages 1a + 1b: codebase-scout ∥ research-history ──────────────────
+    // Run the codebase scout (deterministic compute + brief LLM orientation)
+    // in parallel with the research-history scout (sub-agent dispatch over
+    // the project's prior research docs). Both must complete before any
+    // explorer starts, since:
+    //   - explorers depend on `scout.result.partitions`
+    //   - aggregator depends on the history transcript
+    // Promise.all gives us the cleanest auto-inferred graph topology:
+    // parent → [scout, history] → [explorer-1..N] → aggregator.
+    const [scout, history] = await Promise.all([
+      ctx.stage(
+        {
+          name: "codebase-scout",
+          description: "Map codebase, count LOC, partition for parallel explorers",
+        },
+        {},
+        {},
+        async (s) => {
+          // 1. Deterministic scouting.
+          const data = scoutCodebase(root);
+          if (data.units.length === 0) {
+            throw new Error(
+              `deep-research-codebase: scout found no source files under ${root}. ` +
+                `Run from inside a code repository or check the CODE_EXTENSIONS list.`,
+            );
+          }
+          // 2. Heuristic decides explorer count (capped by available units).
+          const targetCount = calculateExplorerCount(data.totalLoc);
+          const partitions = partitionUnits(data.units, targetCount);
+          const actualCount = partitions.length;
+          // 3. Scratch directory for explorer outputs (timestamped to avoid
+          //    collisions across runs).
+          const scratchDir = path.join(
+            root,
+            "research",
+            "docs",
+            `.deep-research-${startedAt.getTime()}`,
+          );
+          await mkdir(scratchDir, { recursive: true });
+          // 4. Short LLM call: architectural orientation for downstream
+          //    explorers. The prompt explicitly forbids the agent from
+          //    answering the research question — its only job here is to
+          //    orient.
+          await s.session.query(
+            buildScoutPrompt({
+              question: prompt,
+              tree: data.tree,
+              totalLoc: data.totalLoc,
+              totalFiles: data.totalFiles,
+              explorerCount: actualCount,
+              partitionPreview: partitions,
+            }),
+          );
+          s.save(s.sessionId);
+          return {
+            root,
+            totalLoc: data.totalLoc,
+            totalFiles: data.totalFiles,
+            tree: data.tree,
+            partitions,
+            explorerCount: actualCount,
+            scratchDir,
+            heuristicNote: explainHeuristic(data.totalLoc, actualCount),
+          };
+        },
+      ),
+      ctx.stage(
+        {
+          name: "research-history",
+          description: "Surface prior research via research-locator + research-analyzer",
+        },
+        {},
+        {},
+        async (s) => {
+          // Dispatches codebase-research-locator → codebase-research-analyzer
+          // over the project's research/ directory and outputs a ≤400-word
+          // synthesis as prose (no file write — consumed via transcript).
+          await s.session.query(
+            buildHistoryPrompt({ question: prompt, root }),
+          );
+          s.save(s.sessionId);
+        },
+      ),
+    ]);
+    const {
+      partitions,
+      explorerCount,
+      scratchDir,
+      totalLoc,
+      totalFiles,
+    } = scout.result;
+    // Pull both scout transcripts ONCE at the workflow level so every
+    // explorer + the aggregator can embed them in their prompts. Both
+    // stages have already completed by this point (we're past Promise.all),
+    // so these reads are safe (F13).
+    const scoutOverview = (await ctx.transcript(scout)).content;
+    const historyOverview = (await ctx.transcript(history)).content;
+    // ── Stage 2: parallel explorers ────────────────────────────────────────
+    // Each explorer is a separate tmux pane / Claude session, running
+    // concurrently via Promise.all. Each one receives:
+    //   - the original research question (top + bottom of prompt)
+    //   - the scout's architectural overview
+    //   - its OWN partition (never the full file list)
+    //   - the absolute path to its scratch file
+    //
+    // Information flow choices:
+    //   • We deliberately do not pass other explorers' work — they run in
+    //     parallel and forward-only data flow is enforced by the runtime
+    //     (F13). Cross-cutting happens in the aggregator.
+    //   • We pass the partition via closure capture, not by parsing
+    //     scout transcripts — strongly typed and lossless.
+    const explorerHandles = await Promise.all(
+      partitions.map((partition, idx) => {
+        const i = idx + 1;
+        const scratchPath = path.join(scratchDir, `explorer-${i}.md`);
+        return ctx.stage(
+          {
+            name: `explorer-${i}`,
+            description: `Explore ${partition
+              .map((u) => u.path)
+              .join(", ")} (${partition.reduce((s, u) => s + u.fileCount, 0)} files)`,
+          },
+          {},
+          {},
+          async (s) => {
+            await s.session.query(
+              buildExplorerPrompt({
+                question: prompt,
+                index: i,
+                total: explorerCount,
+                partition,
+                scoutOverview,
+                scratchPath,
+                root,
+              }),
+            );
+            s.save(s.sessionId);
+            // Returning structured metadata lets the aggregator stage reach
+            // each explorer's scratch path without re-parsing transcripts.
+            return { index: i, scratchPath, partition };
+          },
+        );
+      }),
+    );
+    // ── Stage 3: aggregator ────────────────────────────────────────────────
+    // Synthesizes explorer findings into the final research document at
+    // research/docs/YYYY-MM-DD-<slug>.md.
+    //
+    // Information flow choice:
+    //   • The aggregator reads explorer findings via FILE PATHS, not by
+    //     embedding all N transcripts in its prompt. This keeps its
+    //     context lean (filesystem-context skill) and lets the agent
+    //     selectively re-read source files when explorers contradict
+    //     each other.
+    //   • The aggregator only sees the scout overview (short) plus a
+    //     manifest of explorer scratch paths — token cost stays roughly
+    //     constant in N rather than growing linearly.
+    const finalPath = path.join(
+      root,
+      "research",
+      "docs",
+      `${isoDate}-${slug}.md`,
+    );
+    await ctx.stage(
+      {
+        name: "aggregator",
+        description: "Synthesize explorer findings + history into final research doc",
+      },
+      {},
+      {},
+      async (s) => {
+        await s.session.query(
+          buildAggregatorPrompt({
+            question: prompt,
+            totalLoc,
+            totalFiles,
+            explorerCount,
+            explorerFiles: explorerHandles.map((h) => h.result),
+            finalPath,
+            scoutOverview,
+            historyOverview,
+          }),
+        );
+        s.save(s.sessionId);
+      },
+    );
+  })
+  .compile();