npm - gsd-pi - Versions diffs - 2.41.0-dev.cac69f9 → 2.42.0-dev.97e9e30 - Mend

gsd-pi 2.41.0-dev.cac69f9 → 2.42.0-dev.97e9e30

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

package/src/resources/extensions/gsd/custom-workflow-engine.ts ADDED Viewed

@@ -0,0 +1,216 @@
+/**
+ * custom-workflow-engine.ts — WorkflowEngine implementation for custom workflows.
+ *
+ * Drives the auto-loop using GRAPH.yaml step state from a run directory.
+ * Each iteration: deriveState reads the graph, resolveDispatch picks the
+ * next eligible step, reconcile marks it complete and persists.
+ *
+ * Observability:
+ * - All state reads/writes go through graph.ts YAML I/O — inspectable on disk.
+ * - `resolveDispatch` returns unitType "custom-step" with unitId "<name>/<stepId>".
+ * - `getDisplayMetadata` provides step N/M progress for dashboard rendering.
+ * - Phase transitions are derivable from GRAPH.yaml step statuses.
+ */
+import type { WorkflowEngine } from "./workflow-engine.js";
+import type {
+  EngineState,
+  EngineDispatchAction,
+  CompletedStep,
+  ReconcileResult,
+  DisplayMetadata,
+} from "./engine-types.js";
+import { readFileSync } from "node:fs";
+import { join } from "node:path";
+import { parse } from "yaml";
+import {
+  readGraph,
+  writeGraph,
+  getNextPendingStep,
+  markStepComplete,
+  expandIteration,
+  type WorkflowGraph,
+} from "./graph.js";
+import { injectContext } from "./context-injector.js";
+import type { WorkflowDefinition, StepDefinition } from "./definition-loader.js";
+/** Read and parse the frozen DEFINITION.yaml from a run directory. */
+export function readFrozenDefinition(runDir: string): WorkflowDefinition {
+  const defPath = join(runDir, "DEFINITION.yaml");
+  const raw = readFileSync(defPath, "utf-8");
+  return parse(raw, { schema: "core" }) as WorkflowDefinition;
+}
+export class CustomWorkflowEngine implements WorkflowEngine {
+  readonly engineId = "custom";
+  private readonly runDir: string;
+  constructor(runDir: string) {
+    this.runDir = runDir;
+  }
+  /**
+   * Derive engine state from GRAPH.yaml on disk.
+   *
+   * Phase is "complete" when all steps are complete or expanded,
+   * "running" otherwise (any pending or active steps remain).
+   */
+  async deriveState(_basePath: string): Promise<EngineState> {
+    const graph = readGraph(this.runDir);
+    const allDone = graph.steps.every(
+      (s) => s.status === "complete" || s.status === "expanded",
+    );
+    const phase = allDone ? "complete" : "running";
+    return {
+      phase,
+      currentMilestoneId: null,
+      activeSliceId: null,
+      activeTaskId: null,
+      isComplete: allDone,
+      raw: graph,
+    };
+  }
+  /**
+   * Resolve the next dispatch action from graph state.
+   *
+   * Uses getNextPendingStep to find the first step whose dependencies
+   * are all satisfied. If the step has an `iterate` config in the frozen
+   * DEFINITION.yaml, expands it into instance steps before dispatching.
+   *
+   * Returns a dispatch with unitType "custom-step" and unitId in
+   * "<workflowName>/<stepId>" format.
+   *
+   * Observability:
+   * - Iterate expansion is logged to stderr with item count and parent step ID.
+   * - Missing source artifacts throw with the full resolved path for diagnosis.
+   * - Zero-match expansions return a stop action with level "info".
+   * - Expanded GRAPH.yaml is written to disk before dispatch — inspectable on disk.
+   */
+  async resolveDispatch(
+    state: EngineState,
+    _context: { basePath: string },
+  ): Promise<EngineDispatchAction> {
+    let graph = state.raw as WorkflowGraph;
+    let next = getNextPendingStep(graph);
+    if (!next) {
+      return {
+        action: "stop",
+        reason: "All steps complete",
+        level: "info",
+      };
+    }
+    // Check frozen DEFINITION.yaml for iterate config on this step
+    const def = readFrozenDefinition(this.runDir);
+    const stepDef = def.steps.find((s: StepDefinition) => s.id === next!.id);
+    if (stepDef?.iterate) {
+      const iterate = stepDef.iterate;
+      // Read source artifact
+      const sourcePath = join(this.runDir, iterate.source);
+      let sourceContent: string;
+      try {
+        sourceContent = readFileSync(sourcePath, "utf-8");
+      } catch {
+        throw new Error(
+          `Iterate source artifact not found: ${sourcePath} (step "${next.id}", source: "${iterate.source}")`,
+        );
+      }
+      // Extract items via regex with global+multiline flags.
+      // Guard against ReDoS: if matching takes too long on large inputs, bail.
+      const regex = new RegExp(iterate.pattern, "gm");
+      const items: string[] = [];
+      const matchStart = Date.now();
+      let match: RegExpExecArray | null;
+      while ((match = regex.exec(sourceContent)) !== null) {
+        if (match[1] !== undefined) items.push(match[1]);
+        if (Date.now() - matchStart > 5_000) {
+          throw new Error(
+            `Iterate pattern "${iterate.pattern}" exceeded 5s timeout on step "${next.id}" — possible ReDoS`,
+          );
+        }
+      }
+      // Expand the graph
+      const expandedGraph = expandIteration(graph, next.id, items, next.prompt);
+      writeGraph(this.runDir, expandedGraph);
+      graph = expandedGraph;
+      // Re-query for first instance step
+      next = getNextPendingStep(expandedGraph);
+      if (!next) {
+        return {
+          action: "stop",
+          reason: "Iterate expansion produced no instances",
+          level: "info",
+        };
+      }
+    }
+    // Enrich prompt with context from prior step artifacts
+    const enrichedPrompt = injectContext(this.runDir, next.id, next.prompt);
+    return {
+      action: "dispatch",
+      step: {
+        unitType: "custom-step",
+        unitId: `${graph.metadata.name}/${next.id}`,
+        prompt: enrichedPrompt,
+      },
+    };
+  }
+  /**
+   * Reconcile state after a step completes.
+   *
+   * Extracts the stepId from the completedStep's unitId (last segment after `/`),
+   * marks it complete in the graph, and writes the updated GRAPH.yaml to disk.
+   *
+   * Returns "milestone-complete" when all steps are now done, "continue" otherwise.
+   */
+  async reconcile(
+    state: EngineState,
+    completedStep: CompletedStep,
+  ): Promise<ReconcileResult> {
+    const graph = state.raw as WorkflowGraph;
+    // Extract stepId from "<workflowName>/<stepId>"
+    const parts = completedStep.unitId.split("/");
+    const stepId = parts[parts.length - 1];
+    const updatedGraph = markStepComplete(graph, stepId);
+    writeGraph(this.runDir, updatedGraph);
+    const allDone = updatedGraph.steps.every(
+      (s) => s.status === "complete" || s.status === "expanded",
+    );
+    return {
+      outcome: allDone ? "milestone-complete" : "continue",
+    };
+  }
+  /**
+   * Return UI-facing metadata for progress display.
+   *
+   * Shows "Step N/M" progress where N = completed count and M = total.
+   */
+  getDisplayMetadata(state: EngineState): DisplayMetadata {
+    const graph = state.raw as WorkflowGraph;
+    const total = graph.steps.length;
+    const completed = graph.steps.filter((s) => s.status === "complete").length;
+    return {
+      engineLabel: "WORKFLOW",
+      currentPhase: state.phase,
+      progressSummary: `Step ${completed}/${total}`,
+      stepCount: { completed, total },
+    };
+  }
+}

package/src/resources/extensions/gsd/dashboard-overlay.ts CHANGED Viewed

@@ -38,6 +38,7 @@ function unitLabel(type: string): string {
     case "triage-captures": return "Triage";
     case "quick-task": return "Quick Task";
     case "replan-slice": return "Replan";
+    case "custom-step": return "Workflow Step";
     default: return type;
   }
 }

package/src/resources/extensions/gsd/definition-loader.ts ADDED Viewed

@@ -0,0 +1,462 @@
+/**
+ * definition-loader.ts — Parse and validate V1 YAML workflow definitions.
+ *
+ * Loads definition YAML files from `.gsd/workflow-defs/`, validates the
+ * V1 schema shape, and returns typed TypeScript objects. Pure functions
+ * with no engine or runtime dependencies — just `yaml` and `node:fs`.
+ *
+ * YAML uses snake_case (`depends_on`, `context_from`) per project convention (P005).
+ * TypeScript uses camelCase (`dependsOn`, `contextFrom`).
+ *
+ * Observability: All validation errors are collected into a string[] — callers
+ * can log, surface in dashboards, or return to agents for self-repair.
+ * substituteParams errors include the offending key name for traceability.
+ */
+import { parse } from "yaml";
+import { readFileSync, existsSync } from "node:fs";
+import { join } from "node:path";
+// ─── Public TypeScript Types (camelCase) ─────────────────────────────────
+export type VerifyPolicy =
+  | { policy: "content-heuristic"; minSize?: number; pattern?: string }
+  | { policy: "shell-command"; command: string }
+  | { policy: "prompt-verify"; prompt: string }
+  | { policy: "human-review" };
+export interface IterateConfig {
+  /** Artifact path (relative to run dir) to read and match against. */
+  source: string;
+  /** Regex pattern string. Must contain at least one capture group. Applied with global flag. */
+  pattern: string;
+}
+export interface StepDefinition {
+  /** Unique step identifier within the workflow. */
+  id: string;
+  /** Human-readable step name. */
+  name: string;
+  /** The prompt to dispatch for this step. */
+  prompt: string;
+  /** IDs of steps that must complete before this step can run. */
+  requires: string[];
+  /** Artifact paths produced by this step (relative to run dir). */
+  produces: string[];
+  /** Step IDs whose artifacts to include as context (S05 — accepted, not processed). */
+  contextFrom?: string[];
+  /** Verification policy for this step (S05 — typed + validated). */
+  verify?: VerifyPolicy;
+  /** Iteration config for this step (S06 — typed + validated). */
+  iterate?: IterateConfig;
+}
+export interface WorkflowDefinition {
+  /** Schema version — must be 1. */
+  version: number;
+  /** Workflow name. */
+  name: string;
+  /** Optional description. */
+  description?: string;
+  /** Optional parameter map for template substitution (S07). */
+  params?: Record<string, string>;
+  /** Ordered list of steps. */
+  steps: StepDefinition[];
+}
+// ─── Internal YAML Types (snake_case) ────────────────────────────────────
+interface YamlStepDef {
+  id?: unknown;
+  name?: unknown;
+  prompt?: unknown;
+  requires?: unknown;
+  depends_on?: unknown;
+  produces?: unknown;
+  context_from?: unknown;
+  verify?: unknown;
+  iterate?: unknown;
+  [key: string]: unknown; // Forward-compat: unknown fields accepted silently
+}
+interface YamlWorkflowDef {
+  version?: unknown;
+  name?: unknown;
+  description?: unknown;
+  params?: unknown;
+  steps?: unknown;
+  [key: string]: unknown; // Forward-compat: unknown fields accepted silently
+}
+// ─── Validation ──────────────────────────────────────────────────────────
+/**
+ * Validate a parsed (but untyped) YAML object against the V1 workflow schema.
+ *
+ * Collects all errors (does not short-circuit) so a single call reveals
+ * every problem with the definition.
+ *
+ * Unknown fields are silently accepted for forward compatibility with
+ * S05/S06 features (`context_from`, `verify`, `iterate`).
+ */
+export function validateDefinition(parsed: unknown): { valid: boolean; errors: string[] } {
+  const errors: string[] = [];
+  if (parsed == null || typeof parsed !== "object") {
+    return { valid: false, errors: ["Definition must be a non-null object"] };
+  }
+  const def = parsed as YamlWorkflowDef;
+  // version: must be 1 (number)
+  if (def.version === undefined || def.version === null) {
+    errors.push("Missing required field: version");
+  } else if (def.version !== 1) {
+    errors.push(`Unsupported version: ${def.version} (expected 1)`);
+  }
+  // name: must be a non-empty string
+  if (typeof def.name !== "string" || def.name.trim() === "") {
+    errors.push("Missing or empty required field: name");
+  }
+  // steps: must be a non-empty array
+  if (!Array.isArray(def.steps)) {
+    errors.push("Missing required field: steps (must be an array)");
+  } else if (def.steps.length === 0) {
+    errors.push("steps must contain at least one step");
+  } else {
+    // Track whether all steps have valid IDs — graph-level checks only run when true
+    let allStepIdsValid = true;
+    for (let i = 0; i < def.steps.length; i++) {
+      const step = def.steps[i] as YamlStepDef;
+      if (step == null || typeof step !== "object") {
+        errors.push(`Step at index ${i} is not an object`);
+        allStepIdsValid = false;
+        continue;
+      }
+      // Required step fields
+      if (typeof step.id !== "string" || step.id.trim() === "") {
+        errors.push(`Step at index ${i} missing required field: id`);
+        allStepIdsValid = false;
+      }
+      if (typeof step.name !== "string" || step.name.trim() === "") {
+        errors.push(`Step at index ${i} missing required field: name`);
+      }
+      if (typeof step.prompt !== "string" || step.prompt.trim() === "") {
+        errors.push(`Step at index ${i} missing required field: prompt`);
+      }
+      // produces: path traversal guard
+      if (Array.isArray(step.produces)) {
+        for (const p of step.produces) {
+          if (typeof p === "string" && p.includes("..")) {
+            errors.push(`Step "${step.id}" produces path contains disallowed '..': ${p}`);
+          }
+        }
+      }
+      // iterate: optional, but if present must conform to IterateConfig shape
+      if (step.iterate !== undefined) {
+        const it = step.iterate;
+        const sid = typeof step.id === "string" ? step.id : `index ${i}`;
+        if (it == null || typeof it !== "object" || Array.isArray(it)) {
+          errors.push(`Step "${sid}" iterate must be an object with "source" and "pattern" fields`);
+        } else {
+          const itObj = it as Record<string, unknown>;
+          if (typeof itObj.source !== "string" || (itObj.source as string).trim() === "") {
+            errors.push(`Step "${sid}" iterate.source must be a non-empty string`);
+          } else if ((itObj.source as string).includes("..")) {
+            errors.push(`Step "${sid}" iterate.source contains disallowed '..' path traversal`);
+          }
+          if (typeof itObj.pattern !== "string" || (itObj.pattern as string).trim() === "") {
+            errors.push(`Step "${sid}" iterate.pattern must be a non-empty string`);
+          } else {
+            const pat = itObj.pattern as string;
+            let regexValid = true;
+            try {
+              new RegExp(pat);
+            } catch {
+              regexValid = false;
+              errors.push(`Step "${sid}" iterate.pattern is not a valid regex: ${pat}`);
+            }
+            if (regexValid && !/\((?!\?)/.test(pat)) {
+              errors.push(`Step "${sid}" iterate.pattern must contain at least one capture group`);
+            }
+          }
+        }
+      }
+      // verify: optional, but if present must conform to VerifyPolicy shape
+      if (step.verify !== undefined) {
+        const v = step.verify;
+        const sid = typeof step.id === "string" ? step.id : `index ${i}`;
+        if (v == null || typeof v !== "object" || Array.isArray(v)) {
+          errors.push(`Step "${sid}" verify must be an object with a "policy" field`);
+        } else {
+          const vObj = v as Record<string, unknown>;
+          const VALID_POLICIES = ["content-heuristic", "shell-command", "prompt-verify", "human-review"];
+          if (typeof vObj.policy !== "string" || !VALID_POLICIES.includes(vObj.policy)) {
+            errors.push(`Step "${sid}" verify.policy must be one of: ${VALID_POLICIES.join(", ")}`);
+          } else {
+            // Policy-specific required field checks
+            if (vObj.policy === "shell-command") {
+              if (typeof vObj.command !== "string" || (vObj.command as string).trim() === "") {
+                errors.push(`Step "${sid}" verify policy "shell-command" requires a non-empty "command" field`);
+              }
+            }
+            if (vObj.policy === "prompt-verify") {
+              if (typeof vObj.prompt !== "string" || (vObj.prompt as string).trim() === "") {
+                errors.push(`Step "${sid}" verify policy "prompt-verify" requires a non-empty "prompt" field`);
+              }
+            }
+          }
+        }
+      }
+    }
+    // ─── Graph-level validations (only when all step IDs are valid) ────
+    if (allStepIdsValid) {
+      const steps = def.steps as YamlStepDef[];
+      // 1. Duplicate step ID check
+      const idCounts = new Map<string, number>();
+      for (const step of steps) {
+        const id = step.id as string;
+        idCounts.set(id, (idCounts.get(id) ?? 0) + 1);
+      }
+      for (const [id, count] of idCounts) {
+        if (count > 1) {
+          errors.push(`Duplicate step id: ${id}`);
+        }
+      }
+      // Build valid ID set for remaining checks
+      const validIds = new Set(steps.map((s) => s.id as string));
+      // 2. Dangling dependency check + 3. Self-referencing dependency check
+      for (const step of steps) {
+        const sid = step.id as string;
+        const deps = Array.isArray(step.requires)
+          ? (step.requires as string[])
+          : Array.isArray(step.depends_on)
+            ? (step.depends_on as string[])
+            : [];
+        for (const depId of deps) {
+          if (depId === sid) {
+            errors.push(`Step '${sid}' depends on itself`);
+          } else if (!validIds.has(depId)) {
+            errors.push(`Step '${sid}' requires unknown step '${depId}'`);
+          }
+        }
+      }
+      // 4. Cycle detection (DFS) — only when no duplicate IDs
+      if (![...idCounts.values()].some((c: number) => c > 1)) {
+        // Build adjacency list: step → its dependencies
+        const adj = new Map<string, string[]>();
+        for (const step of steps) {
+          const sid = step.id as string;
+          const deps = Array.isArray(step.requires)
+            ? (step.requires as string[])
+            : Array.isArray(step.depends_on)
+              ? (step.depends_on as string[])
+              : [];
+          adj.set(sid, deps.filter((d) => validIds.has(d) && d !== sid));
+        }
+        const WHITE = 0, GRAY = 1, BLACK = 2;
+        const color = new Map<string, number>();
+        for (const id of validIds) color.set(id, WHITE);
+        const parent = new Map<string, string | null>();
+        function dfs(node: string): string[] | null {
+          color.set(node, GRAY);
+          for (const dep of adj.get(node) ?? []) {
+            if (color.get(dep) === GRAY) {
+              // Back edge found — reconstruct cycle path
+              const cycle: string[] = [dep, node];
+              let cur = node;
+              while (parent.has(cur) && parent.get(cur) !== null && parent.get(cur) !== dep) {
+                cur = parent.get(cur)!;
+                cycle.push(cur);
+              }
+              cycle.push(dep);
+              cycle.reverse();
+              return cycle;
+            }
+            if (color.get(dep) === WHITE) {
+              parent.set(dep, node);
+              const result = dfs(dep);
+              if (result) return result;
+            }
+          }
+          color.set(node, BLACK);
+          return null;
+        }
+        for (const id of validIds) {
+          if (color.get(id) === WHITE) {
+            parent.set(id, null);
+            const cycle = dfs(id);
+            if (cycle) {
+              errors.push(`Cycle detected: ${cycle.join(" → ")}`);
+              break; // One cycle error is enough
+            }
+          }
+        }
+      }
+    }
+  }
+  return { valid: errors.length === 0, errors };
+}
+// ─── Loading ─────────────────────────────────────────────────────────────
+/**
+ * Load and validate a YAML workflow definition from the filesystem.
+ *
+ * Reads `<defsDir>/<name>.yaml`, parses YAML, validates the V1 schema,
+ * and converts snake_case YAML keys to camelCase TypeScript types.
+ *
+ * @param defsDir — directory containing definition YAML files
+ * @param name — definition filename without extension
+ * @returns Parsed and validated WorkflowDefinition
+ * @throws Error if file is missing, YAML is malformed, or schema is invalid
+ */
+export function loadDefinition(defsDir: string, name: string): WorkflowDefinition {
+  const filePath = join(defsDir, `${name}.yaml`);
+  if (!existsSync(filePath)) {
+    throw new Error(`Definition file not found: ${filePath}`);
+  }
+  const raw = readFileSync(filePath, "utf-8");
+  let parsed: unknown;
+  try {
+    parsed = parse(raw);
+  } catch (e) {
+    const msg = e instanceof Error ? e.message : String(e);
+    throw new Error(`Failed to parse YAML in ${filePath}: ${msg}`);
+  }
+  const { valid, errors } = validateDefinition(parsed);
+  if (!valid) {
+    throw new Error(`Invalid workflow definition in ${filePath}:\n  - ${errors.join("\n  - ")}`);
+  }
+  // Convert snake_case YAML → camelCase TypeScript
+  const yamlDef = parsed as YamlWorkflowDef;
+  const yamlSteps = yamlDef.steps as YamlStepDef[];
+  return {
+    version: yamlDef.version as number,
+    name: yamlDef.name as string,
+    description: typeof yamlDef.description === "string" ? yamlDef.description : undefined,
+    params: yamlDef.params != null && typeof yamlDef.params === "object"
+      ? Object.fromEntries(
+          Object.entries(yamlDef.params as Record<string, unknown>).map(
+            ([k, v]) => [k, String(v)],
+          ),
+        )
+      : undefined,
+    steps: yamlSteps.map((s) => ({
+      id: s.id as string,
+      name: s.name as string,
+      prompt: s.prompt as string,
+      requires: Array.isArray(s.requires)
+        ? (s.requires as string[])
+        : Array.isArray(s.depends_on)
+          ? (s.depends_on as string[])
+          : [],
+      produces: Array.isArray(s.produces) ? (s.produces as string[]) : [],
+      contextFrom: Array.isArray(s.context_from) ? (s.context_from as string[]) : undefined,
+      verify: s.verify as VerifyPolicy | undefined,
+      iterate: (s.iterate != null && typeof s.iterate === "object")
+        ? s.iterate as IterateConfig
+        : undefined,
+    })),
+  };
+}
+// ─── Parameter Substitution ──────────────────────────────────────────────
+/** Regex matching `{{key}}` placeholders — captures the key name. */
+const PARAM_PATTERN = /\{\{(\w+)\}\}/g;
+/**
+ * Replace `{{key}}` placeholders in a single prompt string.
+ *
+ * Exported for use by the engine on iteration-instance prompts that live
+ * in GRAPH.yaml (outside the definition's step list).
+ *
+ * @throws Error if any merged param value contains `..` (path-traversal guard)
+ */
+export function substitutePromptString(
+  prompt: string,
+  merged: Record<string, string>,
+): string {
+  return prompt.replace(PARAM_PATTERN, (match, key: string) => {
+    const value = merged[key];
+    return value !== undefined ? value : match;
+  });
+}
+/**
+ * Replace `{{key}}` placeholders in all step prompts with param values.
+ *
+ * Merge order: `definition.params` (defaults) ← `overrides` (CLI wins).
+ * Returns a **new** WorkflowDefinition — the input is never mutated.
+ *
+ * @throws Error if any param value contains `..` (path-traversal guard)
+ * @throws Error if any `{{key}}` remains unresolved after substitution
+ */
+export function substituteParams(
+  definition: WorkflowDefinition,
+  overrides?: Record<string, string>,
+): WorkflowDefinition {
+  const merged: Record<string, string> = {
+    ...(definition.params ?? {}),
+    ...(overrides ?? {}),
+  };
+  // Path-traversal guard: reject any value containing ".."
+  for (const [key, value] of Object.entries(merged)) {
+    if (value.includes("..")) {
+      throw new Error(
+        `Parameter "${key}" contains disallowed '..' (path traversal): ${value}`,
+      );
+    }
+  }
+  // Substitute in each step prompt
+  const substitutedSteps = definition.steps.map((step) => ({
+    ...step,
+    prompt: substitutePromptString(step.prompt, merged),
+  }));
+  // Check for unresolved placeholders
+  const unresolved = new Set<string>();
+  for (const step of substitutedSteps) {
+    let m: RegExpExecArray | null;
+    const re = new RegExp(PARAM_PATTERN.source, "g");
+    while ((m = re.exec(step.prompt)) !== null) {
+      unresolved.add(m[1]);
+    }
+  }
+  if (unresolved.size > 0) {
+    const keys = [...unresolved].sort().join(", ");
+    throw new Error(`Unresolved parameter(s) in step prompts: ${keys}`);
+  }
+  return {
+    ...definition,
+    steps: substitutedSteps,
+  };
+}