npm - keystone-cli - Versions diffs - 2.0.0 → 2.1.0 - Mend

keystone-cli 2.0.0 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

package/README.md +43 -4
package/package.json +4 -1
package/src/cli.ts +1 -0
package/src/commands/event.ts +9 -0
package/src/commands/run.ts +17 -0
package/src/db/dynamic-state-manager.ts +12 -9
package/src/db/memory-db.test.ts +19 -1
package/src/db/memory-db.ts +101 -22
package/src/db/workflow-db.ts +181 -9
package/src/expression/evaluator.ts +4 -1
package/src/parser/config-schema.ts +6 -0
package/src/parser/schema.ts +1 -0
package/src/runner/__test__/llm-test-setup.ts +43 -11
package/src/runner/durable-timers.test.ts +1 -1
package/src/runner/executors/dynamic-executor.ts +125 -88
package/src/runner/executors/engine-executor.ts +10 -39
package/src/runner/executors/file-executor.ts +67 -0
package/src/runner/executors/foreach-executor.ts +170 -17
package/src/runner/executors/human-executor.ts +18 -0
package/src/runner/executors/llm/stream-handler.ts +103 -0
package/src/runner/executors/llm/tool-manager.ts +360 -0
package/src/runner/executors/llm-executor.ts +288 -555
package/src/runner/executors/memory-executor.ts +41 -34
package/src/runner/executors/shell-executor.ts +96 -52
package/src/runner/executors/subworkflow-executor.ts +16 -0
package/src/runner/executors/types.ts +3 -1
package/src/runner/executors/verification_fixes.test.ts +46 -0
package/src/runner/join-scheduling.test.ts +2 -1
package/src/runner/llm-adapter.integration.test.ts +10 -5
package/src/runner/llm-adapter.ts +57 -18
package/src/runner/llm-clarification.test.ts +4 -1
package/src/runner/llm-executor.test.ts +21 -7
package/src/runner/mcp-client.ts +36 -2
package/src/runner/mcp-server.ts +65 -36
package/src/runner/recovery-security.test.ts +5 -2
package/src/runner/reflexion.test.ts +6 -3
package/src/runner/services/context-builder.ts +13 -4
package/src/runner/services/workflow-validator.ts +2 -1
package/src/runner/standard-tools-ast.test.ts +4 -2
package/src/runner/standard-tools-execution.test.ts +14 -1
package/src/runner/standard-tools-integration.test.ts +6 -0
package/src/runner/standard-tools.ts +13 -10
package/src/runner/step-executor.ts +2 -2
package/src/runner/tool-integration.test.ts +4 -1
package/src/runner/workflow-runner.test.ts +23 -12
package/src/runner/workflow-runner.ts +172 -79
package/src/runner/workflow-state.ts +181 -111
package/src/ui/dashboard.tsx +17 -3
package/src/utils/config-loader.ts +4 -0
package/src/utils/constants.ts +4 -0
package/src/utils/context-injector.test.ts +27 -27
package/src/utils/context-injector.ts +68 -26
package/src/utils/process-sandbox.ts +138 -148
package/src/utils/redactor.ts +39 -9
package/src/utils/resource-loader.ts +24 -19
package/src/utils/sandbox.ts +6 -0
package/src/utils/stream-utils.ts +58 -0

package/src/db/workflow-db.ts CHANGED Viewed

@@ -38,6 +38,7 @@ export interface StepExecution {
   completed_at: string | null;
   retry_count: number;
   usage: string | null; // JSON
+  metadata: string | null; // JSON
 }
 export interface IdempotencyRecord {
@@ -84,6 +85,19 @@ export interface ThoughtEvent {
   created_at: string;
 }
+export interface StepBatchUpdate {
+  type: 'start' | 'complete';
+  id: string;
+  data: {
+    status?: StepStatusType;
+    output?: unknown;
+    error?: string;
+    usage?: unknown;
+    startedAt?: string;
+    completedAt?: string;
+  };
+}
 /**
  * Base error class for database operations
  */
@@ -117,10 +131,13 @@ export class WorkflowDb {
   private createStepStmt!: Statement;
   private startStepStmt!: Statement;
   private completeStepStmt!: Statement;
+  private updateStepMetadataStmt!: Statement;
   private incrementRetryStmt!: Statement;
   private getStepByIterationStmt!: Statement;
   private getMainStepStmt!: Statement;
   private getStepIterationsStmt!: Statement;
+  private getStepIterationsMetadataStmt!: Statement;
+  private countStepIterationsStmt!: Statement;
   private getStepsByRunStmt!: Statement;
   private getSuccessfulRunsStmt!: Statement;
   private getLastRunStmt!: Statement;
@@ -159,6 +176,7 @@ export class WorkflowDb {
   private clearTimersByRunStmt!: Statement;
   private clearAllTimersStmt!: Statement;
   private clearAllStepCacheStmt!: Statement;
+  private getSuspendedStepsForEventStmt!: Statement;
   private isClosed = false;
   constructor(public readonly dbPath = PathResolver.resolveDbPath()) {
@@ -206,8 +224,8 @@ export class WorkflowDb {
       AND status IN ('success', 'failed', 'canceled')
     `);
     this.createStepStmt = this.db.prepare(`
-      INSERT INTO step_executions (id, run_id, step_id, iteration_index, status, retry_count)
-      VALUES (?, ?, ?, ?, ?, ?)
+      INSERT INTO step_executions (id, run_id, step_id, iteration_index, status, retry_count, metadata)
+      VALUES (?, ?, ?, ?, ?, ?, ?)
     `);
     this.startStepStmt = this.db.prepare(`
       UPDATE step_executions
@@ -219,6 +237,11 @@ export class WorkflowDb {
       SET status = ?, output = ?, error = ?, completed_at = ?, usage = ?
       WHERE id = ?
     `);
+    this.updateStepMetadataStmt = this.db.prepare(`
+      UPDATE step_executions
+      SET metadata = ?
+      WHERE id = ?
+    `);
     this.incrementRetryStmt = this.db.prepare(`
       UPDATE step_executions
       SET retry_count = retry_count + 1
@@ -241,6 +264,16 @@ export class WorkflowDb {
       WHERE run_id = ? AND step_id = ? AND iteration_index IS NOT NULL
       ORDER BY iteration_index ASC
     `);
+    this.getStepIterationsMetadataStmt = this.db.prepare(`
+      SELECT id, run_id, step_id, status, error, usage, started_at, completed_at, iteration_index, CASE WHEN output IS NOT NULL THEN '{"truncated":true}' ELSE NULL END as output
+      FROM step_executions
+      WHERE run_id = ? AND step_id = ? AND iteration_index IS NOT NULL
+      ORDER BY iteration_index ASC
+    `);
+    this.countStepIterationsStmt = this.db.prepare(`
+      SELECT count(*) as count FROM step_executions
+      WHERE run_id = ? AND step_id = ? AND iteration_index IS NOT NULL
+    `);
     this.getStepsByRunStmt = this.db.prepare(`
       SELECT * FROM step_executions
       WHERE run_id = ?
@@ -405,6 +438,14 @@ export class WorkflowDb {
     this.clearTimersByRunStmt = this.db.prepare('DELETE FROM durable_timers WHERE run_id = ?');
     this.clearAllTimersStmt = this.db.prepare('DELETE FROM durable_timers');
     this.clearAllStepCacheStmt = this.db.prepare('DELETE FROM step_cache');
+    // PERFORMANCE NOTE: This uses a LIKE query on the 'output' column, which is not indexed for text search.
+    // If the number of suspended steps grows very large, this will become a performance bottleneck.
+    // Consider adding a dedicated 'wait_event' column if this becomes a scalability issue.
+    this.getSuspendedStepsForEventStmt = this.db.prepare(`
+      SELECT run_id FROM step_executions
+      WHERE status = 'suspended'
+      AND output LIKE ?
+    `);
   }
   /**
@@ -420,13 +461,57 @@ export class WorkflowDb {
    * Batch create multiple step executions in a single transaction.
    */
   public async batchCreateSteps(
-    steps: Array<{ id: string; runId: string; stepId: string; iterationIndex: number | null }>
+    steps: Array<{
+      id: string;
+      runId: string;
+      stepId: string;
+      iterationIndex: number | null;
+      metadata?: Record<string, unknown>;
+    }>
   ): Promise<void> {
     if (steps.length === 0) return;
     await this.withRetry(() => {
       this.db.transaction(() => {
         for (const s of steps) {
-          this.createStepStmt.run(s.id, s.runId, s.stepId, s.iterationIndex, 'pending', 0);
+          this.createStepStmt.run(
+            s.id,
+            s.runId,
+            s.stepId,
+            s.iterationIndex,
+            'pending',
+            0,
+            s.metadata ? JSON.stringify(s.metadata) : null
+          );
+        }
+      })();
+    });
+  }
+  /**
+   * Batch update step status (start or complete) in a single transaction.
+   * This reduces database contention for high-concurrency scenarios.
+   */
+  public async batchUpdateSteps(updates: StepBatchUpdate[]): Promise<void> {
+    if (updates.length === 0) return;
+    await this.withRetry(() => {
+      this.db.transaction(() => {
+        for (const update of updates) {
+          if (update.type === 'start') {
+            this.startStepStmt.run(
+              update.data.status || 'running',
+              update.data.startedAt || new Date().toISOString(),
+              update.id
+            );
+          } else if (update.type === 'complete') {
+            this.completeStepStmt.run(
+              update.data.status || 'success',
+              update.data.output ? JSON.stringify(update.data.output) : null,
+              update.data.error || null,
+              update.data.completedAt || new Date().toISOString(),
+              update.data.usage ? JSON.stringify(update.data.usage) : null,
+              update.id
+            );
+          }
         }
       })();
     });
@@ -620,6 +705,28 @@ export class WorkflowDb {
         PRAGMA user_version = 6;
       `);
     }
+    // Version 7: Add composite index for step retrieval optimization
+    if (version < 7) {
+      this.db.exec(`
+        CREATE INDEX IF NOT EXISTS idx_steps_run_ordered ON step_executions(run_id, started_at, iteration_index);
+        PRAGMA user_version = 7;
+      `);
+    }
+    // Version 8: Add metadata column to step_executions
+    if (version < 8) {
+      const hasMetadata = this.db
+        .query(
+          "SELECT count(*) as count FROM pragma_table_info('step_executions') WHERE name='metadata'"
+        )
+        .get() as { count: number };
+      if (hasMetadata.count === 0) {
+        this.db.exec('ALTER TABLE step_executions ADD COLUMN metadata TEXT;');
+      }
+      this.db.exec('PRAGMA user_version = 8;');
+    }
   }
   private initSchema(): void {
@@ -656,6 +763,7 @@ export class WorkflowDb {
       CREATE INDEX IF NOT EXISTS idx_steps_run ON step_executions(run_id);
       CREATE INDEX IF NOT EXISTS idx_steps_status ON step_executions(status);
       CREATE INDEX IF NOT EXISTS idx_steps_iteration ON step_executions(run_id, step_id, iteration_index);
+      CREATE INDEX IF NOT EXISTS idx_steps_run_ordered ON step_executions(run_id, started_at, iteration_index);
       CREATE TABLE IF NOT EXISTS idempotency_records (
         idempotency_key TEXT PRIMARY KEY,
@@ -791,10 +899,32 @@ export class WorkflowDb {
       const cutoffDate = new Date();
       cutoffDate.setDate(cutoffDate.getDate() - days);
       const cutoffIso = cutoffDate.toISOString();
+      let totalDeleted = 0;
+      const BATCH_SIZE = 1000;
-      const result = this.pruneRunsStmt.run(cutoffIso);
+      // Prepare ad-hoc statement for batched deletion
+      // We use IN (SELECT ... LIMIT) because strict DELETE LIMIT is not standard SQL
+      const stmt = this.db.prepare(`
+        DELETE FROM workflow_runs
+        WHERE id IN (
+          SELECT id FROM workflow_runs
+          WHERE started_at < ?
+          AND status IN ('success', 'failed', 'canceled')
+          LIMIT ?
+        )
+      `);
-      return result.changes;
+      try {
+        while (true) {
+          const result = stmt.run(cutoffIso, BATCH_SIZE);
+          if (result.changes === 0) break;
+          totalDeleted += result.changes;
+        }
+      } finally {
+        stmt.finalize();
+      }
+      return totalDeleted;
     });
   }
@@ -810,10 +940,19 @@ export class WorkflowDb {
     id: string,
     runId: string,
     stepId: string,
-    iterationIndex: number | null = null
+    iterationIndex: number | null = null,
+    metadata?: Record<string, unknown>
   ): Promise<void> {
     await this.withRetry(() => {
-      this.createStepStmt.run(id, runId, stepId, iterationIndex, 'pending', 0);
+      this.createStepStmt.run(
+        id,
+        runId,
+        stepId,
+        iterationIndex,
+        'pending',
+        0,
+        metadata ? JSON.stringify(metadata) : null
+      );
     });
   }
@@ -823,6 +962,12 @@ export class WorkflowDb {
     });
   }
+  async updateStepMetadata(id: string, metadata: Record<string, unknown>): Promise<void> {
+    await this.withRetry(() => {
+      this.updateStepMetadataStmt.run(JSON.stringify(metadata), id);
+    });
+  }
   async completeStep(
     id: string,
     status: StepStatus,
@@ -874,12 +1019,29 @@ export class WorkflowDb {
   /**
    * Get all iterations for a step
    */
-  public async getStepIterations(runId: string, stepId: string): Promise<StepExecution[]> {
+  public async getStepIterations(
+    runId: string,
+    stepId: string,
+    options?: { includeOutput?: boolean }
+  ): Promise<StepExecution[]> {
     return this.withRetry(() => {
+      if (options?.includeOutput === false) {
+        return this.getStepIterationsMetadataStmt.all(runId, stepId) as StepExecution[];
+      }
       return this.getStepIterationsStmt.all(runId, stepId) as StepExecution[];
     });
   }
+  /**
+   * Count iterations for a step
+   */
+  public async countStepIterations(runId: string, stepId: string): Promise<number> {
+    return this.withRetry(() => {
+      const result = this.countStepIterationsStmt.get(runId, stepId) as { count: number };
+      return result?.count || 0;
+    });
+  }
   /**
    * Get all step executions for a workflow run
    * @note Synchronous method - wrapped in sync retry logic
@@ -1486,4 +1648,14 @@ export class WorkflowDb {
       return this.listThoughtEventsStmt.all(limit) as ThoughtEvent[];
     });
   }
+  async getSuspendedStepsForEvent(eventName: string): Promise<string[]> {
+    return this.withRetry(() => {
+      // Look for runs suspended with { "event": eventName } in output
+      // We use LIKE for a simple containment check since output is JSON
+      const pattern = `%"event":"${eventName}"%`;
+      const results = this.getSuspendedStepsForEventStmt.all(pattern) as { run_id: string }[];
+      return results.map((r) => r.run_id);
+    });
+  }
 }

package/src/expression/evaluator.ts CHANGED Viewed

@@ -552,7 +552,10 @@ export class ExpressionEvaluator {
           case '+':
             // Support both string concatenation and numeric addition
             if (typeof left === 'string' || typeof right === 'string') {
-              return String(left ?? '') + String(right ?? '');
+              // Handle null/undefined as empty strings for concatenation to match template behavior
+              const leftStr = left === null || left === undefined ? '' : String(left);
+              const rightStr = right === null || right === undefined ? '' : String(right);
+              return leftStr + rightStr;
             }
             return Number(left) + Number(right);
           case '-':

package/src/parser/config-schema.ts CHANGED Viewed

@@ -116,6 +116,12 @@ export const ConfigSchema = z.object({
         .optional(),
     })
     .optional(),
+  logging: z
+    .object({
+      suppress_security_warning: z.boolean().default(false),
+      suppress_ai_sdk_warnings: z.boolean().default(false),
+    })
+    .default({}),
 });
 export type Config = z.infer<typeof ConfigSchema>;

package/src/parser/schema.ts CHANGED Viewed

@@ -140,6 +140,7 @@ export const BaseStepSchema = z.object({
   outputRetries: z.number().int().min(0).optional(), // Max retries for output validation failures
   repairStrategy: z.enum(['reask', 'repair', 'hybrid']).optional(), // Strategy for output repair
   compensate: z.lazy(() => StepSchema).optional(), // Compensation step to run on rollback
+  failFast: z.boolean().optional(), // Stop iteration on first failure (default true)
 });
 // ===== Step Type Schemas =====

package/src/runner/__test__/llm-test-setup.ts CHANGED Viewed

@@ -5,8 +5,12 @@
  * tests to opt-in to mocking rather than having it applied globally.
  */
 import { mock, spyOn } from 'bun:test';
+import { ConfigLoader } from '../../utils/config-loader';
 import * as llmAdapter from '../llm-adapter';
+// Disable AI SDK warnings for cleaner test output
+(global as any).AI_SDK_LOG_WARNINGS = false;
 // Create singleton mock functions that all test files share
 export const mockGetModel = mock();
 export const mockGetEmbeddingModel = mock();
@@ -98,7 +102,7 @@ export function createUnifiedMockModel() {
       }));
       const finalToolCalls = toolCalls && toolCalls.length > 0 ? toolCalls : undefined;
-      const text = response.message.content || ' ';
+      const text = response.message.content || '';
       // Internal AI SDK v6.0.3+ seems to expect 'content' on the result object
       // during generateText processing, even if not in the official v2 spec.
@@ -112,9 +116,8 @@ export function createUnifiedMockModel() {
             type: 'tool-call',
             toolCallId: tc.toolCallId,
             toolName: tc.toolName,
-            args: tc.args,
-            input: JSON.stringify(tc.args), // Add required input field
-          });
+            input: tc.args || (tc as any).input || {},
+          } as any);
         }
       }
@@ -174,28 +177,34 @@ export function createUnifiedMockModel() {
       const stream = new ReadableStream({
         async start(controller) {
-          if (response.message.content) {
+          if (response.message.content !== undefined && response.message.content !== null) {
             controller.enqueue({
               type: 'text-delta',
+              index: 0,
+              textDelta: response.message.content,
               delta: response.message.content,
-              text: response.message.content,
-            });
+            } as any);
           }
           const toolCalls = response.message.tool_calls?.map((tc: any) => ({
-            type: 'tool-call' as const,
+            type: 'tool-call',
             toolCallId: tc.id,
             toolName: tc.function.name,
             args:
               typeof tc.function.arguments === 'string'
                 ? JSON.parse(tc.function.arguments)
                 : tc.function.arguments,
+            input:
+              typeof tc.function.arguments === 'string'
+                ? JSON.parse(tc.function.arguments)
+                : tc.function.arguments,
             id: tc.id,
             name: tc.function.name,
-            input:
+            delta: JSON.stringify(
               typeof tc.function.arguments === 'string'
-                ? tc.function.arguments
-                : JSON.stringify(tc.function.arguments),
+                ? JSON.parse(tc.function.arguments)
+                : tc.function.arguments
+            ),
           }));
           if (toolCalls?.length) {
@@ -204,6 +213,7 @@ export function createUnifiedMockModel() {
             }
           }
+          // Finish event
           controller.enqueue({
             type: 'finish',
             finishReason: toolCalls?.length ? 'tool-calls' : 'stop',
@@ -235,6 +245,28 @@ import { resetProviderRegistry } from '../llm-adapter';
 export function setupLlmMocks() {
   resetProviderRegistry(); // Clear cache to ensure new mock is used
+  // Set a default mock configuration for tests to avoid interference from local config.yaml
+  ConfigLoader.setConfig({
+    default_provider: 'openai',
+    providers: {
+      openai: {
+        type: 'openai',
+        package: '@ai-sdk/openai',
+      },
+      anthropic: {
+        type: 'anthropic',
+        package: '@ai-sdk/anthropic',
+      },
+    },
+    model_mappings: {
+      'claude-*': 'anthropic',
+    },
+    engines: {
+      allowlist: {},
+      denylist: [],
+    },
+  } as any);
   // Provider factory (e.g. createOpenAI) returns a Provider Instance function
   const mockProviderInstance = (modelId: string) => createUnifiedMockModel();
   const mockProviderFactory = (options?: any) => mockProviderInstance;

package/src/runner/durable-timers.test.ts CHANGED Viewed

@@ -7,7 +7,7 @@ import { WorkflowSuspendedError, WorkflowWaitingError } from './step-executor';
 import { WorkflowRunner } from './workflow-runner';
 describe('Durable Timers Integration', () => {
-  const dbPath = 'test-timers.db';
+  const dbPath = `test-timers-${randomUUID()}.db`;
   let db: WorkflowDb;
   beforeAll(() => {