npm - keystone-cli - Versions diffs - 0.8.0 → 1.0.0 - Mend

keystone-cli 0.8.0 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

package/README.md +486 -54
package/package.json +8 -2
package/src/__fixtures__/index.ts +100 -0
package/src/cli.ts +809 -90
package/src/db/memory-db.ts +35 -1
package/src/db/workflow-db.test.ts +24 -0
package/src/db/workflow-db.ts +469 -14
package/src/expression/evaluator.ts +68 -4
package/src/parser/agent-parser.ts +6 -3
package/src/parser/config-schema.ts +38 -2
package/src/parser/schema.ts +192 -7
package/src/parser/test-schema.ts +29 -0
package/src/parser/workflow-parser.test.ts +54 -0
package/src/parser/workflow-parser.ts +153 -7
package/src/runner/aggregate-error.test.ts +57 -0
package/src/runner/aggregate-error.ts +46 -0
package/src/runner/audit-verification.test.ts +2 -2
package/src/runner/auto-heal.test.ts +1 -1
package/src/runner/blueprint-executor.test.ts +63 -0
package/src/runner/blueprint-executor.ts +157 -0
package/src/runner/concurrency-limit.test.ts +82 -0
package/src/runner/debug-repl.ts +18 -3
package/src/runner/durable-timers.test.ts +200 -0
package/src/runner/engine-executor.test.ts +464 -0
package/src/runner/engine-executor.ts +491 -0
package/src/runner/foreach-executor.ts +30 -12
package/src/runner/llm-adapter.test.ts +282 -5
package/src/runner/llm-adapter.ts +581 -8
package/src/runner/llm-clarification.test.ts +79 -21
package/src/runner/llm-errors.ts +83 -0
package/src/runner/llm-executor.test.ts +258 -219
package/src/runner/llm-executor.ts +226 -29
package/src/runner/mcp-client.ts +70 -3
package/src/runner/mcp-manager.test.ts +52 -52
package/src/runner/mcp-manager.ts +12 -5
package/src/runner/mcp-server.test.ts +117 -78
package/src/runner/mcp-server.ts +13 -4
package/src/runner/optimization-runner.ts +48 -31
package/src/runner/reflexion.test.ts +1 -1
package/src/runner/resource-pool.test.ts +113 -0
package/src/runner/resource-pool.ts +164 -0
package/src/runner/shell-executor.ts +130 -32
package/src/runner/standard-tools-integration.test.ts +36 -36
package/src/runner/standard-tools.test.ts +18 -0
package/src/runner/standard-tools.ts +110 -37
package/src/runner/step-executor.test.ts +176 -16
package/src/runner/step-executor.ts +530 -86
package/src/runner/stream-utils.test.ts +14 -0
package/src/runner/subflow-outputs.test.ts +103 -0
package/src/runner/test-harness.ts +161 -0
package/src/runner/tool-integration.test.ts +73 -79
package/src/runner/workflow-runner.test.ts +492 -15
package/src/runner/workflow-runner.ts +1438 -79
package/src/runner/workflow-subflows.test.ts +255 -0
package/src/templates/agents/keystone-architect.md +17 -12
package/src/templates/agents/tester.md +21 -0
package/src/templates/child-rollback.yaml +11 -0
package/src/templates/decompose-implement.yaml +53 -0
package/src/templates/decompose-problem.yaml +159 -0
package/src/templates/decompose-research.yaml +52 -0
package/src/templates/decompose-review.yaml +51 -0
package/src/templates/dev.yaml +134 -0
package/src/templates/engine-example.yaml +33 -0
package/src/templates/fan-out-fan-in.yaml +61 -0
package/src/templates/memory-service.yaml +1 -1
package/src/templates/parent-rollback.yaml +16 -0
package/src/templates/robust-automation.yaml +1 -1
package/src/templates/scaffold-feature.yaml +29 -27
package/src/templates/scaffold-generate.yaml +41 -0
package/src/templates/scaffold-plan.yaml +53 -0
package/src/types/status.ts +3 -0
package/src/ui/dashboard.tsx +4 -3
package/src/utils/assets.macro.ts +36 -0
package/src/utils/auth-manager.ts +585 -8
package/src/utils/blueprint-utils.test.ts +49 -0
package/src/utils/blueprint-utils.ts +80 -0
package/src/utils/circuit-breaker.test.ts +177 -0
package/src/utils/circuit-breaker.ts +160 -0
package/src/utils/config-loader.test.ts +100 -13
package/src/utils/config-loader.ts +44 -17
package/src/utils/constants.ts +62 -0
package/src/utils/error-renderer.test.ts +267 -0
package/src/utils/error-renderer.ts +320 -0
package/src/utils/json-parser.test.ts +4 -0
package/src/utils/json-parser.ts +18 -1
package/src/utils/mermaid.ts +4 -0
package/src/utils/paths.test.ts +46 -0
package/src/utils/paths.ts +70 -0
package/src/utils/process-sandbox.test.ts +128 -0
package/src/utils/process-sandbox.ts +293 -0
package/src/utils/rate-limiter.test.ts +143 -0
package/src/utils/rate-limiter.ts +221 -0
package/src/utils/redactor.test.ts +23 -15
package/src/utils/redactor.ts +65 -25
package/src/utils/resource-loader.test.ts +54 -0
package/src/utils/resource-loader.ts +158 -0
package/src/utils/sandbox.test.ts +69 -4
package/src/utils/sandbox.ts +69 -6
package/src/utils/schema-validator.ts +65 -0
package/src/utils/workflow-registry.test.ts +57 -0
package/src/utils/workflow-registry.ts +45 -25
/package/src/expression/{evaluator.audit.test.ts → evaluator-audit.test.ts} +0 -0
/package/src/runner/{mcp-client.audit.test.ts → mcp-client-audit.test.ts} +0 -0

package/src/runner/step-executor.test.ts CHANGED Viewed

@@ -13,9 +13,11 @@ import * as dns from 'node:dns/promises';
 import { mkdirSync, rmSync } from 'node:fs';
 import { tmpdir } from 'node:os';
 import { join } from 'node:path';
+import * as readlinePromises from 'node:readline/promises';
 import type { MemoryDb } from '../db/memory-db';
 import type { ExpressionContext } from '../expression/evaluator';
 import type {
+  EngineStep,
   FileStep,
   HumanStep,
   RequestStep,
@@ -23,18 +25,12 @@ import type {
   SleepStep,
   WorkflowStep,
 } from '../parser/schema';
+import { ConfigLoader } from '../utils/config-loader';
 import type { SafeSandbox } from '../utils/sandbox';
 import type { getAdapter } from './llm-adapter';
+import type { executeLlmStep } from './llm-executor';
 import { executeStep } from './step-executor';
-// Mock executeLlmStep
-mock.module('./llm-executor', () => ({
-  // @ts-ignore
-  executeLlmStep: mock((_step, _context, _callback) => {
-    return Promise.resolve({ status: 'success', output: 'llm-output' });
-  }),
-}));
 interface StepOutput {
   stdout: string;
   stderr: string;
@@ -46,16 +42,11 @@ interface RequestOutput {
   data: unknown;
 }
-// Mock node:readline/promises
 const mockRl = {
   question: mock(() => Promise.resolve('')),
   close: mock(() => {}),
 };
-mock.module('node:readline/promises', () => ({
-  createInterface: mock(() => mockRl),
-}));
 describe('step-executor', () => {
   let context: ExpressionContext;
@@ -84,6 +75,10 @@ describe('step-executor', () => {
     };
   });
+  afterEach(() => {
+    ConfigLoader.clear();
+  });
   describe('shell', () => {
     it('should execute shell command', async () => {
       const step: ShellStep = {
@@ -313,6 +308,97 @@ describe('step-executor', () => {
       expect(result.status).toBe('failed');
       expect(result.error).toBe('Script failed');
     });
+    it('should pass logger to sandbox execution', async () => {
+      const logger = { log: mock(() => {}) };
+      // @ts-ignore
+      const step = {
+        id: 's1',
+        type: 'script',
+        run: 'return 1',
+        allowInsecure: true,
+      };
+      const mockSandbox = {
+        execute: async (
+          _code: string,
+          _context: Record<string, unknown>,
+          options?: { logger?: unknown }
+        ) => {
+          expect(options?.logger).toBe(logger);
+          return 'ok';
+        },
+      };
+      const result = await executeStep(
+        step,
+        context,
+        logger as unknown as Parameters<typeof executeStep>[2],
+        {
+          sandbox: mockSandbox as unknown as Parameters<typeof executeStep>[3]['sandbox'],
+        }
+      );
+      expect(result.status).toBe('success');
+    });
+  });
+  describe('engine', () => {
+    const artifactRoot = join(tempDir, 'engine-artifacts');
+    const setEngineConfig = (
+      allowlist: Record<string, { command: string; version: string; versionArgs?: string[] }>
+    ) => {
+      ConfigLoader.setConfig({
+        default_provider: 'openai',
+        providers: {},
+        model_mappings: {},
+        storage: { retention_days: 30, redact_secrets_at_rest: true },
+        mcp_servers: {},
+        engines: { allowlist, denylist: [] },
+        concurrency: { default: 10, pools: { llm: 2, shell: 5, http: 10, engine: 2 } },
+      });
+    };
+    it('should execute engine command and parse summary', async () => {
+      const version = (Bun.version || process.versions?.bun || '') as string;
+      setEngineConfig({ bun: { command: 'bun', version } });
+      const step: EngineStep = {
+        id: 'e1',
+        type: 'engine',
+        command: 'bun',
+        args: ['-e', 'console.log(JSON.stringify({ ok: true }))'],
+        env: { PATH: process.env.PATH || '' },
+        cwd: process.cwd(),
+      };
+      const result = await executeStep(step, context, undefined, { artifactRoot });
+      expect(result.status).toBe('success');
+      const output = result.output as { summary: { ok: boolean }; artifactPath?: string };
+      expect(output.summary).toEqual({ ok: true });
+      expect(output.artifactPath).toBeTruthy();
+      const artifactText = await Bun.file(output.artifactPath as string).text();
+      expect(artifactText).toContain('"ok": true');
+    });
+    it('should fail when engine command is not allowlisted', async () => {
+      setEngineConfig({});
+      const step: EngineStep = {
+        id: 'e1',
+        type: 'engine',
+        command: 'bun',
+        args: ['-e', 'console.log(JSON.stringify({ ok: true }))'],
+        env: { PATH: process.env.PATH || '' },
+        cwd: process.cwd(),
+      };
+      const result = await executeStep(step, context, undefined, { artifactRoot });
+      expect(result.status).toBe('failed');
+      expect(result.error).toContain('allowlist');
+    });
   });
   describe('memory', () => {
@@ -322,7 +408,7 @@ describe('step-executor', () => {
     };
     const mockGetAdapter = mock((model) => {
-      if (model === 'no-embed') return { adapter: {}, resolvedModel: model };
+      if (model === 'local:no-embed') return { adapter: {}, resolvedModel: model };
       return {
         adapter: {
           embed: mock((text) => Promise.resolve([0.1, 0.2, 0.3])),
@@ -343,7 +429,13 @@ describe('step-executor', () => {
     it('should fail if adapter does not support embedding', async () => {
       // @ts-ignore
-      const step = { id: 'm1', type: 'memory', op: 'store', text: 'foo', model: 'no-embed' };
+      const step = {
+        id: 'm1',
+        type: 'memory',
+        op: 'store',
+        text: 'foo',
+        model: 'local:no-embed',
+      };
       // @ts-ignore
       const result = await executeStep(step, context, undefined, {
         memoryDb: mockMemoryDb as unknown as MemoryDb,
@@ -353,6 +445,18 @@ describe('step-executor', () => {
       expect(result.error).toContain('does not support embeddings');
     });
+    it('should fail for non-local embedding models', async () => {
+      // @ts-ignore
+      const step = { id: 'm1', type: 'memory', op: 'store', text: 'foo', model: 'openai' };
+      // @ts-ignore
+      const result = await executeStep(step, context, undefined, {
+        memoryDb: mockMemoryDb as unknown as MemoryDb,
+        getAdapter: mockGetAdapter as unknown as typeof getAdapter,
+      });
+      expect(result.status).toBe('failed');
+      expect(result.error).toContain('only support local embeddings');
+    });
     it('should store memory', async () => {
       // @ts-ignore
       const step = {
@@ -585,17 +689,67 @@ describe('step-executor', () => {
       expect(result.error).toContain('HTTP 400: Bad Request');
       expect(result.error).toContain('Response Body: {"error": "bad request details"}');
     });
+    it('should drop auth headers on cross-origin redirects', async () => {
+      // @ts-ignore
+      global.fetch
+        .mockResolvedValueOnce(
+          new Response('', {
+            status: 302,
+            headers: { Location: 'https://other.example.com/next' },
+          })
+        )
+        .mockResolvedValueOnce(new Response('ok'));
+      const step: RequestStep = {
+        id: 'req-redirect',
+        type: 'request',
+        needs: [],
+        url: 'https://api.example.com/start',
+        method: 'GET',
+        headers: { Authorization: 'Bearer token' },
+      };
+      const result = await executeStep(step, context);
+      expect(result.status).toBe('success');
+      // @ts-ignore
+      const secondCall = global.fetch.mock.calls[1][1];
+      expect(secondCall.headers.Authorization).toBeUndefined();
+    });
+    it('should allow insecure request when allowInsecure is true', async () => {
+      // @ts-ignore
+      global.fetch.mockResolvedValue(new Response('ok'));
+      const step: RequestStep = {
+        id: 'req-insecure',
+        type: 'request',
+        needs: [],
+        url: 'http://localhost/test',
+        method: 'GET',
+        allowInsecure: true,
+      };
+      const result = await executeStep(step, context);
+      expect(result.status).toBe('success');
+    });
   });
   describe('human', () => {
     const originalIsTTY = process.stdin.isTTY;
+    let createInterfaceSpy: ReturnType<typeof spyOn>;
     beforeEach(() => {
       process.stdin.isTTY = true;
+      createInterfaceSpy = spyOn(readlinePromises, 'createInterface').mockReturnValue(
+        mockRl as unknown as ReturnType<typeof readlinePromises.createInterface>
+      );
     });
     afterEach(() => {
       process.stdin.isTTY = originalIsTTY;
+      createInterfaceSpy.mockRestore();
     });
     it('should handle human confirmation', async () => {
@@ -737,7 +891,13 @@ describe('step-executor', () => {
         type: 'llm',
         prompt: 'hello',
       };
-      const result = await executeStep(step, context);
+      const executeLlmStepMock = mock(async () => ({
+        status: 'success',
+        output: 'llm-output',
+      })) as unknown as typeof executeLlmStep;
+      const result = await executeStep(step, context, undefined, {
+        executeLlmStep: executeLlmStepMock,
+      });
       expect(result.status).toBe('success');
       expect(result.output).toBe('llm-output');
     });