npm - keystone-cli - Versions diffs - 0.2.0 → 0.3.1 - Mend

keystone-cli 0.2.0 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

package/README.md +30 -12
package/package.json +20 -4
package/src/cli.ts +171 -27
package/src/expression/evaluator.test.ts +4 -0
package/src/expression/evaluator.ts +9 -1
package/src/parser/agent-parser.ts +11 -4
package/src/parser/config-schema.ts +11 -0
package/src/parser/schema.ts +20 -10
package/src/parser/workflow-parser.ts +5 -4
package/src/runner/llm-executor.test.ts +174 -81
package/src/runner/llm-executor.ts +8 -3
package/src/runner/mcp-client.test.ts +85 -47
package/src/runner/mcp-client.ts +235 -42
package/src/runner/mcp-manager.ts +42 -2
package/src/runner/mcp-server.test.ts +22 -15
package/src/runner/mcp-server.ts +21 -4
package/src/runner/step-executor.test.ts +51 -8
package/src/runner/step-executor.ts +69 -7
package/src/runner/workflow-runner.ts +65 -24
package/src/utils/auth-manager.test.ts +86 -0
package/src/utils/auth-manager.ts +89 -0
package/src/utils/config-loader.test.ts +30 -0
package/src/utils/config-loader.ts +11 -1
package/src/utils/mermaid.test.ts +18 -18
package/src/utils/mermaid.ts +154 -20
package/src/utils/redactor.test.ts +6 -0
package/src/utils/redactor.ts +10 -1
package/src/utils/sandbox.test.ts +29 -0
package/src/utils/sandbox.ts +61 -0

package/src/runner/llm-executor.test.ts CHANGED Viewed

@@ -1,6 +1,19 @@
-import { afterAll, beforeAll, describe, expect, it, mock, spyOn } from 'bun:test';
+import {
+  afterAll,
+  afterEach,
+  beforeAll,
+  beforeEach,
+  describe,
+  expect,
+  it,
+  mock,
+  spyOn,
+} from 'bun:test';
+import * as child_process from 'node:child_process';
+import { EventEmitter } from 'node:events';
 import { mkdirSync, writeFileSync } from 'node:fs';
 import { join } from 'node:path';
+import { Readable, Writable } from 'node:stream';
 import type { ExpressionContext } from '../expression/evaluator';
 import type { LlmStep, Step } from '../parser/schema';
 import { ConfigLoader } from '../utils/config-loader';
@@ -24,8 +37,113 @@ const originalAnthropicChat = AnthropicAdapter.prototype.chat;
 describe('llm-executor', () => {
   const agentsDir = join(process.cwd(), '.keystone', 'workflows', 'agents');
+  let spawnSpy: ReturnType<typeof spyOn>;
+  let initSpy: ReturnType<typeof spyOn>;
+  let listToolsSpy: ReturnType<typeof spyOn>;
+  let stopSpy: ReturnType<typeof spyOn>;
+  const mockChat = async (messages: unknown[], _options?: unknown) => {
+    const msgs = messages as LLMMessage[];
+    const lastMessage = msgs[msgs.length - 1];
+    const systemMessage = msgs.find((m) => m.role === 'system');
+    // If there's any tool message, just respond with final message
+    if (msgs.some((m) => m.role === 'tool')) {
+      return {
+        message: { role: 'assistant', content: 'LLM Response' },
+      };
+    }
+    if (systemMessage?.content?.includes('IMPORTANT: You must output valid JSON')) {
+      return {
+        message: { role: 'assistant', content: '```json\n{"foo": "bar"}\n```' },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-1',
+              type: 'function',
+              function: { name: 'test-tool', arguments: '{"val": 123}' },
+            },
+          ],
+        },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger adhoc tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-adhoc',
+              type: 'function',
+              function: { name: 'adhoc-tool', arguments: '{}' },
+            },
+          ],
+        },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger unknown tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-unknown',
+              type: 'function',
+              function: { name: 'unknown-tool', arguments: '{}' },
+            },
+          ],
+        },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger mcp tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-mcp',
+              type: 'function',
+              function: { name: 'mcp-tool', arguments: '{}' },
+            },
+          ],
+        },
+      };
+    }
+    return {
+      message: { role: 'assistant', content: 'LLM Response' },
+    };
+  };
   beforeAll(() => {
+    // Mock spawn to avoid actual process creation
+    const mockProcess = Object.assign(new EventEmitter(), {
+      stdout: new Readable({ read() {} }),
+      stdin: new Writable({
+        write(_chunk, _encoding, cb: (error?: Error | null) => void) {
+          cb();
+        },
+      }),
+      kill: mock(() => {}),
+    });
+    spawnSpy = spyOn(child_process, 'spawn').mockReturnValue(
+      mockProcess as unknown as child_process.ChildProcess
+    );
     try {
       mkdirSync(agentsDir, { recursive: true });
     } catch (e) {}
@@ -40,68 +158,35 @@ tools:
 ---
 You are a test agent.`;
     writeFileSync(join(agentsDir, 'test-agent.md'), agentContent);
+  });
-    const mockChat = async (messages: unknown[], _options?: unknown) => {
-      const lastMessage = messages[messages.length - 1] as { content?: string };
-      const systemMessage = messages.find(
-        (m) =>
-          typeof m === 'object' &&
-          m !== null &&
-          'role' in m &&
-          (m as { role: string }).role === 'system'
-      ) as { content?: string } | undefined;
-      if (systemMessage?.content?.includes('IMPORTANT: You must output valid JSON')) {
-        return {
-          message: { role: 'assistant', content: '```json\n{"foo": "bar"}\n```' },
-        };
-      }
-      if (lastMessage?.content?.includes('trigger tool')) {
-        return {
-          message: {
-            role: 'assistant',
-            content: null,
-            tool_calls: [
-              {
-                id: 'call-1',
-                type: 'function',
-                function: { name: 'test-tool', arguments: '{"val": 123}' },
-              },
-            ],
-          },
-        };
-      }
-      if (lastMessage?.content?.includes('trigger adhoc tool')) {
-        return {
-          message: {
-            role: 'assistant',
-            content: null,
-            tool_calls: [
-              {
-                id: 'call-adhoc',
-                type: 'function',
-                function: { name: 'adhoc-tool', arguments: '{}' },
-              },
-            ],
-          },
-        };
-      }
-      return {
-        message: { role: 'assistant', content: 'LLM Response' },
-      };
-    };
+  beforeEach(() => {
+    // Global MCP mocks to avoid hangs
+    initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue({
+      jsonrpc: '2.0',
+      id: 0,
+      result: { protocolVersion: '2024-11-05' },
+    } as MCPResponse);
+    listToolsSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([]);
+    stopSpy = spyOn(MCPClient.prototype, 'stop').mockReturnValue(undefined);
+    // Set adapters to global mock
     OpenAIAdapter.prototype.chat = mock(mockChat) as unknown as typeof originalOpenAIChat;
     CopilotAdapter.prototype.chat = mock(mockChat) as unknown as typeof originalCopilotChat;
     AnthropicAdapter.prototype.chat = mock(mockChat) as unknown as typeof originalAnthropicChat;
   });
+  afterEach(() => {
+    initSpy.mockRestore();
+    listToolsSpy.mockRestore();
+    stopSpy.mockRestore();
+  });
   afterAll(() => {
     OpenAIAdapter.prototype.chat = originalOpenAIChat;
     CopilotAdapter.prototype.chat = originalCopilotChat;
     AnthropicAdapter.prototype.chat = originalAnthropicChat;
+    spawnSpy.mockRestore();
   });
   it('should execute a simple LLM step', async () => {
@@ -279,9 +364,12 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const spy = spyOn(MCPClient.prototype, 'initialize').mockRejectedValue(
-      new Error('Connect failed')
-    );
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockRejectedValue(new Error('Connect failed'));
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     const consoleSpy = spyOn(console, 'error').mockImplementation(() => {});
     await executeLlmStep(
@@ -293,7 +381,7 @@ You are a test agent.`;
     expect(consoleSpy).toHaveBeenCalledWith(
       expect.stringContaining('Failed to connect to MCP server fail-mcp')
     );
-    spy.mockRestore();
+    createLocalSpy.mockRestore();
     consoleSpy.mockRestore();
   });
@@ -309,13 +397,14 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue({} as MCPResponse);
-    const listSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([
-      { name: 'mcp-tool', inputSchema: {} },
-    ]);
-    const callSpy = spyOn(MCPClient.prototype, 'callTool').mockRejectedValue(
-      new Error('Tool failed')
-    );
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockResolvedValue({} as MCPResponse);
+      spyOn(client, 'listTools').mockResolvedValue([{ name: 'mcp-tool', inputSchema: {} }]);
+      spyOn(client, 'callTool').mockRejectedValue(new Error('Tool failed'));
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
     const originalCopilotChatInner = CopilotAdapter.prototype.chat;
@@ -351,11 +440,7 @@ You are a test agent.`;
     expect(toolErrorCaptured).toBe(true);
     OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
-    CopilotAdapter.prototype.chat = originalCopilotChatInner;
-    AnthropicAdapter.prototype.chat = originalAnthropicChatInner;
-    initSpy.mockRestore();
-    listSpy.mockRestore();
-    callSpy.mockRestore();
+    createLocalSpy.mockRestore();
   });
   it('should use global MCP servers when useGlobalMcp is true', async () => {
@@ -382,10 +467,15 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue({} as MCPResponse);
-    const listSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([
-      { name: 'global-tool', description: 'A global tool', inputSchema: {} },
-    ]);
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockResolvedValue({} as MCPResponse);
+      spyOn(client, 'listTools').mockResolvedValue([
+        { name: 'global-tool', description: 'A global tool', inputSchema: {} },
+      ]);
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     let toolFound = false;
     const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
@@ -409,8 +499,7 @@ You are a test agent.`;
     expect(toolFound).toBe(true);
     OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
-    initSpy.mockRestore();
-    listSpy.mockRestore();
+    createLocalSpy.mockRestore();
     ConfigLoader.clear();
   });
@@ -502,8 +591,13 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue({} as MCPResponse);
-    const listSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([]);
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockResolvedValue({} as MCPResponse);
+      spyOn(client, 'listTools').mockResolvedValue([]);
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
     const mockChat = mock(async () => ({
@@ -526,12 +620,11 @@ You are a test agent.`;
     // We can check this by seeing how many times initialize was called if they were different,
     // but here we just want to ensure it didn't push the global one again.
-    // Actually, initialize will be called for 'test-mcp' (explicitly listed)
-    expect(initSpy).toHaveBeenCalledTimes(1);
+    // Actually, createLocal will be called for 'test-mcp' (explicitly listed)
+    expect(createLocalSpy).toHaveBeenCalledTimes(1);
     OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
-    initSpy.mockRestore();
-    listSpy.mockRestore();
+    createLocalSpy.mockRestore();
     managerSpy.mockRestore();
     ConfigLoader.clear();
   });

package/src/runner/llm-executor.ts CHANGED Viewed

@@ -23,9 +23,10 @@ export async function executeLlmStep(
   context: ExpressionContext,
   executeStepFn: (step: Step, context: ExpressionContext) => Promise<StepResult>,
   logger: Logger = console,
-  mcpManager?: MCPManager
+  mcpManager?: MCPManager,
+  workflowDir?: string
 ): Promise<StepResult> {
-  const agentPath = resolveAgentPath(step.agent);
+  const agentPath = resolveAgentPath(step.agent, workflowDir);
   const agent = parseAgent(agentPath);
   const provider = step.provider || agent.provider;
@@ -110,8 +111,12 @@ export async function executeLlmStep(
             continue;
           }
           logger.log(`  🔌 Connecting to MCP server: ${server.name}`);
-          client = new MCPClient(server.command, server.args, server.env);
           try {
+            client = await MCPClient.createLocal(
+              server.command,
+              server.args || [],
+              server.env || {}
+            );
             await client.initialize();
             localMcpClients.push(client);
           } catch (error) {

package/src/runner/mcp-client.test.ts CHANGED Viewed

@@ -124,77 +124,115 @@ describe('MCPClient', () => {
   describe('SSE Transport', () => {
     it('should connect and receive endpoint', async () => {
-      const mockEventSource = new EventEmitter();
-      // @ts-ignore
-      mockEventSource.addEventListener = mockEventSource.on;
-      // @ts-ignore
-      mockEventSource.close = mock(() => {});
-      // @ts-ignore
-      global.EventSource = mock(() => mockEventSource);
+      let controller: ReadableStreamDefaultController;
+      const stream = new ReadableStream({
+        start(c) {
+          controller = c;
+          controller.enqueue(new TextEncoder().encode('event: endpoint\ndata: /endpoint\n\n'));
+        },
+      });
-      const clientPromise = MCPClient.createRemote('http://localhost:8080/sse');
+      const fetchMock = spyOn(global, 'fetch').mockImplementation((url) => {
+        if (url === 'http://localhost:8080/sse') {
+          return Promise.resolve(new Response(stream));
+        }
+        return Promise.resolve(new Response(JSON.stringify({ ok: true })));
+      });
-      // Simulate endpoint event
-      mockEventSource.emit('endpoint', { data: '/endpoint' });
+      const clientPromise = MCPClient.createRemote('http://localhost:8080/sse');
       const client = await clientPromise;
       expect(client).toBeDefined();
-      // Test sending a message
-      const fetchMock = spyOn(global, 'fetch').mockImplementation(() =>
-        Promise.resolve(new Response(JSON.stringify({ ok: true })))
-      );
       const initPromise = client.initialize();
       // Simulate message event (response from server)
-      mockEventSource.emit('message', {
-        data: JSON.stringify({
-          jsonrpc: '2.0',
-          id: 0,
-          result: { protocolVersion: '2024-11-05' },
-        }),
-      });
+      if (controller) {
+        controller.enqueue(
+          new TextEncoder().encode(
+            `data: ${JSON.stringify({
+              jsonrpc: '2.0',
+              id: 0,
+              result: { protocolVersion: '2024-11-05' },
+            })}\n\n`
+          )
+        );
+      }
       const response = await initPromise;
       expect(response.result?.protocolVersion).toBe('2024-11-05');
       expect(fetchMock).toHaveBeenCalledWith('http://localhost:8080/endpoint', expect.any(Object));
       client.stop();
-      // @ts-ignore
-      expect(mockEventSource.close).toHaveBeenCalled();
+      fetchMock.mockRestore();
+    });
+    it('should handle SSE with multiple events and chunked data', async () => {
+      let controller: ReadableStreamDefaultController;
+      const stream = new ReadableStream({
+        start(c) {
+          controller = c;
+          // Send endpoint event
+          controller.enqueue(new TextEncoder().encode('event: endpoint\n'));
+          controller.enqueue(new TextEncoder().encode('data: /endpoint\n\n'));
+        },
+      });
+      const fetchMock = spyOn(global, 'fetch').mockImplementation((url) => {
+        if (url === 'http://localhost:8080/sse') {
+          return Promise.resolve(new Response(stream));
+        }
+        return Promise.resolve(new Response(JSON.stringify({ ok: true })));
+      });
+      const client = await MCPClient.createRemote('http://localhost:8080/sse');
+      // We can't easily hook into onMessage without reaching into internals
+      // Instead, we'll test that initialize resolves correctly when the response arrives
+      const initPromise = client.initialize();
+      // Enqueue data in chunks
+      if (controller) {
+        controller.enqueue(new TextEncoder().encode('data: {"jsonrpc":"2.0","id":0,'));
+        controller.enqueue(
+          new TextEncoder().encode('"result":{"protocolVersion":"2024-11-05"}}\n\n')
+        );
+        // Send another event (just to test dispatching doesn't crash)
+        controller.enqueue(
+          new TextEncoder().encode(
+            'event: message\ndata: {"jsonrpc":"2.0","id":99,"result":"ignored"}\n\n'
+          )
+        );
+        // Send empty line
+        controller.enqueue(new TextEncoder().encode('\n'));
+        controller.close();
+      }
+      const response = await initPromise;
+      expect(response.result?.protocolVersion).toBe('2024-11-05');
+      client.stop();
       fetchMock.mockRestore();
-      // @ts-ignore
-      global.EventSource = undefined;
     });
     it('should handle SSE connection failure', async () => {
-      const mockEventSource = {
-        addEventListener: mock((_event: string, callback: (arg: unknown) => void) => {
-          if (_event === 'error') {
-            // Store the callback to trigger it later
-            mockEventSource.onerror = callback;
-          }
-        }),
-        onerror: null as ((arg: unknown) => void) | null,
-        close: mock(() => {}),
-      };
-      // @ts-ignore
-      global.EventSource = mock(() => mockEventSource);
+      const fetchMock = spyOn(global, 'fetch').mockImplementation(() =>
+        Promise.resolve(
+          new Response(null, {
+            status: 500,
+            statusText: 'Internal Server Error',
+          })
+        )
+      );
       const clientPromise = MCPClient.createRemote('http://localhost:8080/sse');
-      // Trigger the onerror callback
-      if (mockEventSource.onerror) {
-        mockEventSource.onerror({ message: 'Connection failed' });
-      }
-      await expect(clientPromise).rejects.toThrow(/SSE connection failed/);
+      await expect(clientPromise).rejects.toThrow(/SSE connection failed: 500/);
-      // @ts-ignore
-      global.EventSource = undefined;
+      fetchMock.mockRestore();
     });
   });
 });