npm - keystone-cli - Versions diffs - 0.1.1 → 0.3.0 - Mend

keystone-cli 0.1.1 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

package/README.md +69 -16
package/package.json +14 -3
package/src/cli.ts +183 -84
package/src/db/workflow-db.ts +0 -7
package/src/expression/evaluator.test.ts +46 -0
package/src/expression/evaluator.ts +36 -0
package/src/parser/agent-parser.test.ts +10 -0
package/src/parser/agent-parser.ts +13 -5
package/src/parser/config-schema.ts +24 -5
package/src/parser/schema.ts +1 -1
package/src/parser/workflow-parser.ts +5 -9
package/src/runner/llm-adapter.test.ts +0 -8
package/src/runner/llm-adapter.ts +33 -10
package/src/runner/llm-executor.test.ts +230 -96
package/src/runner/llm-executor.ts +9 -4
package/src/runner/mcp-client.test.ts +204 -88
package/src/runner/mcp-client.ts +349 -22
package/src/runner/mcp-manager.test.ts +73 -15
package/src/runner/mcp-manager.ts +84 -18
package/src/runner/mcp-server.test.ts +4 -1
package/src/runner/mcp-server.ts +25 -11
package/src/runner/shell-executor.ts +3 -3
package/src/runner/step-executor.test.ts +2 -2
package/src/runner/step-executor.ts +31 -16
package/src/runner/tool-integration.test.ts +21 -14
package/src/runner/workflow-runner.ts +34 -7
package/src/templates/agents/explore.md +54 -0
package/src/templates/agents/general.md +8 -0
package/src/templates/agents/keystone-architect.md +54 -0
package/src/templates/agents/my-agent.md +3 -0
package/src/templates/agents/summarizer.md +28 -0
package/src/templates/agents/test-agent.md +10 -0
package/src/templates/approval-process.yaml +36 -0
package/src/templates/basic-inputs.yaml +19 -0
package/src/templates/basic-shell.yaml +20 -0
package/src/templates/batch-processor.yaml +43 -0
package/src/templates/cleanup-finally.yaml +22 -0
package/src/templates/composition-child.yaml +13 -0
package/src/templates/composition-parent.yaml +14 -0
package/src/templates/data-pipeline.yaml +38 -0
package/src/templates/full-feature-demo.yaml +64 -0
package/src/templates/human-interaction.yaml +12 -0
package/src/templates/invalid.yaml +5 -0
package/src/templates/llm-agent.yaml +8 -0
package/src/templates/loop-parallel.yaml +37 -0
package/src/templates/retry-policy.yaml +36 -0
package/src/templates/scaffold-feature.yaml +48 -0
package/src/templates/state.db +0 -0
package/src/templates/state.db-shm +0 -0
package/src/templates/state.db-wal +0 -0
package/src/templates/stop-watch.yaml +17 -0
package/src/templates/workflow.db +0 -0
package/src/utils/auth-manager.test.ts +86 -0
package/src/utils/auth-manager.ts +89 -0
package/src/utils/config-loader.test.ts +32 -2
package/src/utils/config-loader.ts +11 -1
package/src/utils/mermaid.test.ts +27 -3

package/src/runner/llm-executor.test.ts CHANGED Viewed

@@ -1,13 +1,33 @@
-import { afterAll, beforeAll, describe, expect, it, mock, spyOn } from 'bun:test';
+import {
+  afterAll,
+  afterEach,
+  beforeAll,
+  beforeEach,
+  describe,
+  expect,
+  it,
+  mock,
+  spyOn,
+} from 'bun:test';
+import * as child_process from 'node:child_process';
+import { EventEmitter } from 'node:events';
 import { mkdirSync, writeFileSync } from 'node:fs';
 import { join } from 'node:path';
+import { Readable, Writable } from 'node:stream';
 import type { ExpressionContext } from '../expression/evaluator';
 import type { LlmStep, Step } from '../parser/schema';
-import { AnthropicAdapter, CopilotAdapter, OpenAIAdapter } from './llm-adapter';
-import { MCPClient } from './mcp-client';
+import { ConfigLoader } from '../utils/config-loader';
+import {
+  AnthropicAdapter,
+  CopilotAdapter,
+  type LLMMessage,
+  type LLMResponse,
+  type LLMTool,
+  OpenAIAdapter,
+} from './llm-adapter';
 import { executeLlmStep } from './llm-executor';
+import { MCPClient, type MCPResponse } from './mcp-client';
 import { MCPManager } from './mcp-manager';
-import { ConfigLoader } from '../utils/config-loader';
 import type { StepResult } from './step-executor';
 // Mock adapters
@@ -17,8 +37,113 @@ const originalAnthropicChat = AnthropicAdapter.prototype.chat;
 describe('llm-executor', () => {
   const agentsDir = join(process.cwd(), '.keystone', 'workflows', 'agents');
+  let spawnSpy: ReturnType<typeof spyOn>;
+  let initSpy: ReturnType<typeof spyOn>;
+  let listToolsSpy: ReturnType<typeof spyOn>;
+  let stopSpy: ReturnType<typeof spyOn>;
+  const mockChat = async (messages: unknown[], _options?: unknown) => {
+    const msgs = messages as LLMMessage[];
+    const lastMessage = msgs[msgs.length - 1];
+    const systemMessage = msgs.find((m) => m.role === 'system');
+    // If there's any tool message, just respond with final message
+    if (msgs.some((m) => m.role === 'tool')) {
+      return {
+        message: { role: 'assistant', content: 'LLM Response' },
+      };
+    }
+    if (systemMessage?.content?.includes('IMPORTANT: You must output valid JSON')) {
+      return {
+        message: { role: 'assistant', content: '```json\n{"foo": "bar"}\n```' },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-1',
+              type: 'function',
+              function: { name: 'test-tool', arguments: '{"val": 123}' },
+            },
+          ],
+        },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger adhoc tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-adhoc',
+              type: 'function',
+              function: { name: 'adhoc-tool', arguments: '{}' },
+            },
+          ],
+        },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger unknown tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-unknown',
+              type: 'function',
+              function: { name: 'unknown-tool', arguments: '{}' },
+            },
+          ],
+        },
+      };
+    }
+    if (lastMessage.role === 'user' && lastMessage.content?.includes('trigger mcp tool')) {
+      return {
+        message: {
+          role: 'assistant',
+          content: null,
+          tool_calls: [
+            {
+              id: 'call-mcp',
+              type: 'function',
+              function: { name: 'mcp-tool', arguments: '{}' },
+            },
+          ],
+        },
+      };
+    }
+    return {
+      message: { role: 'assistant', content: 'LLM Response' },
+    };
+  };
   beforeAll(() => {
+    // Mock spawn to avoid actual process creation
+    const mockProcess = Object.assign(new EventEmitter(), {
+      stdout: new Readable({ read() {} }),
+      stdin: new Writable({
+        write(_chunk, _encoding, cb: (error?: Error | null) => void) {
+          cb();
+        },
+      }),
+      kill: mock(() => {}),
+    });
+    spawnSpy = spyOn(child_process, 'spawn').mockReturnValue(
+      mockProcess as unknown as child_process.ChildProcess
+    );
     try {
       mkdirSync(agentsDir, { recursive: true });
     } catch (e) {}
@@ -33,68 +158,35 @@ tools:
 ---
 You are a test agent.`;
     writeFileSync(join(agentsDir, 'test-agent.md'), agentContent);
+  });
-    const mockChat = async (messages: unknown[], _options?: unknown) => {
-      const lastMessage = messages[messages.length - 1] as { content?: string };
-      const systemMessage = messages.find(
-        (m) =>
-          typeof m === 'object' &&
-          m !== null &&
-          'role' in m &&
-          (m as { role: string }).role === 'system'
-      ) as { content?: string } | undefined;
-      if (systemMessage?.content?.includes('IMPORTANT: You must output valid JSON')) {
-        return {
-          message: { role: 'assistant', content: '```json\n{"foo": "bar"}\n```' },
-        };
-      }
-      if (lastMessage?.content?.includes('trigger tool')) {
-        return {
-          message: {
-            role: 'assistant',
-            content: null,
-            tool_calls: [
-              {
-                id: 'call-1',
-                type: 'function',
-                function: { name: 'test-tool', arguments: '{"val": 123}' },
-              },
-            ],
-          },
-        };
-      }
-      if (lastMessage?.content?.includes('trigger adhoc tool')) {
-        return {
-          message: {
-            role: 'assistant',
-            content: null,
-            tool_calls: [
-              {
-                id: 'call-adhoc',
-                type: 'function',
-                function: { name: 'adhoc-tool', arguments: '{}' },
-              },
-            ],
-          },
-        };
-      }
-      return {
-        message: { role: 'assistant', content: 'LLM Response' },
-      };
-    };
+  beforeEach(() => {
+    // Global MCP mocks to avoid hangs
+    initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue({
+      jsonrpc: '2.0',
+      id: 0,
+      result: { protocolVersion: '2024-11-05' },
+    } as MCPResponse);
+    listToolsSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([]);
+    stopSpy = spyOn(MCPClient.prototype, 'stop').mockReturnValue(undefined);
+    // Set adapters to global mock
     OpenAIAdapter.prototype.chat = mock(mockChat) as unknown as typeof originalOpenAIChat;
     CopilotAdapter.prototype.chat = mock(mockChat) as unknown as typeof originalCopilotChat;
     AnthropicAdapter.prototype.chat = mock(mockChat) as unknown as typeof originalAnthropicChat;
   });
+  afterEach(() => {
+    initSpy.mockRestore();
+    listToolsSpy.mockRestore();
+    stopSpy.mockRestore();
+  });
   afterAll(() => {
     OpenAIAdapter.prototype.chat = originalOpenAIChat;
     CopilotAdapter.prototype.chat = originalCopilotChat;
     AnthropicAdapter.prototype.chat = originalAnthropicChat;
+    spawnSpy.mockRestore();
   });
   it('should execute a simple LLM step', async () => {
@@ -272,9 +364,12 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const spy = spyOn(MCPClient.prototype, 'initialize').mockRejectedValue(
-      new Error('Connect failed')
-    );
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockRejectedValue(new Error('Connect failed'));
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     const consoleSpy = spyOn(console, 'error').mockImplementation(() => {});
     await executeLlmStep(
@@ -286,7 +381,7 @@ You are a test agent.`;
     expect(consoleSpy).toHaveBeenCalledWith(
       expect.stringContaining('Failed to connect to MCP server fail-mcp')
     );
-    spy.mockRestore();
+    createLocalSpy.mockRestore();
     consoleSpy.mockRestore();
   });
@@ -302,22 +397,21 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue(
-      {} as unknown as any
-    );
-    const listSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([
-      { name: 'mcp-tool', inputSchema: {} },
-    ]);
-    const callSpy = spyOn(MCPClient.prototype, 'callTool').mockRejectedValue(
-      new Error('Tool failed')
-    );
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockResolvedValue({} as MCPResponse);
+      spyOn(client, 'listTools').mockResolvedValue([{ name: 'mcp-tool', inputSchema: {} }]);
+      spyOn(client, 'callTool').mockRejectedValue(new Error('Tool failed'));
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
     const originalCopilotChatInner = CopilotAdapter.prototype.chat;
     const originalAnthropicChatInner = AnthropicAdapter.prototype.chat;
     let toolErrorCaptured = false;
-    const mockChat = mock(async (messages: any[]) => {
+    const mockChat = mock(async (messages: LLMMessage[]) => {
       const toolResultMessage = messages.find((m) => m.role === 'tool');
       if (toolResultMessage?.content?.includes('Error: Tool failed')) {
         toolErrorCaptured = true;
@@ -331,7 +425,7 @@ You are a test agent.`;
           ],
         },
       };
-    }) as any;
+    }) as unknown as typeof originalOpenAIChat;
     OpenAIAdapter.prototype.chat = mockChat;
     CopilotAdapter.prototype.chat = mockChat;
@@ -346,11 +440,7 @@ You are a test agent.`;
     expect(toolErrorCaptured).toBe(true);
     OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
-    CopilotAdapter.prototype.chat = originalCopilotChatInner;
-    AnthropicAdapter.prototype.chat = originalAnthropicChatInner;
-    initSpy.mockRestore();
-    listSpy.mockRestore();
-    callSpy.mockRestore();
+    createLocalSpy.mockRestore();
   });
   it('should use global MCP servers when useGlobalMcp is true', async () => {
@@ -377,21 +467,24 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue(
-      {} as unknown as any
-    );
-    const listSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([
-      { name: 'global-tool', description: 'A global tool', inputSchema: {} },
-    ]);
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockResolvedValue({} as MCPResponse);
+      spyOn(client, 'listTools').mockResolvedValue([
+        { name: 'global-tool', description: 'A global tool', inputSchema: {} },
+      ]);
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     let toolFound = false;
     const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
-    const mockChat = mock(async (_messages: any[], options: any) => {
-      if (options.tools?.some((t: any) => t.function.name === 'global-tool')) {
+    const mockChat = mock(async (_messages: LLMMessage[], options: { tools?: LLMTool[] }) => {
+      if (options.tools?.some((t: LLMTool) => t.function.name === 'global-tool')) {
         toolFound = true;
       }
       return { message: { role: 'assistant', content: 'hello' } };
-    }) as any;
+    }) as unknown as typeof originalOpenAIChat;
     OpenAIAdapter.prototype.chat = mockChat;
@@ -406,8 +499,7 @@ You are a test agent.`;
     expect(toolFound).toBe(true);
     OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
-    initSpy.mockRestore();
-    listSpy.mockRestore();
+    createLocalSpy.mockRestore();
     ConfigLoader.clear();
   });
@@ -499,15 +591,18 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    const initSpy = spyOn(MCPClient.prototype, 'initialize').mockResolvedValue(
-      {} as unknown as any
-    );
-    const listSpy = spyOn(MCPClient.prototype, 'listTools').mockResolvedValue([]);
+    const createLocalSpy = spyOn(MCPClient, 'createLocal').mockImplementation(async () => {
+      const client = Object.create(MCPClient.prototype);
+      spyOn(client, 'initialize').mockResolvedValue({} as MCPResponse);
+      spyOn(client, 'listTools').mockResolvedValue([]);
+      spyOn(client, 'stop').mockReturnValue(undefined);
+      return client;
+    });
     const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
     const mockChat = mock(async () => ({
       message: { role: 'assistant', content: 'hello' },
-    })) as any;
+    })) as unknown as typeof originalOpenAIChat;
     OpenAIAdapter.prototype.chat = mockChat;
     const managerSpy = spyOn(manager, 'getGlobalServers');
@@ -525,13 +620,52 @@ You are a test agent.`;
     // We can check this by seeing how many times initialize was called if they were different,
     // but here we just want to ensure it didn't push the global one again.
-    // Actually, initialize will be called for 'test-mcp' (explicitly listed)
-    expect(initSpy).toHaveBeenCalledTimes(1);
+    // Actually, createLocal will be called for 'test-mcp' (explicitly listed)
+    expect(createLocalSpy).toHaveBeenCalledTimes(1);
     OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
-    initSpy.mockRestore();
-    listSpy.mockRestore();
+    createLocalSpy.mockRestore();
     managerSpy.mockRestore();
     ConfigLoader.clear();
   });
+  it('should handle object prompts by stringifying them', async () => {
+    const step: LlmStep = {
+      id: 'l1',
+      type: 'llm',
+      agent: 'test-agent',
+      prompt: '${{ steps.prev.output }}' as unknown as string,
+      needs: [],
+    };
+    const context: ExpressionContext = {
+      inputs: {},
+      steps: {
+        prev: { output: { key: 'value' }, status: 'success' },
+      },
+    };
+    let capturedPrompt = '';
+    const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
+    const mockChat = mock(async (messages: LLMMessage[]) => {
+      // console.log('MESSAGES:', JSON.stringify(messages, null, 2));
+      capturedPrompt = messages.find((m) => m.role === 'user')?.content || '';
+      return { message: { role: 'assistant', content: 'Response' } };
+    }) as unknown as typeof originalOpenAIChat;
+    OpenAIAdapter.prototype.chat = mockChat;
+    CopilotAdapter.prototype.chat = mockChat;
+    AnthropicAdapter.prototype.chat = mockChat;
+    const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
+    await executeLlmStep(
+      step,
+      context,
+      executeStepFn as unknown as (step: Step, context: ExpressionContext) => Promise<StepResult>
+    );
+    expect(capturedPrompt).toContain('"key": "value"');
+    expect(capturedPrompt).not.toContain('[object Object]');
+    OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
+  });
 });

package/src/runner/llm-executor.ts CHANGED Viewed

@@ -23,14 +23,15 @@ export async function executeLlmStep(
   context: ExpressionContext,
   executeStepFn: (step: Step, context: ExpressionContext) => Promise<StepResult>,
   logger: Logger = console,
-  mcpManager?: MCPManager
+  mcpManager?: MCPManager,
+  workflowDir?: string
 ): Promise<StepResult> {
-  const agentPath = resolveAgentPath(step.agent);
+  const agentPath = resolveAgentPath(step.agent, workflowDir);
   const agent = parseAgent(agentPath);
   const provider = step.provider || agent.provider;
   const model = step.model || agent.model || 'gpt-4o';
-  const prompt = ExpressionEvaluator.evaluate(step.prompt, context) as string;
+  const prompt = ExpressionEvaluator.evaluateString(step.prompt, context);
   const fullModelString = provider ? `${provider}:${model}` : model;
   const { adapter, resolvedModel } = getAdapter(fullModelString);
@@ -110,8 +111,12 @@ export async function executeLlmStep(
             continue;
           }
           logger.log(`  🔌 Connecting to MCP server: ${server.name}`);
-          client = new MCPClient(server.command, server.args, server.env);
           try {
+            client = await MCPClient.createLocal(
+              server.command,
+              server.args || [],
+              server.env || {}
+            );
             await client.initialize();
             localMcpClients.push(client);
           } catch (error) {