npm - keystone-cli - Versions diffs - 0.5.0 → 0.6.0 - Mend

keystone-cli 0.5.0 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/README.md +55 -8
package/package.json +5 -3
package/src/cli.ts +33 -192
package/src/db/memory-db.test.ts +54 -0
package/src/db/memory-db.ts +122 -0
package/src/db/sqlite-setup.ts +49 -0
package/src/db/workflow-db.test.ts +41 -10
package/src/db/workflow-db.ts +84 -28
package/src/expression/evaluator.test.ts +19 -0
package/src/expression/evaluator.ts +134 -39
package/src/parser/schema.ts +41 -0
package/src/runner/audit-verification.test.ts +23 -0
package/src/runner/auto-heal.test.ts +64 -0
package/src/runner/debug-repl.test.ts +74 -0
package/src/runner/debug-repl.ts +225 -0
package/src/runner/foreach-executor.ts +327 -0
package/src/runner/llm-adapter.test.ts +27 -14
package/src/runner/llm-adapter.ts +90 -112
package/src/runner/llm-executor.test.ts +91 -6
package/src/runner/llm-executor.ts +26 -6
package/src/runner/mcp-client.audit.test.ts +69 -0
package/src/runner/mcp-client.test.ts +12 -3
package/src/runner/mcp-client.ts +199 -19
package/src/runner/mcp-manager.ts +19 -8
package/src/runner/mcp-server.test.ts +8 -5
package/src/runner/mcp-server.ts +31 -17
package/src/runner/optimization-runner.ts +305 -0
package/src/runner/reflexion.test.ts +87 -0
package/src/runner/shell-executor.test.ts +12 -0
package/src/runner/shell-executor.ts +9 -6
package/src/runner/step-executor.test.ts +46 -1
package/src/runner/step-executor.ts +154 -60
package/src/runner/stream-utils.test.ts +65 -0
package/src/runner/stream-utils.ts +186 -0
package/src/runner/workflow-runner.test.ts +4 -4
package/src/runner/workflow-runner.ts +436 -251
package/src/templates/agents/keystone-architect.md +6 -4
package/src/templates/full-feature-demo.yaml +4 -4
package/src/types/assets.d.ts +14 -0
package/src/types/status.ts +1 -1
package/src/ui/dashboard.tsx +38 -26
package/src/utils/auth-manager.ts +3 -1
package/src/utils/logger.test.ts +76 -0
package/src/utils/logger.ts +39 -0
package/src/utils/prompt.ts +75 -0
package/src/utils/redactor.test.ts +86 -4
package/src/utils/redactor.ts +48 -13

package/src/runner/llm-adapter.test.ts CHANGED Viewed

@@ -272,33 +272,41 @@ describe('CopilotAdapter', () => {
 describe('getAdapter', () => {
   beforeEach(() => {
-    spyOn(ConfigLoader, 'getProviderForModel').mockImplementation((model: string) => {
-      if (model.startsWith('claude')) return 'anthropic';
-      if (model.startsWith('gpt')) return 'openai';
-      if (model.startsWith('copilot')) return 'copilot';
-      return 'openai';
-    });
-    // @ts-ignore
-    spyOn(ConfigLoader, 'load').mockReturnValue({
+    // Setup a clean config for each test
+    ConfigLoader.setConfig({
+      default_provider: 'openai',
       providers: {
         openai: { type: 'openai', api_key_env: 'OPENAI_API_KEY' },
         anthropic: { type: 'anthropic', api_key_env: 'ANTHROPIC_API_KEY' },
         copilot: { type: 'copilot' },
       },
+      model_mappings: {
+        'claude-*': 'anthropic',
+        'gpt-*': 'openai',
+        'copilot:*': 'copilot',
+      },
+      storage: { retention_days: 30 },
+      workflows_directory: 'workflows',
+      mcp_servers: {},
     });
   });
   afterEach(() => {
-    mock.restore();
+    ConfigLoader.clear();
   });
   it('should return OpenAIAdapter for gpt models', () => {
+    // ConfigLoader.getProviderForModel logic will handle this
     const { adapter, resolvedModel } = getAdapter('gpt-4');
     expect(adapter).toBeInstanceOf(OpenAIAdapter);
     expect(resolvedModel).toBe('gpt-4');
   });
   it('should return AnthropicAdapter for claude models', () => {
+    // Explicit mapping in our mock config above covers this if ConfigLoader logic works
+    // Or we rely on model name prefix if ConfigLoader has that default logic
+    // Let's ensure the mapping exists if we removed the spy
+    // ConfigLoader.getProviderForModel uses: explicit mapping OR default provider
     const { adapter, resolvedModel } = getAdapter('claude-3');
     expect(adapter).toBeInstanceOf(AnthropicAdapter);
     expect(resolvedModel).toBe('claude-3');
@@ -311,11 +319,16 @@ describe('getAdapter', () => {
   });
   it('should throw error for unknown provider', () => {
-    // @ts-ignore
-    ConfigLoader.getProviderForModel.mockReturnValue('unknown');
-    // @ts-ignore
-    ConfigLoader.load.mockReturnValue({ providers: {} });
+    // Set config with empty providers to force error
+    ConfigLoader.setConfig({
+      default_provider: 'unknown',
+      providers: {}, // No providers configured
+      model_mappings: {},
+      storage: { retention_days: 30 },
+      workflows_directory: 'workflows',
+      mcp_servers: {},
+    });
-    expect(() => getAdapter('unknown-model')).toThrow(/Provider configuration not found/);
+    expect(() => getAdapter('unknown-model')).toThrow();
   });
 });

package/src/runner/llm-adapter.ts CHANGED Viewed

@@ -1,5 +1,7 @@
+import { pipeline } from '@xenova/transformers';
 import { AuthManager, COPILOT_HEADERS } from '../utils/auth-manager';
 import { ConfigLoader } from '../utils/config-loader';
+import { processOpenAIStream } from './stream-utils';
 // Maximum response size to prevent memory exhaustion (1MB)
 const MAX_RESPONSE_SIZE = 1024 * 1024;
@@ -48,6 +50,7 @@ export interface LLMAdapter {
       onStream?: (chunk: string) => void;
     }
   ): Promise<LLMResponse>;
+  embed?(text: string, model?: string): Promise<number[]>;
 }
 export class OpenAIAdapter implements LLMAdapter {
@@ -94,72 +97,51 @@ export class OpenAIAdapter implements LLMAdapter {
     if (isStreaming) {
       if (!response.body) throw new Error('Response body is null');
-      const reader = response.body.getReader();
-      const decoder = new TextDecoder();
-      let fullContent = '';
-      const toolCalls: LLMToolCall[] = [];
-      while (true) {
-        const { done, value } = await reader.read();
-        if (done) break;
-        const chunk = decoder.decode(value);
-        const lines = chunk.split('\n').filter((line) => line.trim() !== '');
-        for (const line of lines) {
-          if (line.includes('[DONE]')) continue;
-          if (!line.startsWith('data: ')) continue;
-          try {
-            const data = JSON.parse(line.slice(6));
-            const delta = data.choices[0].delta;
-            if (delta.content) {
-              if (fullContent.length + delta.content.length > MAX_RESPONSE_SIZE) {
-                throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
-              }
-              fullContent += delta.content;
-              options.onStream?.(delta.content);
-            }
-            if (delta.tool_calls) {
-              for (const tc of delta.tool_calls) {
-                if (!toolCalls[tc.index]) {
-                  toolCalls[tc.index] = {
-                    id: tc.id,
-                    type: 'function',
-                    function: { name: '', arguments: '' },
-                  };
-                }
-                const existing = toolCalls[tc.index];
-                if (tc.function?.name) existing.function.name += tc.function.name;
-                if (tc.function?.arguments) existing.function.arguments += tc.function.arguments;
-              }
-            }
-          } catch (e) {
-            // Ignore parse errors for incomplete chunks
-          }
-        }
-      }
-      return {
-        message: {
-          role: 'assistant',
-          content: fullContent || null,
-          tool_calls: toolCalls.length > 0 ? toolCalls.filter(Boolean) : undefined,
-        },
-      };
+      return processOpenAIStream(response, options, 'OpenAI');
     }
     const data = (await response.json()) as {
       choices: { message: LLMMessage }[];
       usage?: { prompt_tokens: number; completion_tokens: number; total_tokens: number };
     };
+    // Validate response size to prevent memory exhaustion
+    const contentLength = data.choices[0]?.message?.content?.length ?? 0;
+    if (contentLength > MAX_RESPONSE_SIZE) {
+      throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
+    }
     return {
       message: data.choices[0].message,
       usage: data.usage,
     };
   }
+  async embed(text: string, model = 'text-embedding-3-small'): Promise<number[]> {
+    const response = await fetch(`${this.baseUrl}/embeddings`, {
+      method: 'POST',
+      headers: {
+        'Content-Type': 'application/json',
+        Authorization: `Bearer ${this.apiKey}`,
+      },
+      body: JSON.stringify({
+        model,
+        input: text,
+      }),
+    });
+    if (!response.ok) {
+      const error = await response.text();
+      throw new Error(
+        `OpenAI Embeddings API error: ${response.status} ${response.statusText} - ${error}`
+      );
+    }
+    const data = (await response.json()) as {
+      data: { embedding: number[] }[];
+    };
+    return data.data[0].embedding;
+  }
 }
 export class AnthropicAdapter implements LLMAdapter {
@@ -348,7 +330,15 @@ export class AnthropicAdapter implements LLMAdapter {
               }
             }
           } catch (e) {
-            // Ignore parse errors
+            // Log non-SyntaxError exceptions at warning level (they indicate real issues)
+            if (!(e instanceof SyntaxError)) {
+              console.warn(`[Anthropic Stream] Error processing chunk: ${e}`);
+            } else if (process.env.DEBUG || process.env.LLM_DEBUG) {
+              // SyntaxErrors are normal for incomplete chunks - only log in debug mode
+              process.stderr.write(
+                `[Anthropic Stream] Incomplete chunk parse: ${line.slice(0, 50)}...\n`
+              );
+            }
           }
         }
       }
@@ -383,6 +373,12 @@ export class AnthropicAdapter implements LLMAdapter {
     };
     const content = data.content.find((c) => c.type === 'text')?.text || null;
+    // Validate response size to prevent memory exhaustion
+    if (content && content.length > MAX_RESPONSE_SIZE) {
+      throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
+    }
     const toolCalls = data.content
       .filter((c) => c.type === 'tool_use')
       .map((c) => ({
@@ -455,68 +451,20 @@ export class CopilotAdapter implements LLMAdapter {
     if (isStreaming) {
       // Use the same streaming logic as OpenAIAdapter since Copilot uses OpenAI API
       if (!response.body) throw new Error('Response body is null');
-      const reader = response.body.getReader();
-      const decoder = new TextDecoder();
-      let fullContent = '';
-      const toolCalls: LLMToolCall[] = [];
-      while (true) {
-        const { done, value } = await reader.read();
-        if (done) break;
-        const chunk = decoder.decode(value);
-        const lines = chunk.split('\n').filter((line) => line.trim() !== '');
-        for (const line of lines) {
-          if (line.includes('[DONE]')) continue;
-          if (!line.startsWith('data: ')) continue;
-          try {
-            const data = JSON.parse(line.slice(6));
-            if (!data.choices?.[0]?.delta) continue;
-            const delta = data.choices[0].delta;
-            if (delta.content) {
-              if (fullContent.length + delta.content.length > MAX_RESPONSE_SIZE) {
-                throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
-              }
-              fullContent += delta.content;
-              options.onStream?.(delta.content);
-            }
-            if (delta.tool_calls) {
-              for (const tc of delta.tool_calls) {
-                if (!toolCalls[tc.index]) {
-                  toolCalls[tc.index] = {
-                    id: tc.id,
-                    type: 'function',
-                    function: { name: '', arguments: '' },
-                  };
-                }
-                const existing = toolCalls[tc.index];
-                if (tc.function?.name) existing.function.name += tc.function.name;
-                if (tc.function?.arguments) existing.function.arguments += tc.function.arguments;
-              }
-            }
-          } catch (e) {
-            // Ignore parse errors
-          }
-        }
-      }
-      return {
-        message: {
-          role: 'assistant',
-          content: fullContent || null,
-          tool_calls: toolCalls.length > 0 ? toolCalls.filter(Boolean) : undefined,
-        },
-      };
+      return processOpenAIStream(response, options, 'Copilot');
     }
     const data = (await response.json()) as {
       choices: { message: LLMMessage }[];
       usage?: { prompt_tokens: number; completion_tokens: number; total_tokens: number };
     };
+    // Validate response size to prevent memory exhaustion
+    const contentLength = data.choices[0]?.message?.content?.length ?? 0;
+    if (contentLength > MAX_RESPONSE_SIZE) {
+      throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
+    }
     return {
       message: data.choices[0].message,
       usage: data.usage,
@@ -524,7 +472,37 @@ export class CopilotAdapter implements LLMAdapter {
   }
 }
+export class LocalEmbeddingAdapter implements LLMAdapter {
+  // biome-ignore lint/suspicious/noExplicitAny: transformers pipeline type
+  private static extractor: any = null;
+  async chat(): Promise<LLMResponse> {
+    throw new Error(
+      'Local models in Keystone currently only support memory/embedding operations. ' +
+        'To use a local LLM for chat/generation, please use an OpenAI-compatible local server ' +
+        '(like Ollama, LM Studio, or LocalAI) and configure it as an OpenAI provider in your config.'
+    );
+  }
+  async embed(text: string, model = 'Xenova/all-MiniLM-L6-v2'): Promise<number[]> {
+    const modelToUse = model === 'local' ? 'Xenova/all-MiniLM-L6-v2' : model;
+    if (!LocalEmbeddingAdapter.extractor) {
+      LocalEmbeddingAdapter.extractor = await pipeline('feature-extraction', modelToUse);
+    }
+    const output = await LocalEmbeddingAdapter.extractor(text, {
+      pooling: 'mean',
+      normalize: true,
+    });
+    return Array.from(output.data);
+  }
+}
 export function getAdapter(model: string): { adapter: LLMAdapter; resolvedModel: string } {
+  if (model === 'local' || model.startsWith('local:')) {
+    const resolvedModel = model === 'local' ? 'Xenova/all-MiniLM-L6-v2' : model.substring(6);
+    return { adapter: new LocalEmbeddingAdapter(), resolvedModel };
+  }
   const providerName = ConfigLoader.getProviderForModel(model);
   const config = ConfigLoader.load();
   const providerConfig = config.providers[providerName];

package/src/runner/llm-executor.test.ts CHANGED Viewed

@@ -28,7 +28,8 @@ import {
 import { executeLlmStep } from './llm-executor';
 import { MCPClient, type MCPResponse } from './mcp-client';
 import { MCPManager } from './mcp-manager';
-import type { StepResult } from './step-executor';
+import { type StepResult, executeStep } from './step-executor';
+import type { Logger } from './workflow-runner';
 // Mock adapters
 const originalOpenAIChat = OpenAIAdapter.prototype.chat;
@@ -129,10 +130,12 @@ describe('llm-executor', () => {
     };
   };
-  beforeAll(() => {
+  beforeAll(async () => {
     // Mock spawn to avoid actual process creation
     const mockProcess = Object.assign(new EventEmitter(), {
-      stdout: new Readable({ read() {} }),
+      stdout: new Readable({
+        read() {},
+      }),
       stdin: new Writable({
         write(_chunk, _encoding, cb: (error?: Error | null) => void) {
           cb();
@@ -239,6 +242,44 @@ You are a test agent.`;
     expect(result.output).toBe('LLM Response');
   });
+  it('should log tool call arguments', async () => {
+    const step: LlmStep = {
+      id: 'l1',
+      type: 'llm',
+      agent: 'test-agent',
+      prompt: 'trigger tool',
+      needs: [],
+      maxIterations: 10,
+    };
+    const context: ExpressionContext = { inputs: {}, steps: {} };
+    const executeStepFn = async (s: Step) => {
+      if (s.type === 'shell') {
+        return { status: 'success' as const, output: { stdout: 'tool result' } };
+      }
+      return { status: 'success' as const, output: 'ok' };
+    };
+    const logger: Logger = {
+      log: mock(() => {}),
+      error: mock(() => {}),
+      warn: mock(() => {}),
+    };
+    await executeLlmStep(
+      step,
+      context,
+      executeStepFn as unknown as (step: Step, context: ExpressionContext) => Promise<StepResult>,
+      logger
+    );
+    // Check if logger.log was called with arguments
+    // The tool call from mockChat is { name: 'test-tool', arguments: '{"val": 123}' }
+    expect(logger.log).toHaveBeenCalledWith(
+      expect.stringContaining('🛠️  Tool Call: test-tool {"val":123}')
+    );
+  });
   it('should support schema for JSON output', async () => {
     const step: LlmStep = {
       id: 'l1',
@@ -266,7 +307,7 @@ You are a test agent.`;
     expect(result.output).toEqual({ foo: 'bar' });
   });
-  it('should throw error if JSON parsing fails for schema', async () => {
+  it('should retry if LLM output fails schema validation', async () => {
     const step: LlmStep = {
       id: 'l1',
       type: 'llm',
@@ -279,7 +320,51 @@ You are a test agent.`;
     const context: ExpressionContext = { inputs: {}, steps: {} };
     const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
-    // Mock response with invalid JSON
+    const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
+    const originalCopilotChatInner = CopilotAdapter.prototype.chat;
+    const originalAnthropicChatInner = AnthropicAdapter.prototype.chat;
+    let attempt = 0;
+    const mockChat = mock(async () => {
+      attempt++;
+      if (attempt === 1) {
+        return { message: { role: 'assistant', content: 'Not JSON' } };
+      }
+      return { message: { role: 'assistant', content: '{"success": true}' } };
+    }) as unknown as typeof originalOpenAIChat;
+    OpenAIAdapter.prototype.chat = mockChat;
+    CopilotAdapter.prototype.chat = mockChat;
+    AnthropicAdapter.prototype.chat = mockChat;
+    const result = await executeLlmStep(
+      step,
+      context,
+      executeStepFn as unknown as (step: Step, context: ExpressionContext) => Promise<StepResult>
+    );
+    expect(result.status).toBe('success');
+    expect(result.output).toEqual({ success: true });
+    expect(attempt).toBe(2);
+    OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
+    CopilotAdapter.prototype.chat = originalCopilotChatInner;
+    AnthropicAdapter.prototype.chat = originalAnthropicChatInner;
+  });
+  it('should fail after max iterations if JSON remains invalid', async () => {
+    const step: LlmStep = {
+      id: 'l1',
+      type: 'llm',
+      agent: 'test-agent',
+      prompt: 'give me invalid json',
+      needs: [],
+      maxIterations: 3,
+      schema: { type: 'object' },
+    };
+    const context: ExpressionContext = { inputs: {}, steps: {} };
+    const executeStepFn = mock(async () => ({ status: 'success' as const, output: 'ok' }));
     const originalOpenAIChatInner = OpenAIAdapter.prototype.chat;
     const originalCopilotChatInner = CopilotAdapter.prototype.chat;
     const originalAnthropicChatInner = AnthropicAdapter.prototype.chat;
@@ -298,7 +383,7 @@ You are a test agent.`;
         context,
         executeStepFn as unknown as (step: Step, context: ExpressionContext) => Promise<StepResult>
       )
-    ).rejects.toThrow(/Failed to parse LLM output as JSON/);
+    ).rejects.toThrow('Max ReAct iterations reached');
     OpenAIAdapter.prototype.chat = originalOpenAIChatInner;
     CopilotAdapter.prototype.chat = originalCopilotChatInner;

package/src/runner/llm-executor.ts CHANGED Viewed

@@ -4,12 +4,12 @@ import { ExpressionEvaluator } from '../expression/evaluator';
 import { parseAgent, resolveAgentPath } from '../parser/agent-parser';
 import type { AgentTool, LlmStep, Step } from '../parser/schema';
 import { extractJson } from '../utils/json-parser';
+import { ConsoleLogger, type Logger } from '../utils/logger.ts';
 import { RedactionBuffer, Redactor } from '../utils/redactor';
 import { type LLMMessage, getAdapter } from './llm-adapter';
 import { MCPClient } from './mcp-client';
 import type { MCPManager, MCPServerConfig } from './mcp-manager';
 import type { StepResult } from './step-executor';
-import type { Logger } from './workflow-runner';
 interface ToolDefinition {
   name: string;
@@ -24,7 +24,7 @@ export async function executeLlmStep(
   step: LlmStep,
   context: ExpressionContext,
   executeStepFn: (step: Step, context: ExpressionContext) => Promise<StepResult>,
-  logger: Logger = console,
+  logger: Logger = new ConsoleLogger(),
   mcpManager?: MCPManager,
   workflowDir?: string
 ): Promise<StepResult> {
@@ -249,9 +249,14 @@ export async function executeLlmStep(
           try {
             output = extractJson(output) as typeof output;
           } catch (e) {
-            throw new Error(
-              `Failed to parse LLM output as JSON matching schema: ${e instanceof Error ? e.message : String(e)}\nOutput: ${output}`
-            );
+            const errorMessage = `Failed to parse LLM output as JSON matching schema: ${e instanceof Error ? e.message : String(e)}`;
+            logger.error(`  ⚠️  ${errorMessage}. Retrying...`);
+            messages.push({
+              role: 'user',
+              content: `Error: ${errorMessage}\n\nPlease correct your output to be valid JSON matching the schema.`,
+            });
+            continue;
           }
         }
@@ -264,7 +269,22 @@ export async function executeLlmStep(
       // Execute tools
       for (const toolCall of message.tool_calls) {
-        logger.log(`  🛠️  Tool Call: ${toolCall.function.name}`);
+        const argsStr = toolCall.function.arguments;
+        let displayArgs = '';
+        try {
+          const parsedArgs = JSON.parse(argsStr);
+          const keys = Object.keys(parsedArgs);
+          if (keys.length > 0) {
+            const formatted = JSON.stringify(parsedArgs);
+            displayArgs = formatted.length > 100 ? `${formatted.substring(0, 100)}...` : formatted;
+          }
+        } catch (e) {
+          displayArgs = argsStr.length > 100 ? `${argsStr.substring(0, 100)}...` : argsStr;
+        }
+        logger.log(
+          `  🛠️  Tool Call: ${toolCall.function.name}${displayArgs ? ` ${displayArgs}` : ''}`
+        );
         const toolInfo = allTools.find((t) => t.name === toolCall.function.name);
         if (!toolInfo) {

package/src/runner/mcp-client.audit.test.ts CHANGED Viewed

@@ -77,3 +77,72 @@ describe('MCPClient Audit Fixes', () => {
     }
   });
 });
+describe('MCPClient SSRF Protection', () => {
+  it('should reject localhost URLs without allowInsecure', async () => {
+    // HTTP localhost is rejected for not using HTTPS
+    await expect(MCPClient.createRemote('http://localhost:8080/sse')).rejects.toThrow(
+      /SSRF Protection.*HTTPS/
+    );
+    // HTTPS localhost is rejected for being localhost
+    await expect(MCPClient.createRemote('https://localhost:8080/sse')).rejects.toThrow(
+      /SSRF Protection.*localhost/
+    );
+  });
+  it('should reject 127.0.0.1', async () => {
+    await expect(MCPClient.createRemote('https://127.0.0.1:8080/sse')).rejects.toThrow(
+      /SSRF Protection.*localhost/
+    );
+  });
+  it('should reject private IP ranges (10.x.x.x)', async () => {
+    await expect(MCPClient.createRemote('https://10.0.0.1:8080/sse')).rejects.toThrow(
+      /SSRF Protection.*private/
+    );
+  });
+  it('should reject private IP ranges (192.168.x.x)', async () => {
+    await expect(MCPClient.createRemote('https://192.168.1.1:8080/sse')).rejects.toThrow(
+      /SSRF Protection.*private/
+    );
+  });
+  it('should reject private IP ranges (172.16-31.x.x)', async () => {
+    await expect(MCPClient.createRemote('https://172.16.0.1:8080/sse')).rejects.toThrow(
+      /SSRF Protection.*private/
+    );
+    await expect(MCPClient.createRemote('https://172.31.255.1:8080/sse')).rejects.toThrow(
+      /SSRF Protection.*private/
+    );
+  });
+  it('should reject cloud metadata endpoints', async () => {
+    // 169.254.169.254 is caught by link-local IP range check
+    await expect(
+      MCPClient.createRemote('https://169.254.169.254/latest/meta-data/')
+    ).rejects.toThrow(/SSRF Protection.*private/);
+    // Also test the hostname-based metadata detection
+    await expect(MCPClient.createRemote('https://metadata.google.internal/sse')).rejects.toThrow(
+      /SSRF Protection.*metadata/
+    );
+  });
+  it('should require HTTPS by default', async () => {
+    await expect(MCPClient.createRemote('http://api.example.com/sse')).rejects.toThrow(
+      /SSRF Protection.*HTTPS/
+    );
+  });
+  it('should allow HTTP with allowInsecure option', async () => {
+    // This will fail due to network issues, not SSRF
+    const promise = MCPClient.createRemote(
+      'http://api.example.com/sse',
+      {},
+      100, // short timeout
+      { allowInsecure: true }
+    );
+    // Should NOT throw SSRF error, but will throw timeout/connection error
+    await expect(promise).rejects.not.toThrow(/SSRF Protection/);
+  });
+});

package/src/runner/mcp-client.test.ts CHANGED Viewed

@@ -139,7 +139,10 @@ describe('MCPClient', () => {
         return Promise.resolve(new Response(JSON.stringify({ ok: true })));
       });
-      const clientPromise = MCPClient.createRemote('http://localhost:8080/sse');
+      // Use allowInsecure for testing with localhost (fetch is mocked anyway)
+      const clientPromise = MCPClient.createRemote('http://localhost:8080/sse', {}, 60000, {
+        allowInsecure: true,
+      });
       const client = await clientPromise;
       expect(client).toBeDefined();
@@ -185,7 +188,10 @@ describe('MCPClient', () => {
         return Promise.resolve(new Response(JSON.stringify({ ok: true })));
       });
-      const client = await MCPClient.createRemote('http://localhost:8080/sse');
+      // Use allowInsecure for testing with localhost (fetch is mocked anyway)
+      const client = await MCPClient.createRemote('http://localhost:8080/sse', {}, 60000, {
+        allowInsecure: true,
+      });
       // We can't easily hook into onMessage without reaching into internals
       // Instead, we'll test that initialize resolves correctly when the response arrives
@@ -228,7 +234,10 @@ describe('MCPClient', () => {
         )
       );
-      const clientPromise = MCPClient.createRemote('http://localhost:8080/sse');
+      // Use allowInsecure for testing with localhost (fetch is mocked anyway)
+      const clientPromise = MCPClient.createRemote('http://localhost:8080/sse', {}, 60000, {
+        allowInsecure: true,
+      });
       await expect(clientPromise).rejects.toThrow(/SSE connection failed: 500/);