npm - @mcpjam/sdk - Versions diffs - 0.1.4 → 0.8.0 - Mend

@mcpjam/sdk 0.1.4 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/README.md +326 -78
package/dist/index.d.mts +2070 -0
package/dist/index.d.ts +2070 -9
package/dist/index.js +2489 -470
package/dist/index.js.map +1 -1
package/dist/index.mjs +2796 -0
package/dist/index.mjs.map +1 -0
package/package.json +62 -35
package/dist/index.cjs +0 -836
package/dist/index.cjs.map +0 -1
package/dist/index.d.cts +0 -9
package/dist/mcp-client-manager/index.cjs +0 -834
package/dist/mcp-client-manager/index.cjs.map +0 -1
package/dist/mcp-client-manager/index.d.cts +0 -1627
package/dist/mcp-client-manager/index.d.ts +0 -1627
package/dist/mcp-client-manager/index.js +0 -824
package/dist/mcp-client-manager/index.js.map +0 -1

package/README.md CHANGED Viewed

@@ -1,124 +1,372 @@
 # @mcpjam/sdk
-The official MCPJam SDK provides utilities for building, testing, and developing MCP clients and servers. Built on top of the [@modelcontextprotocol/sdk](https://github.com/modelcontextprotocol/sdk), it offers high-level abstractions and tools to accelerate MCP development.
+Use the MCPJam SDK to write unit tests and evals for your MCP server.
-[![npm version](https://img.shields.io/npm/v/@mcpjam/sdk?style=for-the-badge&color=blue)](https://www.npmjs.com/package/@mcpjam/sdk)
-[![License: Apache 2.0](https://img.shields.io/badge/License-Apache%202.0-blue.svg?style=for-the-badge)](https://opensource.org/licenses/Apache-2.0)
-# Installation
+## Installation
 ```bash
 npm install @mcpjam/sdk
 ```
-# Key Features
+Compatible with your favorite testing framework like [Jest](https://jestjs.io/) and [Vitest](https://vitest.dev/)
-## MCPClientManager
+## Quick Start
-The primary utility in the SDK is `MCPClientManager`, a powerful client manager for connecting to and interacting with MCP servers:
+### Unit Test
-- **Multi-server support** - Manage multiple MCP server connections simultaneously
-- **All transports** - STDIO, HTTP/SSE, and Streamable HTTP support
-- **Lifecycle management** - Automatic connection handling and cleanup
-- **Tools, resources, prompts** - Full MCP protocol support including elicitation
-- **Agent framework integration** - Built-in adapters for Vercel AI SDK and other popular libraries
-- **OAuth & authentication** - Bearer token and custom header support
+Test the individual parts, request response flow of your MCP server. MCP unit tests are deterministic.
-### Use Cases
+```ts
+import { MCPClientManager } from "@mcpjam/sdk";
-The SDK is designed for:
+describe("Everything MCP example", () => {
+  let manager: MCPClientManager;
+  beforeAll(async () => {
+    manager = new MCPClientManager();
+    await manager.connectToServer("everything", {
+      command: "npx",
+      args: ["-y", "@modelcontextprotocol/server-everything"],
+    });
+  });
+  afterAll(async () => {
+    await manager.disconnectServer("everything");
+  });
+  test("server has expected tools", async () => {
+    const tools = await manager.listTools("everything");
+    expect(tools.tools.map((t) => t.name)).toContain("get-sum");
+  });
+  test("get-sum tool returns correct result", async () => {
+    const result = await manager.executeTool("everything", "get-sum", { a: 2, b: 3 });
+    expect(result.content[0].text).toBe("5");
+  });
+});
+```
-- **Building AI agents** - Connect agents to MCP servers for tool access
-- **Creating MCP clients** - Build custom clients with full protocol support
-- **Testing MCP servers** - Write unit tests and E2E tests for your servers
-- **LLM applications** - Add MCP support to chat applications and AI workflows
+### MCP evals
-### Quick Start
+Test that an LLM correctly understands how to use your MCP server. Evals are non-deterministic and multiple runs are needed.
 ```ts
-import { MCPClientManager } from "@mcpjam/sdk";
-// Initialize with server configurations
-const manager = new MCPClientManager({
-  // STDIO server
-  filesystem: {
-    command: "npx",
-    args: ["-y", "@modelcontextprotocol/server-filesystem", "/tmp"],
-  },
-  // HTTP/SSE server with authentication
-  asana: {
-    url: new URL("https://mcp.asana.com/sse"),
-    requestInit: {
-      headers: {
-        Authorization: "Bearer YOUR_TOKEN",
+import { MCPClientManager, TestAgent, EvalTest } from "@mcpjam/sdk";
+describe("Asana MCP Evals", () => {
+  let manager: MCPClientManager;
+  let agent: TestAgent;
+  beforeAll(async () => {
+    manager = new MCPClientManager();
+    await manager.connectToServer("asana", {
+      url: "https://mcp.asana.com/sse",
+      requestInit: {
+        headers: { Authorization: `Bearer ${process.env.ASANA_TOKEN}` },
       },
-    },
-  },
-});
+    });
+    agent = new TestAgent({
+      tools: await manager.getToolsForAiSdk(["asana"]),
+      model: "openai/gpt-4o",
+      apiKey: process.env.OPENAI_API_KEY!,
+    });
+  });
+  afterAll(async () => {
+    await manager.disconnectServer("asana");
+  });
+  // Single-turn eval
+  test("list workspaces > 80% accuracy", async () => {
+    const evalTest = new EvalTest({
+      name: "list-workspaces",
+      test: async (agent) => {
+        const result = await agent.prompt("Show me all my Asana workspaces");
+        return result.hasToolCall("asana_list_workspaces");
+      },
+    });
+    await evalTest.run(agent, {
+      iterations: 10,
+      onFailure: (report) => console.error(report), // Print the report when a test iteration fails.
+    });
+    expect(evalTest.accuracy()).toBeGreaterThan(0.8); // Pass threshold
+  });
+  // Multi-turn eval
+  test("get user then list projects > 80% accuracy", async () => {
+    const evalTest = new EvalTest({
+      name: "user-then-projects",
+      test: async (agent) => {
+        const r1 = await agent.prompt("Who am I in Asana?");
+        if (!r1.hasToolCall("asana_get_user")) return false;
+        const r2 = await agent.prompt("Now list my projects", { context: [r1] }); // Continue the conversation from the previous prompt
+        return r2.hasToolCall("asana_get_projects");
+      },
+    });
+    await evalTest.run(agent, {
+      iterations: 5,
+      onFailure: (report) => console.error(report),
+    });
+    expect(evalTest.accuracy()).toBeGreaterThan(0.8);
+  });
+  // Validating tool arguments
+  test("search tasks passes correct workspace_gid", async () => {
+    const evalTest = new EvalTest({
+      name: "search-args",
+      test: async (agent) => {
+        const result = await agent.prompt("Search for tasks containing 'bug' in my workspace");
+        const args = result.getToolArguments("asana_search_tasks");
+        return result.hasToolCall("asana_search_tasks") && typeof args?.workspace_gid === "string";
+      },
+    });
+    await evalTest.run(agent, {
+      iterations: 5,
+      onFailure: (report) => console.error(report),
+    });
-// List and execute tools
-const tools = await manager.getTools(["filesystem"]);
-const result = await manager.executeTool("filesystem", "read_file", {
-  path: "/tmp/example.txt",
+    expect(evalTest.accuracy()).toBeGreaterThan(0.8);
+  });
 });
+```
+---
+## API Reference
+<details>
+<summary><strong>MCPClientManager</strong></summary>
+Manages connections to one or more MCP servers.
+```ts
+const manager = new MCPClientManager();
-// Integrate with Vercel AI SDK
-import { generateText } from "ai";
-import { openai } from "@ai-sdk/openai";
+// Connect to STDIO server
+await manager.connectToServer("everything", {
+  command: "npx",
+  args: ["-y", "@modelcontextprotocol/server-everything"],
+});
-const response = await generateText({
-  model: openai("gpt-4o-mini"),
-  tools: manager.getToolsForAiSdk(),
-  messages: [{ role: "user", content: "List files in /tmp" }],
+// Connect to HTTP/SSE server
+await manager.connectToServer("asana", {
+  url: "https://mcp.asana.com/sse",
+  requestInit: {
+    headers: { Authorization: "Bearer TOKEN" },
+  },
 });
+// Get tools for AI SDK integration
+const tools = await manager.getToolsForAiSdk(["everything", "asana"]);
+// Direct MCP operations
+await manager.listTools("everything");
+await manager.executeTool("everything", "add", { a: 1, b: 2 });
+await manager.listResources("everything");
+await manager.readResource("everything", { uri: "file:///tmp/test.txt" });
+await manager.listPrompts("everything");
+await manager.getPrompt("everything", { name: "greeting" });
+await manager.pingServer("everything");
+// Disconnect
+await manager.disconnectServer("everything");
 ```
-## Documentation
+</details>
+<details>
+<summary><strong>TestAgent</strong></summary>
-For detailed documentation on `MCPClientManager` including:
+Runs LLM prompts with MCP tool access.
-- Connection configuration (STDIO, HTTP/SSE)
-- Tool execution and resource management
-- Elicitation handling
-- Agent framework integrations
-- API reference
+```ts
+const agent = new TestAgent({
+  tools: await manager.getToolsForAiSdk(),
+  model: "openai/gpt-4o",        // provider/model format
+  apiKey: process.env.OPENAI_API_KEY!,
+  systemPrompt: "You are a helpful assistant.",  // optional
+  temperature: 0.7,              // optional, omit for reasoning models
+  maxSteps: 10,                  // optional, max tool call loops
+});
-See the [MCPClientManager README](./mcp-client-manager/README.md).
+// Run a prompt
+const result = await agent.prompt("Add 2 and 3");
-## Development
+// Multi-turn with context
+const r1 = await agent.prompt("Who am I?");
+const r2 = await agent.prompt("List my projects", { context: [r1] });
+```
-### Building Locally
+**Supported providers:** `openai`, `anthropic`, `azure`, `google`, `mistral`, `deepseek`, `ollama`, `openrouter`, `xai`
-Build the entire SDK workspace:
+</details>
-```bash
-npm run build
+<details>
+<summary><strong>PromptResult</strong></summary>
+Returned by `agent.prompt()`. Contains the LLM response and tool calls.
+```ts
+const result = await agent.prompt("Add 2 and 3");
+// Tool calls
+result.hasToolCall("add");           // boolean
+result.toolsCalled();                // ["add"]
+result.getToolCalls();               // [{ toolName: "add", arguments: { a: 2, b: 3 } }]
+result.getToolArguments("add");      // { a: 2, b: 3 }
+// Response
+result.text;                         // "The result is 5"
+// Messages (full conversation)
+result.getMessages();                // CoreMessage[]
+result.getUserMessages();            // user messages only
+result.getAssistantMessages();       // assistant messages only
+result.getToolMessages();            // tool result messages only
+// Latency
+result.e2eLatencyMs();               // total wall-clock time
+result.llmLatencyMs();               // LLM API time
+result.mcpLatencyMs();               // MCP tool execution time
+// Tokens
+result.totalTokens();
+result.inputTokens();
+result.outputTokens();
+// Errors
+result.hasError();
+result.getError();
+// Debug trace (JSON dump of messages)
+result.formatTrace();
 ```
-This compiles all sub-packages including `mcp-client-manager` and generates distributable bundles.
+</details>
-### Development Mode
+<details>
+<summary><strong>EvalTest</strong></summary>
-Watch for changes and rebuild automatically:
+Runs a single test scenario with multiple iterations.
-```bash
-npm run dev
+```ts
+const test = new EvalTest({
+  name: "addition",
+  test: async (agent) => {
+    const result = await agent.prompt("Add 2 and 3");
+    return result.hasToolCall("add");
+  },
+});
+await test.run(agent, {
+  iterations: 30,
+  concurrency: 5,                    // parallel iterations (default: 5)
+  retries: 2,                        // retry failed iterations (default: 0)
+  timeoutMs: 30000,                  // timeout per iteration (default: 30000)
+  onProgress: (completed, total) => console.log(`${completed}/${total}`),
+  onFailure: (report) => console.error(report),  // called if any iteration fails
+});
+// Metrics
+test.accuracy();                     // success rate (0-1)
+test.averageTokenUse();              // avg tokens per iteration
+// Iteration details
+test.getAllIterations();             // all iteration results
+test.getFailedIterations();          // failed iterations only
+test.getSuccessfulIterations();      // successful iterations only
+test.getFailureReport();             // formatted string of failed traces
 ```
-## Resources
+</details>
-- **💬 Discord**: [Join the MCPJam Community](https://discord.gg/JEnDtz8X6z)
-- **📖 MCP Protocol**: [Model Context Protocol Documentation](https://modelcontextprotocol.io/)
-- **🔧 GitHub**: [MCPJam Inspector Repository](https://github.com/MCPJam/inspector)
+<details>
+<summary><strong>EvalSuite</strong></summary>
-## Contributing
+Groups multiple `EvalTest` instances for aggregate metrics.
-We welcome contributions! The SDK is part of the [MCPJam Inspector monorepo](https://github.com/MCPJam/inspector). Please see our [Contributing Guide](https://docs.mcpjam.com/CONTRIBUTING) for guidelines.
+```ts
+const suite = new EvalSuite({ name: "Math Operations" });
-## License
+suite.add(new EvalTest({
+  name: "addition",
+  test: async (agent) => {
+    const r = await agent.prompt("Add 2+3");
+    return r.hasToolCall("add");
+  },
+}));
-Apache License 2.0 - see the [LICENSE](../LICENSE) file for details.
+suite.add(new EvalTest({
+  name: "multiply",
+  test: async (agent) => {
+    const r = await agent.prompt("Multiply 4*5");
+    return r.hasToolCall("multiply");
+  },
+}));
----
+await suite.run(agent, { iterations: 30 });
+// Aggregate metrics
+suite.accuracy();                    // overall accuracy
+suite.averageTokenUse();
+// Individual test access
+suite.get("addition")?.accuracy();
+suite.get("multiply")?.accuracy();
+suite.getAll();                      // all EvalTest instances
+```
+</details>
+<details>
+<summary><strong>Validators</strong></summary>
+Helper functions for matching tool calls.
+```ts
+import {
+  matchToolCalls,
+  matchToolCallsSubset,
+  matchAnyToolCall,
+  matchToolCallCount,
+  matchNoToolCalls,
+  matchToolCallWithArgs,
+  matchToolCallWithPartialArgs,
+  matchToolArgument,
+  matchToolArgumentWith,
+} from "@mcpjam/sdk";
+const tools = result.toolsCalled();      // ["add", "multiply"]
+const calls = result.getToolCalls();     // ToolCall[]
+// Exact match (order matters)
+matchToolCalls(["add", "multiply"], tools);           // true
+matchToolCalls(["multiply", "add"], tools);           // false
+// Subset match (order doesn't matter)
+matchToolCallsSubset(["add"], tools);                 // true
+// Any match (at least one)
+matchAnyToolCall(["add", "subtract"], tools);         // true
+// Count match
+matchToolCallCount("add", tools, 1);                  // true
+// No tools called
+matchNoToolCalls([]);                                 // true
+// Argument matching
+matchToolCallWithArgs("add", { a: 2, b: 3 }, calls);         // exact match
+matchToolCallWithPartialArgs("add", { a: 2 }, calls);        // partial match
+matchToolArgument("add", "a", 2, calls);                     // single arg
+matchToolArgumentWith("add", "a", (v) => v > 0, calls);      // predicate
+```
-**Built with ❤️ for the MCP community** • [🌐 MCPJam.com](https://mcpjam.com)
+</details>