npm - codeep - Versions diffs - 1.3.41 → 2.0.0 - Mend

codeep 1.3.41 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

package/README.md +208 -0
package/dist/acp/commands.js +770 -7
package/dist/acp/protocol.d.ts +11 -2
package/dist/acp/server.js +179 -11
package/dist/acp/session.d.ts +3 -0
package/dist/acp/session.js +5 -0
package/dist/api/index.js +39 -6
package/dist/config/index.d.ts +13 -0
package/dist/config/index.js +46 -1
package/dist/config/providers.js +76 -1
package/dist/renderer/App.d.ts +12 -0
package/dist/renderer/App.js +96 -4
package/dist/renderer/agentExecution.js +5 -0
package/dist/renderer/commands.js +348 -2
package/dist/renderer/components/Login.d.ts +1 -0
package/dist/renderer/components/Login.js +24 -9
package/dist/renderer/handlers.d.ts +11 -1
package/dist/renderer/handlers.js +30 -0
package/dist/renderer/main.js +73 -0
package/dist/utils/agent.d.ts +17 -0
package/dist/utils/agent.js +91 -7
package/dist/utils/agentChat.d.ts +10 -2
package/dist/utils/agentChat.js +48 -9
package/dist/utils/agentStream.js +6 -2
package/dist/utils/checkpoints.d.ts +93 -0
package/dist/utils/checkpoints.js +205 -0
package/dist/utils/context.d.ts +24 -0
package/dist/utils/context.js +57 -0
package/dist/utils/customCommands.d.ts +62 -0
package/dist/utils/customCommands.js +201 -0
package/dist/utils/hooks.d.ts +97 -0
package/dist/utils/hooks.js +223 -0
package/dist/utils/mcpClient.d.ts +229 -0
package/dist/utils/mcpClient.js +497 -0
package/dist/utils/mcpConfig.d.ts +55 -0
package/dist/utils/mcpConfig.js +177 -0
package/dist/utils/mcpMarketplace.d.ts +49 -0
package/dist/utils/mcpMarketplace.js +175 -0
package/dist/utils/mcpRegistry.d.ts +129 -0
package/dist/utils/mcpRegistry.js +427 -0
package/dist/utils/mcpSamplingBridge.d.ts +32 -0
package/dist/utils/mcpSamplingBridge.js +88 -0
package/dist/utils/mcpStreamableHttp.d.ts +65 -0
package/dist/utils/mcpStreamableHttp.js +207 -0
package/dist/utils/openrouterPrefs.d.ts +36 -0
package/dist/utils/openrouterPrefs.js +83 -0
package/dist/utils/skillBundles.d.ts +84 -0
package/dist/utils/skillBundles.js +257 -0
package/dist/utils/skillBundlesCloud.d.ts +66 -0
package/dist/utils/skillBundlesCloud.js +196 -0
package/dist/utils/tokenTracker.d.ts +14 -2
package/dist/utils/tokenTracker.js +59 -45
package/dist/utils/toolExecution.d.ts +17 -1
package/dist/utils/toolExecution.js +184 -6
package/dist/utils/tools.d.ts +22 -6
package/dist/utils/tools.js +83 -8
package/package.json +3 -2
package/bin/codeep-macos-arm64 +0 -0
package/bin/codeep-macos-x64 +0 -0

package/dist/utils/mcpRegistry.js ADDED Viewed

@@ -0,0 +1,427 @@
+/**
+ * Per-session registry of MCP servers.
+ *
+ * `acp/server.ts handleSessionNew/Load/Resume` receives an optional
+ * `mcpServers: McpServer[]` from the ACP client. We spawn each one via
+ * `McpClient`, list its tools, and surface them under a flat namespace so
+ * the agent can call them like any built-in tool.
+ *
+ * Naming: tools are surfaced as `<serverName>__<toolName>` to avoid
+ * collisions across servers and with built-in agent tools. Underscores are
+ * legal in MCP tool names; `__` is rare enough in practice to serve as a
+ * delimiter without escaping.
+ */
+import { McpClient } from './mcpClient.js';
+const NAMESPACE_DELIM = '__';
+/**
+ * Virtual-tool suffixes for the resource/prompt wrappers we generate per
+ * server. Keep these in lockstep with the dispatch switch in
+ * toolExecution.ts — adding a new wrapper requires both ends.
+ */
+export const VIRTUAL_TOOL_SUFFIXES = {
+    resourceList: 'resource_list',
+    resourceRead: 'resource_read',
+    promptList: 'prompt_list',
+    promptGet: 'prompt_get',
+};
+/** Map of ACP session id → list of clients started for that session. */
+const sessionClients = new Map();
+/**
+ * In-progress registration promises. `callSessionTool` awaits these so a
+ * tool call that lands between session/new and "all servers spawned" waits
+ * for registration to finish instead of erroring with "no servers".
+ */
+const registrationInProgress = new Map();
+/** Per-session spawn errors, kept around so `/mcp` can surface them. */
+const sessionErrors = new Map();
+/**
+ * Per-session catalog dirty flags. The agent loop polls and clears these
+ * between iterations so a `tools/list_changed` notification mid-run causes
+ * a fresh re-list before the next tool dispatch.
+ */
+const sessionCatalogDirty = new Map();
+/**
+ * Spawn the given servers and discover their tools. Failures on individual
+ * servers are reported in the result but don't abort the whole registration
+ * (one broken server shouldn't kill the rest).
+ *
+ * Idempotent: calling twice for the same sessionId disposes the prior set
+ * first.
+ */
+export async function registerSessionServers(sessionId, servers, opts = {}) {
+    await disposeSession(sessionId);
+    if (servers.length === 0) {
+        sessionClients.set(sessionId, []);
+        sessionErrors.set(sessionId, []);
+        return { registered: [], errors: [] };
+    }
+    // Build the registration as a Promise so concurrent `callSessionTool`
+    // calls can `awaitSessionReady` instead of seeing an empty registry.
+    const registrationPromise = (async () => {
+        const clients = [];
+        const registered = [];
+        const errors = [];
+        // Start in parallel — server startup tends to dominate session/new
+        // latency, and the work is independent per server.
+        await Promise.all(servers.map(async (cfg) => {
+            const client = new McpClient(cfg, {
+                workspaceRoot: opts.workspaceRoot,
+                onSamplingRequest: opts.onSamplingRequest
+                    ? (params) => opts.onSamplingRequest(params, cfg.name)
+                    : undefined,
+            });
+            // Catalog-changed signals from the server flip a dirty bit the agent
+            // loop reads between iterations. Plus restart already invalidates
+            // tools cache on the client side — we flip the same bit so the agent
+            // re-fetches even though the registry doesn't directly know about
+            // the restart.
+            client.onRestart = () => {
+                const dirty = sessionCatalogDirty.get(sessionId) ?? new Set();
+                dirty.add('tools');
+                dirty.add('resources');
+                dirty.add('prompts');
+                sessionCatalogDirty.set(sessionId, dirty);
+            };
+            client.onCatalogChanged = (kind) => {
+                const dirty = sessionCatalogDirty.get(sessionId) ?? new Set();
+                dirty.add(kind);
+                sessionCatalogDirty.set(sessionId, dirty);
+            };
+            client.onGaveUp = (reason) => {
+                const list = sessionErrors.get(sessionId) ?? [];
+                list.push({ server: cfg.name, error: `gave up auto-restart (${reason})` });
+                sessionErrors.set(sessionId, list);
+            };
+            try {
+                await client.start();
+                const tools = await client.listTools();
+                for (const t of tools) {
+                    registered.push(toRegistered(cfg.name, t));
+                }
+                clients.push(client);
+            }
+            catch (err) {
+                errors.push({ server: cfg.name, error: err.message });
+                await client.stop().catch(() => { });
+            }
+        }));
+        sessionClients.set(sessionId, clients);
+        sessionErrors.set(sessionId, errors);
+        return { registered, errors };
+    })();
+    registrationInProgress.set(sessionId, registrationPromise.then(() => { }, () => { }));
+    try {
+        return await registrationPromise;
+    }
+    finally {
+        registrationInProgress.delete(sessionId);
+    }
+}
+/**
+ * Wait for any in-flight `registerSessionServers` for this session to
+ * finish. No-op once registration has completed. Lets `callSessionTool`
+ * be tolerant of the race between session/new returning and the user
+ * sending their first prompt.
+ */
+export async function awaitSessionReady(sessionId) {
+    const pending = registrationInProgress.get(sessionId);
+    if (pending)
+        await pending;
+}
+/** Return spawn errors recorded for a session, for the /mcp inspector. */
+export function getSessionRegistrationErrors(sessionId) {
+    return sessionErrors.get(sessionId) ?? [];
+}
+/**
+ * Atomically read + clear the catalog-dirty flags for a session.
+ * Called by the agent loop between iterations: if any flag is set,
+ * the relevant cached lists (tools / resources / prompts) should be
+ * re-fetched before the next dispatch. Returns the set of dirty kinds.
+ */
+export function consumeSessionCatalogChanges(sessionId) {
+    const dirty = sessionCatalogDirty.get(sessionId);
+    if (!dirty || dirty.size === 0)
+        return new Set();
+    sessionCatalogDirty.delete(sessionId);
+    // Also blow away client-side tool caches so the next listTools() actually
+    // re-queries the server (the per-client cache is what
+    // `getSessionTools` reads from).
+    if (dirty.has('tools')) {
+        const clients = sessionClients.get(sessionId);
+        if (clients) {
+            for (const c of clients) {
+                // Reach in to clear the cache — purposely loose typing so we don't
+                // export a "clear cache" method that callers might mis-use.
+                c.toolsCache = null;
+            }
+        }
+    }
+    return dirty;
+}
+function toRegistered(serverName, tool) {
+    return {
+        agentName: `${serverName}${NAMESPACE_DELIM}${tool.name}`,
+        toolName: tool.name,
+        serverName,
+        description: tool.description,
+        inputSchema: tool.inputSchema,
+    };
+}
+/** Return all tools registered for a session (built from cached server tool lists). */
+export async function getSessionTools(sessionId) {
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        return [];
+    const all = [];
+    for (const client of clients) {
+        try {
+            const tools = await client.listTools();
+            for (const t of tools)
+                all.push(toRegistered(client.server.name, t));
+        }
+        catch {
+            // Skip a flaky server rather than fail the entire list.
+        }
+    }
+    return all;
+}
+/**
+ * Build the set of virtual tools that wrap the resource/prompt primitives
+ * for every server in the session. The agent calls these like normal
+ * `<server>__<tool>` entries; toolExecution.ts dispatches them through
+ * `callSessionResourceTool` below.
+ *
+ * We only emit a wrapper when the server actually exposes resources or
+ * prompts (probed via `listResources`/`listPrompts`) — no point teaching
+ * the model about a `read_resource` tool that always returns "no such
+ * resource".
+ */
+export async function getSessionVirtualTools(sessionId) {
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        return [];
+    const out = [];
+    for (const client of clients) {
+        const serverName = client.server.name;
+        // Resources
+        try {
+            const resources = await client.listResources();
+            if (resources.length > 0) {
+                out.push({
+                    agentName: `${serverName}${NAMESPACE_DELIM}${VIRTUAL_TOOL_SUFFIXES.resourceList}`,
+                    toolName: VIRTUAL_TOOL_SUFFIXES.resourceList,
+                    serverName,
+                    description: `List MCP resources exposed by the "${serverName}" server. Returns the URIs you can pass to ${serverName}__${VIRTUAL_TOOL_SUFFIXES.resourceRead}.`,
+                    inputSchema: { type: 'object', properties: {}, additionalProperties: false },
+                });
+                out.push({
+                    agentName: `${serverName}${NAMESPACE_DELIM}${VIRTUAL_TOOL_SUFFIXES.resourceRead}`,
+                    toolName: VIRTUAL_TOOL_SUFFIXES.resourceRead,
+                    serverName,
+                    description: `Read the contents of an MCP resource from the "${serverName}" server by its URI.`,
+                    inputSchema: {
+                        type: 'object',
+                        properties: { uri: { type: 'string', description: 'Resource URI (use resource_list to discover available URIs).' } },
+                        required: ['uri'],
+                    },
+                });
+            }
+        }
+        catch { /* server doesn't support resources — skip */ }
+        // Prompts
+        try {
+            const prompts = await client.listPrompts();
+            if (prompts.length > 0) {
+                out.push({
+                    agentName: `${serverName}${NAMESPACE_DELIM}${VIRTUAL_TOOL_SUFFIXES.promptList}`,
+                    toolName: VIRTUAL_TOOL_SUFFIXES.promptList,
+                    serverName,
+                    description: `List prompt templates exposed by the "${serverName}" MCP server.`,
+                    inputSchema: { type: 'object', properties: {}, additionalProperties: false },
+                });
+                out.push({
+                    agentName: `${serverName}${NAMESPACE_DELIM}${VIRTUAL_TOOL_SUFFIXES.promptGet}`,
+                    toolName: VIRTUAL_TOOL_SUFFIXES.promptGet,
+                    serverName,
+                    description: `Materialise an MCP prompt template from the "${serverName}" server.`,
+                    inputSchema: {
+                        type: 'object',
+                        properties: {
+                            name: { type: 'string', description: 'Prompt name (use prompt_list to discover).' },
+                            arguments: { type: 'object', additionalProperties: true, description: 'Key/value arguments per the prompt template.' },
+                        },
+                        required: ['name'],
+                    },
+                });
+            }
+        }
+        catch { /* server doesn't support prompts — skip */ }
+    }
+    return out;
+}
+/**
+ * Dispatch a virtual MCP tool (resource_list, resource_read, prompt_list,
+ * prompt_get) and return a JSON-serialised string the agent can consume.
+ * Throws if the tool name doesn't match a virtual wrapper.
+ */
+export async function callSessionVirtualTool(sessionId, agentName, args) {
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        throw new Error(`No MCP servers registered for session ${sessionId}`);
+    const idx = agentName.indexOf(NAMESPACE_DELIM);
+    if (idx < 0)
+        throw new Error(`"${agentName}" is not a namespaced MCP tool`);
+    const serverName = agentName.slice(0, idx);
+    const suffix = agentName.slice(idx + NAMESPACE_DELIM.length);
+    const client = clients.find(c => c.server.name === serverName);
+    if (!client)
+        throw new Error(`No MCP server named "${serverName}" in this session`);
+    if (suffix === VIRTUAL_TOOL_SUFFIXES.resourceList) {
+        const resources = await client.listResources();
+        return JSON.stringify(resources, null, 2);
+    }
+    if (suffix === VIRTUAL_TOOL_SUFFIXES.resourceRead) {
+        const uri = String(args.uri ?? '');
+        if (!uri)
+            throw new Error('resource_read requires a `uri` argument');
+        const contents = await client.readResource(uri);
+        // Inline text content directly; surface blob with a placeholder so the
+        // model knows there was binary data without us blowing up the context.
+        return contents.map(c => c.text ?? `[binary ${c.mimeType ?? 'blob'}, ${c.blob?.length ?? 0} chars]`).join('\n\n');
+    }
+    if (suffix === VIRTUAL_TOOL_SUFFIXES.promptList) {
+        const prompts = await client.listPrompts();
+        return JSON.stringify(prompts, null, 2);
+    }
+    if (suffix === VIRTUAL_TOOL_SUFFIXES.promptGet) {
+        const name = String(args.name ?? '');
+        if (!name)
+            throw new Error('prompt_get requires a `name` argument');
+        const promptArgs = (args.arguments && typeof args.arguments === 'object') ? args.arguments : {};
+        const result = await client.getPrompt(name, promptArgs);
+        return JSON.stringify(result, null, 2);
+    }
+    throw new Error(`Unknown virtual MCP tool suffix: ${suffix}`);
+}
+/** Return true if a tool name matches one of the four virtual wrappers. */
+export function isVirtualMcpToolName(name) {
+    const idx = name.indexOf(NAMESPACE_DELIM);
+    if (idx < 0)
+        return false;
+    const suffix = name.slice(idx + NAMESPACE_DELIM.length);
+    return Object.values(VIRTUAL_TOOL_SUFFIXES).includes(suffix);
+}
+/** Return resources advertised by all session servers, grouped by server. */
+export async function getSessionResources(sessionId) {
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        return [];
+    const out = [];
+    for (const client of clients) {
+        try {
+            const resources = await client.listResources();
+            if (resources.length > 0)
+                out.push({ serverName: client.server.name, resources });
+        }
+        catch {
+            // Per-server failures should not poison the whole list.
+        }
+    }
+    return out;
+}
+/** Read a resource URI from any session server that advertises it. */
+export async function readSessionResource(sessionId, uri) {
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        throw new Error(`No MCP servers registered for session ${sessionId}`);
+    // Try each server in registration order; first success wins. Most URI
+    // schemes are server-specific so this rarely needs more than one try.
+    let lastError = null;
+    for (const client of clients) {
+        try {
+            const contents = await client.readResource(uri);
+            if (contents.length > 0)
+                return contents;
+        }
+        catch (err) {
+            lastError = err;
+        }
+    }
+    throw lastError ?? new Error(`No MCP server returned content for ${uri}`);
+}
+/** Return prompts advertised by all session servers, grouped by server. */
+export async function getSessionPrompts(sessionId) {
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        return [];
+    const out = [];
+    for (const client of clients) {
+        try {
+            const prompts = await client.listPrompts();
+            if (prompts.length > 0)
+                out.push({ serverName: client.server.name, prompts });
+        }
+        catch {
+            // Skip servers that don't expose prompts.
+        }
+    }
+    return out;
+}
+/** Resolve a `<server>__<name>` prompt reference, returning the materialised messages. */
+export async function getSessionPrompt(sessionId, serverName, name, args = {}) {
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        throw new Error(`No MCP servers registered for session ${sessionId}`);
+    const client = clients.find(c => c.server.name === serverName);
+    if (!client)
+        throw new Error(`No MCP server named "${serverName}" in this session`);
+    return client.getPrompt(name, args);
+}
+/** Forward a tool call to the right MCP server. Returns the tool's text output. */
+export async function callSessionTool(sessionId, agentName, args) {
+    // Wait for any pending session registration before checking the registry.
+    // Avoids the "spawn race" where the agent fires a tool call between
+    // session/new returning and the MCP server child processes finishing
+    // their initialize handshake.
+    await awaitSessionReady(sessionId);
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length)
+        throw new Error(`No MCP servers registered for session ${sessionId}`);
+    const idx = agentName.indexOf(NAMESPACE_DELIM);
+    if (idx < 0)
+        throw new Error(`Tool name "${agentName}" is not in the expected "server__tool" form`);
+    const serverName = agentName.slice(0, idx);
+    const toolName = agentName.slice(idx + NAMESPACE_DELIM.length);
+    const client = clients.find(c => c.server.name === serverName);
+    if (!client)
+        throw new Error(`No MCP server named "${serverName}" in this session`);
+    return client.callTool(toolName, args);
+}
+/** True when an agent tool name looks like an MCP-prefixed tool. */
+export function isMcpToolName(name) {
+    return name.includes(NAMESPACE_DELIM);
+}
+/** Stop all MCP clients for a session and drop the registry entry. */
+export async function disposeSession(sessionId) {
+    sessionErrors.delete(sessionId);
+    sessionCatalogDirty.delete(sessionId);
+    const clients = sessionClients.get(sessionId);
+    if (!clients?.length) {
+        sessionClients.delete(sessionId);
+        return;
+    }
+    await Promise.all(clients.map(c => c.stop().catch(() => { })));
+    sessionClients.delete(sessionId);
+}
+/**
+ * Tear down every active MCP session. Wired up as a SIGINT/SIGTERM handler
+ * in `acp/server.ts` so killing the CLI doesn't leave orphan child processes.
+ */
+export async function disposeAllSessions() {
+    const ids = [...sessionClients.keys()];
+    await Promise.all(ids.map(id => disposeSession(id)));
+}
+/** For tests / debugging — how many sessions have active MCP clients. */
+export function sessionCount() {
+    return sessionClients.size;
+}

package/dist/utils/mcpSamplingBridge.d.ts ADDED Viewed

@@ -0,0 +1,32 @@
+/**
+ * Bridges MCP `sampling/createMessage` server requests to Codeep's host LLM.
+ *
+ * MCP servers that opt into the `sampling` capability send the host
+ * (Codeep) a request to generate a completion on their behalf — usually
+ * because they want LLM reasoning without their own provider keys. Per
+ * spec, the host is free to refuse, swap models, or strip context; we
+ * forward the messages to the active provider via `chat()` and return
+ * just the assistant text.
+ *
+ * Notes on the bridge surface:
+ *   - We strip image content (provider matrix varies; safer to skip than
+ *     surprise the model). A future iteration can route images through
+ *     the vision integration in mcpIntegration.ts.
+ *   - We respect `params.modelPreferences.hints[].name` as an *advisory*
+ *     model override — only if the user has the provider for it
+ *     configured; otherwise we stay on the active model.
+ *   - We honour `temperature`, `maxTokens`, `stopSequences` only where
+ *     the underlying chat() path supports them (today: none — chat() uses
+ *     the agent's configured temperature/maxTokens). Pass-through hooks
+ *     are wired so the spec contract is honoured if/when chat() grows
+ *     those knobs.
+ *
+ * Cost guard: every sampling request bills the user's active provider, so
+ * a misbehaving server can drain credits. We enforce a per-server rate
+ * limit (≥1 s spacing) and a per-process cap, and surface every accepted
+ * request on stderr so the user can see what's happening.
+ */
+import type { SamplingCreateMessageParams, SamplingCreateMessageResult } from './mcpClient.js';
+/** Reset the per-server counters. Called on session boundaries. */
+export declare function resetSamplingBudget(): void;
+export declare function handleMcpSamplingRequest(params: SamplingCreateMessageParams, serverName?: string): Promise<SamplingCreateMessageResult>;

package/dist/utils/mcpSamplingBridge.js ADDED Viewed

@@ -0,0 +1,88 @@
+/**
+ * Bridges MCP `sampling/createMessage` server requests to Codeep's host LLM.
+ *
+ * MCP servers that opt into the `sampling` capability send the host
+ * (Codeep) a request to generate a completion on their behalf — usually
+ * because they want LLM reasoning without their own provider keys. Per
+ * spec, the host is free to refuse, swap models, or strip context; we
+ * forward the messages to the active provider via `chat()` and return
+ * just the assistant text.
+ *
+ * Notes on the bridge surface:
+ *   - We strip image content (provider matrix varies; safer to skip than
+ *     surprise the model). A future iteration can route images through
+ *     the vision integration in mcpIntegration.ts.
+ *   - We respect `params.modelPreferences.hints[].name` as an *advisory*
+ *     model override — only if the user has the provider for it
+ *     configured; otherwise we stay on the active model.
+ *   - We honour `temperature`, `maxTokens`, `stopSequences` only where
+ *     the underlying chat() path supports them (today: none — chat() uses
+ *     the agent's configured temperature/maxTokens). Pass-through hooks
+ *     are wired so the spec contract is honoured if/when chat() grows
+ *     those knobs.
+ *
+ * Cost guard: every sampling request bills the user's active provider, so
+ * a misbehaving server can drain credits. We enforce a per-server rate
+ * limit (≥1 s spacing) and a per-process cap, and surface every accepted
+ * request on stderr so the user can see what's happening.
+ */
+const MIN_INTERVAL_MS = 1000;
+const MAX_PER_SERVER = 100;
+const lastRequestAt = new Map();
+const requestCount = new Map();
+/** Reset the per-server counters. Called on session boundaries. */
+export function resetSamplingBudget() {
+    lastRequestAt.clear();
+    requestCount.clear();
+}
+export async function handleMcpSamplingRequest(params, serverName = 'unknown') {
+    const now = Date.now();
+    const count = (requestCount.get(serverName) ?? 0) + 1;
+    if (count > MAX_PER_SERVER) {
+        process.stderr.write(`[codeep] mcp:${serverName} sampling refused — exceeded ${MAX_PER_SERVER}/process cap; restart codeep to reset\n`);
+        throw new Error(`sampling budget exceeded for "${serverName}" (${MAX_PER_SERVER}/process)`);
+    }
+    const last = lastRequestAt.get(serverName) ?? 0;
+    if (now - last < MIN_INTERVAL_MS) {
+        process.stderr.write(`[codeep] mcp:${serverName} sampling refused — exceeds 1/sec rate limit\n`);
+        throw new Error(`sampling rate limit for "${serverName}" (max 1/sec)`);
+    }
+    lastRequestAt.set(serverName, now);
+    requestCount.set(serverName, count);
+    process.stderr.write(`[codeep] mcp:${serverName} sampling/createMessage (${count}/${MAX_PER_SERVER} this session)\n`);
+    // Collapse text-content messages into a normalised Message[] for chat().
+    // Images dropped per the surface note above.
+    const history = [];
+    let lastUserText = '';
+    for (const m of params.messages) {
+        if (m.content.type !== 'text')
+            continue;
+        if (m.role === 'assistant') {
+            history.push({ role: 'assistant', content: m.content.text });
+        }
+        else {
+            history.push({ role: 'user', content: m.content.text });
+            lastUserText = m.content.text;
+        }
+    }
+    // chat() takes (message, history, ...) — last user turn becomes the
+    // "message" arg and the rest becomes the prior history.
+    const message = lastUserText || (history[history.length - 1]?.content ?? '');
+    const prior = history.slice(0, -1);
+    // System prompt: server-provided overrides our agent default for this
+    // single call. We don't wire it through chat() (no parameter slot), so
+    // we prepend a synthetic system turn to history. chat() collapses
+    // duplicate system messages, so this is safe.
+    if (params.systemPrompt) {
+        prior.unshift({ role: 'system', content: params.systemPrompt });
+    }
+    const { chat } = await import('../api/index.js');
+    const { config } = await import('../config/index.js');
+    const text = await chat(message, prior);
+    return {
+        role: 'assistant',
+        content: { type: 'text', text },
+        model: config.get('model'),
+        stopReason: 'endTurn',
+    };
+}

package/dist/utils/mcpStreamableHttp.d.ts ADDED Viewed

@@ -0,0 +1,65 @@
+/**
+ * MCP Streamable HTTP transport — the spec successor to the original
+ * HTTP+SSE transport, used by cloud-hosted MCP servers (Anthropic remote
+ * servers, internal HTTP wrappers, etc.).
+ *
+ * Per the 2025-03 spec, a single URL endpoint accepts both:
+ *   - POST { jsonrpc, id, method, params } → JSON response, or
+ *     text/event-stream of one-or-more JSON-RPC frames.
+ *   - GET                                  → text/event-stream channel
+ *     for server-initiated notifications and requests (sampling, etc.).
+ *
+ * This client opens the GET stream lazily on the first message the server
+ * tells us to expect — many simple HTTP servers never send anything
+ * unsolicited, so we don't burn a TCP connection waiting.
+ *
+ * Session continuity uses the `mcp-session-id` header. The server sets it
+ * on the initialize response; we echo it on every subsequent request.
+ */
+export interface StreamableHttpOptions {
+    /** Endpoint URL of the MCP server. */
+    url: string;
+    /** Optional headers (Authorization, custom auth, etc.). */
+    headers?: Record<string, string>;
+    /** Called for every JSON-RPC frame the server sends, from either channel. */
+    onFrame: (msg: unknown) => void;
+    /** Called when the server's notification stream errors or closes unexpectedly. */
+    onError?: (err: Error) => void;
+}
+export declare class StreamableHttpClient {
+    private readonly opts;
+    private sessionId;
+    private notificationAbort;
+    private stopped;
+    /** True after the server has set a session id (i.e. it tracks state). */
+    private get hasServerSession();
+    constructor(opts: StreamableHttpOptions);
+    /**
+     * Issue a JSON-RPC frame as POST. Reply may be a single JSON response
+     * (synchronous tools/call), or an SSE stream of one-or-more responses
+     * + notifications. The transport invokes `onFrame` for every message
+     * it sees on the response, regardless of shape.
+     */
+    send(frame: object): Promise<void>;
+    /**
+     * Open the server-push SSE channel. Idempotent — won't open twice if
+     * already streaming. Errors are surfaced via `onError`, not thrown, so
+     * a transient network blip doesn't crash the agent loop.
+     */
+    private openNotificationStream;
+    /**
+     * Parse a `text/event-stream` body, invoking `onFrame` for each JSON
+     * payload. SSE framing is intentionally permissive — we treat any line
+     * starting with `data:` as one event's payload and join multi-line
+     * data: blocks until a blank line.
+     *
+     * Bounded by `MAX_SSE_BYTES`: a misbehaving or malicious remote server
+     * can push unbounded data on an SSE channel — without a cap, the
+     * accumulating buffer would OOM the agent. We track cumulative bytes
+     * read and bail with `onError` past the cap.
+     */
+    private consumeSseBody;
+    private dispatchSseEvent;
+    /** Tear down the notification stream and refuse further sends. */
+    stop(): Promise<void>;
+}