sunpeak 0.19.10 → 0.20.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +3 -3
- package/bin/commands/inspect.mjs +321 -6
- package/bin/commands/new.mjs +85 -7
- package/bin/commands/test-init.mjs +190 -59
- package/bin/commands/test.mjs +60 -10
- package/bin/lib/eval/eval-providers.mjs +34 -0
- package/bin/lib/eval/eval-runner.mjs +54 -2
- package/bin/lib/eval/eval-vitest-plugin.mjs +3 -14
- package/bin/lib/eval/model-registry.mjs +2 -2
- package/bin/lib/inspect/inspect-config.mjs +16 -1
- package/bin/lib/inspect/inspect-server.d.mts +32 -0
- package/bin/lib/inspect/inspect-server.mjs +11 -0
- package/bin/lib/resolve-bin.mjs +39 -0
- package/bin/lib/test/base-config.mjs +3 -2
- package/bin/lib/test/matchers.mjs +2 -2
- package/bin/lib/test/test-config.mjs +18 -7
- package/bin/lib/test/test-fixtures.d.mts +52 -92
- package/bin/lib/test/test-fixtures.mjs +174 -147
- package/dist/chatgpt/index.cjs +1 -1
- package/dist/chatgpt/index.js +1 -1
- package/dist/claude/index.cjs +1 -1
- package/dist/claude/index.js +1 -1
- package/dist/host/chatgpt/index.cjs +1 -1
- package/dist/host/chatgpt/index.js +1 -1
- package/dist/index.cjs +4 -4
- package/dist/index.cjs.map +1 -1
- package/dist/index.js +3 -3
- package/dist/index.js.map +1 -1
- package/dist/inspector/index.cjs +1 -1
- package/dist/inspector/index.js +1 -1
- package/dist/{inspector-D5DckQuU.js → inspector-BBDa5yCm.js} +57 -23
- package/dist/inspector-BBDa5yCm.js.map +1 -0
- package/dist/{inspector-jY9O18z9.cjs → inspector-DAA1Wiyh.cjs} +58 -24
- package/dist/inspector-DAA1Wiyh.cjs.map +1 -0
- package/dist/lib/discovery-cli.cjs +1 -1
- package/dist/mcp/index.cjs +22 -25
- package/dist/mcp/index.cjs.map +1 -1
- package/dist/mcp/index.js +19 -22
- package/dist/mcp/index.js.map +1 -1
- package/dist/{use-app-Bfargfa3.js → use-app-Cr0auUa1.js} +2 -2
- package/dist/{use-app-Bfargfa3.js.map → use-app-Cr0auUa1.js.map} +1 -1
- package/dist/{use-app-CbsBEmwv.cjs → use-app-DPkj5Jp_.cjs} +2 -2
- package/dist/{use-app-CbsBEmwv.cjs.map → use-app-DPkj5Jp_.cjs.map} +1 -1
- package/package.json +27 -15
- package/template/README.md +1 -1
- package/template/dist/albums/albums.html +4 -4
- package/template/dist/albums/albums.json +1 -1
- package/template/dist/carousel/carousel.html +4 -4
- package/template/dist/carousel/carousel.json +1 -1
- package/template/dist/map/map.html +6 -6
- package/template/dist/map/map.json +1 -1
- package/template/dist/review/review.html +4 -4
- package/template/dist/review/review.json +1 -1
- package/template/node_modules/.bin/vite +2 -2
- package/template/node_modules/.bin/vitest +2 -2
- package/template/node_modules/.vite/deps/_metadata.json +4 -4
- package/template/node_modules/.vite-mcp/deps/@modelcontextprotocol_ext-apps.js +1 -1
- package/template/node_modules/.vite-mcp/deps/@modelcontextprotocol_ext-apps.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/@modelcontextprotocol_ext-apps_app-bridge.js +1 -1
- package/template/node_modules/.vite-mcp/deps/@modelcontextprotocol_ext-apps_app-bridge.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/@modelcontextprotocol_ext-apps_react.js +1 -1
- package/template/node_modules/.vite-mcp/deps/@modelcontextprotocol_ext-apps_react.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/@testing-library_react.js +4 -4
- package/template/node_modules/.vite-mcp/deps/@testing-library_react.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/_metadata.json +33 -33
- package/template/node_modules/.vite-mcp/deps/{client-CU1wWud4.js → client-B_5CX--u.js} +7 -7
- package/template/node_modules/.vite-mcp/deps/{client-CU1wWud4.js.map → client-B_5CX--u.js.map} +1 -1
- package/template/node_modules/.vite-mcp/deps/embla-carousel-react.js +1 -1
- package/template/node_modules/.vite-mcp/deps/embla-carousel-react.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/react-dom.js +3 -3
- package/template/node_modules/.vite-mcp/deps/react-dom.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/react-dom_client.js +1 -1
- package/template/node_modules/.vite-mcp/deps/react.js +3 -3
- package/template/node_modules/.vite-mcp/deps/react.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/react_jsx-dev-runtime.js +2 -2
- package/template/node_modules/.vite-mcp/deps/react_jsx-dev-runtime.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/react_jsx-runtime.js +2 -2
- package/template/node_modules/.vite-mcp/deps/react_jsx-runtime.js.map +1 -1
- package/template/node_modules/.vite-mcp/deps/vitest.js +1024 -622
- package/template/node_modules/.vite-mcp/deps/vitest.js.map +1 -1
- package/template/package.json +6 -6
- package/template/tests/e2e/albums.spec.ts +24 -52
- package/template/tests/e2e/carousel.spec.ts +36 -58
- package/template/tests/e2e/map.spec.ts +35 -56
- package/template/tests/e2e/review.spec.ts +56 -85
- package/template/tests/e2e/visual.spec.ts +14 -12
- package/template/tests/evals/albums.eval.ts +12 -9
- package/template/tests/evals/carousel.eval.ts +4 -14
- package/template/tests/evals/eval.config.ts +6 -6
- package/template/tests/evals/map.eval.ts +2 -9
- package/template/tests/evals/review.eval.ts +27 -22
- package/dist/inspector-D5DckQuU.js.map +0 -1
- package/dist/inspector-jY9O18z9.cjs.map +0 -1
- /package/template/tests/evals/{.env.example → _env.example} +0 -0
package/README.md
CHANGED
|
@@ -53,8 +53,8 @@ Automatically test any MCP server against replicated ChatGPT and Claude runtimes
|
|
|
53
53
|
```ts
|
|
54
54
|
import { test, expect } from 'sunpeak/test';
|
|
55
55
|
|
|
56
|
-
test('review tool renders title', async ({
|
|
57
|
-
const result = await
|
|
56
|
+
test('review tool renders title', async ({ inspector }) => {
|
|
57
|
+
const result = await inspector.renderTool('review-diff');
|
|
58
58
|
const app = result.app();
|
|
59
59
|
await expect(app.locator('h1:has-text("Refactor")')).toBeVisible();
|
|
60
60
|
});
|
|
@@ -132,7 +132,7 @@ sunpeak new
|
|
|
132
132
|
Install the sunpeak skills to give your coding agent (Claude Code, Cursor, etc.) built-in knowledge of sunpeak patterns, hooks, and testing:
|
|
133
133
|
|
|
134
134
|
```bash
|
|
135
|
-
|
|
135
|
+
pnpm dlx skills add Sunpeak-AI/sunpeak@create-sunpeak-app Sunpeak-AI/sunpeak@test-mcp-server
|
|
136
136
|
```
|
|
137
137
|
|
|
138
138
|
## Troubleshooting
|
package/bin/commands/inspect.mjs
CHANGED
|
@@ -18,6 +18,7 @@ import * as path from 'path';
|
|
|
18
18
|
const { existsSync, readdirSync, readFileSync } = fs;
|
|
19
19
|
const { join, resolve, dirname } = path;
|
|
20
20
|
import { fileURLToPath, pathToFileURL } from 'url';
|
|
21
|
+
import { createServer as createHttpServer } from 'http';
|
|
21
22
|
import { getPort } from '../lib/get-port.mjs';
|
|
22
23
|
import { startSandboxServer } from '../lib/sandbox-server.mjs';
|
|
23
24
|
import { getDevOverlayScript } from '../lib/dev-overlay.mjs';
|
|
@@ -35,6 +36,8 @@ function parseArgs(args) {
|
|
|
35
36
|
simulations: undefined,
|
|
36
37
|
port: undefined,
|
|
37
38
|
name: undefined,
|
|
39
|
+
env: undefined,
|
|
40
|
+
cwd: undefined,
|
|
38
41
|
};
|
|
39
42
|
|
|
40
43
|
for (let i = 0; i < args.length; i++) {
|
|
@@ -47,6 +50,16 @@ function parseArgs(args) {
|
|
|
47
50
|
opts.port = Number(args[++i]);
|
|
48
51
|
} else if (arg === '--name' && i + 1 < args.length) {
|
|
49
52
|
opts.name = args[++i];
|
|
53
|
+
} else if (arg === '--env' && i + 1 < args.length) {
|
|
54
|
+
// Repeatable: --env KEY=VALUE --env KEY2=VALUE2
|
|
55
|
+
const pair = args[++i];
|
|
56
|
+
const eqIdx = pair.indexOf('=');
|
|
57
|
+
if (eqIdx > 0) {
|
|
58
|
+
opts.env = opts.env || {};
|
|
59
|
+
opts.env[pair.slice(0, eqIdx)] = pair.slice(eqIdx + 1);
|
|
60
|
+
}
|
|
61
|
+
} else if (arg === '--cwd' && i + 1 < args.length) {
|
|
62
|
+
opts.cwd = args[++i];
|
|
50
63
|
} else if (arg === '--help' || arg === '-h') {
|
|
51
64
|
printHelp();
|
|
52
65
|
process.exit(0);
|
|
@@ -68,11 +81,14 @@ Options:
|
|
|
68
81
|
--simulations <dir> Simulation JSON directory (opt-in, no default)
|
|
69
82
|
--port, -p <number> Dev server port (default: 3000)
|
|
70
83
|
--name <string> App name in inspector chrome
|
|
84
|
+
--env <KEY=VALUE> Environment variable for stdio servers (repeatable)
|
|
85
|
+
--cwd <path> Working directory for stdio servers
|
|
71
86
|
--help, -h Show this help
|
|
72
87
|
|
|
73
88
|
Examples:
|
|
74
89
|
sunpeak inspect --server http://localhost:8000/mcp
|
|
75
90
|
sunpeak inspect --server "python my_server.py"
|
|
91
|
+
sunpeak inspect --server "python server.py" --env API_KEY=sk-123 --cwd ./backend
|
|
76
92
|
sunpeak inspect --server http://localhost:8000/mcp --simulations tests/simulations
|
|
77
93
|
`);
|
|
78
94
|
}
|
|
@@ -160,11 +176,219 @@ function createInMemoryOAuthProvider(redirectUrl, opts = {}) {
|
|
|
160
176
|
};
|
|
161
177
|
}
|
|
162
178
|
|
|
179
|
+
/**
|
|
180
|
+
* Negotiate OAuth with an MCP server and return an authenticated provider.
|
|
181
|
+
*
|
|
182
|
+
* Handles two cases:
|
|
183
|
+
* 1. Anonymous/auto-approved OAuth: the authorization endpoint redirects
|
|
184
|
+
* immediately back with a code (no user interaction needed).
|
|
185
|
+
* 2. Interactive OAuth: opens the authorization URL in the user's browser
|
|
186
|
+
* and waits for the callback.
|
|
187
|
+
*
|
|
188
|
+
* @param {string} serverUrl - The MCP server URL
|
|
189
|
+
* @returns {Promise<import('@modelcontextprotocol/sdk/client/auth.js').OAuthClientProvider>}
|
|
190
|
+
*/
|
|
191
|
+
async function negotiateOAuth(serverUrl) {
|
|
192
|
+
const { auth } = await import('@modelcontextprotocol/sdk/client/auth.js');
|
|
193
|
+
|
|
194
|
+
// Start a temporary callback server for receiving the OAuth code.
|
|
195
|
+
const callbackPort = await getPort(24681);
|
|
196
|
+
const callbackUrl = `http://localhost:${callbackPort}/oauth/callback`;
|
|
197
|
+
|
|
198
|
+
const oauthState = createInMemoryOAuthProvider(callbackUrl);
|
|
199
|
+
const { provider } = oauthState;
|
|
200
|
+
|
|
201
|
+
// First call to auth() — discovers metadata, registers client, and either
|
|
202
|
+
// returns AUTHORIZED (client_credentials) or REDIRECT (authorization_code).
|
|
203
|
+
const result = await auth(provider, { serverUrl: new URL(serverUrl) });
|
|
204
|
+
|
|
205
|
+
if (result === 'AUTHORIZED') {
|
|
206
|
+
return provider;
|
|
207
|
+
}
|
|
208
|
+
|
|
209
|
+
// result === 'REDIRECT': we need to follow the authorization URL.
|
|
210
|
+
const authUrl = oauthState.getAuthUrl();
|
|
211
|
+
if (!authUrl) {
|
|
212
|
+
throw new Error('OAuth flow returned REDIRECT but no authorization URL was captured');
|
|
213
|
+
}
|
|
214
|
+
|
|
215
|
+
// Try the anonymous/auto-approved path first: follow the authorization URL
|
|
216
|
+
// without a browser and see if it immediately redirects with a code.
|
|
217
|
+
const code = await tryAnonymousOAuth(authUrl.toString(), callbackUrl);
|
|
218
|
+
if (code) {
|
|
219
|
+
// Complete the flow with the authorization code.
|
|
220
|
+
const tokenResult = await auth(provider, {
|
|
221
|
+
serverUrl: new URL(serverUrl),
|
|
222
|
+
authorizationCode: code,
|
|
223
|
+
});
|
|
224
|
+
if (tokenResult === 'AUTHORIZED') {
|
|
225
|
+
return provider;
|
|
226
|
+
}
|
|
227
|
+
throw new Error('OAuth token exchange failed after anonymous authorization');
|
|
228
|
+
}
|
|
229
|
+
|
|
230
|
+
// Anonymous path didn't work — this server requires interactive login.
|
|
231
|
+
// Start a callback server and open the auth URL in the user's browser.
|
|
232
|
+
const interactiveCode = await waitForInteractiveOAuth(
|
|
233
|
+
authUrl.toString(),
|
|
234
|
+
callbackUrl,
|
|
235
|
+
callbackPort
|
|
236
|
+
);
|
|
237
|
+
|
|
238
|
+
const tokenResult = await auth(provider, {
|
|
239
|
+
serverUrl: new URL(serverUrl),
|
|
240
|
+
authorizationCode: interactiveCode,
|
|
241
|
+
});
|
|
242
|
+
if (tokenResult === 'AUTHORIZED') {
|
|
243
|
+
return provider;
|
|
244
|
+
}
|
|
245
|
+
throw new Error('OAuth token exchange failed after interactive authorization');
|
|
246
|
+
}
|
|
247
|
+
|
|
248
|
+
/**
|
|
249
|
+
* Try to complete OAuth without user interaction by following redirects.
|
|
250
|
+
* Returns the authorization code if the server auto-approves, or null if
|
|
251
|
+
* the server requires interactive login (returns an HTML page).
|
|
252
|
+
*
|
|
253
|
+
* @param {string} authUrl - The authorization URL
|
|
254
|
+
* @param {string} callbackUrl - The expected callback URL prefix
|
|
255
|
+
* @returns {Promise<string | null>}
|
|
256
|
+
*/
|
|
257
|
+
async function tryAnonymousOAuth(authUrl, callbackUrl) {
|
|
258
|
+
// Follow redirects manually to detect when the server redirects back
|
|
259
|
+
// to our callback URL with a code parameter.
|
|
260
|
+
let url = authUrl;
|
|
261
|
+
const maxRedirects = 10;
|
|
262
|
+
for (let i = 0; i < maxRedirects; i++) {
|
|
263
|
+
const response = await fetch(url, { redirect: 'manual' });
|
|
264
|
+
const location = response.headers.get('location');
|
|
265
|
+
|
|
266
|
+
if (!location) {
|
|
267
|
+
// No redirect — server returned a page (login form). Not auto-approved.
|
|
268
|
+
// Drain the response body to free the socket.
|
|
269
|
+
await response.text().catch(() => {});
|
|
270
|
+
return null;
|
|
271
|
+
}
|
|
272
|
+
|
|
273
|
+
// Resolve relative redirects.
|
|
274
|
+
const resolved = new URL(location, url).toString();
|
|
275
|
+
|
|
276
|
+
// Check if the redirect goes to our callback URL.
|
|
277
|
+
if (resolved.startsWith(callbackUrl)) {
|
|
278
|
+
const params = new URL(resolved).searchParams;
|
|
279
|
+
const code = params.get('code');
|
|
280
|
+
if (code) return code;
|
|
281
|
+
const error = params.get('error');
|
|
282
|
+
if (error) {
|
|
283
|
+
throw new Error(`OAuth authorization failed: ${error} — ${params.get('error_description') || ''}`);
|
|
284
|
+
}
|
|
285
|
+
return null;
|
|
286
|
+
}
|
|
287
|
+
|
|
288
|
+
url = resolved;
|
|
289
|
+
}
|
|
290
|
+
|
|
291
|
+
return null;
|
|
292
|
+
}
|
|
293
|
+
|
|
294
|
+
/**
|
|
295
|
+
* Wait for the user to complete an interactive OAuth flow in their browser.
|
|
296
|
+
* Starts a temporary HTTP server to receive the callback, opens the auth URL,
|
|
297
|
+
* and resolves with the authorization code.
|
|
298
|
+
*
|
|
299
|
+
* @param {string} authUrl - The authorization URL to open in the browser
|
|
300
|
+
* @param {string} callbackUrl - Our callback URL
|
|
301
|
+
* @param {number} callbackPort - Port for the callback server
|
|
302
|
+
* @returns {Promise<string>}
|
|
303
|
+
*/
|
|
304
|
+
async function waitForInteractiveOAuth(authUrl, callbackUrl, callbackPort) {
|
|
305
|
+
return new Promise((resolve, reject) => {
|
|
306
|
+
let settled = false;
|
|
307
|
+
const settle = (fn, value) => {
|
|
308
|
+
if (settled) return;
|
|
309
|
+
settled = true;
|
|
310
|
+
clearTimeout(timer);
|
|
311
|
+
server.close();
|
|
312
|
+
fn(value);
|
|
313
|
+
};
|
|
314
|
+
|
|
315
|
+
const server = createHttpServer((req, res) => {
|
|
316
|
+
const reqUrl = new URL(req.url, callbackUrl);
|
|
317
|
+
if (!reqUrl.pathname.startsWith('/oauth/callback')) {
|
|
318
|
+
res.writeHead(404);
|
|
319
|
+
res.end('Not found');
|
|
320
|
+
return;
|
|
321
|
+
}
|
|
322
|
+
|
|
323
|
+
const code = reqUrl.searchParams.get('code');
|
|
324
|
+
const error = reqUrl.searchParams.get('error');
|
|
325
|
+
|
|
326
|
+
// Serve a simple page that tells the user they can close the tab.
|
|
327
|
+
const escHtml = (s) => s.replace(/[<>&"']/g, (c) =>
|
|
328
|
+
({ '<': '<', '>': '>', '&': '&', '"': '"', "'": ''' })[c]
|
|
329
|
+
);
|
|
330
|
+
const message = code
|
|
331
|
+
? 'Authorization complete. You can close this tab.'
|
|
332
|
+
: `Authorization failed: ${escHtml(error || 'unknown error')}`;
|
|
333
|
+
res.writeHead(200, { 'Content-Type': 'text/html' });
|
|
334
|
+
res.end(`<!DOCTYPE html><html><body><p>${message}</p></body></html>`);
|
|
335
|
+
|
|
336
|
+
if (code) {
|
|
337
|
+
settle(resolve, code);
|
|
338
|
+
} else {
|
|
339
|
+
settle(reject, new Error(`OAuth authorization failed: ${error || 'unknown error'}`));
|
|
340
|
+
}
|
|
341
|
+
});
|
|
342
|
+
|
|
343
|
+
server.on('error', (err) => {
|
|
344
|
+
settle(reject, new Error(`OAuth callback server failed: ${err.message}`));
|
|
345
|
+
});
|
|
346
|
+
|
|
347
|
+
server.listen(callbackPort, async () => {
|
|
348
|
+
console.log('Opening browser for OAuth authorization...');
|
|
349
|
+
// Use execFile with array args to avoid shell injection from the auth URL.
|
|
350
|
+
const { execFile } = await import('child_process');
|
|
351
|
+
const cmd = process.platform === 'darwin' ? 'open' :
|
|
352
|
+
process.platform === 'win32' ? 'start' : 'xdg-open';
|
|
353
|
+
execFile(cmd, [authUrl], (err) => {
|
|
354
|
+
if (err) console.error(`Failed to open browser: ${err.message}`);
|
|
355
|
+
});
|
|
356
|
+
});
|
|
357
|
+
|
|
358
|
+
// Timeout after 2 minutes.
|
|
359
|
+
const timer = setTimeout(() => {
|
|
360
|
+
settle(reject, new Error('OAuth authorization timed out (2 minutes)'));
|
|
361
|
+
}, 120_000);
|
|
362
|
+
});
|
|
363
|
+
}
|
|
364
|
+
|
|
365
|
+
/**
|
|
366
|
+
* Detect if an error from createMcpConnection is an auth error (401/Unauthorized).
|
|
367
|
+
* @param {Error} err
|
|
368
|
+
* @returns {boolean}
|
|
369
|
+
*/
|
|
370
|
+
function isAuthError(err) {
|
|
371
|
+
// The MCP SDK throws UnauthorizedError for auth failures.
|
|
372
|
+
if (err.constructor?.name === 'UnauthorizedError') return true;
|
|
373
|
+
|
|
374
|
+
// StreamableHTTPError includes a status code in its message.
|
|
375
|
+
// Check for the specific "401" HTTP status pattern, not substring matches.
|
|
376
|
+
const msg = err.message || '';
|
|
377
|
+
if (msg.includes('invalid_token')) return true;
|
|
378
|
+
|
|
379
|
+
// Connection errors (ECONNREFUSED, ETIMEDOUT, etc.) are never auth errors.
|
|
380
|
+
if (msg.includes('ECONNREFUSED') || msg.includes('ETIMEDOUT') || msg.includes('ENOTFOUND')) {
|
|
381
|
+
return false;
|
|
382
|
+
}
|
|
383
|
+
|
|
384
|
+
return false;
|
|
385
|
+
}
|
|
386
|
+
|
|
163
387
|
/**
|
|
164
388
|
* Create an MCP client connection.
|
|
165
389
|
* @param {string} serverArg - URL or command string
|
|
166
|
-
* @param {{ type?: 'none' | 'bearer' | 'oauth', bearerToken?: string, authProvider?: import('@modelcontextprotocol/sdk/client/auth.js').OAuthClientProvider }} [authConfig]
|
|
167
|
-
* @returns {Promise<{ client: import('@modelcontextprotocol/sdk/client/index.js').Client, transport: import('@modelcontextprotocol/sdk/types.js').Transport }>}
|
|
390
|
+
* @param {{ type?: 'none' | 'bearer' | 'oauth', bearerToken?: string, authProvider?: import('@modelcontextprotocol/sdk/client/auth.js').OAuthClientProvider, env?: Record<string, string>, cwd?: string }} [authConfig]
|
|
391
|
+
* @returns {Promise<{ client: import('@modelcontextprotocol/sdk/client/index.js').Client, transport: import('@modelcontextprotocol/sdk/types.js').Transport, stderrOutput?: string[] }>}
|
|
168
392
|
*/
|
|
169
393
|
async function createMcpConnection(serverArg, authConfig) {
|
|
170
394
|
const { Client } = await import('@modelcontextprotocol/sdk/client/index.js');
|
|
@@ -197,9 +421,47 @@ async function createMcpConnection(serverArg, authConfig) {
|
|
|
197
421
|
const { StdioClientTransport } = await import(
|
|
198
422
|
'@modelcontextprotocol/sdk/client/stdio.js'
|
|
199
423
|
);
|
|
200
|
-
|
|
201
|
-
|
|
202
|
-
|
|
424
|
+
|
|
425
|
+
const transportOpts = {
|
|
426
|
+
command,
|
|
427
|
+
args: cmdArgs,
|
|
428
|
+
stderr: 'pipe',
|
|
429
|
+
...(authConfig?.env ? { env: { ...process.env, ...authConfig.env } } : {}),
|
|
430
|
+
...(authConfig?.cwd ? { cwd: authConfig.cwd } : {}),
|
|
431
|
+
};
|
|
432
|
+
|
|
433
|
+
const transport = new StdioClientTransport(transportOpts);
|
|
434
|
+
|
|
435
|
+
// Buffer stderr lines so we can surface them on connection failure,
|
|
436
|
+
// while still printing them in real time (preserving the SDK's default
|
|
437
|
+
// 'inherit' behavior for interactive use).
|
|
438
|
+
const stderrOutput = [];
|
|
439
|
+
const MAX_STDERR_LINES = 50;
|
|
440
|
+
if (transport.stderr) {
|
|
441
|
+
transport.stderr.on('data', (chunk) => {
|
|
442
|
+
process.stderr.write(chunk);
|
|
443
|
+
const lines = chunk.toString().split('\n');
|
|
444
|
+
for (const line of lines) {
|
|
445
|
+
if (line) {
|
|
446
|
+
stderrOutput.push(line);
|
|
447
|
+
if (stderrOutput.length > MAX_STDERR_LINES) {
|
|
448
|
+
stderrOutput.shift();
|
|
449
|
+
}
|
|
450
|
+
}
|
|
451
|
+
}
|
|
452
|
+
});
|
|
453
|
+
}
|
|
454
|
+
|
|
455
|
+
try {
|
|
456
|
+
await client.connect(transport);
|
|
457
|
+
} catch (err) {
|
|
458
|
+
// Attach captured stderr so callers can surface it for diagnostics.
|
|
459
|
+
err._stderrOutput = stderrOutput;
|
|
460
|
+
// Clean up the spawned process so it doesn't linger.
|
|
461
|
+
try { await transport.close(); } catch { /* best-effort */ }
|
|
462
|
+
throw err;
|
|
463
|
+
}
|
|
464
|
+
return { client, transport, stderrOutput };
|
|
203
465
|
}
|
|
204
466
|
}
|
|
205
467
|
|
|
@@ -405,6 +667,20 @@ function sunpeakInspectEndpointsPlugin(getClient, setClient, pluginOpts = {}) {
|
|
|
405
667
|
}
|
|
406
668
|
});
|
|
407
669
|
|
|
670
|
+
// List resources from connected server
|
|
671
|
+
server.middlewares.use('/__sunpeak/list-resources', async (_req, res) => {
|
|
672
|
+
try {
|
|
673
|
+
const client = getClient();
|
|
674
|
+
const result = await client.listResources();
|
|
675
|
+
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
676
|
+
res.end(JSON.stringify(result));
|
|
677
|
+
} catch (err) {
|
|
678
|
+
// Server may not support resources — return empty list
|
|
679
|
+
res.writeHead(200, { 'Content-Type': 'application/json' });
|
|
680
|
+
res.end(JSON.stringify({ resources: [] }));
|
|
681
|
+
}
|
|
682
|
+
});
|
|
683
|
+
|
|
408
684
|
// Call tool on connected server
|
|
409
685
|
server.middlewares.use('/__sunpeak/call-tool', async (req, res) => {
|
|
410
686
|
if (req.method !== 'POST') {
|
|
@@ -911,6 +1187,8 @@ function readRequestBody(req) {
|
|
|
911
1187
|
* @param {Record<string, string>} [opts.resolveAlias] - Vite resolve aliases (e.g., to map sunpeak imports to source)
|
|
912
1188
|
* @param {object[]} [opts.vitePlugins] - Additional Vite plugins (e.g., Tailwind for source CSS)
|
|
913
1189
|
* @param {object} [opts.viteCssConfig] - Vite css config override (e.g., lightningcss customAtRules)
|
|
1190
|
+
* @param {Record<string, string>} [opts.env] - Extra environment variables for stdio server processes
|
|
1191
|
+
* @param {string} [opts.cwd] - Working directory for stdio server processes
|
|
914
1192
|
*/
|
|
915
1193
|
export async function inspectServer(opts) {
|
|
916
1194
|
const {
|
|
@@ -928,6 +1206,8 @@ export async function inspectServer(opts) {
|
|
|
928
1206
|
resolveAlias,
|
|
929
1207
|
vitePlugins: extraVitePlugins = [],
|
|
930
1208
|
viteCssConfig,
|
|
1209
|
+
env: serverEnv,
|
|
1210
|
+
cwd: serverCwd,
|
|
931
1211
|
} = opts;
|
|
932
1212
|
|
|
933
1213
|
// Load favicon from sunpeak package for the inspector UI.
|
|
@@ -948,14 +1228,47 @@ export async function inspectServer(opts) {
|
|
|
948
1228
|
|
|
949
1229
|
// Connect to the MCP server (with retry for local servers that may still be starting)
|
|
950
1230
|
let mcpConnection;
|
|
1231
|
+
let lastStderrOutput = [];
|
|
951
1232
|
const maxRetries = 5;
|
|
1233
|
+
const connectionOpts = {};
|
|
1234
|
+
if (serverEnv) connectionOpts.env = serverEnv;
|
|
1235
|
+
if (serverCwd) connectionOpts.cwd = serverCwd;
|
|
952
1236
|
for (let attempt = 1; attempt <= maxRetries; attempt++) {
|
|
953
1237
|
try {
|
|
954
|
-
mcpConnection = await createMcpConnection(serverArg);
|
|
1238
|
+
mcpConnection = await createMcpConnection(serverArg, connectionOpts);
|
|
955
1239
|
break;
|
|
956
1240
|
} catch (err) {
|
|
1241
|
+
// Capture stderr from the failed connection attempt for diagnostics.
|
|
1242
|
+
if (err._stderrOutput?.length) {
|
|
1243
|
+
lastStderrOutput = err._stderrOutput;
|
|
1244
|
+
}
|
|
1245
|
+
|
|
1246
|
+
// If the server requires OAuth, negotiate it and retry once.
|
|
1247
|
+
if (isAuthError(err) && serverArg.startsWith('http')) {
|
|
1248
|
+
console.log('Server requires authentication. Negotiating OAuth...');
|
|
1249
|
+
try {
|
|
1250
|
+
const authProvider = await negotiateOAuth(serverArg);
|
|
1251
|
+
console.log('OAuth authorized. Reconnecting...');
|
|
1252
|
+
mcpConnection = await createMcpConnection(serverArg, {
|
|
1253
|
+
...connectionOpts,
|
|
1254
|
+
type: 'oauth',
|
|
1255
|
+
authProvider,
|
|
1256
|
+
});
|
|
1257
|
+
break;
|
|
1258
|
+
} catch (oauthErr) {
|
|
1259
|
+
console.error(`OAuth negotiation failed: ${oauthErr.message}`);
|
|
1260
|
+
process.exit(1);
|
|
1261
|
+
}
|
|
1262
|
+
}
|
|
1263
|
+
|
|
957
1264
|
if (attempt === maxRetries) {
|
|
958
1265
|
console.error(`Failed to connect to MCP server: ${err.message}`);
|
|
1266
|
+
if (lastStderrOutput.length) {
|
|
1267
|
+
console.error('\nServer stderr output:');
|
|
1268
|
+
for (const line of lastStderrOutput) {
|
|
1269
|
+
console.error(` ${line}`);
|
|
1270
|
+
}
|
|
1271
|
+
}
|
|
959
1272
|
process.exit(1);
|
|
960
1273
|
}
|
|
961
1274
|
console.log(`Connection attempt ${attempt}/${maxRetries} failed, retrying...`);
|
|
@@ -1195,5 +1508,7 @@ export async function inspect(args) {
|
|
|
1195
1508
|
simulationsDir,
|
|
1196
1509
|
port: opts.port,
|
|
1197
1510
|
name: opts.name,
|
|
1511
|
+
env: opts.env,
|
|
1512
|
+
cwd: opts.cwd,
|
|
1198
1513
|
});
|
|
1199
1514
|
}
|
package/bin/commands/new.mjs
CHANGED
|
@@ -9,6 +9,7 @@ const execAsync = promisify(exec);
|
|
|
9
9
|
import * as clack from '@clack/prompts';
|
|
10
10
|
import { discoverResources } from '../lib/patterns.mjs';
|
|
11
11
|
import { detectPackageManager } from '../utils.mjs';
|
|
12
|
+
import { EVAL_PROVIDERS } from '../lib/eval/eval-providers.mjs';
|
|
12
13
|
|
|
13
14
|
const __dirname = dirname(fileURLToPath(import.meta.url));
|
|
14
15
|
|
|
@@ -57,6 +58,21 @@ async function defaultSelectResources(availableResources) {
|
|
|
57
58
|
return selected;
|
|
58
59
|
}
|
|
59
60
|
|
|
61
|
+
/**
|
|
62
|
+
* Default prompt for eval provider selection.
|
|
63
|
+
* @returns {Promise<Array<{ pkg: string, models: string[] }>>}
|
|
64
|
+
*/
|
|
65
|
+
async function defaultSelectProviders() {
|
|
66
|
+
const selected = await clack.multiselect({
|
|
67
|
+
message: 'AI providers for evals (space to toggle, enter to skip)',
|
|
68
|
+
options: EVAL_PROVIDERS.map((p) => ({ value: p, label: p.label })),
|
|
69
|
+
initialValues: [],
|
|
70
|
+
required: false,
|
|
71
|
+
});
|
|
72
|
+
if (clack.isCancel(selected)) return [];
|
|
73
|
+
return selected;
|
|
74
|
+
}
|
|
75
|
+
|
|
60
76
|
/**
|
|
61
77
|
* Default dependencies (real implementations)
|
|
62
78
|
*/
|
|
@@ -73,6 +89,8 @@ export const defaultDeps = {
|
|
|
73
89
|
execAsync,
|
|
74
90
|
promptName: defaultPromptName,
|
|
75
91
|
selectResources: defaultSelectResources,
|
|
92
|
+
selectProviders: defaultSelectProviders,
|
|
93
|
+
password: clack.password,
|
|
76
94
|
confirm: clack.confirm,
|
|
77
95
|
intro: clack.intro,
|
|
78
96
|
outro: clack.outro,
|
|
@@ -233,6 +251,15 @@ export async function init(projectName, resourcesArg, deps = defaultDeps) {
|
|
|
233
251
|
d.renameSync(srcPath, destPath);
|
|
234
252
|
}
|
|
235
253
|
}
|
|
254
|
+
// Rename nested dotfiles (underscore convention for npm compatibility)
|
|
255
|
+
const nestedDotfiles = [['tests/evals/_env.example', 'tests/evals/.env.example']];
|
|
256
|
+
for (const [from, to] of nestedDotfiles) {
|
|
257
|
+
const srcPath = join(targetDir, from);
|
|
258
|
+
const destPath = join(targetDir, to);
|
|
259
|
+
if (d.existsSync(srcPath)) {
|
|
260
|
+
d.renameSync(srcPath, destPath);
|
|
261
|
+
}
|
|
262
|
+
}
|
|
236
263
|
|
|
237
264
|
// Read sunpeak version from root package.json
|
|
238
265
|
const rootPkg = JSON.parse(d.readFileSync(d.rootPkgPath, 'utf-8'));
|
|
@@ -282,6 +309,56 @@ export async function init(projectName, resourcesArg, deps = defaultDeps) {
|
|
|
282
309
|
s.stop(`Install failed. You can try running "${pm} install" manually.`);
|
|
283
310
|
}
|
|
284
311
|
|
|
312
|
+
// Offer to configure eval providers (only in interactive mode)
|
|
313
|
+
if (resourcesArg === undefined) {
|
|
314
|
+
const providers = await d.selectProviders();
|
|
315
|
+
if (!clack.isCancel(providers) && providers.length > 0) {
|
|
316
|
+
// Install AI SDK core + selected provider packages
|
|
317
|
+
const pkgsToInstall = ['ai', ...providers.map((p) => p.pkg)];
|
|
318
|
+
try {
|
|
319
|
+
await d.execAsync(`${pm} add -D ${pkgsToInstall.join(' ')}`, { cwd: targetDir });
|
|
320
|
+
} catch {
|
|
321
|
+
d.console.log(`Provider install failed. Install manually: ${pm} add -D ${pkgsToInstall.join(' ')}`);
|
|
322
|
+
}
|
|
323
|
+
|
|
324
|
+
// Uncomment selected models in eval.config.ts
|
|
325
|
+
const evalConfigPath = join(targetDir, 'tests', 'evals', 'eval.config.ts');
|
|
326
|
+
if (d.existsSync(evalConfigPath)) {
|
|
327
|
+
let config = d.readFileSync(evalConfigPath, 'utf-8');
|
|
328
|
+
for (const p of providers) {
|
|
329
|
+
for (const model of p.models) {
|
|
330
|
+
// Uncomment lines matching this model (e.g., " // 'gpt-4o'," → " 'gpt-4o',")
|
|
331
|
+
config = config.replace(
|
|
332
|
+
new RegExp(`^(\\s*)// ('${model.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')}',?.*)$`, 'm'),
|
|
333
|
+
'$1$2'
|
|
334
|
+
);
|
|
335
|
+
}
|
|
336
|
+
}
|
|
337
|
+
d.writeFileSync(evalConfigPath, config);
|
|
338
|
+
}
|
|
339
|
+
|
|
340
|
+
// Prompt for API keys and write .env
|
|
341
|
+
const envLines = [];
|
|
342
|
+
const seen = new Set();
|
|
343
|
+
for (const p of providers) {
|
|
344
|
+
if (seen.has(p.envVar)) continue;
|
|
345
|
+
seen.add(p.envVar);
|
|
346
|
+
const key = await d.password({
|
|
347
|
+
message: `${p.envVar} (enter to skip)`,
|
|
348
|
+
mask: '*',
|
|
349
|
+
});
|
|
350
|
+
if (!clack.isCancel(key) && key) {
|
|
351
|
+
envLines.push(`${p.envVar}=${key}`);
|
|
352
|
+
}
|
|
353
|
+
}
|
|
354
|
+
const envPath = join(targetDir, 'tests', 'evals', '.env');
|
|
355
|
+
if (envLines.length > 0) {
|
|
356
|
+
d.writeFileSync(envPath, envLines.join('\n') + '\n');
|
|
357
|
+
clack.log.info(`API keys saved to tests/evals/.env (gitignored)`);
|
|
358
|
+
}
|
|
359
|
+
}
|
|
360
|
+
}
|
|
361
|
+
|
|
285
362
|
// Offer to install the sunpeak skills (only in interactive mode)
|
|
286
363
|
if (resourcesArg === undefined) {
|
|
287
364
|
const installSkill = await d.confirm({
|
|
@@ -290,18 +367,16 @@ export async function init(projectName, resourcesArg, deps = defaultDeps) {
|
|
|
290
367
|
});
|
|
291
368
|
if (!clack.isCancel(installSkill) && installSkill) {
|
|
292
369
|
try {
|
|
293
|
-
d.execSync('
|
|
370
|
+
d.execSync('pnpm dlx skills add Sunpeak-AI/sunpeak@create-sunpeak-app Sunpeak-AI/sunpeak@test-mcp-server', {
|
|
294
371
|
cwd: targetDir,
|
|
295
372
|
stdio: 'inherit',
|
|
296
373
|
});
|
|
297
374
|
} catch {
|
|
298
|
-
d.console.log('Skill install skipped. You can install later with:
|
|
375
|
+
d.console.log('Skill install skipped. You can install later with: pnpm dlx skills add Sunpeak-AI/sunpeak@create-sunpeak-app Sunpeak-AI/sunpeak@test-mcp-server');
|
|
299
376
|
}
|
|
300
377
|
}
|
|
301
378
|
}
|
|
302
379
|
|
|
303
|
-
const runCmd = pm === 'npm' ? 'npm run' : pm;
|
|
304
|
-
|
|
305
380
|
d.outro(`Done! To get started:
|
|
306
381
|
|
|
307
382
|
cd ${projectName}
|
|
@@ -309,9 +384,12 @@ export async function init(projectName, resourcesArg, deps = defaultDeps) {
|
|
|
309
384
|
|
|
310
385
|
Your project commands:
|
|
311
386
|
|
|
312
|
-
sunpeak dev
|
|
313
|
-
sunpeak build
|
|
314
|
-
|
|
387
|
+
sunpeak dev # Start dev server + MCP endpoint
|
|
388
|
+
sunpeak build # Build for production
|
|
389
|
+
sunpeak test # Run unit + e2e tests
|
|
390
|
+
sunpeak test --eval # Run LLM evals (configure models in tests/evals/eval.config.ts)
|
|
391
|
+
sunpeak test --visual # Run visual regression tests
|
|
392
|
+
sunpeak test --live # Run live tests against real AI hosts`);
|
|
315
393
|
}
|
|
316
394
|
|
|
317
395
|
// Allow running directly
|