@inspectr/mcplab 1.12.1 → 1.14.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/app/assets/index-B3_k1eZO.js +250 -0
- package/dist/app/assets/index-C3E9mFQO.css +1 -0
- package/dist/app/index.html +2 -2
- package/dist/app-server/app-context.d.ts +91 -141
- package/dist/app-server/app-context.d.ts.map +1 -1
- package/dist/app-server/http.d.ts +2 -1
- package/dist/app-server/http.d.ts.map +1 -1
- package/dist/app-server/http.js +5 -0
- package/dist/app-server/http.js.map +1 -1
- package/dist/app-server/oauth-debugger-domain.d.ts +182 -202
- package/dist/app-server/oauth-debugger-domain.d.ts.map +1 -1
- package/dist/app-server/oauth-debugger-domain.js +58 -10
- package/dist/app-server/oauth-debugger-domain.js.map +1 -1
- package/dist/app-server/oauth-debugger.d.ts +10 -17
- package/dist/app-server/oauth-debugger.d.ts.map +1 -1
- package/dist/app-server/oauth-debugger.js +233 -2
- package/dist/app-server/oauth-debugger.js.map +1 -1
- package/dist/app-server/result-assistant-domain.js +1 -1
- package/dist/app-server/result-assistant-domain.js.map +1 -1
- package/dist/app-server/result-assistant-tools.d.ts.map +1 -1
- package/dist/app-server/result-assistant-tools.js +3 -2
- package/dist/app-server/result-assistant-tools.js.map +1 -1
- package/dist/app-server/router.d.ts.map +1 -1
- package/dist/app-server/router.js +2 -1
- package/dist/app-server/router.js.map +1 -1
- package/dist/app-server/tool-analysis-domain.d.ts +163 -178
- package/dist/app-server/tool-analysis-domain.d.ts.map +1 -1
- package/dist/app-server/tool-analysis-domain.js +17 -4
- package/dist/app-server/tool-analysis-domain.js.map +1 -1
- package/dist/app-server/tool-analysis.d.ts.map +1 -1
- package/dist/app-server/tool-analysis.js +24 -1
- package/dist/app-server/tool-analysis.js.map +1 -1
- package/dist/cli.js +159 -0
- package/dist/cli.js.map +1 -1
- package/dist/results/context.d.ts +3 -0
- package/dist/results/context.d.ts.map +1 -0
- package/dist/results/context.js +2 -0
- package/dist/results/context.js.map +1 -0
- package/dist/results/format.d.ts +21 -0
- package/dist/results/format.d.ts.map +1 -0
- package/dist/results/format.js +92 -0
- package/dist/results/format.js.map +1 -0
- package/dist/results/indexer.d.ts +9 -0
- package/dist/results/indexer.d.ts.map +1 -0
- package/dist/results/indexer.js +2 -0
- package/dist/results/indexer.js.map +1 -0
- package/dist/results/search.d.ts +2 -0
- package/dist/results/search.d.ts.map +1 -0
- package/dist/results/search.js +2 -0
- package/dist/results/search.js.map +1 -0
- package/dist/results/types.d.ts +11 -0
- package/dist/results/types.d.ts.map +1 -0
- package/dist/results/types.js +2 -0
- package/dist/results/types.js.map +1 -0
- package/dist/test-results-fixture.d.ts +7 -0
- package/dist/test-results-fixture.d.ts.map +1 -0
- package/dist/test-results-fixture.js +82 -0
- package/dist/test-results-fixture.js.map +1 -0
- package/package.json +6 -6
- package/dist/app/assets/index-Djwh_08m.js +0 -249
- package/dist/app/assets/index-cqsnfkao.css +0 -1
|
@@ -0,0 +1,92 @@
|
|
|
1
|
+
import { existsSync, readFileSync } from 'node:fs';
|
|
2
|
+
import { listRunIdsDesc, resolveRunArtifactPath } from '@inspectr/mcplab-core';
|
|
3
|
+
function listRunIds(runsDir) {
|
|
4
|
+
return listRunIdsDesc(runsDir);
|
|
5
|
+
}
|
|
6
|
+
export function listRuns(runsDir) {
|
|
7
|
+
return listRunIds(runsDir).map((runId) => {
|
|
8
|
+
const resultsPath = resolveRunArtifactPath(runsDir, runId, 'results.json');
|
|
9
|
+
if (!existsSync(resultsPath)) {
|
|
10
|
+
return { run_id: runId };
|
|
11
|
+
}
|
|
12
|
+
try {
|
|
13
|
+
const parsed = JSON.parse(readFileSync(resultsPath, 'utf8'));
|
|
14
|
+
return {
|
|
15
|
+
run_id: runId,
|
|
16
|
+
timestamp: parsed.metadata.timestamp,
|
|
17
|
+
pass_rate: typeof parsed.summary.pass_rate === 'number' ? parsed.summary.pass_rate : null,
|
|
18
|
+
total_runs: parsed.summary.total_runs
|
|
19
|
+
};
|
|
20
|
+
}
|
|
21
|
+
catch {
|
|
22
|
+
return { run_id: runId };
|
|
23
|
+
}
|
|
24
|
+
});
|
|
25
|
+
}
|
|
26
|
+
export function showRun(runsDir, runId, format) {
|
|
27
|
+
if (format === 'markdown') {
|
|
28
|
+
const summaryPath = resolveRunArtifactPath(runsDir, runId, 'summary.md');
|
|
29
|
+
if (existsSync(summaryPath)) {
|
|
30
|
+
return readFileSync(summaryPath, 'utf8');
|
|
31
|
+
}
|
|
32
|
+
}
|
|
33
|
+
const resultsPath = resolveRunArtifactPath(runsDir, runId, 'results.json');
|
|
34
|
+
if (!existsSync(resultsPath)) {
|
|
35
|
+
throw new Error(`results.json not found for run ${runId}`);
|
|
36
|
+
}
|
|
37
|
+
try {
|
|
38
|
+
const parsed = JSON.parse(readFileSync(resultsPath, 'utf8'));
|
|
39
|
+
return JSON.stringify(parsed, null, 2);
|
|
40
|
+
}
|
|
41
|
+
catch (error) {
|
|
42
|
+
const msg = error instanceof Error ? error.message : String(error);
|
|
43
|
+
throw new Error(`Could not parse results.json for run ${runId}: ${msg}`);
|
|
44
|
+
}
|
|
45
|
+
}
|
|
46
|
+
export function formatRunList(list, format) {
|
|
47
|
+
if (format === 'json') {
|
|
48
|
+
return JSON.stringify(list, null, 2);
|
|
49
|
+
}
|
|
50
|
+
const lines = ['RUN_ID\tTIMESTAMP\tPASS_RATE\tTOTAL_RUNS'];
|
|
51
|
+
for (const item of list) {
|
|
52
|
+
lines.push(`${item.run_id}\t${item.timestamp ?? '-'}\t${item.pass_rate === undefined || item.pass_rate === null
|
|
53
|
+
? '-'
|
|
54
|
+
: (item.pass_rate * 100).toFixed(1) + '%'}\t${item.total_runs ?? '-'}`);
|
|
55
|
+
}
|
|
56
|
+
return lines.join('\n');
|
|
57
|
+
}
|
|
58
|
+
export function formatSearchHits(hits, format) {
|
|
59
|
+
if (format === 'json')
|
|
60
|
+
return JSON.stringify(hits, null, 2);
|
|
61
|
+
if (format === 'jsonl')
|
|
62
|
+
return hits.map((hit) => JSON.stringify(hit)).join('\n');
|
|
63
|
+
const lines = ['# Search Results', ''];
|
|
64
|
+
hits.forEach((hit, idx) => {
|
|
65
|
+
lines.push(`${idx + 1}. run=${hit.run_id} scenario=${hit.scenario_id ?? '-'} agent=${hit.agent ?? '-'} status=${hit.status ?? '-'} score=${hit.score}`);
|
|
66
|
+
lines.push(` source=${hit.source} file=${hit.file}${hit.line_start ? `:${hit.line_start}` : ''}`);
|
|
67
|
+
lines.push(` snippet: ${hit.snippet}`);
|
|
68
|
+
if (hit.context_command) {
|
|
69
|
+
lines.push(` next: ${hit.context_command}`);
|
|
70
|
+
}
|
|
71
|
+
});
|
|
72
|
+
return lines.join('\n');
|
|
73
|
+
}
|
|
74
|
+
export function formatContext(result, format) {
|
|
75
|
+
if (format === 'json')
|
|
76
|
+
return JSON.stringify(result, null, 2);
|
|
77
|
+
return [
|
|
78
|
+
`# Context ${result.run_id}/${result.scenario_id}`,
|
|
79
|
+
'',
|
|
80
|
+
`run: ${result.run_id}`,
|
|
81
|
+
`scenario: ${result.scenario_id}`,
|
|
82
|
+
`source: ${result.source}`,
|
|
83
|
+
result.line_start ? `lines: ${result.line_start}-${result.line_end}` : '',
|
|
84
|
+
'',
|
|
85
|
+
'```',
|
|
86
|
+
result.excerpt,
|
|
87
|
+
'```'
|
|
88
|
+
]
|
|
89
|
+
.filter(Boolean)
|
|
90
|
+
.join('\n');
|
|
91
|
+
}
|
|
92
|
+
//# sourceMappingURL=format.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"format.js","sourceRoot":"","sources":["../../src/results/format.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,UAAU,EAAE,YAAY,EAAE,MAAM,SAAS,CAAC;AACnD,OAAO,EAAE,cAAc,EAAE,sBAAsB,EAAoB,MAAM,uBAAuB,CAAC;AAWjG,SAAS,UAAU,CAAC,OAAe;IACjC,OAAO,cAAc,CAAC,OAAO,CAAC,CAAC;AACjC,CAAC;AAED,MAAM,UAAU,QAAQ,CAAC,OAAe;IACtC,OAAO,UAAU,CAAC,OAAO,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,EAAE;QACvC,MAAM,WAAW,GAAG,sBAAsB,CAAC,OAAO,EAAE,KAAK,EAAE,cAAc,CAAC,CAAC;QAC3E,IAAI,CAAC,UAAU,CAAC,WAAW,CAAC,EAAE,CAAC;YAC7B,OAAO,EAAE,MAAM,EAAE,KAAK,EAAE,CAAC;QAC3B,CAAC;QACD,IAAI,CAAC;YACH,MAAM,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,YAAY,CAAC,WAAW,EAAE,MAAM,CAAC,CAAgB,CAAC;YAC5E,OAAO;gBACL,MAAM,EAAE,KAAK;gBACb,SAAS,EAAE,MAAM,CAAC,QAAQ,CAAC,SAAS;gBACpC,SAAS,EAAE,OAAO,MAAM,CAAC,OAAO,CAAC,SAAS,KAAK,QAAQ,CAAC,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,SAAS,CAAC,CAAC,CAAC,IAAI;gBACzF,UAAU,EAAE,MAAM,CAAC,OAAO,CAAC,UAAU;aACtC,CAAC;QACJ,CAAC;QAAC,MAAM,CAAC;YACP,OAAO,EAAE,MAAM,EAAE,KAAK,EAAE,CAAC;QAC3B,CAAC;IACH,CAAC,CAAC,CAAC;AACL,CAAC;AAED,MAAM,UAAU,OAAO,CAAC,OAAe,EAAE,KAAa,EAAE,MAA2B;IACjF,IAAI,MAAM,KAAK,UAAU,EAAE,CAAC;QAC1B,MAAM,WAAW,GAAG,sBAAsB,CAAC,OAAO,EAAE,KAAK,EAAE,YAAY,CAAC,CAAC;QACzE,IAAI,UAAU,CAAC,WAAW,CAAC,EAAE,CAAC;YAC5B,OAAO,YAAY,CAAC,WAAW,EAAE,MAAM,CAAC,CAAC;QAC3C,CAAC;IACH,CAAC;IACD,MAAM,WAAW,GAAG,sBAAsB,CAAC,OAAO,EAAE,KAAK,EAAE,cAAc,CAAC,CAAC;IAC3E,IAAI,CAAC,UAAU,CAAC,WAAW,CAAC,EAAE,CAAC;QAC7B,MAAM,IAAI,KAAK,CAAC,kCAAkC,KAAK,EAAE,CAAC,CAAC;IAC7D,CAAC;IACD,IAAI,CAAC;QACH,MAAM,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,YAAY,CAAC,WAAW,EAAE,MAAM,CAAC,CAAgB,CAAC;QAC5E,OAAO,IAAI,CAAC,SAAS,CAAC,MAAM,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC;IACzC,CAAC;IAAC,OAAO,KAAK,EAAE,CAAC;QACf,MAAM,GAAG,GAAG,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC;QACnE,MAAM,IAAI,KAAK,CAAC,wCAAwC,KAAK,KAAK,GAAG,EAAE,CAAC,CAAC;IAC3E,CAAC;AACH,CAAC;AAED,MAAM,UAAU,aAAa,CAAC,IAAmB,EAAE,MAAwB;IACzE,IAAI,MAAM,KAAK,MAAM,EAAE,CAAC;QACtB,OAAO,IAAI,CAAC,SAAS,CAAC,IAAI,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC;IACvC,CAAC;IACD,MAAM,KAAK,GAAG,CAAC,0CAA0C,CAAC,CAAC;IAC3D,KAAK,MAAM,IAAI,IAAI,IAAI,EAAE,CAAC;QACxB,KAAK,CAAC,IAAI,CACR,GAAG,IAAI,CAAC,MAAM,KAAK,IAAI,CAAC,SAAS,IAAI,GAAG,KACtC,IAAI,CAAC,SAAS,KAAK,SAAS,IAAI,IAAI,CAAC,SAAS,KAAK,IAAI;YACrD,CAAC,CAAC,GAAG;YACL,CAAC,CAAC,CAAC,IAAI,CAAC,SAAS,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,GAC1C,KAAK,IAAI,CAAC,UAAU,IAAI,GAAG,EAAE,CAC9B,CAAC;IACJ,CAAC;IACD,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;AAC1B,CAAC;AAED,MAAM,UAAU,gBAAgB,CAAC,IAAiB,EAAE,MAAqC;IACvF,IAAI,MAAM,KAAK,MAAM;QAAE,OAAO,IAAI,CAAC,SAAS,CAAC,IAAI,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC;IAC5D,IAAI,MAAM,KAAK,OAAO;QAAE,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE,EAAE,CAAC,IAAI,CAAC,SAAS,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IACjF,MAAM,KAAK,GAAG,CAAC,kBAAkB,EAAE,EAAE,CAAC,CAAC;IACvC,IAAI,CAAC,OAAO,CAAC,CAAC,GAAG,EAAE,GAAG,EAAE,EAAE;QACxB,KAAK,CAAC,IAAI,CACR,GAAG,GAAG,GAAG,CAAC,SAAS,GAAG,CAAC,MAAM,aAAa,GAAG,CAAC,WAAW,IAAI,GAAG,UAC9D,GAAG,CAAC,KAAK,IAAI,GACf,WAAW,GAAG,CAAC,MAAM,IAAI,GAAG,UAAU,GAAG,CAAC,KAAK,EAAE,CAClD,CAAC;QACF,KAAK,CAAC,IAAI,CACR,aAAa,GAAG,CAAC,MAAM,SAAS,GAAG,CAAC,IAAI,GAAG,GAAG,CAAC,UAAU,CAAC,CAAC,CAAC,IAAI,GAAG,CAAC,UAAU,EAAE,CAAC,CAAC,CAAC,EAAE,EAAE,CACxF,CAAC;QACF,KAAK,CAAC,IAAI,CAAC,eAAe,GAAG,CAAC,OAAO,EAAE,CAAC,CAAC;QACzC,IAAI,GAAG,CAAC,eAAe,EAAE,CAAC;YACxB,KAAK,CAAC,IAAI,CAAC,YAAY,GAAG,CAAC,eAAe,EAAE,CAAC,CAAC;QAChD,CAAC;IACH,CAAC,CAAC,CAAC;IACH,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;AAC1B,CAAC;AAED,MAAM,UAAU,aAAa,CAAC,MAAqB,EAAE,MAA2B;IAC9E,IAAI,MAAM,KAAK,MAAM;QAAE,OAAO,IAAI,CAAC,SAAS,CAAC,MAAM,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC;IAC9D,OAAO;QACL,aAAa,MAAM,CAAC,MAAM,IAAI,MAAM,CAAC,WAAW,EAAE;QAClD,EAAE;QACF,QAAQ,MAAM,CAAC,MAAM,EAAE;QACvB,aAAa,MAAM,CAAC,WAAW,EAAE;QACjC,WAAW,MAAM,CAAC,MAAM,EAAE;QAC1B,MAAM,CAAC,UAAU,CAAC,CAAC,CAAC,UAAU,MAAM,CAAC,UAAU,IAAI,MAAM,CAAC,QAAQ,EAAE,CAAC,CAAC,CAAC,EAAE;QACzE,EAAE;QACF,KAAK;QACL,MAAM,CAAC,OAAO;QACd,KAAK;KACN;SACE,MAAM,CAAC,OAAO,CAAC;SACf,IAAI,CAAC,IAAI,CAAC,CAAC;AAChB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"indexer.d.ts","sourceRoot":"","sources":["../../src/results/indexer.ts"],"names":[],"mappings":"AAAA,OAAO,EACL,gBAAgB,EAChB,iBAAiB,EACjB,sBAAsB,EACtB,eAAe,EACf,gBAAgB,EAChB,oBAAoB,EACrB,MAAM,uBAAuB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"indexer.js","sourceRoot":"","sources":["../../src/results/indexer.ts"],"names":[],"mappings":"AAAA,OAAO,EACL,gBAAgB,EAChB,iBAAiB,EACjB,sBAAsB,EACtB,eAAe,EACf,gBAAgB,EAChB,oBAAoB,EACrB,MAAM,uBAAuB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"search.d.ts","sourceRoot":"","sources":["../../src/results/search.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,QAAQ,EAAE,WAAW,EAAE,QAAQ,EAAE,cAAc,EAAE,UAAU,EAAE,MAAM,uBAAuB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"search.js","sourceRoot":"","sources":["../../src/results/search.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,QAAQ,EAAE,WAAW,EAAE,QAAQ,EAAE,cAAc,EAAE,UAAU,EAAE,MAAM,uBAAuB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.d.ts","sourceRoot":"","sources":["../../src/results/types.ts"],"names":[],"mappings":"AAAA,YAAY,EACV,YAAY,EACZ,YAAY,EACZ,SAAS,EACT,SAAS,EACT,aAAa,EACb,aAAa,EACb,cAAc,EACd,aAAa,EACd,MAAM,uBAAuB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.js","sourceRoot":"","sources":["../../src/results/types.ts"],"names":[],"mappings":""}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"test-results-fixture.d.ts","sourceRoot":"","sources":["../src/test-results-fixture.ts"],"names":[],"mappings":"AAKA,MAAM,MAAM,UAAU,GAAG;IAAE,IAAI,EAAE,MAAM,CAAC;IAAC,OAAO,EAAE,MAAM,CAAC;IAAC,KAAK,EAAE,MAAM,CAAA;CAAE,CAAC;AAE1E,wBAAgB,uBAAuB,IAAI,UAAU,CAwFpD"}
|
|
@@ -0,0 +1,82 @@
|
|
|
1
|
+
import { mkdtempSync, mkdirSync, writeFileSync } from 'node:fs';
|
|
2
|
+
import { tmpdir } from 'node:os';
|
|
3
|
+
import { join } from 'node:path';
|
|
4
|
+
export function createResultsRunFixture() {
|
|
5
|
+
const root = mkdtempSync(join(tmpdir(), 'mcplab-results-'));
|
|
6
|
+
const runsDir = join(root, 'mcplab', 'results', 'evaluation-runs');
|
|
7
|
+
const runId = '20260206-212239';
|
|
8
|
+
const runDir = join(runsDir, runId);
|
|
9
|
+
mkdirSync(runDir, { recursive: true });
|
|
10
|
+
const results = {
|
|
11
|
+
metadata: {
|
|
12
|
+
run_id: runId,
|
|
13
|
+
timestamp: '2026-02-06T21:22:39.000Z',
|
|
14
|
+
config_hash: 'abc123',
|
|
15
|
+
cli_version: '1.0.0',
|
|
16
|
+
mcp_server_versions: {}
|
|
17
|
+
},
|
|
18
|
+
summary: {
|
|
19
|
+
total_scenarios: 1,
|
|
20
|
+
total_runs: 1,
|
|
21
|
+
pass_rate: 0,
|
|
22
|
+
avg_tool_calls_per_run: 1,
|
|
23
|
+
avg_tool_latency_ms: 50
|
|
24
|
+
},
|
|
25
|
+
scenarios: [
|
|
26
|
+
{
|
|
27
|
+
scenario_id: 'search-tags',
|
|
28
|
+
agent: 'claude-haiku',
|
|
29
|
+
runs: [
|
|
30
|
+
{
|
|
31
|
+
run_index: 0,
|
|
32
|
+
pass: false,
|
|
33
|
+
failures: ['response assertion failed'],
|
|
34
|
+
tool_calls: ['search_tags'],
|
|
35
|
+
tool_call_count: 1,
|
|
36
|
+
tool_sequence: ['search_tags'],
|
|
37
|
+
tool_usage: { search_tags: 1 },
|
|
38
|
+
tool_durations_ms: [50],
|
|
39
|
+
final_text: 'Could not complete request because timeout',
|
|
40
|
+
extracted: {},
|
|
41
|
+
error: 'timeout'
|
|
42
|
+
}
|
|
43
|
+
],
|
|
44
|
+
pass_rate: 0,
|
|
45
|
+
distinct_sequences: { '["search_tags"]': 1 },
|
|
46
|
+
tool_usage_frequency: { search_tags: 1 },
|
|
47
|
+
extracted_values: {},
|
|
48
|
+
last_final_answer: 'Could not complete request because timeout'
|
|
49
|
+
}
|
|
50
|
+
]
|
|
51
|
+
};
|
|
52
|
+
writeFileSync(join(runDir, 'results.json'), `${JSON.stringify(results, null, 2)}\n`, 'utf8');
|
|
53
|
+
writeFileSync(join(runDir, 'summary.md'), '# MCP Eval Summary\n\n| Scenario | Agent | Runs | Pass rate |\n|---|---|---|---|\n| search-tags | claude-haiku | 1 | 0% |\n', 'utf8');
|
|
54
|
+
writeFileSync(join(runDir, 'trace.jsonl'), `${JSON.stringify({
|
|
55
|
+
type: 'scenario_run',
|
|
56
|
+
trace_version: 3,
|
|
57
|
+
run_index: 0,
|
|
58
|
+
scenario_id: 'search-tags',
|
|
59
|
+
agent: 'claude-haiku',
|
|
60
|
+
provider: 'anthropic',
|
|
61
|
+
model: 'claude-3-haiku',
|
|
62
|
+
ts_start: '2026-02-06T21:22:39.000Z',
|
|
63
|
+
ts_end: '2026-02-06T21:22:40.000Z',
|
|
64
|
+
pass: false,
|
|
65
|
+
messages: [
|
|
66
|
+
{
|
|
67
|
+
role: 'assistant',
|
|
68
|
+
content: [
|
|
69
|
+
{
|
|
70
|
+
type: 'tool_result',
|
|
71
|
+
tool_use_id: 'call_1',
|
|
72
|
+
name: 'search_tags',
|
|
73
|
+
content: [{ type: 'text', text: 'tool search_tags returned timeout after 5000ms' }],
|
|
74
|
+
is_error: true
|
|
75
|
+
}
|
|
76
|
+
]
|
|
77
|
+
}
|
|
78
|
+
]
|
|
79
|
+
})}\nnot-json\n`, 'utf8');
|
|
80
|
+
return { root, runsDir, runId };
|
|
81
|
+
}
|
|
82
|
+
//# sourceMappingURL=test-results-fixture.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"test-results-fixture.js","sourceRoot":"","sources":["../src/test-results-fixture.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,WAAW,EAAE,SAAS,EAAE,aAAa,EAAE,MAAM,SAAS,CAAC;AAChE,OAAO,EAAE,MAAM,EAAE,MAAM,SAAS,CAAC;AACjC,OAAO,EAAE,IAAI,EAAE,MAAM,WAAW,CAAC;AAKjC,MAAM,UAAU,uBAAuB;IACrC,MAAM,IAAI,GAAG,WAAW,CAAC,IAAI,CAAC,MAAM,EAAE,EAAE,iBAAiB,CAAC,CAAC,CAAC;IAC5D,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,EAAE,QAAQ,EAAE,SAAS,EAAE,iBAAiB,CAAC,CAAC;IACnE,MAAM,KAAK,GAAG,iBAAiB,CAAC;IAChC,MAAM,MAAM,GAAG,IAAI,CAAC,OAAO,EAAE,KAAK,CAAC,CAAC;IACpC,SAAS,CAAC,MAAM,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;IAEvC,MAAM,OAAO,GAAgB;QAC3B,QAAQ,EAAE;YACR,MAAM,EAAE,KAAK;YACb,SAAS,EAAE,0BAA0B;YACrC,WAAW,EAAE,QAAQ;YACrB,WAAW,EAAE,OAAO;YACpB,mBAAmB,EAAE,EAAE;SACxB;QACD,OAAO,EAAE;YACP,eAAe,EAAE,CAAC;YAClB,UAAU,EAAE,CAAC;YACb,SAAS,EAAE,CAAC;YACZ,sBAAsB,EAAE,CAAC;YACzB,mBAAmB,EAAE,EAAE;SACxB;QACD,SAAS,EAAE;YACT;gBACE,WAAW,EAAE,aAAa;gBAC1B,KAAK,EAAE,cAAc;gBACrB,IAAI,EAAE;oBACJ;wBACE,SAAS,EAAE,CAAC;wBACZ,IAAI,EAAE,KAAK;wBACX,QAAQ,EAAE,CAAC,2BAA2B,CAAC;wBACvC,UAAU,EAAE,CAAC,aAAa,CAAC;wBAC3B,eAAe,EAAE,CAAC;wBAClB,aAAa,EAAE,CAAC,aAAa,CAAC;wBAC9B,UAAU,EAAE,EAAE,WAAW,EAAE,CAAC,EAAE;wBAC9B,iBAAiB,EAAE,CAAC,EAAE,CAAC;wBACvB,UAAU,EAAE,4CAA4C;wBACxD,SAAS,EAAE,EAAE;wBACb,KAAK,EAAE,SAAS;qBACjB;iBACF;gBACD,SAAS,EAAE,CAAC;gBACZ,kBAAkB,EAAE,EAAE,iBAAiB,EAAE,CAAC,EAAE;gBAC5C,oBAAoB,EAAE,EAAE,WAAW,EAAE,CAAC,EAAE;gBACxC,gBAAgB,EAAE,EAAE;gBACpB,iBAAiB,EAAE,4CAA4C;aAChE;SACF;KACF,CAAC;IAEF,aAAa,CAAC,IAAI,CAAC,MAAM,EAAE,cAAc,CAAC,EAAE,GAAG,IAAI,CAAC,SAAS,CAAC,OAAO,EAAE,IAAI,EAAE,CAAC,CAAC,IAAI,EAAE,MAAM,CAAC,CAAC;IAC7F,aAAa,CACX,IAAI,CAAC,MAAM,EAAE,YAAY,CAAC,EAC1B,6HAA6H,EAC7H,MAAM,CACP,CAAC;IACF,aAAa,CACX,IAAI,CAAC,MAAM,EAAE,aAAa,CAAC,EAC3B,GAAG,IAAI,CAAC,SAAS,CAAC;QAChB,IAAI,EAAE,cAAc;QACpB,aAAa,EAAE,CAAC;QAChB,SAAS,EAAE,CAAC;QACZ,WAAW,EAAE,aAAa;QAC1B,KAAK,EAAE,cAAc;QACrB,QAAQ,EAAE,WAAW;QACrB,KAAK,EAAE,gBAAgB;QACvB,QAAQ,EAAE,0BAA0B;QACpC,MAAM,EAAE,0BAA0B;QAClC,IAAI,EAAE,KAAK;QACX,QAAQ,EAAE;YACR;gBACE,IAAI,EAAE,WAAW;gBACjB,OAAO,EAAE;oBACP;wBACE,IAAI,EAAE,aAAa;wBACnB,WAAW,EAAE,QAAQ;wBACrB,IAAI,EAAE,aAAa;wBACnB,OAAO,EAAE,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,IAAI,EAAE,gDAAgD,EAAE,CAAC;wBACnF,QAAQ,EAAE,IAAI;qBACf;iBACF;aACF;SACF;KACF,CAAC,cAAc,EAChB,MAAM,CACP,CAAC;IAEF,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE,KAAK,EAAE,CAAC;AAClC,CAAC"}
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@inspectr/mcplab",
|
|
3
|
-
"version": "1.
|
|
3
|
+
"version": "1.14.0",
|
|
4
4
|
"description": "MCPLab - Test and evaluate MCP servers with LLMs — run evals, compare agents and launch the MCPLab web app",
|
|
5
5
|
"license": "MIT",
|
|
6
6
|
"homepage": "https://mcplab.inspectr.dev",
|
|
@@ -44,12 +44,12 @@
|
|
|
44
44
|
"vitest": "^3.2.4"
|
|
45
45
|
},
|
|
46
46
|
"dependencies": {
|
|
47
|
-
"@inspectr/mcplab-core": "1.
|
|
48
|
-
"@inspectr/mcplab-mcp-server": "1.
|
|
49
|
-
"@inspectr/mcplab-reporting": "1.1.
|
|
47
|
+
"@inspectr/mcplab-core": "1.11.0",
|
|
48
|
+
"@inspectr/mcplab-mcp-server": "1.3.1",
|
|
49
|
+
"@inspectr/mcplab-reporting": "1.1.11",
|
|
50
50
|
"commander": "^12.1.0",
|
|
51
|
-
"dotenv": "^16.
|
|
51
|
+
"dotenv": "^16.6.1",
|
|
52
52
|
"kleur": "^4.1.5",
|
|
53
|
-
"yaml": "^2.
|
|
53
|
+
"yaml": "^2.8.4"
|
|
54
54
|
}
|
|
55
55
|
}
|