backend-manager 5.6.4 → 5.7.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +35 -0
- package/CLAUDE.md +4 -3
- package/PROGRESS.md +34 -0
- package/docs/ai-library.md +62 -11
- package/docs/cdp-debugging.md +44 -0
- package/docs/cli-output.md +22 -10
- package/docs/mcp.md +166 -43
- package/package.json +1 -1
- package/plans/mcp2.md +247 -0
- package/src/cli/commands/mcp.js +8 -2
- package/src/cli/commands/serve.js +155 -29
- package/src/cli/commands/setup-tests/base-test.js +8 -0
- package/src/cli/commands/setup-tests/firebase-auth.js +26 -0
- package/src/cli/commands/setup-tests/firebase-cli.js +9 -13
- package/src/cli/commands/setup-tests/index.js +4 -0
- package/src/cli/commands/setup-tests/java-installed.js +26 -0
- package/src/cli/commands/setup.js +2 -1
- package/src/cli/commands/test.js +8 -0
- package/src/cli/index.js +14 -0
- package/src/cli/utils/ui.js +27 -5
- package/src/manager/index.js +8 -3
- package/src/manager/libraries/ai/index.js +45 -1
- package/src/manager/libraries/ai/providers/anthropic-format.js +234 -0
- package/src/manager/libraries/ai/providers/anthropic.js +28 -49
- package/src/manager/libraries/ai/providers/claude-code.js +21 -47
- package/src/manager/libraries/ai/providers/openai.js +154 -19
- package/src/manager/libraries/ai/providers/test.js +242 -0
- package/src/manager/libraries/email/data/disposable-domains.json +465 -0
- package/src/mcp/client.js +48 -13
- package/src/mcp/handler.js +222 -69
- package/src/mcp/index.js +48 -18
- package/src/mcp/tools.js +150 -0
- package/src/mcp/utils.js +108 -0
- package/src/test/fixtures/firebase-project/firebase.json +1 -1
- package/test/ai/tools-live.js +170 -0
- package/test/helpers/ai-test-provider.js +202 -0
- package/test/helpers/ai-tools-format.js +350 -0
- package/test/mcp/discovery.js +53 -0
- package/test/mcp/oauth.js +161 -0
- package/test/mcp/protocol.js +268 -0
- package/test/mcp/roles.js +168 -0
- package/test/mcp/utils.js +245 -0
- package/.claude/settings.local.json +0 -12
|
@@ -0,0 +1,202 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Test: deterministic AI test provider (libraries/ai/providers/test.js)
|
|
3
|
+
*
|
|
4
|
+
* The test provider is a first-class provider (the `test` payment-processor
|
|
5
|
+
* precedent) that consumer suites drive with directives embedded in the last
|
|
6
|
+
* user message. These tests exercise the full request() surface directly —
|
|
7
|
+
* no network involved by design.
|
|
8
|
+
*/
|
|
9
|
+
const TestProvider = require('../../src/manager/libraries/ai/providers/test.js');
|
|
10
|
+
const { parseScript } = TestProvider._internals;
|
|
11
|
+
|
|
12
|
+
function makeProvider() {
|
|
13
|
+
// No Manager — the provider falls back to the BEM_TESTING signal, which the
|
|
14
|
+
// test runner sets
|
|
15
|
+
return new TestProvider({});
|
|
16
|
+
}
|
|
17
|
+
|
|
18
|
+
module.exports = {
|
|
19
|
+
description: 'AI test provider (scripted sequences)',
|
|
20
|
+
type: 'group',
|
|
21
|
+
tests: [
|
|
22
|
+
// ─── Script parsing ───
|
|
23
|
+
|
|
24
|
+
{
|
|
25
|
+
name: 'parse-script-orders-steps-and-strips-directives',
|
|
26
|
+
async run({ assert }) {
|
|
27
|
+
const { steps, cleanText } = parseScript(
|
|
28
|
+
'Check my order [[tool:check_order {"orderNumber":"1"}]] please [[reply:{"message":"done"}]]',
|
|
29
|
+
);
|
|
30
|
+
|
|
31
|
+
assert.equal(steps.length, 2, 'two steps');
|
|
32
|
+
assert.equal(steps[0].type, 'tools', 'first step is a tool call');
|
|
33
|
+
assert.equal(steps[0].calls[0].name, 'check_order', 'tool name parsed');
|
|
34
|
+
assert.deepEqual(steps[0].calls[0].arguments, { orderNumber: '1' }, 'tool args parsed');
|
|
35
|
+
assert.equal(steps[1].type, 'reply', 'second step is the reply');
|
|
36
|
+
assert.equal(cleanText, 'Check my order please', 'directives stripped from echo text');
|
|
37
|
+
},
|
|
38
|
+
},
|
|
39
|
+
|
|
40
|
+
{
|
|
41
|
+
name: 'parse-script-delay-attaches-to-next-step',
|
|
42
|
+
async run({ assert }) {
|
|
43
|
+
const { steps } = parseScript('[[delay:50]][[tool:slow_tool]]');
|
|
44
|
+
|
|
45
|
+
assert.equal(steps.length, 1, 'one step');
|
|
46
|
+
assert.equal(steps[0].delay, 50, 'delay attached to the tool step');
|
|
47
|
+
},
|
|
48
|
+
},
|
|
49
|
+
|
|
50
|
+
// ─── Echo default ───
|
|
51
|
+
|
|
52
|
+
{
|
|
53
|
+
name: 'echo-reply-without-directives',
|
|
54
|
+
async run({ assert }) {
|
|
55
|
+
const provider = makeProvider();
|
|
56
|
+
const result = await provider.request({
|
|
57
|
+
messages: [
|
|
58
|
+
{ role: 'system', content: 'sys' },
|
|
59
|
+
{ role: 'user', content: 'hello there' },
|
|
60
|
+
],
|
|
61
|
+
});
|
|
62
|
+
|
|
63
|
+
assert.equal(result.content, 'Echo: hello there', 'echoes the user message');
|
|
64
|
+
assert.equal(result.stopReason, 'end', 'final turn');
|
|
65
|
+
assert.deepEqual(result.toolCalls, [], 'no tool calls');
|
|
66
|
+
assert.equal(result.tokens.total.count > 0, true, 'tokens accounted');
|
|
67
|
+
},
|
|
68
|
+
},
|
|
69
|
+
|
|
70
|
+
{
|
|
71
|
+
name: 'echo-reply-json-mode-wraps-message',
|
|
72
|
+
async run({ assert }) {
|
|
73
|
+
const provider = makeProvider();
|
|
74
|
+
const result = await provider.request({
|
|
75
|
+
response: 'json',
|
|
76
|
+
messages: [{ role: 'user', content: 'hi' }],
|
|
77
|
+
});
|
|
78
|
+
|
|
79
|
+
assert.equal(typeof result.content, 'object', 'parsed object');
|
|
80
|
+
assert.equal(result.content.message, 'Echo: hi', 'wrapped message');
|
|
81
|
+
},
|
|
82
|
+
},
|
|
83
|
+
|
|
84
|
+
// ─── Scripted reply ───
|
|
85
|
+
|
|
86
|
+
{
|
|
87
|
+
name: 'scripted-json-reply',
|
|
88
|
+
async run({ assert }) {
|
|
89
|
+
const provider = makeProvider();
|
|
90
|
+
const result = await provider.request({
|
|
91
|
+
response: 'json',
|
|
92
|
+
messages: [
|
|
93
|
+
{ role: 'user', content: 'whatever [[reply:{"message":"Hi!","actions":[{"type":"reply","label":"More"}]}]]' },
|
|
94
|
+
],
|
|
95
|
+
});
|
|
96
|
+
|
|
97
|
+
assert.equal(result.content.message, 'Hi!', 'scripted message');
|
|
98
|
+
assert.equal(result.content.actions[0].label, 'More', 'scripted actions');
|
|
99
|
+
assert.equal(result.stopReason, 'end', 'final turn');
|
|
100
|
+
},
|
|
101
|
+
},
|
|
102
|
+
|
|
103
|
+
// ─── Tool loop sequence ───
|
|
104
|
+
|
|
105
|
+
{
|
|
106
|
+
name: 'tool-then-reply-sequence-across-turns',
|
|
107
|
+
async run({ assert }) {
|
|
108
|
+
const provider = makeProvider();
|
|
109
|
+
const script = 'check it [[tool:check_order {"orderNumber":"42"}]] [[reply:{"message":"Order 42 shipped"}]]';
|
|
110
|
+
|
|
111
|
+
// Turn 1: the provider emits the tool call
|
|
112
|
+
const first = await provider.request({
|
|
113
|
+
response: 'json',
|
|
114
|
+
messages: [
|
|
115
|
+
{ role: 'system', content: 'sys' },
|
|
116
|
+
{ role: 'user', content: script },
|
|
117
|
+
],
|
|
118
|
+
});
|
|
119
|
+
|
|
120
|
+
assert.equal(first.stopReason, 'tool_use', 'first turn requests the tool');
|
|
121
|
+
assert.equal(first.toolCalls.length, 1, 'one call');
|
|
122
|
+
assert.equal(first.toolCalls[0].name, 'check_order', 'tool name');
|
|
123
|
+
assert.deepEqual(first.toolCalls[0].arguments, { orderNumber: '42' }, 'tool args');
|
|
124
|
+
|
|
125
|
+
// Turn 2: caller appended the assistant turn + tool result — provider
|
|
126
|
+
// moves to the next step (the reply)
|
|
127
|
+
const second = await provider.request({
|
|
128
|
+
response: 'json',
|
|
129
|
+
messages: [
|
|
130
|
+
{ role: 'system', content: 'sys' },
|
|
131
|
+
{ role: 'user', content: script },
|
|
132
|
+
{ role: 'assistant', toolCalls: first.toolCalls },
|
|
133
|
+
{ role: 'tool', toolCallId: first.toolCalls[0].id, content: '{"status":"shipped"}' },
|
|
134
|
+
],
|
|
135
|
+
});
|
|
136
|
+
|
|
137
|
+
assert.equal(second.stopReason, 'end', 'second turn is final');
|
|
138
|
+
assert.equal(second.content.message, 'Order 42 shipped', 'scripted final reply');
|
|
139
|
+
},
|
|
140
|
+
},
|
|
141
|
+
|
|
142
|
+
{
|
|
143
|
+
name: 'parallel-tools-directive-emits-multiple-calls',
|
|
144
|
+
async run({ assert }) {
|
|
145
|
+
const provider = makeProvider();
|
|
146
|
+
const result = await provider.request({
|
|
147
|
+
messages: [
|
|
148
|
+
{ role: 'user', content: '[[tools:[{"name":"a","arguments":{"x":1}},{"name":"b","arguments":{"y":2}}]]]' },
|
|
149
|
+
],
|
|
150
|
+
});
|
|
151
|
+
|
|
152
|
+
assert.equal(result.stopReason, 'tool_use', 'tool turn');
|
|
153
|
+
assert.equal(result.toolCalls.length, 2, 'two parallel calls');
|
|
154
|
+
assert.equal(result.toolCalls[0].name, 'a', 'first call');
|
|
155
|
+
assert.equal(result.toolCalls[1].name, 'b', 'second call');
|
|
156
|
+
assert.deepEqual(result.toolCalls[1].arguments, { y: 2 }, 'second args');
|
|
157
|
+
},
|
|
158
|
+
},
|
|
159
|
+
|
|
160
|
+
// ─── Scripted error ───
|
|
161
|
+
|
|
162
|
+
{
|
|
163
|
+
name: 'scripted-error-throws',
|
|
164
|
+
async run({ assert }) {
|
|
165
|
+
const provider = makeProvider();
|
|
166
|
+
let threw = false;
|
|
167
|
+
|
|
168
|
+
try {
|
|
169
|
+
await provider.request({
|
|
170
|
+
messages: [{ role: 'user', content: '[[error:boom]]' }],
|
|
171
|
+
});
|
|
172
|
+
} catch (e) {
|
|
173
|
+
threw = true;
|
|
174
|
+
assert.equal(e.message, 'boom', 'scripted error message');
|
|
175
|
+
}
|
|
176
|
+
|
|
177
|
+
assert.equal(threw, true, 'throws the scripted error');
|
|
178
|
+
},
|
|
179
|
+
},
|
|
180
|
+
|
|
181
|
+
// ─── Script exhaustion ───
|
|
182
|
+
|
|
183
|
+
{
|
|
184
|
+
name: 'exhausted-script-falls-back-to-echo',
|
|
185
|
+
async run({ assert }) {
|
|
186
|
+
const provider = makeProvider();
|
|
187
|
+
const script = 'hi [[tool:t1]]';
|
|
188
|
+
|
|
189
|
+
const second = await provider.request({
|
|
190
|
+
messages: [
|
|
191
|
+
{ role: 'user', content: script },
|
|
192
|
+
{ role: 'assistant', toolCalls: [{ id: 'c', name: 't1', arguments: {} }] },
|
|
193
|
+
{ role: 'tool', toolCallId: 'c', content: 'r' },
|
|
194
|
+
],
|
|
195
|
+
});
|
|
196
|
+
|
|
197
|
+
assert.equal(second.stopReason, 'end', 'falls back to a final turn');
|
|
198
|
+
assert.equal(String(second.content).startsWith('Echo:'), true, 'echo fallback');
|
|
199
|
+
},
|
|
200
|
+
},
|
|
201
|
+
],
|
|
202
|
+
};
|
|
@@ -0,0 +1,350 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Test: cross-provider AI tools formatting (libraries/ai)
|
|
3
|
+
*
|
|
4
|
+
* Verifies the unified tools interface added for agentic tool loops:
|
|
5
|
+
* - anthropic-format.js — tool defs, tool choice, unified-message → Claude
|
|
6
|
+
* Messages API mapping (tool_use / tool_result blocks), stop reasons
|
|
7
|
+
* - openai.js formatMessages/normalizeToolEntry/normalizeToolChoice — the
|
|
8
|
+
* direct-messages path and Responses API tool envelopes
|
|
9
|
+
* - ai/index.js normalizeOptions — structured conversations are NOT
|
|
10
|
+
* string-flattened; system injections still apply
|
|
11
|
+
*
|
|
12
|
+
* All pure helpers — no network, no assistant.
|
|
13
|
+
*/
|
|
14
|
+
const format = require('../../src/manager/libraries/ai/providers/anthropic-format.js');
|
|
15
|
+
const OpenAI = require('../../src/manager/libraries/ai/providers/openai.js');
|
|
16
|
+
const AI = require('../../src/manager/libraries/ai/index.js');
|
|
17
|
+
|
|
18
|
+
const { formatMessages, normalizeToolEntry, normalizeToolChoice } = OpenAI._internals;
|
|
19
|
+
const { normalizeOptions, isStructuredMessages, SYSTEM_PROMPT_INJECTIONS } = AI._internals;
|
|
20
|
+
|
|
21
|
+
function noopLog() {}
|
|
22
|
+
|
|
23
|
+
const SAMPLE_TOOL = {
|
|
24
|
+
name: 'check_order',
|
|
25
|
+
description: 'Look up an order',
|
|
26
|
+
parameters: { type: 'object', properties: { orderNumber: { type: 'string' } }, required: ['orderNumber'] },
|
|
27
|
+
};
|
|
28
|
+
|
|
29
|
+
module.exports = {
|
|
30
|
+
description: 'AI cross-provider tools formatting',
|
|
31
|
+
type: 'group',
|
|
32
|
+
tests: [
|
|
33
|
+
// ─── anthropic-format: tool definitions ───
|
|
34
|
+
|
|
35
|
+
{
|
|
36
|
+
name: 'anthropic-tool-defs-map-parameters-to-input-schema',
|
|
37
|
+
async run({ assert }) {
|
|
38
|
+
const defs = format.buildToolDefs([SAMPLE_TOOL]);
|
|
39
|
+
|
|
40
|
+
assert.equal(defs.length, 1, 'one def');
|
|
41
|
+
assert.equal(defs[0].name, 'check_order', 'name preserved');
|
|
42
|
+
assert.equal(defs[0].description, 'Look up an order', 'description preserved');
|
|
43
|
+
assert.deepEqual(defs[0].input_schema, SAMPLE_TOOL.parameters, 'parameters → input_schema');
|
|
44
|
+
},
|
|
45
|
+
},
|
|
46
|
+
|
|
47
|
+
{
|
|
48
|
+
name: 'anthropic-tool-defs-accept-explicit-function-type',
|
|
49
|
+
async run({ assert }) {
|
|
50
|
+
const defs = format.buildToolDefs([{ ...SAMPLE_TOOL, type: 'function' }]);
|
|
51
|
+
|
|
52
|
+
assert.equal(defs[0].name, 'check_order', 'function-typed entry accepted');
|
|
53
|
+
},
|
|
54
|
+
},
|
|
55
|
+
|
|
56
|
+
{
|
|
57
|
+
name: 'anthropic-tool-defs-reject-hosted-tools',
|
|
58
|
+
async run({ assert }) {
|
|
59
|
+
let threw = false;
|
|
60
|
+
|
|
61
|
+
try {
|
|
62
|
+
format.buildToolDefs([{ type: 'web_search' }]);
|
|
63
|
+
} catch (e) {
|
|
64
|
+
threw = true;
|
|
65
|
+
}
|
|
66
|
+
|
|
67
|
+
assert.equal(threw, true, 'hosted tool types throw on Anthropic');
|
|
68
|
+
},
|
|
69
|
+
},
|
|
70
|
+
|
|
71
|
+
{
|
|
72
|
+
name: 'anthropic-tool-defs-empty-list-returns-empty',
|
|
73
|
+
async run({ assert }) {
|
|
74
|
+
assert.deepEqual(format.buildToolDefs(undefined), [], 'undefined → []');
|
|
75
|
+
assert.deepEqual(format.buildToolDefs([]), [], '[] → []');
|
|
76
|
+
},
|
|
77
|
+
},
|
|
78
|
+
|
|
79
|
+
// ─── anthropic-format: tool choice ───
|
|
80
|
+
|
|
81
|
+
{
|
|
82
|
+
name: 'anthropic-tool-choice-mapping',
|
|
83
|
+
async run({ assert }) {
|
|
84
|
+
assert.deepEqual(format.buildToolChoice('auto'), { type: 'auto' }, 'auto');
|
|
85
|
+
assert.deepEqual(format.buildToolChoice('required'), { type: 'any' }, 'required → any');
|
|
86
|
+
assert.deepEqual(format.buildToolChoice('none'), { type: 'none' }, 'none');
|
|
87
|
+
assert.deepEqual(format.buildToolChoice({ name: 'check_order' }), { type: 'tool', name: 'check_order' }, 'specific tool');
|
|
88
|
+
assert.equal(format.buildToolChoice(undefined), undefined, 'undefined passes through');
|
|
89
|
+
},
|
|
90
|
+
},
|
|
91
|
+
|
|
92
|
+
// ─── anthropic-format: message building ───
|
|
93
|
+
|
|
94
|
+
{
|
|
95
|
+
name: 'anthropic-messages-assistant-toolcalls-become-tool-use-blocks',
|
|
96
|
+
async run({ assert }) {
|
|
97
|
+
const { system, messages } = format.buildMessages({
|
|
98
|
+
messages: [
|
|
99
|
+
{ role: 'system', content: 'sys' },
|
|
100
|
+
{ role: 'user', content: 'check my order 123' },
|
|
101
|
+
{ role: 'assistant', content: 'Let me check.', toolCalls: [{ id: 'call_1', name: 'check_order', arguments: { orderNumber: '123' } }] },
|
|
102
|
+
],
|
|
103
|
+
});
|
|
104
|
+
|
|
105
|
+
assert.equal(system, 'sys', 'system extracted');
|
|
106
|
+
assert.equal(messages.length, 2, 'user + assistant');
|
|
107
|
+
|
|
108
|
+
const assistantTurn = messages[1];
|
|
109
|
+
assert.equal(assistantTurn.role, 'assistant', 'assistant role');
|
|
110
|
+
assert.equal(assistantTurn.content[0].type, 'text', 'text block first');
|
|
111
|
+
assert.equal(assistantTurn.content[0].text, 'Let me check.', 'text content');
|
|
112
|
+
assert.equal(assistantTurn.content[1].type, 'tool_use', 'tool_use block');
|
|
113
|
+
assert.equal(assistantTurn.content[1].id, 'call_1', 'call id');
|
|
114
|
+
assert.deepEqual(assistantTurn.content[1].input, { orderNumber: '123' }, 'arguments → input');
|
|
115
|
+
},
|
|
116
|
+
},
|
|
117
|
+
|
|
118
|
+
{
|
|
119
|
+
name: 'anthropic-messages-consecutive-tool-results-merge-into-one-user-turn',
|
|
120
|
+
async run({ assert }) {
|
|
121
|
+
const { messages } = format.buildMessages({
|
|
122
|
+
messages: [
|
|
123
|
+
{ role: 'user', content: 'hi' },
|
|
124
|
+
{ role: 'assistant', toolCalls: [
|
|
125
|
+
{ id: 'call_1', name: 'a', arguments: {} },
|
|
126
|
+
{ id: 'call_2', name: 'b', arguments: {} },
|
|
127
|
+
] },
|
|
128
|
+
{ role: 'tool', toolCallId: 'call_1', content: 'result A' },
|
|
129
|
+
{ role: 'tool', toolCallId: 'call_2', content: 'result B' },
|
|
130
|
+
],
|
|
131
|
+
});
|
|
132
|
+
|
|
133
|
+
assert.equal(messages.length, 3, 'user + assistant + ONE merged tool-result user turn');
|
|
134
|
+
|
|
135
|
+
const resultTurn = messages[2];
|
|
136
|
+
assert.equal(resultTurn.role, 'user', 'tool results ride a user turn');
|
|
137
|
+
assert.equal(resultTurn.content.length, 2, 'both results in one turn');
|
|
138
|
+
assert.equal(resultTurn.content[0].type, 'tool_result', 'tool_result block');
|
|
139
|
+
assert.equal(resultTurn.content[0].tool_use_id, 'call_1', 'first result id');
|
|
140
|
+
assert.equal(resultTurn.content[1].tool_use_id, 'call_2', 'second result id');
|
|
141
|
+
},
|
|
142
|
+
},
|
|
143
|
+
|
|
144
|
+
{
|
|
145
|
+
name: 'anthropic-messages-developer-role-folds-into-system',
|
|
146
|
+
async run({ assert }) {
|
|
147
|
+
const { system, messages } = format.buildMessages({
|
|
148
|
+
messages: [
|
|
149
|
+
{ role: 'system', content: 'platform' },
|
|
150
|
+
{ role: 'developer', content: 'operator' },
|
|
151
|
+
{ role: 'user', content: 'hi' },
|
|
152
|
+
],
|
|
153
|
+
});
|
|
154
|
+
|
|
155
|
+
assert.equal(system, 'platform\n\noperator', 'developer folded into system');
|
|
156
|
+
assert.equal(messages.length, 1, 'only the user turn remains');
|
|
157
|
+
},
|
|
158
|
+
},
|
|
159
|
+
|
|
160
|
+
{
|
|
161
|
+
name: 'anthropic-messages-raw-block-arrays-pass-through',
|
|
162
|
+
async run({ assert }) {
|
|
163
|
+
const rawBlocks = [{ type: 'text', text: 'hello' }, { type: 'tool_use', id: 'x', name: 't', input: {} }];
|
|
164
|
+
const { messages } = format.buildMessages({
|
|
165
|
+
messages: [
|
|
166
|
+
{ role: 'user', content: 'hi' },
|
|
167
|
+
{ role: 'assistant', content: rawBlocks },
|
|
168
|
+
],
|
|
169
|
+
});
|
|
170
|
+
|
|
171
|
+
assert.deepEqual(messages[1].content, rawBlocks, 'raw blocks untouched');
|
|
172
|
+
},
|
|
173
|
+
},
|
|
174
|
+
|
|
175
|
+
{
|
|
176
|
+
name: 'anthropic-messages-legacy-prompt-message-form-unchanged',
|
|
177
|
+
async run({ assert }) {
|
|
178
|
+
const { system, messages } = format.buildMessages({
|
|
179
|
+
prompt: { content: 'sys prompt' },
|
|
180
|
+
message: { content: 'user msg' },
|
|
181
|
+
});
|
|
182
|
+
|
|
183
|
+
assert.equal(system, 'sys prompt', 'system from prompt');
|
|
184
|
+
assert.deepEqual(messages, [{ role: 'user', content: 'user msg' }], 'single user turn');
|
|
185
|
+
},
|
|
186
|
+
},
|
|
187
|
+
|
|
188
|
+
// ─── anthropic-format: response extraction ───
|
|
189
|
+
|
|
190
|
+
{
|
|
191
|
+
name: 'anthropic-extract-tool-calls-and-stop-reasons',
|
|
192
|
+
async run({ assert }) {
|
|
193
|
+
const calls = format.extractToolCalls([
|
|
194
|
+
{ type: 'text', text: 'thinking...' },
|
|
195
|
+
{ type: 'tool_use', id: 'call_9', name: 'check_order', input: { orderNumber: '9' } },
|
|
196
|
+
]);
|
|
197
|
+
|
|
198
|
+
assert.equal(calls.length, 1, 'one call');
|
|
199
|
+
assert.deepEqual(calls[0], { id: 'call_9', name: 'check_order', arguments: { orderNumber: '9' } }, 'normalized shape');
|
|
200
|
+
|
|
201
|
+
assert.equal(format.mapStopReason('tool_use'), 'tool_use', 'tool_use');
|
|
202
|
+
assert.equal(format.mapStopReason('max_tokens'), 'max_tokens', 'max_tokens');
|
|
203
|
+
assert.equal(format.mapStopReason('end_turn'), 'end', 'end_turn → end');
|
|
204
|
+
assert.equal(format.mapStopReason('stop_sequence'), 'end', 'stop_sequence → end');
|
|
205
|
+
},
|
|
206
|
+
},
|
|
207
|
+
|
|
208
|
+
// ─── openai: direct-messages path ───
|
|
209
|
+
|
|
210
|
+
{
|
|
211
|
+
name: 'openai-format-messages-maps-toolcalls-to-function-call-items',
|
|
212
|
+
async run({ assert }) {
|
|
213
|
+
const input = formatMessages([
|
|
214
|
+
{ role: 'system', content: 'sys' },
|
|
215
|
+
{ role: 'user', content: 'check order 123' },
|
|
216
|
+
{ role: 'assistant', content: 'Checking.', toolCalls: [{ id: 'call_1', name: 'check_order', arguments: { orderNumber: '123' } }] },
|
|
217
|
+
{ role: 'tool', toolCallId: 'call_1', content: '{"status":"shipped"}' },
|
|
218
|
+
], noopLog);
|
|
219
|
+
|
|
220
|
+
assert.equal(input.length, 5, 'system + user + assistant text + function_call + function_call_output');
|
|
221
|
+
assert.equal(input[0].role, 'system', 'system turn');
|
|
222
|
+
assert.equal(input[1].role, 'user', 'user turn');
|
|
223
|
+
assert.equal(input[2].role, 'assistant', 'assistant text turn');
|
|
224
|
+
assert.equal(input[2].content[0].type, 'output_text', 'assistant uses output_text');
|
|
225
|
+
|
|
226
|
+
const callItem = input[3];
|
|
227
|
+
assert.equal(callItem.type, 'function_call', 'function_call item');
|
|
228
|
+
assert.equal(callItem.call_id, 'call_1', 'call id');
|
|
229
|
+
assert.equal(callItem.name, 'check_order', 'name');
|
|
230
|
+
assert.equal(callItem.arguments, JSON.stringify({ orderNumber: '123' }), 'arguments stringified');
|
|
231
|
+
|
|
232
|
+
const outputItem = input[4];
|
|
233
|
+
assert.equal(outputItem.type, 'function_call_output', 'function_call_output item');
|
|
234
|
+
assert.equal(outputItem.call_id, 'call_1', 'output call id');
|
|
235
|
+
assert.equal(outputItem.output, '{"status":"shipped"}', 'output string');
|
|
236
|
+
},
|
|
237
|
+
},
|
|
238
|
+
|
|
239
|
+
{
|
|
240
|
+
name: 'openai-format-messages-toolcall-turn-without-text-emits-no-message-item',
|
|
241
|
+
async run({ assert }) {
|
|
242
|
+
const input = formatMessages([
|
|
243
|
+
{ role: 'user', content: 'hi' },
|
|
244
|
+
{ role: 'assistant', toolCalls: [{ id: 'c1', name: 't', arguments: {} }] },
|
|
245
|
+
], noopLog);
|
|
246
|
+
|
|
247
|
+
assert.equal(input.length, 2, 'user + function_call only');
|
|
248
|
+
assert.equal(input[1].type, 'function_call', 'no empty assistant message item');
|
|
249
|
+
},
|
|
250
|
+
},
|
|
251
|
+
|
|
252
|
+
// ─── openai: tool envelopes ───
|
|
253
|
+
|
|
254
|
+
{
|
|
255
|
+
name: 'openai-tool-entry-normalization',
|
|
256
|
+
async run({ assert }) {
|
|
257
|
+
const normalized = normalizeToolEntry(SAMPLE_TOOL);
|
|
258
|
+
|
|
259
|
+
assert.equal(normalized.type, 'function', 'function envelope added');
|
|
260
|
+
assert.equal(normalized.name, 'check_order', 'name preserved');
|
|
261
|
+
assert.deepEqual(normalized.parameters, SAMPLE_TOOL.parameters, 'parameters preserved');
|
|
262
|
+
|
|
263
|
+
const hosted = normalizeToolEntry({ type: 'web_search' });
|
|
264
|
+
assert.deepEqual(hosted, { type: 'web_search' }, 'hosted tools pass verbatim');
|
|
265
|
+
},
|
|
266
|
+
},
|
|
267
|
+
|
|
268
|
+
{
|
|
269
|
+
name: 'openai-tool-choice-normalization',
|
|
270
|
+
async run({ assert }) {
|
|
271
|
+
assert.equal(normalizeToolChoice('auto'), 'auto', 'auto passes');
|
|
272
|
+
assert.equal(normalizeToolChoice('required'), 'required', 'required passes');
|
|
273
|
+
assert.equal(normalizeToolChoice('none'), 'none', 'none passes');
|
|
274
|
+
assert.deepEqual(normalizeToolChoice({ name: 'check_order' }), { type: 'function', name: 'check_order' }, 'specific tool');
|
|
275
|
+
},
|
|
276
|
+
},
|
|
277
|
+
|
|
278
|
+
// ─── index.js: normalizeOptions on structured conversations ───
|
|
279
|
+
|
|
280
|
+
{
|
|
281
|
+
name: 'structured-detection',
|
|
282
|
+
async run({ assert }) {
|
|
283
|
+
assert.equal(isStructuredMessages([{ role: 'user', content: 'hi' }]), false, 'plain text is not structured');
|
|
284
|
+
assert.equal(isStructuredMessages([{ role: 'tool', toolCallId: 'x', content: 'r' }]), true, 'tool turn is structured');
|
|
285
|
+
assert.equal(isStructuredMessages([{ role: 'assistant', toolCalls: [{ id: 'x', name: 't' }] }]), true, 'toolCalls turn is structured');
|
|
286
|
+
assert.equal(isStructuredMessages([{ role: 'assistant', content: [{ type: 'tool_use', id: 'x' }] }]), true, 'raw tool_use blocks are structured');
|
|
287
|
+
},
|
|
288
|
+
},
|
|
289
|
+
|
|
290
|
+
{
|
|
291
|
+
name: 'normalize-options-structured-keeps-turns-and-injects-system-rules',
|
|
292
|
+
async run({ assert }) {
|
|
293
|
+
const messages = [
|
|
294
|
+
{ role: 'system', content: 'agent instructions' },
|
|
295
|
+
{ role: 'user', content: 'check order 1' },
|
|
296
|
+
{ role: 'assistant', toolCalls: [{ id: 'c1', name: 'check_order', arguments: {} }] },
|
|
297
|
+
{ role: 'tool', toolCallId: 'c1', content: 'shipped' },
|
|
298
|
+
];
|
|
299
|
+
const out = normalizeOptions({ messages });
|
|
300
|
+
|
|
301
|
+
assert.equal(out.messages.length, 4, 'no turns added or dropped');
|
|
302
|
+
assert.equal(
|
|
303
|
+
out.messages[0].content.includes(SYSTEM_PROMPT_INJECTIONS[0]),
|
|
304
|
+
true,
|
|
305
|
+
'system rules injected into the system turn',
|
|
306
|
+
);
|
|
307
|
+
assert.equal(
|
|
308
|
+
out.messages[0].content.includes('agent instructions'),
|
|
309
|
+
true,
|
|
310
|
+
'original system content preserved',
|
|
311
|
+
);
|
|
312
|
+
assert.deepEqual(out.messages[2], messages[2], 'toolCalls turn untouched');
|
|
313
|
+
assert.deepEqual(out.messages[3], messages[3], 'tool result turn untouched');
|
|
314
|
+
assert.equal(out.prompt, undefined, 'prompt NOT synthesized in structured mode');
|
|
315
|
+
},
|
|
316
|
+
},
|
|
317
|
+
|
|
318
|
+
{
|
|
319
|
+
name: 'normalize-options-structured-without-system-prepends-rules-turn',
|
|
320
|
+
async run({ assert }) {
|
|
321
|
+
const out = normalizeOptions({
|
|
322
|
+
messages: [
|
|
323
|
+
{ role: 'user', content: 'hi' },
|
|
324
|
+
{ role: 'tool', toolCallId: 'c1', content: 'r' },
|
|
325
|
+
],
|
|
326
|
+
});
|
|
327
|
+
|
|
328
|
+
assert.equal(out.messages.length, 3, 'rules turn prepended');
|
|
329
|
+
assert.equal(out.messages[0].role, 'system', 'first turn is system');
|
|
330
|
+
assert.equal(out.messages[0].content.includes(SYSTEM_PROMPT_INJECTIONS[1]), true, 'rules content');
|
|
331
|
+
},
|
|
332
|
+
},
|
|
333
|
+
|
|
334
|
+
{
|
|
335
|
+
name: 'normalize-options-legacy-plain-messages-unchanged-behavior',
|
|
336
|
+
async run({ assert }) {
|
|
337
|
+
const out = normalizeOptions({
|
|
338
|
+
messages: [
|
|
339
|
+
{ role: 'system', content: 'sys' },
|
|
340
|
+
{ role: 'user', content: 'hello' },
|
|
341
|
+
],
|
|
342
|
+
});
|
|
343
|
+
|
|
344
|
+
assert.equal(typeof out.prompt?.content, 'string', 'prompt synthesized for legacy mode');
|
|
345
|
+
assert.equal(out.prompt.content.includes('sys'), true, 'prompt carries system content');
|
|
346
|
+
assert.equal(out.message?.content, 'hello', 'message carries last user turn');
|
|
347
|
+
},
|
|
348
|
+
},
|
|
349
|
+
],
|
|
350
|
+
};
|
|
@@ -0,0 +1,53 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Test: MCP OAuth discovery endpoints
|
|
3
|
+
* Tests .well-known/oauth-authorization-server and .well-known/oauth-protected-resource
|
|
4
|
+
*
|
|
5
|
+
* Run: npx mgr test bem:mcp/discovery
|
|
6
|
+
*/
|
|
7
|
+
const fetch = require('wonderful-fetch');
|
|
8
|
+
|
|
9
|
+
const BASE_URL = 'http://localhost:5002';
|
|
10
|
+
|
|
11
|
+
module.exports = {
|
|
12
|
+
description: 'MCP OAuth discovery endpoints',
|
|
13
|
+
type: 'group',
|
|
14
|
+
|
|
15
|
+
tests: [
|
|
16
|
+
{
|
|
17
|
+
name: 'oauth-authorization-server returns valid metadata',
|
|
18
|
+
async run({ assert }) {
|
|
19
|
+
const response = await fetch(`${BASE_URL}/.well-known/oauth-authorization-server`, {
|
|
20
|
+
method: 'GET',
|
|
21
|
+
response: 'json',
|
|
22
|
+
timeout: 10000,
|
|
23
|
+
});
|
|
24
|
+
|
|
25
|
+
assert.ok(response, 'Discovery endpoint should return a response');
|
|
26
|
+
assert.ok(response.issuer, 'Should have issuer');
|
|
27
|
+
assert.ok(response.authorization_endpoint, 'Should have authorization_endpoint');
|
|
28
|
+
assert.ok(response.token_endpoint, 'Should have token_endpoint');
|
|
29
|
+
assert.ok(response.authorization_endpoint.includes('/backend-manager/mcp/authorize'), 'authorization_endpoint should point to mcp/authorize');
|
|
30
|
+
assert.ok(response.token_endpoint.includes('/backend-manager/mcp/token'), 'token_endpoint should point to mcp/token');
|
|
31
|
+
assert.ok(response.response_types_supported.includes('code'), 'Should support code response type');
|
|
32
|
+
assert.ok(response.code_challenge_methods_supported.includes('S256'), 'Should support PKCE S256');
|
|
33
|
+
},
|
|
34
|
+
},
|
|
35
|
+
|
|
36
|
+
{
|
|
37
|
+
name: 'oauth-protected-resource returns valid metadata',
|
|
38
|
+
async run({ assert }) {
|
|
39
|
+
const response = await fetch(`${BASE_URL}/.well-known/oauth-protected-resource`, {
|
|
40
|
+
method: 'GET',
|
|
41
|
+
response: 'json',
|
|
42
|
+
timeout: 10000,
|
|
43
|
+
});
|
|
44
|
+
|
|
45
|
+
assert.ok(response, 'Protected resource endpoint should return a response');
|
|
46
|
+
assert.ok(response.resource, 'Should have resource');
|
|
47
|
+
assert.ok(response.resource.includes('/backend-manager/mcp'), 'resource should point to MCP endpoint');
|
|
48
|
+
assert.ok(Array.isArray(response.authorization_servers), 'Should have authorization_servers array');
|
|
49
|
+
assert.ok(response.authorization_servers.length > 0, 'Should have at least one authorization server');
|
|
50
|
+
},
|
|
51
|
+
},
|
|
52
|
+
],
|
|
53
|
+
};
|