@wingman-ai/gateway 0.4.2 → 0.4.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +14 -0
- package/dist/agent/config/mcpClientManager.cjs +104 -1
- package/dist/agent/config/mcpClientManager.d.ts +30 -0
- package/dist/agent/config/mcpClientManager.js +104 -1
- package/dist/agent/config/modelFactory.cjs +10 -0
- package/dist/agent/config/modelFactory.js +10 -0
- package/dist/agent/config/xaiImageModel.cjs +242 -0
- package/dist/agent/config/xaiImageModel.d.ts +33 -0
- package/dist/agent/config/xaiImageModel.js +202 -0
- package/dist/agent/tests/mcpClientManager.test.cjs +116 -0
- package/dist/agent/tests/mcpClientManager.test.js +117 -1
- package/dist/agent/tests/mcpResourceTools.test.cjs +101 -0
- package/dist/agent/tests/mcpResourceTools.test.d.ts +1 -0
- package/dist/agent/tests/mcpResourceTools.test.js +95 -0
- package/dist/agent/tests/modelFactory.test.cjs +16 -2
- package/dist/agent/tests/modelFactory.test.js +16 -2
- package/dist/agent/tests/xaiImageModel.test.cjs +194 -0
- package/dist/agent/tests/xaiImageModel.test.d.ts +1 -0
- package/dist/agent/tests/xaiImageModel.test.js +188 -0
- package/dist/agent/tools/mcp_resources.cjs +111 -0
- package/dist/agent/tools/mcp_resources.d.ts +3 -0
- package/dist/agent/tools/mcp_resources.js +77 -0
- package/dist/bench/adapters/commandAdapter.cjs +93 -0
- package/dist/bench/adapters/commandAdapter.d.ts +6 -0
- package/dist/bench/adapters/commandAdapter.js +59 -0
- package/dist/bench/adapters/helpers.cjs +170 -0
- package/dist/bench/adapters/helpers.d.ts +7 -0
- package/dist/bench/adapters/helpers.js +133 -0
- package/dist/bench/adapters/index.cjs +41 -0
- package/dist/bench/adapters/index.d.ts +2 -0
- package/dist/bench/adapters/index.js +7 -0
- package/dist/bench/adapters/wingmanCliAdapter.cjs +100 -0
- package/dist/bench/adapters/wingmanCliAdapter.d.ts +6 -0
- package/dist/bench/adapters/wingmanCliAdapter.js +66 -0
- package/dist/bench/cleanup.cjs +122 -0
- package/dist/bench/cleanup.d.ts +9 -0
- package/dist/bench/cleanup.js +85 -0
- package/dist/bench/config.cjs +190 -0
- package/dist/bench/config.d.ts +2 -0
- package/dist/bench/config.js +156 -0
- package/dist/bench/index.cjs +43 -0
- package/dist/bench/index.d.ts +3 -0
- package/dist/bench/index.js +3 -0
- package/dist/bench/official.cjs +616 -0
- package/dist/bench/official.d.ts +80 -0
- package/dist/bench/official.js +546 -0
- package/dist/bench/officialCli.cjs +204 -0
- package/dist/bench/officialCli.d.ts +5 -0
- package/dist/bench/officialCli.js +170 -0
- package/dist/bench/process.cjs +78 -0
- package/dist/bench/process.d.ts +14 -0
- package/dist/bench/process.js +44 -0
- package/dist/bench/runner.cjs +237 -0
- package/dist/bench/runner.d.ts +7 -0
- package/dist/bench/runner.js +197 -0
- package/dist/bench/scoring.cjs +171 -0
- package/dist/bench/scoring.d.ts +9 -0
- package/dist/bench/scoring.js +137 -0
- package/dist/bench/types.cjs +18 -0
- package/dist/bench/types.d.ts +200 -0
- package/dist/bench/types.js +0 -0
- package/dist/bench/validator.cjs +92 -0
- package/dist/bench/validator.d.ts +2 -0
- package/dist/bench/validator.js +58 -0
- package/dist/cli/config/schema.cjs +36 -1
- package/dist/cli/config/schema.d.ts +46 -0
- package/dist/cli/config/schema.js +36 -1
- package/dist/cli/config/warnings.cjs +119 -51
- package/dist/cli/config/warnings.js +119 -51
- package/dist/cli/core/agentInvoker.cjs +9 -2
- package/dist/cli/core/agentInvoker.d.ts +1 -0
- package/dist/cli/core/agentInvoker.js +9 -2
- package/dist/cli/core/imagePersistence.cjs +17 -1
- package/dist/cli/core/imagePersistence.d.ts +2 -0
- package/dist/cli/core/imagePersistence.js +13 -3
- package/dist/cli/core/sessionManager.cjs +2 -0
- package/dist/cli/core/sessionManager.js +3 -1
- package/dist/cli/types.d.ts +18 -0
- package/dist/gateway/adapters/teams.cjs +419 -0
- package/dist/gateway/adapters/teams.d.ts +47 -0
- package/dist/gateway/adapters/teams.js +361 -0
- package/dist/gateway/http/sms.cjs +286 -0
- package/dist/gateway/http/sms.d.ts +4 -0
- package/dist/gateway/http/sms.js +249 -0
- package/dist/gateway/server.cjs +54 -3
- package/dist/gateway/server.d.ts +2 -0
- package/dist/gateway/server.js +54 -3
- package/dist/gateway/sms/commands.cjs +116 -0
- package/dist/gateway/sms/commands.d.ts +15 -0
- package/dist/gateway/sms/commands.js +79 -0
- package/dist/gateway/sms/control.cjs +118 -0
- package/dist/gateway/sms/control.d.ts +18 -0
- package/dist/gateway/sms/control.js +84 -0
- package/dist/gateway/sms/policyStore.cjs +198 -0
- package/dist/gateway/sms/policyStore.d.ts +37 -0
- package/dist/gateway/sms/policyStore.js +161 -0
- package/dist/providers/registry.cjs +1 -0
- package/dist/providers/registry.js +1 -0
- package/dist/tests/cli-config-warnings.test.cjs +41 -0
- package/dist/tests/cli-config-warnings.test.js +41 -0
- package/dist/tests/cli-init.test.cjs +32 -26
- package/dist/tests/cli-init.test.js +32 -26
- package/dist/tests/gateway-http-security.test.cjs +21 -0
- package/dist/tests/gateway-http-security.test.js +21 -0
- package/dist/tests/gateway-origin-policy.test.cjs +22 -0
- package/dist/tests/gateway-origin-policy.test.js +22 -0
- package/dist/tests/gateway.test.cjs +57 -0
- package/dist/tests/gateway.test.js +57 -0
- package/dist/tests/imagePersistence.test.cjs +26 -0
- package/dist/tests/imagePersistence.test.js +27 -1
- package/dist/tests/run-terminal-bench-official-script.test.cjs +61 -0
- package/dist/tests/run-terminal-bench-official-script.test.d.ts +1 -0
- package/dist/tests/run-terminal-bench-official-script.test.js +55 -0
- package/dist/tests/sessions-api.test.cjs +69 -1
- package/dist/tests/sessions-api.test.js +70 -2
- package/dist/tests/sms-api.test.cjs +183 -0
- package/dist/tests/sms-api.test.d.ts +1 -0
- package/dist/tests/sms-api.test.js +177 -0
- package/dist/tests/sms-commands.test.cjs +90 -0
- package/dist/tests/sms-commands.test.d.ts +1 -0
- package/dist/tests/sms-commands.test.js +84 -0
- package/dist/tests/sms-policy-store.test.cjs +69 -0
- package/dist/tests/sms-policy-store.test.d.ts +1 -0
- package/dist/tests/sms-policy-store.test.js +63 -0
- package/dist/tests/teams-adapter.test.cjs +58 -0
- package/dist/tests/teams-adapter.test.d.ts +1 -0
- package/dist/tests/teams-adapter.test.js +52 -0
- package/dist/tests/terminal-bench-adapters-helpers.test.cjs +64 -0
- package/dist/tests/terminal-bench-adapters-helpers.test.d.ts +1 -0
- package/dist/tests/terminal-bench-adapters-helpers.test.js +58 -0
- package/dist/tests/terminal-bench-cleanup.test.cjs +93 -0
- package/dist/tests/terminal-bench-cleanup.test.d.ts +1 -0
- package/dist/tests/terminal-bench-cleanup.test.js +87 -0
- package/dist/tests/terminal-bench-config.test.cjs +62 -0
- package/dist/tests/terminal-bench-config.test.d.ts +1 -0
- package/dist/tests/terminal-bench-config.test.js +56 -0
- package/dist/tests/terminal-bench-official.test.cjs +194 -0
- package/dist/tests/terminal-bench-official.test.d.ts +1 -0
- package/dist/tests/terminal-bench-official.test.js +188 -0
- package/dist/tests/terminal-bench-runner.test.cjs +82 -0
- package/dist/tests/terminal-bench-runner.test.d.ts +1 -0
- package/dist/tests/terminal-bench-runner.test.js +76 -0
- package/dist/tests/terminal-bench-scoring.test.cjs +128 -0
- package/dist/tests/terminal-bench-scoring.test.d.ts +1 -0
- package/dist/tests/terminal-bench-scoring.test.js +122 -0
- package/dist/tools/mcp-fal-ai.cjs +1 -1
- package/dist/tools/mcp-fal-ai.js +1 -1
- package/dist/webui/assets/index-Cyg_Hs57.css +11 -0
- package/dist/webui/assets/{index-BMekSELC.js → index-DZXLLjaA.js} +109 -109
- package/dist/webui/index.html +2 -2
- package/package.json +11 -2
- package/templates/agents/game-dev/agent.md +122 -63
- package/templates/agents/game-dev/art-director.md +106 -0
- package/templates/agents/game-dev/game-designer.md +87 -0
- package/templates/agents/game-dev/scene-engineer.md +474 -0
- package/dist/webui/assets/index-Cwkg4DKj.css +0 -11
- package/templates/agents/game-dev/art-generation.md +0 -38
- package/templates/agents/game-dev/asset-refinement.md +0 -17
- package/templates/agents/game-dev/planning-idea.md +0 -17
- package/templates/agents/game-dev/ui-specialist.md +0 -17
|
@@ -0,0 +1,204 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
var __webpack_require__ = {};
|
|
3
|
+
(()=>{
|
|
4
|
+
__webpack_require__.d = (exports1, definition)=>{
|
|
5
|
+
for(var key in definition)if (__webpack_require__.o(definition, key) && !__webpack_require__.o(exports1, key)) Object.defineProperty(exports1, key, {
|
|
6
|
+
enumerable: true,
|
|
7
|
+
get: definition[key]
|
|
8
|
+
});
|
|
9
|
+
};
|
|
10
|
+
})();
|
|
11
|
+
(()=>{
|
|
12
|
+
__webpack_require__.o = (obj, prop)=>Object.prototype.hasOwnProperty.call(obj, prop);
|
|
13
|
+
})();
|
|
14
|
+
(()=>{
|
|
15
|
+
__webpack_require__.r = (exports1)=>{
|
|
16
|
+
if ("u" > typeof Symbol && Symbol.toStringTag) Object.defineProperty(exports1, Symbol.toStringTag, {
|
|
17
|
+
value: 'Module'
|
|
18
|
+
});
|
|
19
|
+
Object.defineProperty(exports1, '__esModule', {
|
|
20
|
+
value: true
|
|
21
|
+
});
|
|
22
|
+
};
|
|
23
|
+
})();
|
|
24
|
+
var __webpack_exports__ = {};
|
|
25
|
+
__webpack_require__.r(__webpack_exports__);
|
|
26
|
+
__webpack_require__.d(__webpack_exports__, {
|
|
27
|
+
parseOfficialBenchArgs: ()=>parseOfficialBenchArgs
|
|
28
|
+
});
|
|
29
|
+
const external_node_path_namespaceObject = require("node:path");
|
|
30
|
+
function normalizeWingmanModel(value) {
|
|
31
|
+
const trimmed = value.trim();
|
|
32
|
+
if (trimmed.includes(":")) return trimmed;
|
|
33
|
+
const slash = trimmed.indexOf("/");
|
|
34
|
+
if (slash > 0 && slash < trimmed.length - 1) return `${trimmed.slice(0, slash)}:${trimmed.slice(slash + 1)}`;
|
|
35
|
+
return trimmed;
|
|
36
|
+
}
|
|
37
|
+
function parseOfficialBenchArgs(argv) {
|
|
38
|
+
const args = argv.slice(2);
|
|
39
|
+
let configPath = "bench/config.tb2.json";
|
|
40
|
+
const taskNames = [];
|
|
41
|
+
let useAllTasks = false;
|
|
42
|
+
const agentKwargs = {};
|
|
43
|
+
const overrides = {};
|
|
44
|
+
for(let i = 0; i < args.length; i += 1){
|
|
45
|
+
const arg = args[i];
|
|
46
|
+
if (("--config" === arg || "-c" === arg) && args[i + 1]) {
|
|
47
|
+
configPath = args[i + 1];
|
|
48
|
+
i += 1;
|
|
49
|
+
continue;
|
|
50
|
+
}
|
|
51
|
+
if (arg.startsWith("--config=")) {
|
|
52
|
+
configPath = arg.slice(9);
|
|
53
|
+
continue;
|
|
54
|
+
}
|
|
55
|
+
if (("--task-id" === arg || "--task-name" === arg) && args[i + 1]) {
|
|
56
|
+
taskNames.push(args[i + 1]);
|
|
57
|
+
i += 1;
|
|
58
|
+
continue;
|
|
59
|
+
}
|
|
60
|
+
if (arg.startsWith("--task-id=")) {
|
|
61
|
+
taskNames.push(arg.slice(10));
|
|
62
|
+
continue;
|
|
63
|
+
}
|
|
64
|
+
if (arg.startsWith("--task-name=")) {
|
|
65
|
+
taskNames.push(arg.slice(12));
|
|
66
|
+
continue;
|
|
67
|
+
}
|
|
68
|
+
if ("--all-tasks" === arg) {
|
|
69
|
+
useAllTasks = true;
|
|
70
|
+
continue;
|
|
71
|
+
}
|
|
72
|
+
if ("--registry-url" === arg && args[i + 1]) {
|
|
73
|
+
overrides.registryUrl = args[i + 1];
|
|
74
|
+
i += 1;
|
|
75
|
+
continue;
|
|
76
|
+
}
|
|
77
|
+
if (arg.startsWith("--registry-url=")) {
|
|
78
|
+
overrides.registryUrl = arg.slice(15);
|
|
79
|
+
continue;
|
|
80
|
+
}
|
|
81
|
+
if ("--registry-path" === arg && args[i + 1]) {
|
|
82
|
+
overrides.registryPath = args[i + 1];
|
|
83
|
+
i += 1;
|
|
84
|
+
continue;
|
|
85
|
+
}
|
|
86
|
+
if (arg.startsWith("--registry-path=")) {
|
|
87
|
+
overrides.registryPath = arg.slice(16);
|
|
88
|
+
continue;
|
|
89
|
+
}
|
|
90
|
+
if ("--agent" === arg && args[i + 1]) {
|
|
91
|
+
overrides.agent = args[i + 1];
|
|
92
|
+
i += 1;
|
|
93
|
+
continue;
|
|
94
|
+
}
|
|
95
|
+
if (arg.startsWith("--agent=")) {
|
|
96
|
+
overrides.agent = arg.slice(8);
|
|
97
|
+
continue;
|
|
98
|
+
}
|
|
99
|
+
if ("--agent-import-path" === arg && args[i + 1]) {
|
|
100
|
+
overrides.agentImportPath = args[i + 1];
|
|
101
|
+
i += 1;
|
|
102
|
+
continue;
|
|
103
|
+
}
|
|
104
|
+
if (arg.startsWith("--agent-import-path=")) {
|
|
105
|
+
overrides.agentImportPath = arg.slice(20);
|
|
106
|
+
continue;
|
|
107
|
+
}
|
|
108
|
+
if ("--agent-kwarg" === arg && args[i + 1]) {
|
|
109
|
+
const [key, ...valueParts] = args[i + 1].split("=");
|
|
110
|
+
if (key && valueParts.length > 0) agentKwargs[key] = valueParts.join("=");
|
|
111
|
+
i += 1;
|
|
112
|
+
continue;
|
|
113
|
+
}
|
|
114
|
+
if (arg.startsWith("--agent-kwarg=")) {
|
|
115
|
+
const pair = arg.slice(14);
|
|
116
|
+
const [key, ...valueParts] = pair.split("=");
|
|
117
|
+
if (key && valueParts.length > 0) agentKwargs[key] = valueParts.join("=");
|
|
118
|
+
continue;
|
|
119
|
+
}
|
|
120
|
+
if ("--wingman-agent" === arg && args[i + 1]) {
|
|
121
|
+
agentKwargs.wingman_agent = args[i + 1];
|
|
122
|
+
i += 1;
|
|
123
|
+
continue;
|
|
124
|
+
}
|
|
125
|
+
if (arg.startsWith("--wingman-agent=")) {
|
|
126
|
+
agentKwargs.wingman_agent = arg.slice(16);
|
|
127
|
+
continue;
|
|
128
|
+
}
|
|
129
|
+
if ("--wingman-model" === arg && args[i + 1]) {
|
|
130
|
+
agentKwargs.wingman_model = normalizeWingmanModel(args[i + 1]);
|
|
131
|
+
i += 1;
|
|
132
|
+
continue;
|
|
133
|
+
}
|
|
134
|
+
if (arg.startsWith("--wingman-model=")) {
|
|
135
|
+
agentKwargs.wingman_model = normalizeWingmanModel(arg.slice(16));
|
|
136
|
+
continue;
|
|
137
|
+
}
|
|
138
|
+
if ("--model" === arg && args[i + 1]) {
|
|
139
|
+
overrides.model = args[i + 1];
|
|
140
|
+
i += 1;
|
|
141
|
+
continue;
|
|
142
|
+
}
|
|
143
|
+
if (arg.startsWith("--model=")) {
|
|
144
|
+
overrides.model = arg.slice(8);
|
|
145
|
+
continue;
|
|
146
|
+
}
|
|
147
|
+
if ("--dataset" === arg && args[i + 1]) {
|
|
148
|
+
overrides.dataset = args[i + 1];
|
|
149
|
+
i += 1;
|
|
150
|
+
continue;
|
|
151
|
+
}
|
|
152
|
+
if (arg.startsWith("--dataset=")) {
|
|
153
|
+
overrides.dataset = arg.slice(10);
|
|
154
|
+
continue;
|
|
155
|
+
}
|
|
156
|
+
if ("--n-concurrent" === arg && args[i + 1]) {
|
|
157
|
+
overrides.nConcurrent = Number.parseInt(args[i + 1], 10);
|
|
158
|
+
i += 1;
|
|
159
|
+
continue;
|
|
160
|
+
}
|
|
161
|
+
if (arg.startsWith("--n-concurrent=")) {
|
|
162
|
+
overrides.nConcurrent = Number.parseInt(arg.slice(15), 10);
|
|
163
|
+
continue;
|
|
164
|
+
}
|
|
165
|
+
if ("--n-attempts" === arg && args[i + 1]) {
|
|
166
|
+
overrides.nAttempts = Number.parseInt(args[i + 1], 10);
|
|
167
|
+
i += 1;
|
|
168
|
+
continue;
|
|
169
|
+
}
|
|
170
|
+
if (arg.startsWith("--n-attempts=")) {
|
|
171
|
+
overrides.nAttempts = Number.parseInt(arg.slice(13), 10);
|
|
172
|
+
continue;
|
|
173
|
+
}
|
|
174
|
+
if ("--n-tasks" === arg && args[i + 1]) {
|
|
175
|
+
overrides.nTasks = Number.parseInt(args[i + 1], 10);
|
|
176
|
+
i += 1;
|
|
177
|
+
continue;
|
|
178
|
+
}
|
|
179
|
+
if (arg.startsWith("--n-tasks=")) {
|
|
180
|
+
overrides.nTasks = Number.parseInt(arg.slice(10), 10);
|
|
181
|
+
continue;
|
|
182
|
+
}
|
|
183
|
+
if ("--timeout-ms" === arg && args[i + 1]) {
|
|
184
|
+
overrides.timeoutMs = Number.parseInt(args[i + 1], 10);
|
|
185
|
+
i += 1;
|
|
186
|
+
continue;
|
|
187
|
+
}
|
|
188
|
+
if (arg.startsWith("--timeout-ms=")) overrides.timeoutMs = Number.parseInt(arg.slice(13), 10);
|
|
189
|
+
}
|
|
190
|
+
if (useAllTasks) overrides.taskNames = [];
|
|
191
|
+
else if (taskNames.length > 0) overrides.taskNames = taskNames;
|
|
192
|
+
if (Object.keys(agentKwargs).length > 0) overrides.agentKwargs = agentKwargs;
|
|
193
|
+
return {
|
|
194
|
+
configPath: (0, external_node_path_namespaceObject.resolve)(process.cwd(), configPath),
|
|
195
|
+
overrides
|
|
196
|
+
};
|
|
197
|
+
}
|
|
198
|
+
exports.parseOfficialBenchArgs = __webpack_exports__.parseOfficialBenchArgs;
|
|
199
|
+
for(var __rspack_i in __webpack_exports__)if (-1 === [
|
|
200
|
+
"parseOfficialBenchArgs"
|
|
201
|
+
].indexOf(__rspack_i)) exports[__rspack_i] = __webpack_exports__[__rspack_i];
|
|
202
|
+
Object.defineProperty(exports, '__esModule', {
|
|
203
|
+
value: true
|
|
204
|
+
});
|
|
@@ -0,0 +1,170 @@
|
|
|
1
|
+
import { resolve } from "node:path";
|
|
2
|
+
function normalizeWingmanModel(value) {
|
|
3
|
+
const trimmed = value.trim();
|
|
4
|
+
if (trimmed.includes(":")) return trimmed;
|
|
5
|
+
const slash = trimmed.indexOf("/");
|
|
6
|
+
if (slash > 0 && slash < trimmed.length - 1) return `${trimmed.slice(0, slash)}:${trimmed.slice(slash + 1)}`;
|
|
7
|
+
return trimmed;
|
|
8
|
+
}
|
|
9
|
+
function parseOfficialBenchArgs(argv) {
|
|
10
|
+
const args = argv.slice(2);
|
|
11
|
+
let configPath = "bench/config.tb2.json";
|
|
12
|
+
const taskNames = [];
|
|
13
|
+
let useAllTasks = false;
|
|
14
|
+
const agentKwargs = {};
|
|
15
|
+
const overrides = {};
|
|
16
|
+
for(let i = 0; i < args.length; i += 1){
|
|
17
|
+
const arg = args[i];
|
|
18
|
+
if (("--config" === arg || "-c" === arg) && args[i + 1]) {
|
|
19
|
+
configPath = args[i + 1];
|
|
20
|
+
i += 1;
|
|
21
|
+
continue;
|
|
22
|
+
}
|
|
23
|
+
if (arg.startsWith("--config=")) {
|
|
24
|
+
configPath = arg.slice(9);
|
|
25
|
+
continue;
|
|
26
|
+
}
|
|
27
|
+
if (("--task-id" === arg || "--task-name" === arg) && args[i + 1]) {
|
|
28
|
+
taskNames.push(args[i + 1]);
|
|
29
|
+
i += 1;
|
|
30
|
+
continue;
|
|
31
|
+
}
|
|
32
|
+
if (arg.startsWith("--task-id=")) {
|
|
33
|
+
taskNames.push(arg.slice(10));
|
|
34
|
+
continue;
|
|
35
|
+
}
|
|
36
|
+
if (arg.startsWith("--task-name=")) {
|
|
37
|
+
taskNames.push(arg.slice(12));
|
|
38
|
+
continue;
|
|
39
|
+
}
|
|
40
|
+
if ("--all-tasks" === arg) {
|
|
41
|
+
useAllTasks = true;
|
|
42
|
+
continue;
|
|
43
|
+
}
|
|
44
|
+
if ("--registry-url" === arg && args[i + 1]) {
|
|
45
|
+
overrides.registryUrl = args[i + 1];
|
|
46
|
+
i += 1;
|
|
47
|
+
continue;
|
|
48
|
+
}
|
|
49
|
+
if (arg.startsWith("--registry-url=")) {
|
|
50
|
+
overrides.registryUrl = arg.slice(15);
|
|
51
|
+
continue;
|
|
52
|
+
}
|
|
53
|
+
if ("--registry-path" === arg && args[i + 1]) {
|
|
54
|
+
overrides.registryPath = args[i + 1];
|
|
55
|
+
i += 1;
|
|
56
|
+
continue;
|
|
57
|
+
}
|
|
58
|
+
if (arg.startsWith("--registry-path=")) {
|
|
59
|
+
overrides.registryPath = arg.slice(16);
|
|
60
|
+
continue;
|
|
61
|
+
}
|
|
62
|
+
if ("--agent" === arg && args[i + 1]) {
|
|
63
|
+
overrides.agent = args[i + 1];
|
|
64
|
+
i += 1;
|
|
65
|
+
continue;
|
|
66
|
+
}
|
|
67
|
+
if (arg.startsWith("--agent=")) {
|
|
68
|
+
overrides.agent = arg.slice(8);
|
|
69
|
+
continue;
|
|
70
|
+
}
|
|
71
|
+
if ("--agent-import-path" === arg && args[i + 1]) {
|
|
72
|
+
overrides.agentImportPath = args[i + 1];
|
|
73
|
+
i += 1;
|
|
74
|
+
continue;
|
|
75
|
+
}
|
|
76
|
+
if (arg.startsWith("--agent-import-path=")) {
|
|
77
|
+
overrides.agentImportPath = arg.slice(20);
|
|
78
|
+
continue;
|
|
79
|
+
}
|
|
80
|
+
if ("--agent-kwarg" === arg && args[i + 1]) {
|
|
81
|
+
const [key, ...valueParts] = args[i + 1].split("=");
|
|
82
|
+
if (key && valueParts.length > 0) agentKwargs[key] = valueParts.join("=");
|
|
83
|
+
i += 1;
|
|
84
|
+
continue;
|
|
85
|
+
}
|
|
86
|
+
if (arg.startsWith("--agent-kwarg=")) {
|
|
87
|
+
const pair = arg.slice(14);
|
|
88
|
+
const [key, ...valueParts] = pair.split("=");
|
|
89
|
+
if (key && valueParts.length > 0) agentKwargs[key] = valueParts.join("=");
|
|
90
|
+
continue;
|
|
91
|
+
}
|
|
92
|
+
if ("--wingman-agent" === arg && args[i + 1]) {
|
|
93
|
+
agentKwargs.wingman_agent = args[i + 1];
|
|
94
|
+
i += 1;
|
|
95
|
+
continue;
|
|
96
|
+
}
|
|
97
|
+
if (arg.startsWith("--wingman-agent=")) {
|
|
98
|
+
agentKwargs.wingman_agent = arg.slice(16);
|
|
99
|
+
continue;
|
|
100
|
+
}
|
|
101
|
+
if ("--wingman-model" === arg && args[i + 1]) {
|
|
102
|
+
agentKwargs.wingman_model = normalizeWingmanModel(args[i + 1]);
|
|
103
|
+
i += 1;
|
|
104
|
+
continue;
|
|
105
|
+
}
|
|
106
|
+
if (arg.startsWith("--wingman-model=")) {
|
|
107
|
+
agentKwargs.wingman_model = normalizeWingmanModel(arg.slice(16));
|
|
108
|
+
continue;
|
|
109
|
+
}
|
|
110
|
+
if ("--model" === arg && args[i + 1]) {
|
|
111
|
+
overrides.model = args[i + 1];
|
|
112
|
+
i += 1;
|
|
113
|
+
continue;
|
|
114
|
+
}
|
|
115
|
+
if (arg.startsWith("--model=")) {
|
|
116
|
+
overrides.model = arg.slice(8);
|
|
117
|
+
continue;
|
|
118
|
+
}
|
|
119
|
+
if ("--dataset" === arg && args[i + 1]) {
|
|
120
|
+
overrides.dataset = args[i + 1];
|
|
121
|
+
i += 1;
|
|
122
|
+
continue;
|
|
123
|
+
}
|
|
124
|
+
if (arg.startsWith("--dataset=")) {
|
|
125
|
+
overrides.dataset = arg.slice(10);
|
|
126
|
+
continue;
|
|
127
|
+
}
|
|
128
|
+
if ("--n-concurrent" === arg && args[i + 1]) {
|
|
129
|
+
overrides.nConcurrent = Number.parseInt(args[i + 1], 10);
|
|
130
|
+
i += 1;
|
|
131
|
+
continue;
|
|
132
|
+
}
|
|
133
|
+
if (arg.startsWith("--n-concurrent=")) {
|
|
134
|
+
overrides.nConcurrent = Number.parseInt(arg.slice(15), 10);
|
|
135
|
+
continue;
|
|
136
|
+
}
|
|
137
|
+
if ("--n-attempts" === arg && args[i + 1]) {
|
|
138
|
+
overrides.nAttempts = Number.parseInt(args[i + 1], 10);
|
|
139
|
+
i += 1;
|
|
140
|
+
continue;
|
|
141
|
+
}
|
|
142
|
+
if (arg.startsWith("--n-attempts=")) {
|
|
143
|
+
overrides.nAttempts = Number.parseInt(arg.slice(13), 10);
|
|
144
|
+
continue;
|
|
145
|
+
}
|
|
146
|
+
if ("--n-tasks" === arg && args[i + 1]) {
|
|
147
|
+
overrides.nTasks = Number.parseInt(args[i + 1], 10);
|
|
148
|
+
i += 1;
|
|
149
|
+
continue;
|
|
150
|
+
}
|
|
151
|
+
if (arg.startsWith("--n-tasks=")) {
|
|
152
|
+
overrides.nTasks = Number.parseInt(arg.slice(10), 10);
|
|
153
|
+
continue;
|
|
154
|
+
}
|
|
155
|
+
if ("--timeout-ms" === arg && args[i + 1]) {
|
|
156
|
+
overrides.timeoutMs = Number.parseInt(args[i + 1], 10);
|
|
157
|
+
i += 1;
|
|
158
|
+
continue;
|
|
159
|
+
}
|
|
160
|
+
if (arg.startsWith("--timeout-ms=")) overrides.timeoutMs = Number.parseInt(arg.slice(13), 10);
|
|
161
|
+
}
|
|
162
|
+
if (useAllTasks) overrides.taskNames = [];
|
|
163
|
+
else if (taskNames.length > 0) overrides.taskNames = taskNames;
|
|
164
|
+
if (Object.keys(agentKwargs).length > 0) overrides.agentKwargs = agentKwargs;
|
|
165
|
+
return {
|
|
166
|
+
configPath: resolve(process.cwd(), configPath),
|
|
167
|
+
overrides
|
|
168
|
+
};
|
|
169
|
+
}
|
|
170
|
+
export { parseOfficialBenchArgs };
|
|
@@ -0,0 +1,78 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
var __webpack_require__ = {};
|
|
3
|
+
(()=>{
|
|
4
|
+
__webpack_require__.d = (exports1, definition)=>{
|
|
5
|
+
for(var key in definition)if (__webpack_require__.o(definition, key) && !__webpack_require__.o(exports1, key)) Object.defineProperty(exports1, key, {
|
|
6
|
+
enumerable: true,
|
|
7
|
+
get: definition[key]
|
|
8
|
+
});
|
|
9
|
+
};
|
|
10
|
+
})();
|
|
11
|
+
(()=>{
|
|
12
|
+
__webpack_require__.o = (obj, prop)=>Object.prototype.hasOwnProperty.call(obj, prop);
|
|
13
|
+
})();
|
|
14
|
+
(()=>{
|
|
15
|
+
__webpack_require__.r = (exports1)=>{
|
|
16
|
+
if ("u" > typeof Symbol && Symbol.toStringTag) Object.defineProperty(exports1, Symbol.toStringTag, {
|
|
17
|
+
value: 'Module'
|
|
18
|
+
});
|
|
19
|
+
Object.defineProperty(exports1, '__esModule', {
|
|
20
|
+
value: true
|
|
21
|
+
});
|
|
22
|
+
};
|
|
23
|
+
})();
|
|
24
|
+
var __webpack_exports__ = {};
|
|
25
|
+
__webpack_require__.r(__webpack_exports__);
|
|
26
|
+
__webpack_require__.d(__webpack_exports__, {
|
|
27
|
+
runCommand: ()=>runCommand
|
|
28
|
+
});
|
|
29
|
+
const external_node_child_process_namespaceObject = require("node:child_process");
|
|
30
|
+
const external_node_events_namespaceObject = require("node:events");
|
|
31
|
+
async function runCommand(command, args, options) {
|
|
32
|
+
const startedAt = Date.now();
|
|
33
|
+
const child = (0, external_node_child_process_namespaceObject.spawn)(command, args, {
|
|
34
|
+
cwd: options.cwd,
|
|
35
|
+
env: {
|
|
36
|
+
...process.env,
|
|
37
|
+
...options.env || {}
|
|
38
|
+
},
|
|
39
|
+
shell: true === options.shell,
|
|
40
|
+
stdio: [
|
|
41
|
+
"ignore",
|
|
42
|
+
"pipe",
|
|
43
|
+
"pipe"
|
|
44
|
+
]
|
|
45
|
+
});
|
|
46
|
+
let stdout = "";
|
|
47
|
+
let stderr = "";
|
|
48
|
+
child.stdout?.on("data", (chunk)=>{
|
|
49
|
+
stdout += chunk.toString();
|
|
50
|
+
});
|
|
51
|
+
child.stderr?.on("data", (chunk)=>{
|
|
52
|
+
stderr += chunk.toString();
|
|
53
|
+
});
|
|
54
|
+
let timedOut = false;
|
|
55
|
+
const timer = setTimeout(()=>{
|
|
56
|
+
timedOut = true;
|
|
57
|
+
child.kill("SIGTERM");
|
|
58
|
+
setTimeout(()=>{
|
|
59
|
+
if (!child.killed) child.kill("SIGKILL");
|
|
60
|
+
}, 500);
|
|
61
|
+
}, options.timeoutMs);
|
|
62
|
+
const [code] = await (0, external_node_events_namespaceObject.once)(child, "close");
|
|
63
|
+
clearTimeout(timer);
|
|
64
|
+
return {
|
|
65
|
+
exitCode: code ?? 1,
|
|
66
|
+
timedOut,
|
|
67
|
+
durationMs: Date.now() - startedAt,
|
|
68
|
+
stdout,
|
|
69
|
+
stderr
|
|
70
|
+
};
|
|
71
|
+
}
|
|
72
|
+
exports.runCommand = __webpack_exports__.runCommand;
|
|
73
|
+
for(var __rspack_i in __webpack_exports__)if (-1 === [
|
|
74
|
+
"runCommand"
|
|
75
|
+
].indexOf(__rspack_i)) exports[__rspack_i] = __webpack_exports__[__rspack_i];
|
|
76
|
+
Object.defineProperty(exports, '__esModule', {
|
|
77
|
+
value: true
|
|
78
|
+
});
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
export interface CommandExecutionOptions {
|
|
2
|
+
cwd: string;
|
|
3
|
+
timeoutMs: number;
|
|
4
|
+
env?: Record<string, string>;
|
|
5
|
+
shell?: boolean;
|
|
6
|
+
}
|
|
7
|
+
export interface CommandExecutionResult {
|
|
8
|
+
exitCode: number;
|
|
9
|
+
timedOut: boolean;
|
|
10
|
+
durationMs: number;
|
|
11
|
+
stdout: string;
|
|
12
|
+
stderr: string;
|
|
13
|
+
}
|
|
14
|
+
export declare function runCommand(command: string, args: string[], options: CommandExecutionOptions): Promise<CommandExecutionResult>;
|
|
@@ -0,0 +1,44 @@
|
|
|
1
|
+
import { spawn } from "node:child_process";
|
|
2
|
+
import { once } from "node:events";
|
|
3
|
+
async function runCommand(command, args, options) {
|
|
4
|
+
const startedAt = Date.now();
|
|
5
|
+
const child = spawn(command, args, {
|
|
6
|
+
cwd: options.cwd,
|
|
7
|
+
env: {
|
|
8
|
+
...process.env,
|
|
9
|
+
...options.env || {}
|
|
10
|
+
},
|
|
11
|
+
shell: true === options.shell,
|
|
12
|
+
stdio: [
|
|
13
|
+
"ignore",
|
|
14
|
+
"pipe",
|
|
15
|
+
"pipe"
|
|
16
|
+
]
|
|
17
|
+
});
|
|
18
|
+
let stdout = "";
|
|
19
|
+
let stderr = "";
|
|
20
|
+
child.stdout?.on("data", (chunk)=>{
|
|
21
|
+
stdout += chunk.toString();
|
|
22
|
+
});
|
|
23
|
+
child.stderr?.on("data", (chunk)=>{
|
|
24
|
+
stderr += chunk.toString();
|
|
25
|
+
});
|
|
26
|
+
let timedOut = false;
|
|
27
|
+
const timer = setTimeout(()=>{
|
|
28
|
+
timedOut = true;
|
|
29
|
+
child.kill("SIGTERM");
|
|
30
|
+
setTimeout(()=>{
|
|
31
|
+
if (!child.killed) child.kill("SIGKILL");
|
|
32
|
+
}, 500);
|
|
33
|
+
}, options.timeoutMs);
|
|
34
|
+
const [code] = await once(child, "close");
|
|
35
|
+
clearTimeout(timer);
|
|
36
|
+
return {
|
|
37
|
+
exitCode: code ?? 1,
|
|
38
|
+
timedOut,
|
|
39
|
+
durationMs: Date.now() - startedAt,
|
|
40
|
+
stdout,
|
|
41
|
+
stderr
|
|
42
|
+
};
|
|
43
|
+
}
|
|
44
|
+
export { runCommand };
|