@workbench-ai/workbench 0.0.67 → 0.0.69

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (82) hide show
  1. package/dist/dev-open/client.css +387 -287
  2. package/dist/dev-open/client.js +202 -202
  3. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-400-normal.woff +0 -0
  4. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-400-normal.woff2 +0 -0
  5. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-500-normal.woff +0 -0
  6. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-500-normal.woff2 +0 -0
  7. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-600-normal.woff +0 -0
  8. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-600-normal.woff2 +0 -0
  9. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-ext-400-normal.woff +0 -0
  10. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-ext-400-normal.woff2 +0 -0
  11. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-ext-500-normal.woff +0 -0
  12. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-ext-500-normal.woff2 +0 -0
  13. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-ext-600-normal.woff +0 -0
  14. package/dist/dev-open/fonts/ibm-plex-mono-cyrillic-ext-600-normal.woff2 +0 -0
  15. package/dist/dev-open/fonts/ibm-plex-mono-latin-400-normal.woff +0 -0
  16. package/dist/dev-open/fonts/ibm-plex-mono-latin-400-normal.woff2 +0 -0
  17. package/dist/dev-open/fonts/ibm-plex-mono-latin-500-normal.woff +0 -0
  18. package/dist/dev-open/fonts/ibm-plex-mono-latin-500-normal.woff2 +0 -0
  19. package/dist/dev-open/fonts/ibm-plex-mono-latin-600-normal.woff +0 -0
  20. package/dist/dev-open/fonts/ibm-plex-mono-latin-600-normal.woff2 +0 -0
  21. package/dist/dev-open/fonts/ibm-plex-mono-latin-ext-400-normal.woff +0 -0
  22. package/dist/dev-open/fonts/ibm-plex-mono-latin-ext-400-normal.woff2 +0 -0
  23. package/dist/dev-open/fonts/ibm-plex-mono-latin-ext-500-normal.woff +0 -0
  24. package/dist/dev-open/fonts/ibm-plex-mono-latin-ext-500-normal.woff2 +0 -0
  25. package/dist/dev-open/fonts/ibm-plex-mono-latin-ext-600-normal.woff +0 -0
  26. package/dist/dev-open/fonts/ibm-plex-mono-latin-ext-600-normal.woff2 +0 -0
  27. package/dist/dev-open/fonts/ibm-plex-mono-vietnamese-400-normal.woff +0 -0
  28. package/dist/dev-open/fonts/ibm-plex-mono-vietnamese-400-normal.woff2 +0 -0
  29. package/dist/dev-open/fonts/ibm-plex-mono-vietnamese-500-normal.woff +0 -0
  30. package/dist/dev-open/fonts/ibm-plex-mono-vietnamese-500-normal.woff2 +0 -0
  31. package/dist/dev-open/fonts/ibm-plex-mono-vietnamese-600-normal.woff +0 -0
  32. package/dist/dev-open/fonts/ibm-plex-mono-vietnamese-600-normal.woff2 +0 -0
  33. package/dist/dev-open/fonts/libre-caslon-display-latin-400-normal.woff +0 -0
  34. package/dist/dev-open/fonts/libre-caslon-display-latin-400-normal.woff2 +0 -0
  35. package/dist/dev-open/fonts/libre-caslon-display-latin-ext-400-normal.woff +0 -0
  36. package/dist/dev-open/fonts/libre-caslon-display-latin-ext-400-normal.woff2 +0 -0
  37. package/dist/index.d.ts +2 -6
  38. package/dist/index.d.ts.map +1 -1
  39. package/dist/index.js +2035 -5100
  40. package/dist/install-targets.d.ts +35 -0
  41. package/dist/install-targets.d.ts.map +1 -0
  42. package/dist/install-targets.js +188 -0
  43. package/dist/open-server.d.ts +12 -0
  44. package/dist/open-server.d.ts.map +1 -0
  45. package/dist/open-server.js +248 -0
  46. package/dist/output.d.ts +22 -0
  47. package/dist/output.d.ts.map +1 -0
  48. package/dist/output.js +38 -0
  49. package/package.json +5 -5
  50. package/dist/adapter-command-env.d.ts +0 -8
  51. package/dist/adapter-command-env.d.ts.map +0 -1
  52. package/dist/adapter-command-env.js +0 -80
  53. package/dist/adapter-project.d.ts +0 -29
  54. package/dist/adapter-project.d.ts.map +0 -1
  55. package/dist/adapter-project.js +0 -332
  56. package/dist/benchmark-fingerprint.d.ts +0 -6
  57. package/dist/benchmark-fingerprint.d.ts.map +0 -1
  58. package/dist/benchmark-fingerprint.js +0 -42
  59. package/dist/command-model.d.ts +0 -5
  60. package/dist/command-model.d.ts.map +0 -1
  61. package/dist/command-model.js +0 -537
  62. package/dist/dev-open-server.d.ts +0 -18
  63. package/dist/dev-open-server.d.ts.map +0 -1
  64. package/dist/dev-open-server.js +0 -297
  65. package/dist/init-scaffold.d.ts +0 -22
  66. package/dist/init-scaffold.d.ts.map +0 -1
  67. package/dist/init-scaffold.js +0 -30
  68. package/dist/init-template-pack.d.ts +0 -19
  69. package/dist/init-template-pack.d.ts.map +0 -1
  70. package/dist/init-template-pack.js +0 -262
  71. package/dist/local-archive.d.ts +0 -48
  72. package/dist/local-archive.d.ts.map +0 -1
  73. package/dist/local-archive.js +0 -838
  74. package/dist/local-inspection.d.ts +0 -9
  75. package/dist/local-inspection.d.ts.map +0 -1
  76. package/dist/local-inspection.js +0 -354
  77. package/dist/project-source.d.ts +0 -63
  78. package/dist/project-source.d.ts.map +0 -1
  79. package/dist/project-source.js +0 -682
  80. package/dist/workspace-snapshot.d.ts +0 -10
  81. package/dist/workspace-snapshot.d.ts.map +0 -1
  82. package/dist/workspace-snapshot.js +0 -81
@@ -1,537 +0,0 @@
1
- const sourceDirectoryHelp = [
2
- "Directory:",
3
- " Run from a Workbench project containing benchmark.yaml plus candidates/<name>/candidate.yaml.",
4
- " Candidate manifests declare their files with files.path, usually files beside candidate.yaml.",
5
- " Pass --dir DIR or pass benchmark.yaml, candidates/<name>, or candidates/<name>/candidate.yaml as SOURCE.",
6
- ];
7
- export const LOCAL_DEV_OPEN_LIFECYCLE_NOTE = "Keep this command running while using the local web view; Ctrl-C stops the server and the page will stop working.";
8
- const remoteWatchLifecycleNoteLines = [
9
- "Watching is client-side polling only.",
10
- "Stopping this command does not cancel the remote run.",
11
- ];
12
- export const REMOTE_WATCH_LIFECYCLE_NOTE = remoteWatchLifecycleNoteLines.join(" ");
13
- const localOpenLifecycleHelp = [
14
- "Lifecycle:",
15
- " workbench open starts a long-running local web server.",
16
- ` ${LOCAL_DEV_OPEN_LIFECYCLE_NOTE}`,
17
- ];
18
- const remoteWatchLifecycleHelp = [
19
- "Lifecycle:",
20
- ...remoteWatchLifecycleNoteLines.map((line) => ` ${line}`),
21
- ];
22
- const rootLines = [
23
- "Usage:",
24
- " workbench <command> [options]",
25
- "",
26
- ...sourceDirectoryHelp,
27
- "",
28
- "Project:",
29
- " workbench init [DIR] --skill NAME --agent ADAPTER [--from PATH] [--example] [--json]",
30
- " workbench init [DIR] --command NAME [--from PATH] [--example] [--json]",
31
- " workbench check [SOURCE] [--dir DIR] [--json]",
32
- " workbench adapters create PATH [--dir DIR] [--json]",
33
- " workbench adapters list [--dir DIR] [--json]",
34
- " workbench adapters inspect ID [--dir DIR] [--json]",
35
- " workbench adapters test ID|SOURCE [--dir DIR] [--request PATH] [--output DIR] [--json]",
36
- "",
37
- "Runs:",
38
- " workbench eval [SOURCE] [--dir DIR] [--candidate CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--json]",
39
- " workbench eval --remote [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--candidate CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
40
- " workbench improve [SOURCE] [--dir DIR] [--from CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--json]",
41
- " workbench improve --remote [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--base CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
42
- " workbench retry TARGET_ID [--dir DIR] [--remote] [--benchmark OWNER/BENCHMARK] [--watch] [--interval-ms N] [--timeout-ms N] [--json]",
43
- " workbench open [SOURCE|OWNER/BENCHMARK|RUN_ID|CANDIDATE_ID] [--dir DIR] [--remote] [--benchmark OWNER/BENCHMARK] [--run RUN_ID] [--host HOST] [--port N] [--no-open] [--json]",
44
- " workbench restore [--dir DIR] [--candidate CANDIDATE_ID] [--dry-run] [--yes] [--json]",
45
- "",
46
- "Local inspection:",
47
- " workbench runs list [--dir DIR] [--json]",
48
- " workbench runs show RUN_ID [--dir DIR] [--jobs] [--failures] [--json]",
49
- " workbench evaluations list [--dir DIR] [--json]",
50
- " workbench evaluations show EVALUATION_ID [--dir DIR] [--json]",
51
- " workbench executions trace --run RUN_ID --job JOB_ID [--dir DIR] [--json]",
52
- " workbench diagnose [RUN_OR_EVALUATION_ID] [--dir DIR] [--json]",
53
- " workbench candidates list [--dir DIR] [--json]",
54
- " workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
55
- " workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
56
- " workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
57
- " # Installed-agent traces, not Workbench run execution traces:",
58
- " workbench traces collect [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
59
- " workbench traces list [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
60
- " workbench traces show TRACE_ID [--providers codex,claude] [--since 30d] [--workspace DIR] [--json]",
61
- "",
62
- "Remote:",
63
- " workbench login [--base-url URL] [--no-open] [--json]",
64
- " workbench logout [--json]",
65
- " workbench whoami [--dir DIR] [--json]",
66
- " workbench clone OWNER/BENCHMARK [DIR] [--dry-run] [--json]",
67
- " workbench pull [--dir DIR] [--dry-run] [--json]",
68
- " workbench push [SOURCE] [--dir DIR] [--visibility public|private] [--dry-run] [--force] [--json]",
69
- "",
70
- "Auth:",
71
- " workbench auth connect ADAPTER[/SLOT] [--dir DIR] [--method METHOD] [--profile PROFILE] [--profile-root DIR] [--local-only] [--json]",
72
- " workbench auth disconnect ADAPTER[/SLOT] [--profile PROFILE] [--local-only] [--json]",
73
- "",
74
- "Examples:",
75
- " workbench init --skill invoice-review --agent codex",
76
- " workbench eval candidates/current --samples 1",
77
- " workbench improve --budget 2 --samples 1",
78
- " workbench retry eval_local_123 --json",
79
- " workbench open --no-open --json",
80
- " workbench push",
81
- " workbench eval --remote candidates/current --benchmark openbench/invoice-review --watch",
82
- "",
83
- "Environment:",
84
- " WORKBENCH_API_URL sets the remote Workbench API base URL.",
85
- "",
86
- "Default API URL:",
87
- " https://v2.workbench.ai",
88
- ];
89
- export const rootUsage = rootLines.join("\n");
90
- function withSourceDirectoryHelp(lines) {
91
- return withHelpAfterUsage(lines, sourceDirectoryHelp);
92
- }
93
- function withLifecycleHelp(lines, lifecycleHelp) {
94
- return withHelpAfterUsage(lines, lifecycleHelp);
95
- }
96
- function withHelpAfterUsage(lines, helpLines) {
97
- const firstBlankIndex = lines.indexOf("");
98
- if (firstBlankIndex < 0) {
99
- return [...lines, "", ...helpLines];
100
- }
101
- return [
102
- ...lines.slice(0, firstBlankIndex),
103
- "",
104
- ...helpLines,
105
- "",
106
- ...lines.slice(firstBlankIndex + 1),
107
- ];
108
- }
109
- const commandHelp = Object.fromEntries(Object.entries({
110
- init: [
111
- "Usage:",
112
- " workbench init [DIR] --skill NAME --agent ADAPTER [--from PATH] [--example] [--json]",
113
- " workbench init [DIR] --command NAME [--from PATH] [--example] [--json]",
114
- "",
115
- "Scaffold a local Workbench project. benchmark.yaml selects an engine; the built-in workbench engine owns tasks, environment, and scoring under engine.with. candidates/<name>/candidate.yaml owns files.path plus optional prepare and run behavior. Candidate manifests own improvement behavior.",
116
- "",
117
- "Examples:",
118
- " workbench init --skill invoice-review --agent codex",
119
- " workbench init --command command-eval",
120
- ],
121
- check: withSourceDirectoryHelp([
122
- "Usage:",
123
- " workbench check [SOURCE] [--dir DIR] [--json]",
124
- "",
125
- "Validate benchmark.yaml, one candidate manifest.",
126
- "",
127
- "Examples:",
128
- " workbench check",
129
- " workbench check candidates/current --json",
130
- ]),
131
- eval: withSourceDirectoryHelp(withLifecycleHelp([
132
- "Usage:",
133
- " workbench eval [SOURCE] [--dir DIR] [--candidate CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--json]",
134
- " workbench eval --remote [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--candidate CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
135
- "",
136
- "Ensure the selected candidate run has an evaluation for the current benchmark. Without --remote, execution writes local records. With --remote, Workbench starts or reuses a remote run against the configured remote or --benchmark target. Completed work is reused only when candidate, run configuration, source, adapters, benchmark, and samples match; use --rerun to intentionally spend again.",
137
- "",
138
- "Examples:",
139
- " workbench eval --samples 1",
140
- " workbench eval --remote candidates/current --samples 1 --watch --json",
141
- " workbench eval candidates/current --samples 2 --json",
142
- ], remoteWatchLifecycleHelp)),
143
- improve: withSourceDirectoryHelp(withLifecycleHelp([
144
- "Usage:",
145
- " workbench improve [SOURCE] [--dir DIR] [--from CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--json]",
146
- " workbench improve --remote [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--base CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
147
- "",
148
- "Ensure a candidate improvement exists for the selected base, run, budget, and samples. Improve defaults to the evaluated active candidate when it belongs to the current benchmark fingerprint; otherwise it evaluates and uses the authored current candidate. Without --remote, execution writes local records. With --remote, Workbench starts or reuses remote work against the configured remote or --benchmark target. Completed work is reused only when base, run configuration, source, adapters, benchmark, budget, and samples match; use --rerun to intentionally spend again.",
149
- "",
150
- "Examples:",
151
- " workbench improve --budget 1 --samples 1",
152
- " workbench improve --remote candidates/current --budget 1 --samples 1 --watch --json",
153
- " workbench improve candidates/current --from candidate_123 --json",
154
- ], remoteWatchLifecycleHelp)),
155
- retry: withSourceDirectoryHelp(withLifecycleHelp([
156
- "Usage:",
157
- " workbench retry TARGET_ID [--dir DIR] [--json]",
158
- " workbench retry --remote TARGET_ID [--dir DIR] [--benchmark OWNER/BENCHMARK] [--watch] [--interval-ms N] [--timeout-ms N] [--json]",
159
- "",
160
- "Retry a failed run or evaluation by replaying its recorded candidate, configuration, sample count, and improve budget. Use --remote for remote records.",
161
- "",
162
- "Examples:",
163
- " workbench retry eval_local_123 --json",
164
- " workbench retry --remote run_123 --watch --json",
165
- " workbench retry run_local_123 --dir ./my-benchmark",
166
- ], remoteWatchLifecycleHelp)),
167
- open: withSourceDirectoryHelp(withLifecycleHelp([
168
- "Usage:",
169
- " workbench open [SOURCE] [--dir DIR] [--run RUN_ID] [--host HOST] [--port N] [--no-open] [--json]",
170
- " workbench open --remote [OWNER/BENCHMARK|RUN_ID|CANDIDATE_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--no-open] [--json]",
171
- "",
172
- "Start the local Workbench web view for the project and keep serving it until stopped. With --remote, print and optionally open the remote project URL instead.",
173
- "",
174
- "Examples:",
175
- " workbench open",
176
- " workbench open --remote --no-open --json",
177
- " workbench open --run eval_local_123 --port 4317 --no-open --json",
178
- ], localOpenLifecycleHelp)),
179
- restore: withSourceDirectoryHelp([
180
- "Usage:",
181
- " workbench restore [--dir DIR] [--candidate CANDIDATE_ID] [--dry-run] [--yes] [--json]",
182
- "",
183
- "Restore a local candidate snapshot into the candidate files directory.",
184
- "",
185
- "Examples:",
186
- " workbench restore --candidate candidate_123 --dry-run",
187
- " workbench restore --candidate candidate_123 --yes",
188
- ]),
189
- runs: [
190
- "Usage:",
191
- " workbench runs <command> [options]",
192
- "",
193
- "Inspect local run history.",
194
- "",
195
- "Commands:",
196
- " workbench runs list [--dir DIR] [--json]",
197
- " workbench runs show RUN_ID [--dir DIR] [--jobs] [--failures] [--json]",
198
- "",
199
- "Examples:",
200
- " workbench runs list --json",
201
- " workbench runs show eval_local_123 --json",
202
- ],
203
- "runs list": withSourceDirectoryHelp([
204
- "Usage:",
205
- " workbench runs list [--dir DIR] [--json]",
206
- "",
207
- "List local runs.",
208
- "",
209
- "Examples:",
210
- " workbench runs list",
211
- " workbench runs list --dir ./my-benchmark --json",
212
- ]),
213
- "runs show": withSourceDirectoryHelp([
214
- "Usage:",
215
- " workbench runs show RUN_ID [--dir DIR] [--jobs] [--failures] [--json]",
216
- "",
217
- "Show one local run record. Use --jobs for execution jobs and --failures for the generic failure diagnosis.",
218
- "",
219
- "Examples:",
220
- " workbench runs show eval_local_123",
221
- " workbench runs show eval_local_123 --failures --json",
222
- ]),
223
- evaluations: [
224
- "Usage:",
225
- " workbench evaluations <command> [options]",
226
- "",
227
- "Inspect local evaluation comparisons through the same read model used by the browser.",
228
- "",
229
- "Commands:",
230
- " workbench evaluations list [--dir DIR] [--json]",
231
- " workbench evaluations show EVALUATION_ID [--dir DIR] [--json]",
232
- "",
233
- "Examples:",
234
- " workbench evaluations list",
235
- " workbench evaluations show eval_local_123 --json",
236
- ],
237
- "evaluations list": withSourceDirectoryHelp([
238
- "Usage:",
239
- " workbench evaluations list [--dir DIR] [--json]",
240
- "",
241
- "List local evaluations with candidate, configuration, score, and run id.",
242
- "",
243
- "Examples:",
244
- " workbench evaluations list",
245
- " workbench evaluations list --json",
246
- ]),
247
- "evaluations show": withSourceDirectoryHelp([
248
- "Usage:",
249
- " workbench evaluations show EVALUATION_ID [--dir DIR] [--json]",
250
- "",
251
- "Show one local evaluation scorecard and its case summaries.",
252
- "",
253
- "Examples:",
254
- " workbench evaluations show eval_local_123",
255
- " workbench evaluations show eval_local_123 --json",
256
- ]),
257
- executions: [
258
- "Usage:",
259
- " workbench executions <command> [options]",
260
- "",
261
- "Inspect Workbench run execution artifacts. These are runtime traces tied to a Workbench run and job.",
262
- "",
263
- "Commands:",
264
- " workbench executions trace --run RUN_ID --job JOB_ID [--dir DIR] [--json]",
265
- "",
266
- "Examples:",
267
- " workbench executions trace --run run_local_123 --job job_123 --json",
268
- ],
269
- "executions trace": withSourceDirectoryHelp([
270
- "Usage:",
271
- " workbench executions trace --run RUN_ID --job JOB_ID [--dir DIR] [--json]",
272
- "",
273
- "Show the Workbench execution trace for a run job.",
274
- "",
275
- "Examples:",
276
- " workbench executions trace --run run_local_123 --job job_123",
277
- " workbench executions trace --run run_local_123 --job job_123 --json",
278
- ]),
279
- diagnose: withSourceDirectoryHelp([
280
- "Usage:",
281
- " workbench diagnose [RUN_OR_EVALUATION_ID] [--dir DIR] [--json]",
282
- "",
283
- "Summarize generic Workbench failure modes from runs, evaluations, samples, cases, and jobs.",
284
- "",
285
- "Examples:",
286
- " workbench diagnose",
287
- " workbench diagnose eval_local_123 --json",
288
- ]),
289
- candidates: [
290
- "Usage:",
291
- " workbench candidates <command> [options]",
292
- "",
293
- "Inspect local candidates.",
294
- "",
295
- "Commands:",
296
- " workbench candidates list [--dir DIR] [--json]",
297
- " workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
298
- " workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
299
- " workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
300
- "",
301
- "Examples:",
302
- " workbench candidates list --json",
303
- " workbench candidates preview --candidate candidate_123 --path SKILL.md --output -",
304
- ],
305
- "candidates list": withSourceDirectoryHelp([
306
- "Usage:",
307
- " workbench candidates list [--dir DIR] [--json]",
308
- "",
309
- "List local candidates.",
310
- "",
311
- "Examples:",
312
- " workbench candidates list",
313
- " workbench candidates list --json",
314
- ]),
315
- "candidates show": withSourceDirectoryHelp([
316
- "Usage:",
317
- " workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
318
- "",
319
- "Show one local candidate.",
320
- "",
321
- "Examples:",
322
- " workbench candidates show candidate_123",
323
- " workbench candidates show candidate_123 --json",
324
- ]),
325
- "candidates files": withSourceDirectoryHelp([
326
- "Usage:",
327
- " workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
328
- "",
329
- "List files in a local candidate snapshot.",
330
- "",
331
- "Examples:",
332
- " workbench candidates files --candidate candidate_123",
333
- " workbench candidates files --candidate candidate_123 --json",
334
- ]),
335
- "candidates preview": withSourceDirectoryHelp([
336
- "Usage:",
337
- " workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
338
- "",
339
- "Preview a file from a local candidate snapshot.",
340
- "",
341
- "Examples:",
342
- " workbench candidates preview --candidate candidate_123 --path SKILL.md",
343
- " workbench candidates preview --candidate candidate_123 --path SKILL.md --output -",
344
- ]),
345
- clone: [
346
- "Usage:",
347
- " workbench clone OWNER/BENCHMARK [DIR] [--dry-run] [--json]",
348
- "",
349
- "Clone remote source and runtime history into a local Workbench project and remember it as the remote.",
350
- "",
351
- "Examples:",
352
- " workbench clone openbench/invoice-review",
353
- " workbench clone openbench/invoice-review ./invoice-review --dry-run --json",
354
- ],
355
- pull: withSourceDirectoryHelp([
356
- "Usage:",
357
- " workbench pull [--dir DIR] [--dry-run] [--json]",
358
- "",
359
- "Pull source and runtime history from the remembered remote into the local project.",
360
- "",
361
- "Examples:",
362
- " workbench pull --dry-run",
363
- " workbench pull --json",
364
- ]),
365
- push: withSourceDirectoryHelp([
366
- "Usage:",
367
- " workbench push [SOURCE] [--dir DIR] [--visibility public|private] [--dry-run] [--force] [--json]",
368
- "",
369
- "Push local project source and runtime history to the remembered remote, or create one when the project has not been pushed before.",
370
- "",
371
- "Examples:",
372
- " workbench push --dry-run",
373
- " workbench push candidates/current --visibility private --json",
374
- ]),
375
- login: [
376
- "Usage:",
377
- " workbench login [--base-url URL] [--no-open] [--json]",
378
- "",
379
- "Authenticate this machine with Workbench Cloud.",
380
- "",
381
- "Examples:",
382
- " workbench login",
383
- " workbench login --no-open --json",
384
- ],
385
- logout: [
386
- "Usage:",
387
- " workbench logout [--json]",
388
- "",
389
- "Remove the stored Workbench Cloud access token.",
390
- "",
391
- "Examples:",
392
- " workbench logout",
393
- " workbench logout --json",
394
- ],
395
- whoami: withSourceDirectoryHelp([
396
- "Usage:",
397
- " workbench whoami [--dir DIR] [--json]",
398
- "",
399
- "Show the effective Workbench Cloud API target, login status, username, and required adapter auth status.",
400
- "",
401
- "Examples:",
402
- " workbench whoami",
403
- " workbench whoami --json",
404
- ]),
405
- adapters: withSourceDirectoryHelp([
406
- "Usage:",
407
- " workbench adapters create PATH [--dir DIR] [--json]",
408
- " workbench adapters list [--dir DIR] [--json]",
409
- " workbench adapters inspect ID [--dir DIR] [--json]",
410
- " workbench adapters test ID|SOURCE [--dir DIR] [--request PATH] [--output DIR] [--json]",
411
- "",
412
- "Create, list, inspect, and locally replay Workbench adapters. Adapter sources can be local paths, npm: package refs, or git: refs.",
413
- "",
414
- "Examples:",
415
- " workbench adapters list --json",
416
- " workbench adapters test codex --json",
417
- ]),
418
- "adapters create": withSourceDirectoryHelp([
419
- "Usage:",
420
- " workbench adapters create PATH [--dir DIR] [--json]",
421
- "",
422
- "Scaffold a benchmark-contained adapter source.",
423
- "",
424
- "Examples:",
425
- " workbench adapters create adapters/my-agent",
426
- " workbench adapters create adapters/my-agent --json",
427
- ]),
428
- "adapters list": withSourceDirectoryHelp([
429
- "Usage:",
430
- " workbench adapters list [--dir DIR] [--json]",
431
- "",
432
- "List default and project-declared adapters.",
433
- "",
434
- "Examples:",
435
- " workbench adapters list",
436
- " workbench adapters list --json",
437
- ]),
438
- "adapters inspect": withSourceDirectoryHelp([
439
- "Usage:",
440
- " workbench adapters inspect ID [--dir DIR] [--json]",
441
- "",
442
- "Show one adapter manifest and resolved source.",
443
- "",
444
- "Examples:",
445
- " workbench adapters inspect codex",
446
- " workbench adapters inspect adapters/my-agent --json",
447
- ]),
448
- "adapters test": withSourceDirectoryHelp([
449
- "Usage:",
450
- " workbench adapters test ID|SOURCE [--dir DIR] [--request PATH] [--output DIR] [--json]",
451
- "",
452
- "Validate an adapter manifest, or replay its command locally when --request is provided. Without --output, replay uses a temporary output directory.",
453
- "",
454
- "Examples:",
455
- " workbench adapters test codex --json",
456
- " workbench adapters test adapters/my-agent --request request.json --output out/adapter-test",
457
- ]),
458
- traces: [
459
- "Usage:",
460
- " workbench traces collect [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
461
- " workbench traces list [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
462
- " workbench traces show TRACE_ID [--providers codex,claude] [--since 30d] [--workspace DIR] [--json]",
463
- "",
464
- "Inspect local installed-agent traces without calling an LLM. These are not Workbench run execution traces; use workbench executions trace for runtime traces.",
465
- "",
466
- "Examples:",
467
- " workbench traces list --limit 10 --json",
468
- " workbench traces show codex:SESSION:TRACE --json",
469
- ],
470
- "traces collect": [
471
- "Usage:",
472
- " workbench traces collect [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
473
- "",
474
- "Recover recent local Codex and Claude Code sessions to stdout without calling an LLM. --limit defaults to 3 per provider and output reports when matches were capped.",
475
- "",
476
- "Examples:",
477
- " workbench traces collect --limit 5 --json",
478
- " workbench traces collect --providers codex --workspace . --since 14d",
479
- ],
480
- "traces list": [
481
- "Usage:",
482
- " workbench traces list [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
483
- "",
484
- "List recent local Codex and Claude Code sessions as compact trace rows with ids for follow-up inspection.",
485
- "",
486
- "Examples:",
487
- " workbench traces list --limit 10 --json",
488
- " workbench traces list --providers claude --workspace .",
489
- ],
490
- "traces show": [
491
- "Usage:",
492
- " workbench traces show TRACE_ID [--providers codex,claude] [--since 30d] [--workspace DIR] [--json]",
493
- "",
494
- "Show one selected local trace digest by exact id.",
495
- "",
496
- "Examples:",
497
- " workbench traces show codex:SESSION:TRACE --json",
498
- " workbench traces show claude:SESSION:TRACE --workspace .",
499
- ],
500
- auth: [
501
- "Usage:",
502
- " workbench auth <command> [options]",
503
- "",
504
- "Connect adapter auth for local and remote runs.",
505
- "",
506
- "Commands:",
507
- " workbench auth connect ADAPTER[/SLOT] [--dir DIR] [--method METHOD] [--profile PROFILE] [--profile-root DIR] [--local-only] [--json]",
508
- " workbench auth disconnect ADAPTER[/SLOT] [--profile PROFILE] [--local-only] [--json]",
509
- "",
510
- "Examples:",
511
- " workbench auth connect codex --method oauth --json",
512
- " workbench auth disconnect codex --local-only",
513
- ],
514
- "auth connect": [
515
- "Usage:",
516
- " workbench auth connect ADAPTER[/SLOT] [--dir DIR] [--method METHOD] [--profile PROFILE] [--profile-root DIR] [--local-only] [--json]",
517
- "",
518
- "Connect adapter auth using a manifest-supported method.",
519
- "",
520
- "Examples:",
521
- " workbench auth connect codex --method oauth --json",
522
- " workbench auth connect claude --method api-key --profile default --local-only",
523
- ],
524
- "auth disconnect": [
525
- "Usage:",
526
- " workbench auth disconnect ADAPTER[/SLOT] [--profile PROFILE] [--local-only] [--json]",
527
- "",
528
- "Disconnect adapter auth locally and, when logged in, in remote Workbench.",
529
- "",
530
- "Examples:",
531
- " workbench auth disconnect codex --local-only",
532
- " workbench auth disconnect claude --profile default --json",
533
- ],
534
- }).map(([key, lines]) => [key, lines.join("\n")]));
535
- export function commandUsage(commandPath) {
536
- return commandHelp[commandPath] ?? null;
537
- }
@@ -1,18 +0,0 @@
1
- import type { WorkbenchInspection } from "@workbench-ai/workbench-core";
2
- export interface LocalWorkbenchDevServer {
3
- url: string;
4
- close: () => Promise<void>;
5
- }
6
- export interface LocalWorkbenchDevServerOptions {
7
- workspace: string;
8
- host: string;
9
- port: number;
10
- assetsRoot?: string;
11
- }
12
- export interface LocalWorkbenchRequestContext {
13
- workspace: string;
14
- assetsRoot: string;
15
- inspection: WorkbenchInspection;
16
- }
17
- export declare function startLocalWorkbenchDevServer(options: LocalWorkbenchDevServerOptions): Promise<LocalWorkbenchDevServer>;
18
- //# sourceMappingURL=dev-open-server.d.ts.map
@@ -1 +0,0 @@
1
- {"version":3,"file":"dev-open-server.d.ts","sourceRoot":"","sources":["../src/dev-open-server.ts"],"names":[],"mappings":"AAKA,OAAO,KAAK,EAAE,mBAAmB,EAAE,MAAM,8BAA8B,CAAC;AAOxE,MAAM,WAAW,uBAAuB;IACtC,GAAG,EAAE,MAAM,CAAC;IACZ,KAAK,EAAE,MAAM,OAAO,CAAC,IAAI,CAAC,CAAC;CAC5B;AAED,MAAM,WAAW,8BAA8B;IAC7C,SAAS,EAAE,MAAM,CAAC;IAClB,IAAI,EAAE,MAAM,CAAC;IACb,IAAI,EAAE,MAAM,CAAC;IACb,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB;AAWD,MAAM,WAAW,4BAA4B;IAC3C,SAAS,EAAE,MAAM,CAAC;IAClB,UAAU,EAAE,MAAM,CAAC;IACnB,UAAU,EAAE,mBAAmB,CAAC;CACjC;AAID,wBAAsB,4BAA4B,CAChD,OAAO,EAAE,8BAA8B,GACtC,OAAO,CAAC,uBAAuB,CAAC,CA4ClC"}