npm - @workbench-ai/workbench - Versions diffs - 0.0.49 → 0.0.51 - Mend

@workbench-ai/workbench 0.0.49 → 0.0.51

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

package/dist/adapter-project.js +3 -3
package/dist/benchmark-fingerprint.d.ts +1 -1
package/dist/benchmark-fingerprint.d.ts.map +1 -1
package/dist/benchmark-fingerprint.js +4 -6
package/dist/command-model.d.ts.map +1 -1
package/dist/command-model.js +95 -453
package/dist/dev-open/client.css +42 -43
package/dist/dev-open/client.js +145 -145
package/dist/dev-open-server.d.ts +12 -22
package/dist/dev-open-server.d.ts.map +1 -1
package/dist/dev-open-server.js +82 -42
package/dist/index.d.ts.map +1 -1
package/dist/index.js +1758 -1245
package/dist/init-scaffold.d.ts +4 -4
package/dist/init-scaffold.d.ts.map +1 -1
package/dist/init-scaffold.js +2 -2
package/dist/init-template-pack.d.ts +4 -4
package/dist/init-template-pack.d.ts.map +1 -1
package/dist/init-template-pack.js +47 -59
package/dist/local-archive.d.ts +15 -11
package/dist/local-archive.d.ts.map +1 -1
package/dist/local-archive.js +325 -83
package/dist/project-source.d.ts +14 -17
package/dist/project-source.d.ts.map +1 -1
package/dist/project-source.js +80 -151
package/package.json +4 -4

package/dist/command-model.js CHANGED Viewed

@@ -1,13 +1,13 @@
 const sourceDirectoryHelp = [
     "Directory:",
-    "  Run from a Workbench project containing benchmark.yaml plus subjects/<name>/subject.yaml.",
-    "  Subject manifests declare their files with files.path, usually files beside subject.yaml.",
-    "  Pass --dir DIR or pass benchmark.yaml, subjects/<name>, or subjects/<name>/subject.yaml as SOURCE.",
+    "  Run from a Workbench project containing benchmark.yaml plus candidates/<name>/candidate.yaml.",
+    "  Candidate manifests declare their files with files.path, usually files beside candidate.yaml.",
+    "  Pass --dir DIR or pass benchmark.yaml, candidates/<name>, or candidates/<name>/candidate.yaml as SOURCE.",
 ];
 export const LOCAL_DEV_OPEN_LIFECYCLE_NOTE = "Keep this command running while using the local web view; Ctrl-C stops the server and the page will stop working.";
 const hostedWatchLifecycleNoteLines = [
     "Watching is client-side polling only.",
-    "Stopping this command does not cancel the hosted run; use workbench cloud runs cancel RUN_ID to cancel it.",
+    "Stopping this command does not cancel the hosted run.",
 ];
 export const HOSTED_WATCH_LIFECYCLE_NOTE = hostedWatchLifecycleNoteLines.join(" ");
 const localOpenLifecycleHelp = [
@@ -34,45 +34,31 @@ const rootLines = [
     "  workbench adapters inspect ID [--dir DIR] [--json]",
     "  workbench adapters test ID|SOURCE [--dir DIR] [--request PATH] [--output DIR] [--json]",
     "",
-    "Local runs:",
-    "  workbench eval [SOURCE] [--dir DIR] [--subject ID] [--samples N] [--json]",
-    "  workbench improve [SOURCE] [--dir DIR] [--from SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--json]",
-    "  workbench open [SOURCE] [--dir DIR] [--run RUN_ID] [--host HOST] [--port N] [--no-open] [--json]",
-    "  workbench restore [--dir DIR] [--subject ID] [--dry-run] [--yes] [--json]",
+    "Runs:",
+    "  workbench eval [SOURCE] [--dir DIR] [--hosted] [--benchmark OWNER/BENCHMARK] [--candidate CANDIDATE_ID] [--base CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
+    "  workbench improve [SOURCE] [--dir DIR] [--hosted] [--benchmark OWNER/BENCHMARK] [--from CANDIDATE_ID] [--base CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
+    "  workbench retry TARGET_ID [--dir DIR] [--hosted] [--benchmark OWNER/BENCHMARK] [--watch] [--interval-ms N] [--timeout-ms N] [--json]",
+    "  workbench open [SOURCE|OWNER/BENCHMARK|RUN_ID|CANDIDATE_ID] [--dir DIR] [--hosted] [--benchmark OWNER/BENCHMARK] [--run RUN_ID] [--host HOST] [--port N] [--no-open] [--json]",
+    "  workbench restore [--dir DIR] [--candidate CANDIDATE_ID] [--dry-run] [--yes] [--json]",
     "",
     "Local inspection:",
     "  workbench runs list [--dir DIR] [--json]",
     "  workbench runs show RUN_ID [--dir DIR] [--json]",
-    "  workbench subjects list [--dir DIR] [--json]",
-    "  workbench subjects show SUBJECT_ID [--dir DIR] [--json]",
-    "  workbench subjects files [--dir DIR] [--subject ID] [--json]",
-    "  workbench subjects preview --path PATH [--dir DIR] [--subject ID] [--output PATH|-] [--json]",
+    "  workbench candidates list [--dir DIR] [--json]",
+    "  workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
+    "  workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
+    "  workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
     "  workbench traces collect [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
     "  workbench traces list [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
     "  workbench traces show TRACE_ID [--providers codex,claude] [--since 30d] [--workspace DIR] [--json]",
     "",
-    "Remote sync:",
+    "Remote:",
     "  workbench login [--base-url URL] [--no-open] [--json]",
     "  workbench logout [--json]",
     "  workbench whoami [--dir DIR] [--json]",
-    "  workbench clone OWNER/BENCHMARK[@REF] [DIR] [--dry-run] [--json]",
-    "  workbench remote show [--dir DIR] [--json]",
-    "  workbench remote add origin OWNER/BENCHMARK[@REF] [--dir DIR] [--json]",
-    "  workbench remote set-url origin OWNER/BENCHMARK[@REF] [--dir DIR] [--json]",
-    "  workbench remote remove origin [--dir DIR] [--json]",
-    "  workbench fetch [--dir DIR] [--json]",
+    "  workbench clone OWNER/BENCHMARK [DIR] [--dry-run] [--json]",
     "  workbench pull [--dir DIR] [--dry-run] [--json]",
-    "  workbench push [SOURCE] [--dir DIR] [--tag TAG] [--visibility public|private] [--dry-run] [--json]",
-    "",
-    "Hosted runs and resources:",
-    "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--samples N] [--watch] [--dry-run] [--json]",
-    "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--watch] [--dry-run] [--json]",
-    "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|SUBJECT_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
-    "  workbench cloud watch RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--interval-ms N] [--timeout-ms N] [--json]",
-    "  workbench cloud logs RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-    "  workbench cloud star OWNER/BENCHMARK [--json]",
-    "  workbench cloud unstar OWNER/BENCHMARK [--json]",
-    "  workbench cloud benchmarks|runs|subjects <command> [options]",
+    "  workbench push [SOURCE] [--dir DIR] [--visibility public|private] [--dry-run] [--json]",
     "",
     "Auth:",
     "  workbench auth connect ADAPTER[/SLOT] [--dir DIR] [--method METHOD] [--profile PROFILE] [--profile-root DIR] [--local-only] [--json]",
@@ -80,11 +66,12 @@ const rootLines = [
     "",
     "Examples:",
     "  workbench init --skill invoice-review --agent codex",
-    "  workbench eval subjects/codex --samples 1",
+    "  workbench eval candidates/current --samples 1",
     "  workbench improve --budget 2 --samples 1",
+    "  workbench retry eval_local_123 --json",
     "  workbench open --no-open --json",
-    "  workbench push --tag v1",
-    "  workbench cloud eval subjects/codex --benchmark openbench/invoice-review@v1 --watch",
+    "  workbench push",
+    "  workbench eval --hosted candidates/current --benchmark openbench/invoice-review --watch",
     "",
     "Environment:",
     "  WORKBENCH_API_URL sets the hosted Workbench API base URL.",
@@ -118,7 +105,7 @@ const commandHelp = Object.fromEntries(Object.entries({
         "  workbench init [DIR] --skill NAME --agent ADAPTER [--from PATH] [--example] [--json]",
         "  workbench init [DIR] --command NAME [--from PATH] [--example] [--json]",
         "",
-        "Scaffold a local Workbench project. benchmark.yaml selects an engine; the built-in workbench engine owns tasks, environment, and scoring under engine.with. subjects/<name>/subject.yaml owns files.path plus optional prepare and run behavior. optimizers/<name>.yaml owns improvement behavior.",
+        "Scaffold a local Workbench project. benchmark.yaml selects an engine; the built-in workbench engine owns tasks, environment, and scoring under engine.with. candidates/<name>/candidate.yaml owns files.path plus optional prepare and run behavior. Candidate manifests own improvement behavior.",
         "",
         "Examples:",
         "  workbench init --skill invoice-review --agent codex",
@@ -128,51 +115,69 @@ const commandHelp = Object.fromEntries(Object.entries({
         "Usage:",
         "  workbench check [SOURCE] [--dir DIR] [--json]",
         "",
-        "Validate benchmark.yaml, one subject manifest, and an optional optimizer manifest.",
+        "Validate benchmark.yaml, one candidate manifest.",
         "",
         "Examples:",
         "  workbench check",
-        "  workbench check subjects/codex --json",
+        "  workbench check candidates/current --json",
     ]),
-    eval: withSourceDirectoryHelp([
+    eval: withSourceDirectoryHelp(withLifecycleHelp([
         "Usage:",
-        "  workbench eval [SOURCE] [--dir DIR] [--subject ID] [--samples N] [--json]",
+        "  workbench eval [SOURCE] [--dir DIR] [--candidate CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--json]",
+        "  workbench eval --hosted [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--base CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
         "",
-        "Run the selected local subject against the current benchmark and record attempts, results, traces, artifacts, and a run record under .workbench/runtime.",
+        "Ensure the selected candidate run has an evaluation for the current benchmark. Without --hosted, execution writes local records. With --hosted, Workbench starts or reuses a hosted run against the configured remote or --benchmark target. Completed work is reused only when candidate, run configuration, source, adapters, benchmark, and samples match; use --rerun to intentionally spend again.",
         "",
         "Examples:",
         "  workbench eval --samples 1",
-        "  workbench eval subjects/codex --samples 2 --json",
-    ]),
-    improve: withSourceDirectoryHelp([
+        "  workbench eval --hosted candidates/current --samples 1 --watch --json",
+        "  workbench eval candidates/current --samples 2 --json",
+    ], hostedWatchLifecycleHelp)),
+    improve: withSourceDirectoryHelp(withLifecycleHelp([
         "Usage:",
-        "  workbench improve [SOURCE] [--dir DIR] [--from SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--json]",
+        "  workbench improve [SOURCE] [--dir DIR] [--from CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--json]",
+        "  workbench improve --hosted [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--base CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
         "",
-        "Run local subject improvement. By default, Workbench improves the current subject. If it has not been evaluated yet, Workbench evaluates it first. Use --from to improve an explicit subject id.",
+        "Ensure a candidate improvement exists for the selected base, run, budget, and samples. Without --hosted, execution writes local records. With --hosted, Workbench starts or reuses hosted work against the configured remote or --benchmark target. Completed work is reused only when base, run configuration, source, adapters, benchmark, budget, and samples match; use --rerun to intentionally spend again.",
         "",
         "Examples:",
         "  workbench improve --budget 1 --samples 1",
-        "  workbench improve subjects/codex --from subj_123 --optimizer optimizers/codex.yaml --json",
-    ]),
+        "  workbench improve --hosted candidates/current --budget 1 --samples 1 --watch --json",
+        "  workbench improve candidates/current --from candidate_123 --json",
+    ], hostedWatchLifecycleHelp)),
+    retry: withSourceDirectoryHelp(withLifecycleHelp([
+        "Usage:",
+        "  workbench retry TARGET_ID [--dir DIR] [--json]",
+        "  workbench retry --hosted TARGET_ID [--dir DIR] [--benchmark OWNER/BENCHMARK] [--watch] [--interval-ms N] [--timeout-ms N] [--json]",
+        "",
+        "Retry a failed run or evaluation by replaying its recorded candidate, configuration, sample count, and improve budget. Use --hosted for hosted records.",
+        "",
+        "Examples:",
+        "  workbench retry eval_local_123 --json",
+        "  workbench retry --hosted run_123 --watch --json",
+        "  workbench retry run_local_123 --dir ./my-benchmark",
+    ], hostedWatchLifecycleHelp)),
     open: withSourceDirectoryHelp(withLifecycleHelp([
         "Usage:",
         "  workbench open [SOURCE] [--dir DIR] [--run RUN_ID] [--host HOST] [--port N] [--no-open] [--json]",
+        "  workbench open --hosted [OWNER/BENCHMARK|RUN_ID|CANDIDATE_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK] [--no-open] [--json]",
         "",
-        "Start the local Workbench web view for the project and keep serving it until stopped. When a run is supplied, open directly to that run. Without --run, Workbench opens the latest run when one exists.",
+        "Start the local Workbench web view for the project and keep serving it until stopped. With --hosted, print and optionally open the hosted project URL instead.",
         "",
         "Examples:",
         "  workbench open",
+        "  workbench open --hosted --no-open --json",
         "  workbench open --run eval_local_123 --port 4317 --no-open --json",
     ], localOpenLifecycleHelp)),
     restore: withSourceDirectoryHelp([
         "Usage:",
-        "  workbench restore [--dir DIR] [--subject ID] [--dry-run] [--yes] [--json]",
+        "  workbench restore [--dir DIR] [--candidate CANDIDATE_ID] [--dry-run] [--yes] [--json]",
         "",
-        "Restore a local subject snapshot into the subject files directory.",
+        "Restore a local candidate snapshot into the candidate files directory.",
         "",
         "Examples:",
-        "  workbench restore --subject subj_123 --dry-run",
-        "  workbench restore --subject subj_123 --yes",
+        "  workbench restore --candidate candidate_123 --dry-run",
+        "  workbench restore --candidate candidate_123 --yes",
     ]),
     runs: [
         "Usage:",
@@ -208,140 +213,77 @@ const commandHelp = Object.fromEntries(Object.entries({
         "  workbench runs show eval_local_123",
         "  workbench runs show eval_local_123 --json",
     ]),
-    subjects: [
+    candidates: [
         "Usage:",
-        "  workbench subjects <command> [options]",
+        "  workbench candidates <command> [options]",
         "",
-        "Inspect local subjects.",
+        "Inspect local candidates.",
         "",
         "Commands:",
-        "  workbench subjects list [--dir DIR] [--json]",
-        "  workbench subjects show SUBJECT_ID [--dir DIR] [--json]",
-        "  workbench subjects files [--dir DIR] [--subject ID] [--json]",
-        "  workbench subjects preview --path PATH [--dir DIR] [--subject ID] [--output PATH|-] [--json]",
+        "  workbench candidates list [--dir DIR] [--json]",
+        "  workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
+        "  workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
+        "  workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
         "",
         "Examples:",
-        "  workbench subjects list --json",
-        "  workbench subjects preview --subject subj_123 --path SKILL.md --output -",
+        "  workbench candidates list --json",
+        "  workbench candidates preview --candidate candidate_123 --path SKILL.md --output -",
     ],
-    "subjects list": withSourceDirectoryHelp([
+    "candidates list": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects list [--dir DIR] [--json]",
+        "  workbench candidates list [--dir DIR] [--json]",
         "",
-        "List local subjects.",
+        "List local candidates.",
         "",
         "Examples:",
-        "  workbench subjects list",
-        "  workbench subjects list --json",
+        "  workbench candidates list",
+        "  workbench candidates list --json",
     ]),
-    "subjects show": withSourceDirectoryHelp([
+    "candidates show": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects show SUBJECT_ID [--dir DIR] [--json]",
+        "  workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
         "",
-        "Show one local subject.",
+        "Show one local candidate.",
         "",
         "Examples:",
-        "  workbench subjects show subj_123",
-        "  workbench subjects show subj_123 --json",
+        "  workbench candidates show candidate_123",
+        "  workbench candidates show candidate_123 --json",
     ]),
-    "subjects files": withSourceDirectoryHelp([
+    "candidates files": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects files [--dir DIR] [--subject ID] [--json]",
+        "  workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
         "",
-        "List files in a local subject snapshot.",
+        "List files in a local candidate snapshot.",
         "",
         "Examples:",
-        "  workbench subjects files --subject subj_123",
-        "  workbench subjects files --subject subj_123 --json",
+        "  workbench candidates files --candidate candidate_123",
+        "  workbench candidates files --candidate candidate_123 --json",
     ]),
-    "subjects preview": withSourceDirectoryHelp([
+    "candidates preview": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects preview --path PATH [--dir DIR] [--subject ID] [--output PATH|-] [--json]",
+        "  workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
         "",
-        "Preview a file from a local subject snapshot.",
+        "Preview a file from a local candidate snapshot.",
         "",
         "Examples:",
-        "  workbench subjects preview --subject subj_123 --path SKILL.md",
-        "  workbench subjects preview --subject subj_123 --path SKILL.md --output -",
+        "  workbench candidates preview --candidate candidate_123 --path SKILL.md",
+        "  workbench candidates preview --candidate candidate_123 --path SKILL.md --output -",
     ]),
     clone: [
         "Usage:",
-        "  workbench clone OWNER/BENCHMARK[@REF] [DIR] [--dry-run] [--json]",
+        "  workbench clone OWNER/BENCHMARK [DIR] [--dry-run] [--json]",
         "",
-        "Download a hosted benchmark project into a local Workbench project and write .workbench/origin.json.",
+        "Clone hosted source and runtime history into a local Workbench project and remember it as the remote.",
         "",
         "Examples:",
         "  workbench clone openbench/invoice-review",
-        "  workbench clone openbench/invoice-review@v1 ./invoice-review --dry-run --json",
+        "  workbench clone openbench/invoice-review ./invoice-review --dry-run --json",
     ],
-    remote: withSourceDirectoryHelp([
-        "Usage:",
-        "  workbench remote show [--dir DIR] [--json]",
-        "  workbench remote add origin OWNER/BENCHMARK[@REF] [--dir DIR] [--json]",
-        "  workbench remote set-url origin OWNER/BENCHMARK[@REF] [--dir DIR] [--json]",
-        "  workbench remote remove origin [--dir DIR] [--json]",
-        "",
-        "Manage the project origin used by fetch, pull, and push.",
-        "",
-        "Examples:",
-        "  workbench remote show --json",
-        "  workbench remote add origin openbench/invoice-review@v1",
-    ]),
-    "remote show": withSourceDirectoryHelp([
-        "Usage:",
-        "  workbench remote show [--dir DIR] [--json]",
-        "",
-        "Show the configured origin.",
-        "",
-        "Examples:",
-        "  workbench remote show",
-        "  workbench remote show --json",
-    ]),
-    "remote add": withSourceDirectoryHelp([
-        "Usage:",
-        "  workbench remote add origin OWNER/BENCHMARK[@REF] [--dir DIR] [--json]",
-        "",
-        "Set the project origin.",
-        "",
-        "Examples:",
-        "  workbench remote add origin openbench/invoice-review@v1",
-        "  workbench remote add origin openbench/invoice-review --json",
-    ]),
-    "remote set-url": withSourceDirectoryHelp([
-        "Usage:",
-        "  workbench remote set-url origin OWNER/BENCHMARK[@REF] [--dir DIR] [--json]",
-        "",
-        "Replace the project origin.",
-        "",
-        "Examples:",
-        "  workbench remote set-url origin openbench/invoice-review@v2",
-        "  workbench remote set-url origin openbench/invoice-review@v2 --json",
-    ]),
-    "remote remove": withSourceDirectoryHelp([
-        "Usage:",
-        "  workbench remote remove origin [--dir DIR] [--json]",
-        "",
-        "Remove the project origin.",
-        "",
-        "Examples:",
-        "  workbench remote remove origin",
-        "  workbench remote remove origin --json",
-    ]),
-    fetch: withSourceDirectoryHelp([
-        "Usage:",
-        "  workbench fetch [--dir DIR] [--json]",
-        "",
-        "Download remote source into .workbench/fetch without changing project files.",
-        "",
-        "Examples:",
-        "  workbench fetch",
-        "  workbench fetch --json",
-    ]),
     pull: withSourceDirectoryHelp([
         "Usage:",
         "  workbench pull [--dir DIR] [--dry-run] [--json]",
         "",
-        "Update managed project source files from the configured origin.",
+        "Pull source and runtime history from the remembered remote into the local project.",
         "",
         "Examples:",
         "  workbench pull --dry-run",
@@ -349,13 +291,13 @@ const commandHelp = Object.fromEntries(Object.entries({
     ]),
     push: withSourceDirectoryHelp([
         "Usage:",
-        "  workbench push [SOURCE] [--dir DIR] [--tag TAG] [--visibility public|private] [--dry-run] [--json]",
+        "  workbench push [SOURCE] [--dir DIR] [--visibility public|private] [--dry-run] [--json]",
         "",
-        "Create or update the hosted benchmark version from local project source and write .workbench/origin.json.",
+        "Push local project source and runtime history to the remembered remote, or create one when the project has not been pushed before.",
         "",
         "Examples:",
-        "  workbench push --tag v1 --dry-run",
-        "  workbench push subjects/codex --visibility private --json",
+        "  workbench push --dry-run",
+        "  workbench push candidates/current --visibility private --json",
     ]),
     login: [
         "Usage:",
@@ -516,307 +458,7 @@ const commandHelp = Object.fromEntries(Object.entries({
         "  workbench auth disconnect codex --local-only",
         "  workbench auth disconnect claude --profile default --json",
     ],
-    cloud: [
-        "Usage:",
-        "  workbench cloud <command> [options]",
-        "",
-        "Hosted Workbench Cloud execution and resource commands.",
-        "",
-        "Commands:",
-        "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--samples N] [--watch] [--dry-run] [--json]",
-        "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--watch] [--dry-run] [--json]",
-        "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|SUBJECT_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
-        "  workbench cloud watch RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--interval-ms N] [--timeout-ms N] [--json]",
-        "  workbench cloud logs RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud star OWNER/BENCHMARK [--json]",
-        "  workbench cloud unstar OWNER/BENCHMARK [--json]",
-        "  workbench cloud benchmarks|runs|subjects <command> [options]",
-        "",
-        "Examples:",
-        "  workbench cloud eval subjects/codex --benchmark openbench/invoice-review@v1 --dry-run --json",
-        "  workbench cloud runs list --benchmark openbench/invoice-review --json",
-    ],
-    "cloud star": [
-        "Usage:",
-        "  workbench cloud star OWNER/BENCHMARK [--json]",
-        "",
-        "Star a hosted benchmark.",
-        "",
-        "Examples:",
-        "  workbench cloud star openbench/invoice-review",
-        "  workbench cloud star openbench/invoice-review --json",
-    ],
-    "cloud unstar": [
-        "Usage:",
-        "  workbench cloud unstar OWNER/BENCHMARK [--json]",
-        "",
-        "Remove your star from a hosted benchmark.",
-        "",
-        "Examples:",
-        "  workbench cloud unstar openbench/invoice-review",
-        "  workbench cloud unstar openbench/invoice-review --json",
-    ],
-    "cloud eval": withSourceDirectoryHelp(withLifecycleHelp([
-        "Usage:",
-        "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--samples N] [--watch] [--dry-run] [--json]",
-        "",
-        "Submit subject files to Workbench Cloud and run hosted evaluation.",
-        "",
-        "Examples:",
-        "  workbench cloud eval subjects/codex --benchmark openbench/invoice-review@v1 --dry-run --json",
-        "  workbench cloud eval --benchmark openbench/invoice-review --watch",
-    ], hostedWatchLifecycleHelp)),
-    "cloud improve": withSourceDirectoryHelp(withLifecycleHelp([
-        "Usage:",
-        "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--watch] [--dry-run] [--json]",
-        "",
-        "Run hosted subject improvement.",
-        "",
-        "Examples:",
-        "  workbench cloud improve --optimizer optimizers/codex.yaml --benchmark openbench/invoice-review --dry-run",
-        "  workbench cloud improve subjects/codex --optimizer optimizers/codex.yaml --watch --json",
-    ], hostedWatchLifecycleHelp)),
-    "cloud open": [
-        "Usage:",
-        "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|SUBJECT_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
-        "",
-        "Print and open the hosted Workbench URL.",
-        "",
-        "Examples:",
-        "  workbench cloud open openbench/invoice-review --no-open",
-        "  workbench cloud open run_123 --benchmark openbench/invoice-review --json",
-    ],
-    "cloud watch": withSourceDirectoryHelp(withLifecycleHelp([
-        "Usage:",
-        "  workbench cloud watch RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--interval-ms N] [--timeout-ms N] [--json]",
-        "",
-        "Poll a hosted run until it finishes.",
-        "",
-        "Examples:",
-        "  workbench cloud watch run_123 --benchmark openbench/invoice-review",
-        "  workbench cloud watch run_123 --interval-ms 5000 --timeout-ms 600000 --json",
-    ], hostedWatchLifecycleHelp)),
-    "cloud logs": withSourceDirectoryHelp([
-        "Usage:",
-        "  workbench cloud logs RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Show hosted run job statuses and errors.",
-        "",
-        "Examples:",
-        "  workbench cloud logs run_123 --benchmark openbench/invoice-review",
-        "  workbench cloud logs run_123 --json",
-    ]),
-    "cloud benchmarks": [
-        "Usage:",
-        "  workbench cloud benchmarks <command> [options]",
-        "",
-        "Hosted benchmark resource commands.",
-        "",
-        "Commands:",
-        "  workbench cloud benchmarks list [--json]",
-        "  workbench cloud benchmarks show OWNER/BENCHMARK [--json]",
-        "  workbench cloud benchmarks versions OWNER/BENCHMARK [--json]",
-        "  workbench cloud benchmarks starred [--json]",
-        "  workbench cloud benchmarks delete OWNER/BENCHMARK [--dir DIR] [--dry-run] [--json]",
-        "",
-        "Examples:",
-        "  workbench cloud benchmarks list --json",
-        "  workbench cloud benchmarks show openbench/invoice-review",
-    ],
-    "cloud runs": [
-        "Usage:",
-        "  workbench cloud runs <command> [options]",
-        "",
-        "Hosted run resource commands.",
-        "",
-        "Commands:",
-        "  workbench cloud runs list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud runs show RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud runs cancel RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Examples:",
-        "  workbench cloud runs list --benchmark openbench/invoice-review --json",
-        "  workbench cloud runs show run_123 --benchmark openbench/invoice-review",
-    ],
-    "cloud subjects": [
-        "Usage:",
-        "  workbench cloud subjects <command> [options]",
-        "",
-        "Hosted subject resource commands.",
-        "",
-        "Commands:",
-        "  workbench cloud subjects list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects show SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects files SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects preview SUBJECT_ID --path PATH [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--output PATH|-] [--json]",
-        "  workbench cloud subjects pull SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--out DIR] [--json]",
-        "  workbench cloud subjects publish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects unpublish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Examples:",
-        "  workbench cloud subjects list --benchmark openbench/invoice-review --json",
-        "  workbench cloud subjects preview subj_123 --path SKILL.md --output -",
-    ],
 }).map(([key, lines]) => [key, lines.join("\n")]));
 export function commandUsage(commandPath) {
-    return commandHelp[commandPath] ?? cloudNestedCommandUsage(commandPath);
-}
-const hostedCommandHelp = Object.fromEntries(Object.entries({
-    "benchmarks list": [
-        "Usage:",
-        "  workbench cloud benchmarks list [--json]",
-        "",
-        "List public hosted benchmarks.",
-        "",
-        "Examples:",
-        "  workbench cloud benchmarks list",
-        "  workbench cloud benchmarks list --json",
-    ],
-    "benchmarks show": [
-        "Usage:",
-        "  workbench cloud benchmarks show OWNER/BENCHMARK [--json]",
-        "",
-        "Show one hosted benchmark.",
-        "",
-        "Examples:",
-        "  workbench cloud benchmarks show openbench/invoice-review",
-        "  workbench cloud benchmarks show openbench/invoice-review --json",
-    ],
-    "benchmarks versions": [
-        "Usage:",
-        "  workbench cloud benchmarks versions OWNER/BENCHMARK [--json]",
-        "",
-        "List hosted benchmark versions.",
-        "",
-        "Examples:",
-        "  workbench cloud benchmarks versions openbench/invoice-review",
-        "  workbench cloud benchmarks versions openbench/invoice-review --json",
-    ],
-    "benchmarks starred": [
-        "Usage:",
-        "  workbench cloud benchmarks starred [--json]",
-        "",
-        "List benchmarks starred by the current user.",
-        "",
-        "Examples:",
-        "  workbench cloud benchmarks starred",
-        "  workbench cloud benchmarks starred --json",
-    ],
-    "benchmarks delete": [
-        "Usage:",
-        "  workbench cloud benchmarks delete OWNER/BENCHMARK [--dir DIR] [--dry-run] [--json]",
-        "",
-        "Delete a hosted benchmark project that you own.",
-        "",
-        "Examples:",
-        "  workbench cloud benchmarks delete alice/invoice-review --dry-run",
-        "  workbench cloud benchmarks delete alice/invoice-review --json",
-    ],
-    "runs list": [
-        "Usage:",
-        "  workbench cloud runs list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "List hosted runs.",
-        "",
-        "Examples:",
-        "  workbench cloud runs list --benchmark openbench/invoice-review",
-        "  workbench cloud runs list --benchmark openbench/invoice-review --json",
-    ],
-    "runs show": [
-        "Usage:",
-        "  workbench cloud runs show RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Show one hosted run.",
-        "",
-        "Examples:",
-        "  workbench cloud runs show run_123 --benchmark openbench/invoice-review",
-        "  workbench cloud runs show run_123 --json",
-    ],
-    "runs cancel": [
-        "Usage:",
-        "  workbench cloud runs cancel RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Cancel a hosted run.",
-        "",
-        "Examples:",
-        "  workbench cloud runs cancel run_123 --benchmark openbench/invoice-review",
-        "  workbench cloud runs cancel run_123 --json",
-    ],
-    "subjects list": [
-        "Usage:",
-        "  workbench cloud subjects list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "List hosted subjects.",
-        "",
-        "Examples:",
-        "  workbench cloud subjects list --benchmark openbench/invoice-review",
-        "  workbench cloud subjects list --json",
-    ],
-    "subjects show": [
-        "Usage:",
-        "  workbench cloud subjects show SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Show one hosted subject.",
-        "",
-        "Examples:",
-        "  workbench cloud subjects show subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects show subj_123 --json",
-    ],
-    "subjects files": [
-        "Usage:",
-        "  workbench cloud subjects files SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "List files in a hosted subject snapshot.",
-        "",
-        "Examples:",
-        "  workbench cloud subjects files subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects files subj_123 --json",
-    ],
-    "subjects preview": [
-        "Usage:",
-        "  workbench cloud subjects preview SUBJECT_ID --path PATH [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--output PATH|-] [--json]",
-        "",
-        "Preview a file from a hosted subject snapshot.",
-        "",
-        "Examples:",
-        "  workbench cloud subjects preview subj_123 --path SKILL.md --output -",
-        "  workbench cloud subjects preview subj_123 --path SKILL.md --benchmark openbench/invoice-review",
-    ],
-    "subjects pull": [
-        "Usage:",
-        "  workbench cloud subjects pull SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--out DIR] [--json]",
-        "",
-        "Download hosted subject files.",
-        "",
-        "Examples:",
-        "  workbench cloud subjects pull subj_123 --out ./subject-files",
-        "  workbench cloud subjects pull subj_123 --benchmark openbench/invoice-review --json",
-    ],
-    "subjects publish": [
-        "Usage:",
-        "  workbench cloud subjects publish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Make a hosted subject public.",
-        "",
-        "Examples:",
-        "  workbench cloud subjects publish subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects publish subj_123 --json",
-    ],
-    "subjects unpublish": [
-        "Usage:",
-        "  workbench cloud subjects unpublish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "",
-        "Make a hosted subject private.",
-        "",
-        "Examples:",
-        "  workbench cloud subjects unpublish subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects unpublish subj_123 --json",
-    ],
-}).map(([key, lines]) => [key, lines.join("\n")]));
-function cloudNestedCommandUsage(commandPath) {
-    if (!commandPath.startsWith("cloud ")) {
-        return null;
-    }
-    const withoutCloud = commandPath.slice("cloud ".length);
-    return hostedCommandHelp[withoutCloud] ?? null;
+    return commandHelp[commandPath] ?? null;
 }