npm - @workbench-ai/workbench - Versions diffs - 0.0.48 → 0.0.50 - Mend

@workbench-ai/workbench 0.0.48 → 0.0.50

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

package/dist/adapter-project.js +3 -3
package/dist/benchmark-fingerprint.d.ts +1 -1
package/dist/benchmark-fingerprint.d.ts.map +1 -1
package/dist/benchmark-fingerprint.js +4 -6
package/dist/command-model.d.ts.map +1 -1
package/dist/command-model.js +144 -119
package/dist/dev-open/client.css +48 -11
package/dist/dev-open/client.js +149 -149
package/dist/dev-open-server.d.ts +9 -22
package/dist/dev-open-server.d.ts.map +1 -1
package/dist/dev-open-server.js +42 -38
package/dist/index.d.ts.map +1 -1
package/dist/index.js +1472 -505
package/dist/init-scaffold.d.ts +4 -4
package/dist/init-scaffold.d.ts.map +1 -1
package/dist/init-scaffold.js +2 -2
package/dist/init-template-pack.d.ts +4 -4
package/dist/init-template-pack.d.ts.map +1 -1
package/dist/init-template-pack.js +47 -59
package/dist/local-archive.d.ts +11 -11
package/dist/local-archive.d.ts.map +1 -1
package/dist/local-archive.js +87 -74
package/dist/project-source.d.ts +14 -17
package/dist/project-source.d.ts.map +1 -1
package/dist/project-source.js +80 -151
package/package.json +4 -4

package/dist/adapter-project.js CHANGED Viewed

@@ -55,7 +55,7 @@ export async function resolveWorkbenchAdaptersForProject(dir, spec) {
                 discovered = true;
                 continue;
             }
-            throw new Error(`Adapter ${id} is referenced by benchmark/subject/optimizer YAML but is not installed. List its source under adapters in the YAML file that uses it.`);
+            throw new Error(`Adapter ${id} is referenced by benchmark/candidate YAML but is not installed. List its source under adapters in the YAML file that uses it.`);
         }
     }
     assertWorkbenchAdapterOperationSupport(rootAdapterOperationRequirements(spec), [...adapters.values()].map((adapter) => adapter.manifest));
@@ -258,8 +258,8 @@ function rootAdapterOperationRequirements(spec) {
     return [
         { invocation: engineResolveInvocationForSpec(spec), operation: "engine.resolve" },
         { invocation: spec.engineRun, operation: "engine.run" },
-        ...(spec.improve ? [{ invocation: spec.improve, operation: "optimizer.improve" }] : []),
-        { invocation: spec.run, operation: "subject.run" },
+        ...(spec.improve ? [{ invocation: spec.improve, operation: "candidate.improve" }] : []),
+        { invocation: spec.run, operation: "candidate.run" },
     ];
 }
 function rootAdapterInvocations(spec) {

package/dist/benchmark-fingerprint.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 import type { SurfaceSnapshotFile } from "@workbench-ai/workbench-core";
 import type { LocalProjectSource } from "./project-source.js";
 export declare function localBenchmarkFingerprint(project: LocalProjectSource): string;
-export declare function localSubjectFingerprint(project: LocalProjectSource): string;
+export declare function localCandidateFingerprint(project: LocalProjectSource): string;
 export declare function benchmarkFingerprintForFiles(files: readonly SurfaceSnapshotFile[]): string;
 //# sourceMappingURL=benchmark-fingerprint.d.ts.map

package/dist/benchmark-fingerprint.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"benchmark-fingerprint.d.ts","sourceRoot":"","sources":["../src/benchmark-fingerprint.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,mBAAmB,EAAE,MAAM,8BAA8B,CAAC;AAExE,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,qBAAqB,CAAC;AAE9D,wBAAgB,yBAAyB,CAAC,OAAO,EAAE,kBAAkB,GAAG,MAAM,CAO7E;AAED,wBAAgB,~~uBAAuB~~,CAAC,OAAO,EAAE,kBAAkB,GAAG,MAAM,~~CAQ3E~~;AAED,wBAAgB,4BAA4B,CAC1C,KAAK,EAAE,SAAS,mBAAmB,EAAE,GACpC,MAAM,CAgBR"}
1	+ {"version":3,"file":"benchmark-fingerprint.d.ts","sourceRoot":"","sources":["../src/benchmark-fingerprint.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,mBAAmB,EAAE,MAAM,8BAA8B,CAAC;AAExE,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,qBAAqB,CAAC;AAE9D,wBAAgB,yBAAyB,CAAC,OAAO,EAAE,kBAAkB,GAAG,MAAM,CAO7E;AAED,wBAAgB,yBAAyB,CAAC,OAAO,EAAE,kBAAkB,GAAG,MAAM,CAM7E;AAED,wBAAgB,4BAA4B,CAC1C,KAAK,EAAE,SAAS,mBAAmB,EAAE,GACpC,MAAM,CAgBR"}

package/dist/benchmark-fingerprint.js CHANGED Viewed

@@ -7,13 +7,11 @@ export function localBenchmarkFingerprint(project) {
         ...benchmarkAdapterFiles(project),
     ]);
 }
-export function localSubjectFingerprint(project) {
+export function localCandidateFingerprint(project) {
     const hash = createHash("sha256");
-    hash.update("workbench-subject-v1\0");
-    hash.update(project.subjectSource);
-    hash.update("\0runner\0");
-    hash.update(JSON.stringify(project.spec.run));
-    hashSurfaceFiles(hash, project.subjectFiles);
+    hash.update("workbench-candidate-v1\0");
+    hash.update(project.candidateSource);
+    hashSurfaceFiles(hash, project.candidateFiles);
     return hash.digest("hex");
 }
 export function benchmarkFingerprintForFiles(files) {

package/dist/command-model.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"command-model.d.ts","sourceRoot":"","sources":["../src/command-model.ts"],"names":[],"mappings":"AAOA,eAAO,MAAM,6BAA6B,sHAC2E,CAAC;AAOtH,eAAO,MAAM,2BAA2B,QAA0C,CAAC;~~AAuFnF~~,eAAO,MAAM,SAAS,QAAuB,CAAC;~~AA8jB9C~~,wBAAgB,YAAY,CAAC,WAAW,EAAE,MAAM,GAAG,MAAM,GAAG,IAAI,CAE/D"}
1	+ {"version":3,"file":"command-model.d.ts","sourceRoot":"","sources":["../src/command-model.ts"],"names":[],"mappings":"AAOA,eAAO,MAAM,6BAA6B,sHAC2E,CAAC;AAOtH,eAAO,MAAM,2BAA2B,QAA0C,CAAC;AA0FnF,eAAO,MAAM,SAAS,QAAuB,CAAC;AAolB9C,wBAAgB,YAAY,CAAC,WAAW,EAAE,MAAM,GAAG,MAAM,GAAG,IAAI,CAE/D"}

package/dist/command-model.js CHANGED Viewed

@@ -1,8 +1,8 @@
 const sourceDirectoryHelp = [
     "Directory:",
-    "  Run from a Workbench project containing benchmark.yaml plus subjects/<name>/subject.yaml.",
-    "  Subject manifests declare their files with files.path, usually files beside subject.yaml.",
-    "  Pass --dir DIR or pass benchmark.yaml, subjects/<name>, or subjects/<name>/subject.yaml as SOURCE.",
+    "  Run from a Workbench project containing benchmark.yaml plus candidates/<name>/candidate.yaml.",
+    "  Candidate manifests declare their files with files.path, usually files beside candidate.yaml.",
+    "  Pass --dir DIR or pass benchmark.yaml, candidates/<name>, or candidates/<name>/candidate.yaml as SOURCE.",
 ];
 export const LOCAL_DEV_OPEN_LIFECYCLE_NOTE = "Keep this command running while using the local web view; Ctrl-C stops the server and the page will stop working.";
 const hostedWatchLifecycleNoteLines = [
@@ -35,18 +35,19 @@ const rootLines = [
     "  workbench adapters test ID|SOURCE [--dir DIR] [--request PATH] [--output DIR] [--json]",
     "",
     "Local runs:",
-    "  workbench eval [SOURCE] [--dir DIR] [--subject ID] [--samples N] [--json]",
-    "  workbench improve [SOURCE] [--dir DIR] [--from SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--json]",
+    "  workbench eval [SOURCE] [--dir DIR] [--candidate CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--json]",
+    "  workbench improve [SOURCE] [--dir DIR] [--from CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--json]",
+    "  workbench retry TARGET_ID [--dir DIR] [--json]",
     "  workbench open [SOURCE] [--dir DIR] [--run RUN_ID] [--host HOST] [--port N] [--no-open] [--json]",
-    "  workbench restore [--dir DIR] [--subject ID] [--dry-run] [--yes] [--json]",
+    "  workbench restore [--dir DIR] [--candidate CANDIDATE_ID] [--dry-run] [--yes] [--json]",
     "",
     "Local inspection:",
     "  workbench runs list [--dir DIR] [--json]",
     "  workbench runs show RUN_ID [--dir DIR] [--json]",
-    "  workbench subjects list [--dir DIR] [--json]",
-    "  workbench subjects show SUBJECT_ID [--dir DIR] [--json]",
-    "  workbench subjects files [--dir DIR] [--subject ID] [--json]",
-    "  workbench subjects preview --path PATH [--dir DIR] [--subject ID] [--output PATH|-] [--json]",
+    "  workbench candidates list [--dir DIR] [--json]",
+    "  workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
+    "  workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
+    "  workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
     "  workbench traces collect [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
     "  workbench traces list [--providers codex,claude] [--since 30d] [--workspace DIR] [--limit N] [--json]",
     "  workbench traces show TRACE_ID [--providers codex,claude] [--since 30d] [--workspace DIR] [--json]",
@@ -65,14 +66,15 @@ const rootLines = [
     "  workbench push [SOURCE] [--dir DIR] [--tag TAG] [--visibility public|private] [--dry-run] [--json]",
     "",
     "Hosted runs and resources:",
-    "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--samples N] [--watch] [--dry-run] [--json]",
-    "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--watch] [--dry-run] [--json]",
-    "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|SUBJECT_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
+    "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
+    "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
+    "  workbench cloud retry TARGET_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--watch] [--interval-ms N] [--timeout-ms N] [--json]",
+    "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|CANDIDATE_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
     "  workbench cloud watch RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--interval-ms N] [--timeout-ms N] [--json]",
     "  workbench cloud logs RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
     "  workbench cloud star OWNER/BENCHMARK [--json]",
     "  workbench cloud unstar OWNER/BENCHMARK [--json]",
-    "  workbench cloud benchmarks|runs|subjects <command> [options]",
+    "  workbench cloud benchmarks|runs|candidates <command> [options]",
     "",
     "Auth:",
     "  workbench auth connect ADAPTER[/SLOT] [--dir DIR] [--method METHOD] [--profile PROFILE] [--profile-root DIR] [--local-only] [--json]",
@@ -80,11 +82,12 @@ const rootLines = [
     "",
     "Examples:",
     "  workbench init --skill invoice-review --agent codex",
-    "  workbench eval subjects/codex --samples 1",
+    "  workbench eval candidates/current --samples 1",
     "  workbench improve --budget 2 --samples 1",
+    "  workbench retry eval_local_123 --json",
     "  workbench open --no-open --json",
     "  workbench push --tag v1",
-    "  workbench cloud eval subjects/codex --benchmark openbench/invoice-review@v1 --watch",
+    "  workbench cloud eval candidates/current --benchmark openbench/invoice-review@v1 --watch",
     "",
     "Environment:",
     "  WORKBENCH_API_URL sets the hosted Workbench API base URL.",
@@ -118,7 +121,7 @@ const commandHelp = Object.fromEntries(Object.entries({
         "  workbench init [DIR] --skill NAME --agent ADAPTER [--from PATH] [--example] [--json]",
         "  workbench init [DIR] --command NAME [--from PATH] [--example] [--json]",
         "",
-        "Scaffold a local Workbench project. benchmark.yaml selects an engine; the built-in workbench engine owns tasks, environment, and scoring under engine.with. subjects/<name>/subject.yaml owns files.path plus optional prepare and run behavior. optimizers/<name>.yaml owns improvement behavior.",
+        "Scaffold a local Workbench project. benchmark.yaml selects an engine; the built-in workbench engine owns tasks, environment, and scoring under engine.with. candidates/<name>/candidate.yaml owns files.path plus optional prepare and run behavior. Candidate manifests own improvement behavior.",
         "",
         "Examples:",
         "  workbench init --skill invoice-review --agent codex",
@@ -128,31 +131,41 @@ const commandHelp = Object.fromEntries(Object.entries({
         "Usage:",
         "  workbench check [SOURCE] [--dir DIR] [--json]",
         "",
-        "Validate benchmark.yaml, one subject manifest, and an optional optimizer manifest.",
+        "Validate benchmark.yaml, one candidate manifest.",
         "",
         "Examples:",
         "  workbench check",
-        "  workbench check subjects/codex --json",
+        "  workbench check candidates/current --json",
     ]),
     eval: withSourceDirectoryHelp([
         "Usage:",
-        "  workbench eval [SOURCE] [--dir DIR] [--subject ID] [--samples N] [--json]",
+        "  workbench eval [SOURCE] [--dir DIR] [--candidate CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--json]",
         "",
-        "Run the selected local subject against the current benchmark and record attempts, results, traces, artifacts, and a run record under .workbench/runtime.",
+        "Ensure the selected local candidate run has an evaluation for the current benchmark. Completed work is reused only when candidate, run configuration, source, adapters, benchmark, and samples match; use --rerun to intentionally spend again.",
         "",
         "Examples:",
         "  workbench eval --samples 1",
-        "  workbench eval subjects/codex --samples 2 --json",
+        "  workbench eval candidates/current --samples 2 --json",
     ]),
     improve: withSourceDirectoryHelp([
         "Usage:",
-        "  workbench improve [SOURCE] [--dir DIR] [--from SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--json]",
+        "  workbench improve [SOURCE] [--dir DIR] [--from CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--json]",
         "",
-        "Run local subject improvement. By default, Workbench improves the current subject. If it has not been evaluated yet, Workbench evaluates it first. Use --from to improve an explicit subject id.",
+        "Ensure a local candidate improvement exists for the selected base, run, budget, and samples. Completed work is reused only when base, run configuration, source, adapters, benchmark, budget, and samples match; use --rerun to intentionally spend again.",
         "",
         "Examples:",
         "  workbench improve --budget 1 --samples 1",
-        "  workbench improve subjects/codex --from subj_123 --optimizer optimizers/codex.yaml --json",
+        "  workbench improve candidates/current --from candidate_123 --json",
+    ]),
+    retry: withSourceDirectoryHelp([
+        "Usage:",
+        "  workbench retry TARGET_ID [--dir DIR] [--json]",
+        "",
+        "Retry a failed local run or evaluation by replaying its recorded candidate, configuration, sample count, and improve budget.",
+        "",
+        "Examples:",
+        "  workbench retry eval_local_123 --json",
+        "  workbench retry run_local_123 --dir ./my-benchmark",
     ]),
     open: withSourceDirectoryHelp(withLifecycleHelp([
         "Usage:",
@@ -166,13 +179,13 @@ const commandHelp = Object.fromEntries(Object.entries({
     ], localOpenLifecycleHelp)),
     restore: withSourceDirectoryHelp([
         "Usage:",
-        "  workbench restore [--dir DIR] [--subject ID] [--dry-run] [--yes] [--json]",
+        "  workbench restore [--dir DIR] [--candidate CANDIDATE_ID] [--dry-run] [--yes] [--json]",
         "",
-        "Restore a local subject snapshot into the subject files directory.",
+        "Restore a local candidate snapshot into the candidate files directory.",
         "",
         "Examples:",
-        "  workbench restore --subject subj_123 --dry-run",
-        "  workbench restore --subject subj_123 --yes",
+        "  workbench restore --candidate candidate_123 --dry-run",
+        "  workbench restore --candidate candidate_123 --yes",
     ]),
     runs: [
         "Usage:",
@@ -208,61 +221,61 @@ const commandHelp = Object.fromEntries(Object.entries({
         "  workbench runs show eval_local_123",
         "  workbench runs show eval_local_123 --json",
     ]),
-    subjects: [
+    candidates: [
         "Usage:",
-        "  workbench subjects <command> [options]",
+        "  workbench candidates <command> [options]",
         "",
-        "Inspect local subjects.",
+        "Inspect local candidates.",
         "",
         "Commands:",
-        "  workbench subjects list [--dir DIR] [--json]",
-        "  workbench subjects show SUBJECT_ID [--dir DIR] [--json]",
-        "  workbench subjects files [--dir DIR] [--subject ID] [--json]",
-        "  workbench subjects preview --path PATH [--dir DIR] [--subject ID] [--output PATH|-] [--json]",
+        "  workbench candidates list [--dir DIR] [--json]",
+        "  workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
+        "  workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
+        "  workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
         "",
         "Examples:",
-        "  workbench subjects list --json",
-        "  workbench subjects preview --subject subj_123 --path SKILL.md --output -",
+        "  workbench candidates list --json",
+        "  workbench candidates preview --candidate candidate_123 --path SKILL.md --output -",
     ],
-    "subjects list": withSourceDirectoryHelp([
+    "candidates list": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects list [--dir DIR] [--json]",
+        "  workbench candidates list [--dir DIR] [--json]",
         "",
-        "List local subjects.",
+        "List local candidates.",
         "",
         "Examples:",
-        "  workbench subjects list",
-        "  workbench subjects list --json",
+        "  workbench candidates list",
+        "  workbench candidates list --json",
     ]),
-    "subjects show": withSourceDirectoryHelp([
+    "candidates show": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects show SUBJECT_ID [--dir DIR] [--json]",
+        "  workbench candidates show CANDIDATE_ID [--dir DIR] [--json]",
         "",
-        "Show one local subject.",
+        "Show one local candidate.",
         "",
         "Examples:",
-        "  workbench subjects show subj_123",
-        "  workbench subjects show subj_123 --json",
+        "  workbench candidates show candidate_123",
+        "  workbench candidates show candidate_123 --json",
     ]),
-    "subjects files": withSourceDirectoryHelp([
+    "candidates files": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects files [--dir DIR] [--subject ID] [--json]",
+        "  workbench candidates files [--dir DIR] [--candidate CANDIDATE_ID] [--json]",
         "",
-        "List files in a local subject snapshot.",
+        "List files in a local candidate snapshot.",
         "",
         "Examples:",
-        "  workbench subjects files --subject subj_123",
-        "  workbench subjects files --subject subj_123 --json",
+        "  workbench candidates files --candidate candidate_123",
+        "  workbench candidates files --candidate candidate_123 --json",
     ]),
-    "subjects preview": withSourceDirectoryHelp([
+    "candidates preview": withSourceDirectoryHelp([
         "Usage:",
-        "  workbench subjects preview --path PATH [--dir DIR] [--subject ID] [--output PATH|-] [--json]",
+        "  workbench candidates preview --path PATH [--dir DIR] [--candidate CANDIDATE_ID] [--output PATH|-] [--json]",
         "",
-        "Preview a file from a local subject snapshot.",
+        "Preview a file from a local candidate snapshot.",
         "",
         "Examples:",
-        "  workbench subjects preview --subject subj_123 --path SKILL.md",
-        "  workbench subjects preview --subject subj_123 --path SKILL.md --output -",
+        "  workbench candidates preview --candidate candidate_123 --path SKILL.md",
+        "  workbench candidates preview --candidate candidate_123 --path SKILL.md --output -",
     ]),
     clone: [
         "Usage:",
@@ -355,7 +368,7 @@ const commandHelp = Object.fromEntries(Object.entries({
         "",
         "Examples:",
         "  workbench push --tag v1 --dry-run",
-        "  workbench push subjects/codex --visibility private --json",
+        "  workbench push candidates/current --visibility private --json",
     ]),
     login: [
         "Usage:",
@@ -523,17 +536,19 @@ const commandHelp = Object.fromEntries(Object.entries({
         "Hosted Workbench Cloud execution and resource commands.",
         "",
         "Commands:",
-        "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--samples N] [--watch] [--dry-run] [--json]",
-        "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--watch] [--dry-run] [--json]",
-        "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|SUBJECT_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
+        "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
+        "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
+        "  workbench cloud retry TARGET_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--watch] [--interval-ms N] [--timeout-ms N] [--json]",
+        "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|CANDIDATE_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
         "  workbench cloud watch RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--interval-ms N] [--timeout-ms N] [--json]",
         "  workbench cloud logs RUN_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
         "  workbench cloud star OWNER/BENCHMARK [--json]",
         "  workbench cloud unstar OWNER/BENCHMARK [--json]",
-        "  workbench cloud benchmarks|runs|subjects <command> [options]",
+        "  workbench cloud benchmarks|runs|candidates <command> [options]",
         "",
         "Examples:",
-        "  workbench cloud eval subjects/codex --benchmark openbench/invoice-review@v1 --dry-run --json",
+        "  workbench cloud eval candidates/current --benchmark openbench/invoice-review@v1 --dry-run --json",
+        "  workbench cloud retry run_123 --benchmark openbench/invoice-review --watch",
         "  workbench cloud runs list --benchmark openbench/invoice-review --json",
     ],
     "cloud star": [
@@ -558,27 +573,37 @@ const commandHelp = Object.fromEntries(Object.entries({
     ],
     "cloud eval": withSourceDirectoryHelp(withLifecycleHelp([
         "Usage:",
-        "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--samples N] [--watch] [--dry-run] [--json]",
+        "  workbench cloud eval [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base CANDIDATE_ID] [--runs RUNS|all] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
         "",
-        "Submit subject files to Workbench Cloud and run hosted evaluation.",
+        "Ensure a hosted evaluation exists for the selected candidate run. Completed hosted work is reused only when candidate, run configuration, source, adapters, benchmark, and samples match; use --rerun to intentionally spend again.",
         "",
         "Examples:",
-        "  workbench cloud eval subjects/codex --benchmark openbench/invoice-review@v1 --dry-run --json",
+        "  workbench cloud eval candidates/current --benchmark openbench/invoice-review@v1 --dry-run --json",
         "  workbench cloud eval --benchmark openbench/invoice-review --watch",
     ], hostedWatchLifecycleHelp)),
     "cloud improve": withSourceDirectoryHelp(withLifecycleHelp([
         "Usage:",
-        "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base SUBJECT_ID] [--optimizer OPTIMIZER_YAML] [--budget N] [--samples N] [--watch] [--dry-run] [--json]",
+        "  workbench cloud improve [SOURCE] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--base CANDIDATE_ID] [--runs RUN] [--budget N] [--samples N] [--rerun] [--watch] [--dry-run] [--json]",
+        "",
+        "Ensure a hosted candidate improvement exists for the selected base, run, budget, and samples. Completed work is reused only when base, run configuration, source, adapters, benchmark, budget, and samples match; use --rerun to intentionally spend again.",
+        "",
+        "Examples:",
+        "  workbench cloud improve --benchmark openbench/invoice-review --dry-run",
+        "  workbench cloud improve candidates/current --watch --json",
+    ], hostedWatchLifecycleHelp)),
+    "cloud retry": withSourceDirectoryHelp(withLifecycleHelp([
+        "Usage:",
+        "  workbench cloud retry TARGET_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--watch] [--interval-ms N] [--timeout-ms N] [--json]",
         "",
-        "Run hosted subject improvement.",
+        "Retry a failed hosted run or evaluation by replaying its recorded candidate, configuration, sample count, and improve budget.",
         "",
         "Examples:",
-        "  workbench cloud improve --optimizer optimizers/codex.yaml --benchmark openbench/invoice-review --dry-run",
-        "  workbench cloud improve subjects/codex --optimizer optimizers/codex.yaml --watch --json",
+        "  workbench cloud retry run_123 --benchmark openbench/invoice-review --watch",
+        "  workbench cloud retry eval_123 --json",
     ], hostedWatchLifecycleHelp)),
     "cloud open": [
         "Usage:",
-        "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|SUBJECT_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
+        "  workbench cloud open [OWNER/BENCHMARK[@REF]|RUN_ID|CANDIDATE_ID] [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--no-open] [--json]",
         "",
         "Print and open the hosted Workbench URL.",
         "",
@@ -638,24 +663,24 @@ const commandHelp = Object.fromEntries(Object.entries({
         "  workbench cloud runs list --benchmark openbench/invoice-review --json",
         "  workbench cloud runs show run_123 --benchmark openbench/invoice-review",
     ],
-    "cloud subjects": [
+    "cloud candidates": [
         "Usage:",
-        "  workbench cloud subjects <command> [options]",
+        "  workbench cloud candidates <command> [options]",
         "",
-        "Hosted subject resource commands.",
+        "Hosted candidate resource commands.",
         "",
         "Commands:",
-        "  workbench cloud subjects list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects show SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects files SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects preview SUBJECT_ID --path PATH [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--output PATH|-] [--json]",
-        "  workbench cloud subjects pull SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--out DIR] [--json]",
-        "  workbench cloud subjects publish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
-        "  workbench cloud subjects unpublish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates show CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates files CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates preview CANDIDATE_ID --path PATH [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--output PATH|-] [--json]",
+        "  workbench cloud candidates pull CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--out DIR] [--json]",
+        "  workbench cloud candidates publish CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates unpublish CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
         "",
         "Examples:",
-        "  workbench cloud subjects list --benchmark openbench/invoice-review --json",
-        "  workbench cloud subjects preview subj_123 --path SKILL.md --output -",
+        "  workbench cloud candidates list --benchmark openbench/invoice-review --json",
+        "  workbench cloud candidates preview candidate_123 --path SKILL.md --output -",
     ],
 }).map(([key, lines]) => [key, lines.join("\n")]));
 export function commandUsage(commandPath) {
@@ -742,75 +767,75 @@ const hostedCommandHelp = Object.fromEntries(Object.entries({
         "  workbench cloud runs cancel run_123 --benchmark openbench/invoice-review",
         "  workbench cloud runs cancel run_123 --json",
     ],
-    "subjects list": [
+    "candidates list": [
         "Usage:",
-        "  workbench cloud subjects list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates list [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
         "",
-        "List hosted subjects.",
+        "List hosted candidates.",
         "",
         "Examples:",
-        "  workbench cloud subjects list --benchmark openbench/invoice-review",
-        "  workbench cloud subjects list --json",
+        "  workbench cloud candidates list --benchmark openbench/invoice-review",
+        "  workbench cloud candidates list --json",
     ],
-    "subjects show": [
+    "candidates show": [
         "Usage:",
-        "  workbench cloud subjects show SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates show CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
         "",
-        "Show one hosted subject.",
+        "Show one hosted candidate.",
         "",
         "Examples:",
-        "  workbench cloud subjects show subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects show subj_123 --json",
+        "  workbench cloud candidates show candidate_123 --benchmark openbench/invoice-review",
+        "  workbench cloud candidates show candidate_123 --json",
     ],
-    "subjects files": [
+    "candidates files": [
         "Usage:",
-        "  workbench cloud subjects files SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates files CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
         "",
-        "List files in a hosted subject snapshot.",
+        "List files in a hosted candidate snapshot.",
         "",
         "Examples:",
-        "  workbench cloud subjects files subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects files subj_123 --json",
+        "  workbench cloud candidates files candidate_123 --benchmark openbench/invoice-review",
+        "  workbench cloud candidates files candidate_123 --json",
     ],
-    "subjects preview": [
+    "candidates preview": [
         "Usage:",
-        "  workbench cloud subjects preview SUBJECT_ID --path PATH [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--output PATH|-] [--json]",
+        "  workbench cloud candidates preview CANDIDATE_ID --path PATH [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--output PATH|-] [--json]",
         "",
-        "Preview a file from a hosted subject snapshot.",
+        "Preview a file from a hosted candidate snapshot.",
         "",
         "Examples:",
-        "  workbench cloud subjects preview subj_123 --path SKILL.md --output -",
-        "  workbench cloud subjects preview subj_123 --path SKILL.md --benchmark openbench/invoice-review",
+        "  workbench cloud candidates preview candidate_123 --path SKILL.md --output -",
+        "  workbench cloud candidates preview candidate_123 --path SKILL.md --benchmark openbench/invoice-review",
     ],
-    "subjects pull": [
+    "candidates pull": [
         "Usage:",
-        "  workbench cloud subjects pull SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--out DIR] [--json]",
+        "  workbench cloud candidates pull CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--out DIR] [--json]",
         "",
-        "Download hosted subject files.",
+        "Download hosted candidate files.",
         "",
         "Examples:",
-        "  workbench cloud subjects pull subj_123 --out ./subject-files",
-        "  workbench cloud subjects pull subj_123 --benchmark openbench/invoice-review --json",
+        "  workbench cloud candidates pull candidate_123 --out ./candidate-files",
+        "  workbench cloud candidates pull candidate_123 --benchmark openbench/invoice-review --json",
     ],
-    "subjects publish": [
+    "candidates publish": [
         "Usage:",
-        "  workbench cloud subjects publish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates publish CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
         "",
-        "Make a hosted subject public.",
+        "Make a hosted candidate public.",
         "",
         "Examples:",
-        "  workbench cloud subjects publish subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects publish subj_123 --json",
+        "  workbench cloud candidates publish candidate_123 --benchmark openbench/invoice-review",
+        "  workbench cloud candidates publish candidate_123 --json",
     ],
-    "subjects unpublish": [
+    "candidates unpublish": [
         "Usage:",
-        "  workbench cloud subjects unpublish SUBJECT_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
+        "  workbench cloud candidates unpublish CANDIDATE_ID [--dir DIR] [--benchmark OWNER/BENCHMARK[@REF]] [--json]",
         "",
-        "Make a hosted subject private.",
+        "Make a hosted candidate private.",
         "",
         "Examples:",
-        "  workbench cloud subjects unpublish subj_123 --benchmark openbench/invoice-review",
-        "  workbench cloud subjects unpublish subj_123 --json",
+        "  workbench cloud candidates unpublish candidate_123 --benchmark openbench/invoice-review",
+        "  workbench cloud candidates unpublish candidate_123 --json",
     ],
 }).map(([key, lines]) => [key, lines.join("\n")]));
 function cloudNestedCommandUsage(commandPath) {