@workbench-ai/workbench-core 0.0.66 → 0.0.68
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/execution-graph.d.ts +4 -3
- package/dist/execution-graph.d.ts.map +1 -1
- package/dist/execution-graph.js +15 -14
- package/dist/execution-jobs.d.ts +5 -20
- package/dist/execution-jobs.d.ts.map +1 -1
- package/dist/execution-jobs.js +7 -91
- package/dist/execution-outputs.d.ts +2 -2
- package/dist/execution-outputs.d.ts.map +1 -1
- package/dist/execution-outputs.js +10 -10
- package/dist/execution-runtime-types.d.ts +1 -1
- package/dist/execution-runtime-types.d.ts.map +1 -1
- package/dist/execution-scheduler.d.ts.map +1 -1
- package/dist/execution-scheduler.js +4 -1
- package/dist/execution-traces.js +1 -1
- package/dist/generic-spec.d.ts +29 -29
- package/dist/generic-spec.d.ts.map +1 -1
- package/dist/generic-spec.js +94 -92
- package/dist/index.d.ts +325 -220
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +5784 -3856
- package/dist/runtime-dockerfile.d.ts +1 -1
- package/dist/runtime-dockerfile.d.ts.map +1 -1
- package/dist/runtime-dockerfile.js +4 -4
- package/dist/runtime-utils.d.ts +1 -1
- package/dist/runtime-utils.d.ts.map +1 -1
- package/dist/runtime-utils.js +3 -3
- package/dist/sandbox-backends/docker.js +7 -5
- package/dist/sandbox-inputs.js +3 -3
- package/dist/sandbox-plane.d.ts.map +1 -1
- package/dist/sandbox-plane.js +13 -9
- package/dist/skill-patch.d.ts +8 -0
- package/dist/skill-patch.d.ts.map +1 -0
- package/dist/{candidate-patch.js → skill-patch.js} +5 -5
- package/package.json +3 -3
- package/worker/sandbox-adapter-runner.cjs +2 -2
- package/dist/candidate-patch.d.ts +0 -8
- package/dist/candidate-patch.d.ts.map +0 -1
- package/dist/execution-evidence.d.ts +0 -22
- package/dist/execution-evidence.d.ts.map +0 -1
- package/dist/execution-evidence.js +0 -302
- package/dist/inspection.d.ts +0 -111
- package/dist/inspection.d.ts.map +0 -1
- package/dist/inspection.js +0 -217
package/dist/index.d.ts
CHANGED
|
@@ -1,220 +1,104 @@
|
|
|
1
|
-
import type {
|
|
2
|
-
import { type WorkbenchAdapterOperationExecutor
|
|
3
|
-
import
|
|
1
|
+
import type { Json, RemoteWorkbenchJob, SurfaceSnapshotFile, WorkbenchArtifact, WorkbenchAutomationReadiness, WorkbenchSkillPatch, WorkbenchComparison, WorkbenchEvalSnapshot, WorkbenchExecutionSpec, WorkbenchInspectionSnapshot, WorkbenchJob, WorkbenchObjectPack, WorkbenchProjectState, WorkbenchRemote, WorkbenchRun, WorkbenchRunKind, WorkbenchAgent, WorkbenchSkillBundleSnapshot, WorkbenchSkillSource, WorkbenchStatus, WorkbenchTrace, WorkbenchVersion, UsageSummary } from "@workbench-ai/workbench-contract";
|
|
2
|
+
import { type WorkbenchAdapterOperationExecutor } from "@workbench-ai/workbench-protocol";
|
|
3
|
+
import type { WorkbenchAdapterAuthBundle, WorkbenchAdapterAuthTarget } from "./adapter-auth.ts";
|
|
4
|
+
import { type SandboxExecutionFileStore, type SandboxPlane } from "./sandbox-plane.ts";
|
|
4
5
|
import type { WorkbenchExecutionRuntimeInput } from "./execution-runtime-types.ts";
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
export { BENCHMARK_SPEC_FILE, CANDIDATE_SPEC_FILE, DEFAULT_EXECUTION_RESOURCES, engineCasePrivateFiles, engineCaseFilesForRuntimeInput, engineCasePublicFiles, engineResolveInvocationForSpec, engineResolveBindingForSpec, engineResolveBindingForSourceYaml, isWorkbenchCandidateManifestPath, parseWorkbenchSourceFiles, resolveEngineCaseExecutionConfig, resolveWorkbenchResolvedSourceYaml, resolveWorkbenchSourceFiles, runtimeNetwork, runtimeResources, serializeWorkbenchResolvedSourceYaml, validateWorkbenchResolvedSourceYaml, type AuthoredBenchmarkSpec, type WorkbenchCandidateImproveSpec, type WorkbenchCandidateManifestSpec, type WorkbenchCandidateRunSpec, type WorkbenchCaseSelector, type WorkbenchSelectionSpec, type GenericRunSpec, type GenericEngineCaseSpec, type WorkbenchEngineCase, type WorkbenchResolvedSource, } from "./generic-spec.ts";
|
|
8
|
-
export { composeRuntimeDockerfileWithAdapterInstallers, type WorkbenchRuntimeAdapterInstaller, type WorkbenchRuntimeAdapterInstallerFile, } from "./runtime-dockerfile.ts";
|
|
9
|
-
export { adapterCommandName, cloneWorkbenchAdapterManifest, collectWorkbenchAdapterAuthRequirements, collectWorkbenchAdapterInvocations, parseWorkbenchAdapterManifest, workbenchAdapterManifestRequiresAuth, workbenchAdapterManifestSupportsOperation, workbenchAdapterOperationCommand, workbenchAdapterOperationExecutor, withDefaultWorkbenchAdapterAuth, withDefaultWorkbenchAdapterAuthProfiles, type WorkbenchPrimitiveAdapterOperation, type WorkbenchAdapterOperation, type WorkbenchAdapterOperationExecutor, type WorkbenchAdapterOperationManifest, type WorkbenchAdapterSlotManifest, type WorkbenchAdapterAuthRequirement, type WorkbenchAdapterAuthManifest, type WorkbenchAdapterAuthMethodManifest, type WorkbenchAdapterInvocationLike, type WorkbenchAdapterManifest, } from "@workbench-ai/workbench-protocol";
|
|
10
|
-
export { adapterAuthEnv, createWorkbenchAdapterAuthBundle, defaultWorkbenchAdapterAuthStoreRoot, localWorkbenchAdapterAuthStore, normalizeWorkbenchAdapterAuthTarget, parseWorkbenchAdapterAuthTarget, sanitizeWorkbenchAdapterAuthBundle, type WorkbenchAdapterAuthBundle, type WorkbenchAdapterAuthEnvVar, type WorkbenchAdapterAuthFile, type WorkbenchAdapterAuthStatus, type WorkbenchAdapterAuthStatusRecord, type WorkbenchAdapterAuthStore, type WorkbenchAdapterAuthTarget, } from "./adapter-auth.ts";
|
|
6
|
+
export type { Json, RemoteWorkbenchJob, SurfaceSnapshotFile, WorkbenchArtifact, WorkbenchAutomationReadiness, WorkbenchComparison, WorkbenchComparisonCell, WorkbenchEvalSnapshot, WorkbenchExecutionResult, WorkbenchExecutionSpec, WorkbenchFileSurface, WorkbenchInspectionFileContent, WorkbenchInspectionFileOwnerKind, WorkbenchInspectionSnapshot, WorkbenchJob, WorkbenchLineageEdge, WorkbenchObjectPack, WorkbenchProjectState, WorkbenchRefs, WorkbenchRemote, WorkbenchRun, WorkbenchAgent, WorkbenchSkillBundleSnapshot, WorkbenchSkillInclude, WorkbenchSkillSource, WorkbenchStatus, WorkbenchTrace, WorkbenchVersion, } from "@workbench-ai/workbench-contract";
|
|
7
|
+
export { workbenchInspectionFileContent, workbenchInspectionFileContentUnavailableReason, workbenchInspectionFileManifest, } from "@workbench-ai/workbench-contract";
|
|
11
8
|
export type { WorkbenchExecutionRuntimeInput, WorkbenchWorkloadStepCommand, } from "./execution-runtime-types.ts";
|
|
12
|
-
export {
|
|
13
|
-
export {
|
|
14
|
-
export {
|
|
15
|
-
export { persistWorkbenchAdapterAuthUpdates, } from "./adapter-auth-updates.ts";
|
|
16
|
-
export { resolveSandboxTemplateImage, } from "./sandbox-backends/template-images.ts";
|
|
17
|
-
export { readOutputTraceFiles, workbenchTraceExecutionDirectory, workbenchTraceRunDirectory, workbenchTraceRunDirectoryName, } from "./trace-files.ts";
|
|
18
|
-
export { assertWorkbenchAdapterOperationSupport, assertWorkbenchAdapterOperationResultOk, collectWorkbenchAdapterOperationIssues, collectWorkbenchAdapterOperationRequirements, ensureWorkbenchAdapterOutputDir, WORKBENCH_ADAPTER_RESULT_FILE, normalizeWorkbenchAdapterOperationRequest, normalizeWorkbenchAdapterOperationResult, readWorkbenchAdapterOperationRequest, readWorkbenchAdapterOperationResult, workbenchAdapterOperationResultPath, writeWorkbenchAdapterOperationResult, type WorkbenchAdapterOperationRequest, type WorkbenchAdapterOperationResult, type WorkbenchAdapterOperationResultValue, type WorkbenchAdapterOperationRequirement, type WorkbenchEngineResolveResult, type WorkbenchEngineCaseSpec, } from "@workbench-ai/workbench-protocol";
|
|
19
|
-
export { applyWorkbenchCandidatePatch, type ApplyWorkbenchCandidatePatchInput, } from "./candidate-patch.ts";
|
|
20
|
-
export { createWorkbenchSandboxFileStore, createSandboxAdapterRequest, executionResultFromCompletedSandboxJob, isSurfaceSnapshotFile, materializeWorkbenchSandboxInput, readWorkbenchExecutionSpec, sanitizeWorkbenchExecutionJobForSandbox, } from "./sandbox-inputs.ts";
|
|
21
|
-
export { compileWorkbenchExecutionGraph, type CompileExecutionGraphInput, type WorkbenchExecutionGraph, type WorkbenchExecutionGraphNode, } from "./execution-graph.ts";
|
|
22
|
-
export { createBaselineCandidateExecution, createBaselineCandidateJob, createWorkbenchExecutionJob, expectedWorkbenchRunJobCount, engineCaseForCase, engineCaseIds, attemptJobCountForRunSpec, workbenchExecutionJobPurpose, MAX_WORKBENCH_RUN_BUDGET, planWorkbenchExecutionJobsForPurpose, validateWorkbenchRunEnvelope, workbenchExecutionJobId, type WorkbenchRunWorkflow, } from "./execution-jobs.ts";
|
|
9
|
+
export { attachSandboxMetadataToJob, createSandboxAdapterRequest, createWorkbenchSandboxFileStore, executionResultFromCompletedSandboxJob, isSurfaceSnapshotFile, readWorkbenchExecutionSpec, } from "./sandbox-inputs.ts";
|
|
10
|
+
export { createWorkbenchExecutionCapability, createWorkbenchSandboxAllocation, collectExecutionCapabilityScopeIssues, collectSandboxAllocationScopeIssues, collectSandboxHandleScopeIssues, assertSandboxBackendSupportsNetworkPolicy, executeValidatedSandboxExecution, type SandboxBackendCapabilities, type SandboxBackendDescriptor, type SandboxCreateRequest, type SandboxEnvironmentImage, type SandboxExecRequest, type SandboxExecutionFileStore, type SandboxHandle, type SandboxMaterializedInput, type SandboxPlane, } from "./sandbox-plane.ts";
|
|
11
|
+
export { createDockerSandboxBackendDescriptor, createDockerSandboxPlane, DOCKER_SANDBOX_BACKEND, } from "./sandbox-backends/index.ts";
|
|
23
12
|
export { addCapacity, capacityFits, runWorkbenchExecutionDag, subtractCapacity, workbenchJobDependencies, workbenchJobHostCost, workbenchJobResources, type WorkbenchExecutionDagCapacity, type WorkbenchExecutionDagResult, type WorkbenchExecutionDagRunInput, } from "./execution-scheduler.ts";
|
|
24
|
-
export {
|
|
25
|
-
export {
|
|
26
|
-
export {
|
|
27
|
-
export {
|
|
28
|
-
export {
|
|
29
|
-
export {
|
|
30
|
-
export {
|
|
31
|
-
export
|
|
32
|
-
export
|
|
33
|
-
export
|
|
34
|
-
export declare
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
export
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
|
|
73
|
-
|
|
74
|
-
|
|
75
|
-
|
|
76
|
-
|
|
77
|
-
completedJobCount: number;
|
|
78
|
-
failedJobCount: number;
|
|
79
|
-
}
|
|
80
|
-
export interface WorkbenchRunWorkload {
|
|
81
|
-
job: RemoteWorkbenchJob;
|
|
82
|
-
spec: GenericRunSpec;
|
|
83
|
-
candidateId: string;
|
|
84
|
-
attemptIndex: number;
|
|
85
|
-
sampleIndex: number;
|
|
13
|
+
export { createWorkbenchExecutionJob, planWorkbenchExecutionJobsForPurpose, workbenchExecutionJobId, } from "./execution-jobs.ts";
|
|
14
|
+
export { applyWorkbenchSkillPatch, } from "./skill-patch.ts";
|
|
15
|
+
export { asRuntimeRecord, importNodeModule, jsonRecord, nodeBuiltin, normalizeRelativePath, normalizeRuntimeRegistry, normalizeWorkbenchWorkerId, quoteShellArg, readSurfaceFiles, resolveDockerRuntimeImageRef, resolveWorkbenchWorkerId, writeSurfaceFiles, } from "./runtime-utils.ts";
|
|
16
|
+
export { assignUsageRole, extractExecutionUsageFromTrace, mergeUsageSummaries, normalizeUsageSummary, } from "./execution-usage.ts";
|
|
17
|
+
export { composeRuntimeDockerfileWithAdapterInstallers, type WorkbenchRuntimeAdapterInstaller, } from "./runtime-dockerfile.ts";
|
|
18
|
+
export { readOutputTraceFiles, workbenchTraceExecutionDirectory, workbenchTraceRunDirectory, workbenchTraceRunDirectoryName, } from "./trace-files.ts";
|
|
19
|
+
export { createWorkbenchProgressStdoutParser, publishWorkbenchProgressStdoutEnvelope, type WorkbenchExecutionEventPublisher, type WorkbenchExecutionProgressTarget, } from "./execution-events.ts";
|
|
20
|
+
export { persistWorkbenchAdapterAuthUpdates, } from "./adapter-auth-updates.ts";
|
|
21
|
+
export { adapterAuthEnv, createWorkbenchAdapterAuthBundle, defaultWorkbenchAdapterAuthStoreRoot, localWorkbenchAdapterAuthStore, normalizeWorkbenchAdapterAuthTarget, parseWorkbenchAdapterAuthTarget, sanitizeWorkbenchAdapterAuthBundle, type WorkbenchAdapterAuthBundle, type WorkbenchAdapterAuthEnvVar, type WorkbenchAdapterAuthFile, type WorkbenchAdapterAuthStatus, type WorkbenchAdapterAuthStatusRecord, type WorkbenchAdapterAuthStore, type WorkbenchAdapterAuthTarget, } from "./adapter-auth.ts";
|
|
22
|
+
export { mergeWorkbenchExecutionTracesByJob, } from "./execution-traces.ts";
|
|
23
|
+
export declare class WorkbenchUserError extends Error {
|
|
24
|
+
constructor(message: string);
|
|
25
|
+
}
|
|
26
|
+
export interface WorkbenchCommandOptions {
|
|
27
|
+
dir?: string;
|
|
28
|
+
authToken?: string;
|
|
29
|
+
}
|
|
30
|
+
export interface WorkbenchEvalOptions extends WorkbenchCommandOptions {
|
|
31
|
+
version?: string;
|
|
32
|
+
skill?: string;
|
|
33
|
+
agent?: string;
|
|
34
|
+
samples?: number;
|
|
35
|
+
kind?: WorkbenchRunKind;
|
|
36
|
+
parentRunId?: string;
|
|
37
|
+
caseIds?: readonly string[];
|
|
38
|
+
selectedSamples?: readonly WorkbenchCaseSampleSelection[];
|
|
39
|
+
rerun?: boolean;
|
|
40
|
+
}
|
|
41
|
+
export interface WorkbenchStateEvalOptions {
|
|
42
|
+
authToken?: string;
|
|
43
|
+
version?: string;
|
|
44
|
+
evalHash?: string;
|
|
45
|
+
skill?: string;
|
|
46
|
+
agent?: string;
|
|
47
|
+
samples?: number;
|
|
48
|
+
kind?: WorkbenchRunKind;
|
|
49
|
+
parentRunId?: string;
|
|
50
|
+
caseIds?: readonly string[];
|
|
51
|
+
selectedSamples?: readonly WorkbenchCaseSampleSelection[];
|
|
52
|
+
rerun?: boolean;
|
|
53
|
+
}
|
|
54
|
+
export interface WorkbenchStateImproveOptions {
|
|
55
|
+
authToken?: string;
|
|
56
|
+
version?: string;
|
|
57
|
+
evalHash?: string;
|
|
58
|
+
skill?: string;
|
|
59
|
+
agent?: string;
|
|
60
|
+
budget?: number;
|
|
61
|
+
samples?: number;
|
|
62
|
+
parentRunId?: string;
|
|
63
|
+
evidenceTraceIds?: readonly string[];
|
|
64
|
+
}
|
|
65
|
+
export interface WorkbenchCaseSampleSelection {
|
|
86
66
|
caseId: string;
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
|
|
99
|
-
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
cases?: RemoteWorkbenchFileInput[];
|
|
121
|
-
}): AuthoredWorkbenchSourceDocument;
|
|
122
|
-
export declare function materializeWorkbenchRunResult(args: {
|
|
123
|
-
runId: string;
|
|
124
|
-
benchmarkFingerprint: string;
|
|
125
|
-
sourceYaml?: string;
|
|
126
|
-
benchmarkSourceFiles?: readonly SurfaceSnapshotFile[];
|
|
127
|
-
candidateFingerprint?: string;
|
|
128
|
-
candidateSourceFiles?: readonly SurfaceSnapshotFile[];
|
|
129
|
-
startedAt: string;
|
|
130
|
-
spec: GenericRunSpec;
|
|
131
|
-
jobs: readonly RemoteWorkbenchJob[];
|
|
132
|
-
previousCandidate?: CandidateRecord | null;
|
|
133
|
-
existingCandidateCount: number;
|
|
134
|
-
selection?: {
|
|
135
|
-
metric: string;
|
|
136
|
-
caseIds?: readonly string[];
|
|
137
|
-
label?: string;
|
|
138
|
-
};
|
|
139
|
-
}): WorkbenchRunMaterialization;
|
|
140
|
-
export declare function evaluationScorecardId(runId: string, candidateId: string): string;
|
|
141
|
-
export declare function selectExecutionOutputFilesForInspection(args: {
|
|
142
|
-
purpose: string | null | undefined;
|
|
143
|
-
files: readonly SurfaceSnapshotFile[];
|
|
144
|
-
output?: Record<string, unknown> | null | undefined;
|
|
145
|
-
}): SurfaceSnapshotFile[];
|
|
146
|
-
export declare function isWorkbenchInternalOutputPath(filePath: string): boolean;
|
|
147
|
-
export declare function isGeneratedExecutionOutputPath(filePath: string): boolean;
|
|
148
|
-
export declare function createOptimizerTraceInputFiles(args: {
|
|
149
|
-
jobs: readonly RemoteWorkbenchJob[];
|
|
150
|
-
}): SurfaceSnapshotFile[];
|
|
151
|
-
export interface WorkbenchSelectionPolicy {
|
|
152
|
-
metric: string;
|
|
153
|
-
selector: WorkbenchCaseSelector;
|
|
154
|
-
}
|
|
155
|
-
export declare function workbenchImproveOptimizeSelector(spec: GenericRunSpec): WorkbenchCaseSelector;
|
|
156
|
-
export declare function workbenchImproveSelectionPolicy(spec: GenericRunSpec): WorkbenchSelectionPolicy;
|
|
157
|
-
export declare function workbenchEngineCaseIdsForSelector(engineCases: readonly WorkbenchEngineCase[], selector: WorkbenchCaseSelector): string[];
|
|
158
|
-
export declare function workbenchEngineCaseIdsForImproveEvaluation(args: {
|
|
159
|
-
spec: GenericRunSpec;
|
|
160
|
-
engineCases: readonly WorkbenchEngineCase[];
|
|
161
|
-
}): string[];
|
|
162
|
-
export declare function filterOptimizerTraceJobsForCaseIds(jobs: readonly RemoteWorkbenchJob[], caseIds: readonly string[]): RemoteWorkbenchJob[];
|
|
163
|
-
export declare function formatWorkbenchCaseSelector(selector: WorkbenchCaseSelector): string;
|
|
164
|
-
export declare function formatWorkbenchSelectionPolicy(policy: WorkbenchSelectionPolicy): string;
|
|
165
|
-
export declare function workbenchCaseSelectorUsesAllCases(selector: WorkbenchCaseSelector): boolean;
|
|
166
|
-
export declare function evaluationMeanMetrics(evaluation: Pick<EvaluationRecord, "metrics"> | null | undefined): Record<string, number> | undefined;
|
|
167
|
-
export declare function candidateRecordWithoutDerivedFields(candidate: CandidateRecord): CandidateRecord;
|
|
168
|
-
export declare function candidateSummaryFromRecord(candidate: CandidateRecord): CandidateSummary;
|
|
169
|
-
export declare function workbenchRunExecutionFingerprint(args: {
|
|
170
|
-
sourceYaml?: string | null;
|
|
171
|
-
adapterFiles?: readonly SurfaceSnapshotFile[];
|
|
172
|
-
specVersionId?: string | null;
|
|
173
|
-
environmentVersionId?: string | null;
|
|
174
|
-
}): string;
|
|
175
|
-
export interface WorkbenchProjectSourceFilesInput {
|
|
176
|
-
specSource?: string;
|
|
177
|
-
specFiles?: readonly SurfaceSnapshotFile[];
|
|
178
|
-
candidateFilesPath: string;
|
|
179
|
-
candidateFiles: readonly SurfaceSnapshotFile[];
|
|
180
|
-
engineResolveFilesPath: string;
|
|
181
|
-
engineResolveFiles: readonly SurfaceSnapshotFile[];
|
|
182
|
-
adapterFiles?: readonly SurfaceSnapshotFile[];
|
|
183
|
-
dockerfilePath?: string;
|
|
184
|
-
dockerfile?: string | null;
|
|
185
|
-
dockerfiles?: readonly SurfaceSnapshotFile[];
|
|
186
|
-
}
|
|
187
|
-
export declare function buildWorkbenchProjectSourceFiles(input: WorkbenchProjectSourceFilesInput): SurfaceSnapshotFile[];
|
|
188
|
-
export declare function readWorkbenchSpecDockerfilePath(spec: {
|
|
189
|
-
environment: {
|
|
190
|
-
dockerfile?: unknown;
|
|
67
|
+
sample: number;
|
|
68
|
+
}
|
|
69
|
+
export interface WorkbenchCheckResult {
|
|
70
|
+
ok: true;
|
|
71
|
+
status: WorkbenchStatus;
|
|
72
|
+
cases: number;
|
|
73
|
+
skills: number;
|
|
74
|
+
agents: number;
|
|
75
|
+
plan: {
|
|
76
|
+
source: {
|
|
77
|
+
skillFiles: number;
|
|
78
|
+
evalFiles: number;
|
|
79
|
+
caseCount: number;
|
|
80
|
+
smokeCaseCount: number;
|
|
81
|
+
};
|
|
82
|
+
skills: Array<{
|
|
83
|
+
name: string;
|
|
84
|
+
bundleHash: string;
|
|
85
|
+
includedSkillCount: number;
|
|
86
|
+
fileCount: number;
|
|
87
|
+
}>;
|
|
88
|
+
agents: Array<{
|
|
89
|
+
name: string;
|
|
90
|
+
adapter: string;
|
|
91
|
+
model?: string;
|
|
92
|
+
providerBacked: boolean;
|
|
93
|
+
executionMode: "local-command" | "provider-backed";
|
|
94
|
+
network: WorkbenchExecutionSpec["policy"]["network"];
|
|
95
|
+
resources: WorkbenchExecutionSpec["policy"]["resources"];
|
|
96
|
+
image: string;
|
|
97
|
+
auth?: "local-adapter-auth";
|
|
98
|
+
}>;
|
|
99
|
+
readiness: WorkbenchAutomationReadiness;
|
|
191
100
|
};
|
|
192
|
-
}
|
|
193
|
-
export declare function isCandidateSourceFilePath(filePath: string): boolean;
|
|
194
|
-
export declare function filterCandidateSourceFiles(files: readonly SurfaceSnapshotFile[]): SurfaceSnapshotFile[];
|
|
195
|
-
export declare function normalizeSurfaceFiles(files: RemoteWorkbenchFileInput[]): SurfaceSnapshotFile[];
|
|
196
|
-
export declare function filterSurfaceFilesByInclude<T extends {
|
|
197
|
-
path: string;
|
|
198
|
-
}>(files: readonly T[], include: readonly string[] | undefined): T[];
|
|
199
|
-
export declare function summarizeCandidateFiles(files: readonly SurfaceSnapshotFile[], changedPaths?: readonly string[]): CandidateFileSummary[];
|
|
200
|
-
export declare function createCandidateFilePreview(args: {
|
|
201
|
-
files: readonly SurfaceSnapshotFile[];
|
|
202
|
-
path: string;
|
|
203
|
-
view: "diff" | "raw" | "rendered";
|
|
204
|
-
}): CandidateFilePreview;
|
|
205
|
-
export declare function createCaseReview(args: {
|
|
206
|
-
candidate: CandidateRecord;
|
|
207
|
-
caseId: string;
|
|
208
|
-
executions?: CandidateCaseExecutionRef[];
|
|
209
|
-
}): CandidateCaseReview;
|
|
210
|
-
export declare function createWorkbenchRunWorkload(args: {
|
|
211
|
-
job: RemoteWorkbenchJob;
|
|
212
|
-
spec: GenericRunSpec;
|
|
213
|
-
baseFiles: readonly SurfaceSnapshotFile[];
|
|
214
|
-
engineResolveFiles: readonly SurfaceSnapshotFile[];
|
|
215
|
-
engineCases: readonly WorkbenchEngineCase[];
|
|
216
|
-
traceFiles?: readonly SurfaceSnapshotFile[];
|
|
217
|
-
}): WorkbenchRunWorkload;
|
|
101
|
+
}
|
|
218
102
|
export interface WorkbenchExecutionJobOptions {
|
|
219
103
|
sandboxBackend: string;
|
|
220
104
|
loadLocalAdapterAuthProfiles?: boolean;
|
|
@@ -222,13 +106,234 @@ export interface WorkbenchExecutionJobOptions {
|
|
|
222
106
|
createSandboxPlaneForBackend?: (backend: string, args: WorkbenchExecutionRuntimeInput, startedAt: string, fileStore: SandboxExecutionFileStore) => SandboxPlane;
|
|
223
107
|
}
|
|
224
108
|
export declare function executeWorkbenchExecutionJob(args: WorkbenchExecutionRuntimeInput, options: WorkbenchExecutionJobOptions): Promise<RemoteWorkbenchJob>;
|
|
225
|
-
export declare function
|
|
109
|
+
export declare function requiredWorkbenchAdapterAuthTargetsForRuntimeInput(args: Pick<WorkbenchExecutionRuntimeInput, "job" | "adapterManifests" | "runtimeControlOperation" | "spec">): WorkbenchAdapterAuthTarget[];
|
|
226
110
|
export declare function workbenchExecutionPurpose(job: RemoteWorkbenchJob): WorkbenchExecutionSpec["purpose"] | null;
|
|
227
|
-
export declare function
|
|
228
|
-
export declare function
|
|
229
|
-
export declare function
|
|
230
|
-
export declare function
|
|
231
|
-
export
|
|
232
|
-
|
|
233
|
-
|
|
111
|
+
export declare function workbenchExecutionExecutorForRuntimeInput(args: Pick<WorkbenchExecutionRuntimeInput, "job" | "adapterManifests" | "runtimeControlOperation">): WorkbenchAdapterOperationExecutor;
|
|
112
|
+
export declare function executeAdapterInCurrentRuntime(args: WorkbenchExecutionRuntimeInput, execution: WorkbenchExecutionSpec, startedAt: string): Promise<RemoteWorkbenchJob>;
|
|
113
|
+
export declare function executeRuntimeControlOperationSequenceInCurrentRuntime(args: WorkbenchExecutionRuntimeInput, execution: WorkbenchExecutionSpec, startedAt: string): Promise<RemoteWorkbenchJob>;
|
|
114
|
+
export declare function isWorkbenchInternalOutputPath(filePath: string): boolean;
|
|
115
|
+
export interface WorkbenchImproveOptions extends WorkbenchCommandOptions {
|
|
116
|
+
version?: string;
|
|
117
|
+
skill?: string;
|
|
118
|
+
agent?: string;
|
|
119
|
+
budget?: number;
|
|
120
|
+
samples?: number;
|
|
121
|
+
parentRunId?: string;
|
|
122
|
+
evidenceTraceIds?: readonly string[];
|
|
123
|
+
}
|
|
124
|
+
export interface WorkbenchImproveResult {
|
|
125
|
+
run: WorkbenchRun;
|
|
126
|
+
version: WorkbenchVersion;
|
|
127
|
+
switched: boolean;
|
|
128
|
+
promoted: boolean;
|
|
129
|
+
promotionReason: string;
|
|
130
|
+
incumbentRunId?: string;
|
|
131
|
+
incumbentScore?: number;
|
|
132
|
+
outputScore?: number;
|
|
133
|
+
}
|
|
134
|
+
export interface WorkbenchCompareOptions extends WorkbenchCommandOptions {
|
|
135
|
+
versions?: string;
|
|
136
|
+
skills?: string;
|
|
137
|
+
agents?: string;
|
|
138
|
+
}
|
|
139
|
+
export interface WorkbenchRemoteOptions extends WorkbenchCommandOptions {
|
|
140
|
+
remote?: string;
|
|
141
|
+
authToken?: string;
|
|
142
|
+
}
|
|
143
|
+
export interface WorkbenchPublishOptions extends WorkbenchCommandOptions {
|
|
144
|
+
version?: string;
|
|
145
|
+
remote?: string;
|
|
146
|
+
visibility?: "private" | "public";
|
|
147
|
+
authToken?: string;
|
|
148
|
+
}
|
|
149
|
+
export interface WorkbenchPublishResult {
|
|
150
|
+
remote: WorkbenchRemote;
|
|
151
|
+
version: WorkbenchVersion;
|
|
152
|
+
visibility: "private" | "public";
|
|
153
|
+
installUrl: string;
|
|
154
|
+
pinnedInstallUrl: string;
|
|
155
|
+
}
|
|
156
|
+
export interface WorkbenchDiffEntry {
|
|
157
|
+
path: string;
|
|
158
|
+
status: "added" | "removed" | "modified";
|
|
159
|
+
before?: string;
|
|
160
|
+
after?: string;
|
|
161
|
+
}
|
|
162
|
+
export interface WorkbenchCaseRecord {
|
|
163
|
+
id: string;
|
|
164
|
+
path: string;
|
|
165
|
+
content: string;
|
|
166
|
+
}
|
|
167
|
+
export interface WorkbenchQueuedSkillEvalJobInput {
|
|
168
|
+
kind: "workbench.skill.eval.job.v1";
|
|
169
|
+
ownerUserId?: string;
|
|
170
|
+
skillId?: string;
|
|
171
|
+
runId: string;
|
|
172
|
+
jobId: string;
|
|
173
|
+
artifactId?: string;
|
|
174
|
+
traceId?: string;
|
|
175
|
+
versionId: string;
|
|
176
|
+
evalHash: string;
|
|
177
|
+
agentName: string;
|
|
178
|
+
caseId: string;
|
|
179
|
+
sample: number;
|
|
180
|
+
state: WorkbenchProjectState;
|
|
181
|
+
adapterAuthProfiles?: readonly WorkbenchAdapterAuthBundle[];
|
|
182
|
+
}
|
|
183
|
+
export interface WorkbenchEvalCaseRuntime extends WorkbenchCaseRecord {
|
|
184
|
+
files: SurfaceSnapshotFile[];
|
|
185
|
+
command?: string;
|
|
186
|
+
smoke?: boolean;
|
|
187
|
+
}
|
|
188
|
+
export interface WorkbenchSkillEvalRuntimeInputArgs {
|
|
189
|
+
ownerUserId: string;
|
|
190
|
+
projectId: string;
|
|
191
|
+
runId: string;
|
|
192
|
+
jobId: string;
|
|
193
|
+
versionId: string;
|
|
194
|
+
evalHash: string;
|
|
195
|
+
evalSnapshot: WorkbenchEvalSnapshot;
|
|
196
|
+
skillName?: string;
|
|
197
|
+
skillBundleHash?: string;
|
|
198
|
+
agent: WorkbenchAgent;
|
|
199
|
+
versionFiles: readonly SurfaceSnapshotFile[];
|
|
200
|
+
runtimeCase: WorkbenchEvalCaseRuntime;
|
|
201
|
+
sample: number;
|
|
202
|
+
createdAt?: string;
|
|
203
|
+
attempt?: number;
|
|
204
|
+
environmentDockerfile?: string;
|
|
205
|
+
environmentImageRef?: string;
|
|
206
|
+
}
|
|
207
|
+
export interface WorkbenchSkillImproveRuntimeInputArgs {
|
|
208
|
+
ownerUserId: string;
|
|
209
|
+
projectId: string;
|
|
210
|
+
runId: string;
|
|
211
|
+
jobId: string;
|
|
212
|
+
baseVersionId: string;
|
|
213
|
+
evalHash: string;
|
|
214
|
+
skillName?: string;
|
|
215
|
+
skillBundleHash?: string;
|
|
216
|
+
agent: WorkbenchAgent;
|
|
217
|
+
baseFiles: readonly SurfaceSnapshotFile[];
|
|
218
|
+
traces: readonly WorkbenchTrace[];
|
|
219
|
+
createdAt?: string;
|
|
220
|
+
attempt?: number;
|
|
221
|
+
environmentDockerfile?: string;
|
|
222
|
+
environmentImageRef?: string;
|
|
223
|
+
}
|
|
224
|
+
export interface WorkbenchSkillImprovementPatchApplication {
|
|
225
|
+
state: WorkbenchProjectState;
|
|
226
|
+
version: WorkbenchVersion;
|
|
227
|
+
created: boolean;
|
|
228
|
+
}
|
|
229
|
+
export declare function initWorkbenchSkill(options?: WorkbenchCommandOptions): Promise<WorkbenchStatus>;
|
|
230
|
+
export declare function workbenchStatus(options?: WorkbenchCommandOptions): Promise<WorkbenchStatus>;
|
|
231
|
+
export declare function checkWorkbenchSkill(options?: WorkbenchCommandOptions): Promise<WorkbenchCheckResult>;
|
|
232
|
+
export declare function listWorkbenchVersions(options?: WorkbenchCommandOptions): Promise<WorkbenchVersion[]>;
|
|
233
|
+
export declare function evalWorkbenchSkill(options?: WorkbenchEvalOptions): Promise<WorkbenchRun[]>;
|
|
234
|
+
export declare function evalWorkbenchProjectState(state: WorkbenchProjectState, options?: WorkbenchStateEvalOptions): Promise<{
|
|
235
|
+
state: WorkbenchProjectState;
|
|
236
|
+
runs: WorkbenchRun[];
|
|
237
|
+
}>;
|
|
238
|
+
export declare function improveWorkbenchProjectState(state: WorkbenchProjectState, options?: WorkbenchStateImproveOptions): Promise<{
|
|
239
|
+
state: WorkbenchProjectState;
|
|
240
|
+
runs: WorkbenchRun[];
|
|
241
|
+
}>;
|
|
242
|
+
export declare function listWorkbenchProjectStateEvalCases(state: WorkbenchProjectState): Promise<WorkbenchCaseRecord[]>;
|
|
243
|
+
export declare function listWorkbenchProjectStateEvalRuntimeCases(state: WorkbenchProjectState, evalHash?: string): Promise<WorkbenchEvalCaseRuntime[]>;
|
|
244
|
+
export declare function createWorkbenchSkillEvalRuntimeInput(args: WorkbenchSkillEvalRuntimeInputArgs): WorkbenchExecutionRuntimeInput;
|
|
245
|
+
export declare function createWorkbenchSkillImproveRuntimeInput(args: WorkbenchSkillImproveRuntimeInputArgs): WorkbenchExecutionRuntimeInput;
|
|
246
|
+
export declare function workbenchImprovementEvidenceFromTraces(traces: readonly WorkbenchTrace[]): string[];
|
|
247
|
+
export declare function workbenchImprovementEvidenceTraces(traces: readonly WorkbenchTrace[]): WorkbenchTrace[];
|
|
248
|
+
export declare function workbenchImprovementEvidenceTracesForVersion(state: WorkbenchProjectState, options: {
|
|
249
|
+
versionId: string;
|
|
250
|
+
skillName: string;
|
|
251
|
+
agent: WorkbenchAgent;
|
|
252
|
+
traceIds?: readonly string[];
|
|
253
|
+
}): WorkbenchTrace[];
|
|
254
|
+
export declare function workbenchSkillImproveCanUseQueuedAdapter(agent: WorkbenchAgent): boolean;
|
|
255
|
+
export declare function workbenchSkillImproveAdapterRequirementMessage(agent: WorkbenchAgent): string;
|
|
256
|
+
export declare function readWorkbenchSkillImprovementPatchFromRemoteJob(remoteJob: RemoteWorkbenchJob): WorkbenchSkillPatch | null;
|
|
257
|
+
export declare function applyWorkbenchSkillImprovementPatch(state: WorkbenchProjectState, args: {
|
|
258
|
+
baseVersionId: string;
|
|
259
|
+
agent: WorkbenchAgent;
|
|
260
|
+
patch: WorkbenchSkillPatch;
|
|
261
|
+
runId?: string;
|
|
262
|
+
createdAt?: string;
|
|
263
|
+
}): WorkbenchSkillImprovementPatchApplication;
|
|
264
|
+
export declare function decideWorkbenchImprovementPromotion(run: WorkbenchRun, incumbentRun: WorkbenchRun | undefined): {
|
|
265
|
+
promoted: boolean;
|
|
266
|
+
reason: string;
|
|
267
|
+
};
|
|
268
|
+
export declare function normalizeWorkbenchSkillEvalEnvironmentDockerfile(source: string | undefined): string | undefined;
|
|
269
|
+
export interface WorkbenchVersionRuntimeSnapshot {
|
|
270
|
+
evalSnapshot: WorkbenchEvalSnapshot;
|
|
271
|
+
cases: WorkbenchEvalCaseRuntime[];
|
|
272
|
+
agents: WorkbenchAgent[];
|
|
273
|
+
selectedAgents: WorkbenchAgent[];
|
|
274
|
+
defaultAgent?: string;
|
|
275
|
+
skillSources: WorkbenchSkillSource[];
|
|
276
|
+
skillBundles: WorkbenchSkillBundleSnapshot[];
|
|
277
|
+
defaultSkill?: string;
|
|
278
|
+
environmentDockerfile?: string;
|
|
279
|
+
}
|
|
280
|
+
export declare function createWorkbenchVersionRuntimeSnapshot(version: WorkbenchVersion, options?: {
|
|
281
|
+
skill?: string;
|
|
282
|
+
agent?: string;
|
|
283
|
+
evalHash?: string;
|
|
284
|
+
authToken?: string;
|
|
285
|
+
}): Promise<WorkbenchVersionRuntimeSnapshot>;
|
|
286
|
+
export declare function executeQueuedWorkbenchSkillEvalJob(input: WorkbenchQueuedSkillEvalJobInput): Promise<{
|
|
287
|
+
run: WorkbenchRun;
|
|
288
|
+
job: WorkbenchJob;
|
|
289
|
+
artifact: WorkbenchArtifact;
|
|
290
|
+
trace: WorkbenchTrace;
|
|
291
|
+
}>;
|
|
292
|
+
export declare function improveWorkbenchSkill(options?: WorkbenchImproveOptions): Promise<WorkbenchImproveResult>;
|
|
293
|
+
export declare function compareWorkbench(options?: WorkbenchCompareOptions): Promise<WorkbenchComparison>;
|
|
294
|
+
export declare function switchWorkbenchVersion(versionRef: string, options?: WorkbenchCommandOptions): Promise<WorkbenchVersion>;
|
|
295
|
+
export declare function diffWorkbenchVersions(range: string, options?: WorkbenchCommandOptions): Promise<WorkbenchDiffEntry[]>;
|
|
296
|
+
export declare function showWorkbenchRef(ref: string, options?: WorkbenchCommandOptions): Promise<unknown>;
|
|
297
|
+
export declare function filesForWorkbenchRef(ref: string, options?: WorkbenchCommandOptions): Promise<SurfaceSnapshotFile[]>;
|
|
298
|
+
export declare function listWorkbenchCases(options?: WorkbenchCommandOptions): Promise<WorkbenchCaseRecord[]>;
|
|
299
|
+
export declare function showWorkbenchCase(caseId: string, options?: WorkbenchCommandOptions): Promise<WorkbenchCaseRecord>;
|
|
300
|
+
export declare function addWorkbenchCase(options?: WorkbenchCommandOptions & {
|
|
301
|
+
fromTraceId?: string;
|
|
302
|
+
}): Promise<WorkbenchCaseRecord>;
|
|
303
|
+
export declare function removeWorkbenchCase(caseId: string, options?: WorkbenchCommandOptions): Promise<{
|
|
304
|
+
removed: string;
|
|
305
|
+
}>;
|
|
306
|
+
export declare function listWorkbenchAgents(options?: WorkbenchCommandOptions): Promise<WorkbenchAgent[]>;
|
|
307
|
+
export declare function addWorkbenchAgent(input: WorkbenchCommandOptions & {
|
|
308
|
+
name: string;
|
|
309
|
+
adapter: string;
|
|
310
|
+
model?: string;
|
|
311
|
+
config?: Record<string, Json>;
|
|
312
|
+
}): Promise<WorkbenchAgent>;
|
|
313
|
+
export declare function removeWorkbenchAgent(name: string, options?: WorkbenchCommandOptions): Promise<{
|
|
314
|
+
removed: string;
|
|
315
|
+
}>;
|
|
316
|
+
export declare function setDefaultWorkbenchAgent(name: string, options?: WorkbenchCommandOptions): Promise<WorkbenchAgent>;
|
|
317
|
+
export declare function addWorkbenchRemote(name: string, url: string, options?: WorkbenchCommandOptions): Promise<WorkbenchRemote>;
|
|
318
|
+
export declare function listWorkbenchRemotes(options?: WorkbenchCommandOptions): Promise<WorkbenchRemote[]>;
|
|
319
|
+
export declare function syncWorkbenchRemote(options?: WorkbenchRemoteOptions): Promise<{
|
|
320
|
+
remote: WorkbenchRemote;
|
|
321
|
+
pushed: number;
|
|
322
|
+
pulled: number;
|
|
323
|
+
}>;
|
|
324
|
+
export declare function publishWorkbenchVersion(options?: WorkbenchPublishOptions): Promise<WorkbenchPublishResult>;
|
|
325
|
+
export declare function createWorkbenchInspectionSnapshot(options?: WorkbenchCommandOptions): Promise<WorkbenchInspectionSnapshot>;
|
|
326
|
+
export declare function exportObjectPack(state: WorkbenchProjectState): WorkbenchObjectPack;
|
|
327
|
+
interface ImportObjectPackOptions {
|
|
328
|
+
refs?: "merge" | "none";
|
|
329
|
+
}
|
|
330
|
+
export declare function importObjectPack(state: WorkbenchProjectState, pack: WorkbenchObjectPack, options?: ImportObjectPackOptions): void;
|
|
331
|
+
export declare function hashJson(value: unknown): string;
|
|
332
|
+
export declare function hashFiles(files: readonly SurfaceSnapshotFile[]): string;
|
|
333
|
+
export declare function readWorkbenchSkillRunOutputScore(output: unknown): number;
|
|
334
|
+
export declare function readWorkbenchSkillRunOutputUsage(output: unknown): UsageSummary | undefined;
|
|
335
|
+
export declare function readWorkbenchSkillTraceResultsCostUsd(results: readonly unknown[]): number | undefined;
|
|
336
|
+
export declare function readWorkbenchSkillUsageCostUsd(usage: UsageSummary | undefined): number | undefined;
|
|
337
|
+
export declare function isDefaultWorkbenchSkillEvalEnvironmentDockerfile(source: string): boolean;
|
|
338
|
+
export declare function automationReadinessForRuns(runs: readonly WorkbenchRun[], jobs: readonly WorkbenchJob[]): WorkbenchAutomationReadiness;
|
|
234
339
|
//# sourceMappingURL=index.d.ts.map
|