@aztec/prover-client 0.66.0 → 0.67.1-devnet
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dest/block_builder/light.d.ts +4 -3
- package/dest/block_builder/light.d.ts.map +1 -1
- package/dest/block_builder/light.js +30 -20
- package/dest/index.d.ts +0 -1
- package/dest/index.d.ts.map +1 -1
- package/dest/index.js +1 -2
- package/dest/mocks/fixtures.d.ts +3 -3
- package/dest/mocks/fixtures.d.ts.map +1 -1
- package/dest/mocks/fixtures.js +2 -2
- package/dest/mocks/test_context.d.ts +10 -9
- package/dest/mocks/test_context.d.ts.map +1 -1
- package/dest/mocks/test_context.js +24 -13
- package/dest/orchestrator/block-building-helpers.d.ts +10 -6
- package/dest/orchestrator/block-building-helpers.d.ts.map +1 -1
- package/dest/orchestrator/block-building-helpers.js +27 -16
- package/dest/orchestrator/block-proving-state.d.ts +6 -5
- package/dest/orchestrator/block-proving-state.d.ts.map +1 -1
- package/dest/orchestrator/block-proving-state.js +16 -8
- package/dest/orchestrator/epoch-proving-state.d.ts +1 -1
- package/dest/orchestrator/epoch-proving-state.d.ts.map +1 -1
- package/dest/orchestrator/epoch-proving-state.js +3 -3
- package/dest/orchestrator/orchestrator.d.ts +11 -8
- package/dest/orchestrator/orchestrator.d.ts.map +1 -1
- package/dest/orchestrator/orchestrator.js +94 -58
- package/dest/orchestrator/orchestrator_metrics.d.ts.map +1 -1
- package/dest/orchestrator/orchestrator_metrics.js +2 -5
- package/dest/prover-agent/memory-proving-queue.d.ts +2 -1
- package/dest/prover-agent/memory-proving-queue.d.ts.map +1 -1
- package/dest/prover-agent/memory-proving-queue.js +241 -224
- package/dest/prover-agent/prover-agent.d.ts +11 -2
- package/dest/prover-agent/prover-agent.d.ts.map +1 -1
- package/dest/prover-agent/prover-agent.js +187 -160
- package/dest/prover-client/prover-client.d.ts +2 -3
- package/dest/prover-client/prover-client.d.ts.map +1 -1
- package/dest/prover-client/prover-client.js +6 -9
- package/dest/proving_broker/broker_prover_facade.d.ts +26 -0
- package/dest/proving_broker/broker_prover_facade.d.ts.map +1 -0
- package/dest/proving_broker/broker_prover_facade.js +107 -0
- package/dest/proving_broker/proving_agent.d.ts +4 -3
- package/dest/proving_broker/proving_agent.d.ts.map +1 -1
- package/dest/proving_broker/proving_agent.js +74 -65
- package/dest/proving_broker/proving_broker.d.ts +27 -7
- package/dest/proving_broker/proving_broker.d.ts.map +1 -1
- package/dest/proving_broker/proving_broker.js +405 -258
- package/dest/proving_broker/proving_broker_database/persisted.d.ts.map +1 -1
- package/dest/proving_broker/proving_broker_database/persisted.js +4 -8
- package/dest/proving_broker/proving_broker_instrumentation.d.ts.map +1 -1
- package/dest/proving_broker/proving_broker_instrumentation.js +2 -8
- package/dest/proving_broker/proving_job_controller.d.ts +2 -1
- package/dest/proving_broker/proving_job_controller.d.ts.map +1 -1
- package/dest/proving_broker/proving_job_controller.js +15 -14
- package/dest/proving_broker/rpc.js +2 -2
- package/dest/test/mock_prover.d.ts +6 -6
- package/dest/test/mock_prover.d.ts.map +1 -1
- package/dest/test/mock_prover.js +5 -5
- package/package.json +18 -13
- package/src/block_builder/light.ts +31 -22
- package/src/index.ts +0 -1
- package/src/mocks/fixtures.ts +4 -4
- package/src/mocks/test_context.ts +39 -24
- package/src/orchestrator/block-building-helpers.ts +33 -20
- package/src/orchestrator/block-proving-state.ts +17 -6
- package/src/orchestrator/epoch-proving-state.ts +0 -2
- package/src/orchestrator/orchestrator.ts +111 -62
- package/src/orchestrator/orchestrator_metrics.ts +1 -11
- package/src/prover-agent/memory-proving-queue.ts +12 -7
- package/src/prover-agent/prover-agent.ts +67 -48
- package/src/prover-client/prover-client.ts +5 -12
- package/src/proving_broker/{caching_broker_facade.ts → broker_prover_facade.ts} +62 -85
- package/src/proving_broker/proving_agent.ts +74 -78
- package/src/proving_broker/proving_broker.ts +240 -73
- package/src/proving_broker/proving_broker_database/persisted.ts +2 -8
- package/src/proving_broker/proving_broker_instrumentation.ts +0 -7
- package/src/proving_broker/proving_job_controller.ts +13 -12
- package/src/proving_broker/rpc.ts +1 -1
- package/src/test/mock_prover.ts +7 -3
- package/dest/proving_broker/caching_broker_facade.d.ts +0 -30
- package/dest/proving_broker/caching_broker_facade.d.ts.map +0 -1
- package/dest/proving_broker/caching_broker_facade.js +0 -150
- package/dest/proving_broker/prover_cache/memory.d.ts +0 -9
- package/dest/proving_broker/prover_cache/memory.d.ts.map +0 -1
- package/dest/proving_broker/prover_cache/memory.js +0 -16
- package/src/proving_broker/prover_cache/memory.ts +0 -20
|
@@ -1,284 +1,433 @@
|
|
|
1
|
+
import { __esDecorate, __runInitializers } from "tslib";
|
|
1
2
|
import { ProvingRequestType, } from '@aztec/circuit-types';
|
|
2
|
-
import {
|
|
3
|
+
import { asyncPool } from '@aztec/foundation/async-pool';
|
|
4
|
+
import { createLogger } from '@aztec/foundation/log';
|
|
3
5
|
import { RunningPromise, promiseWithResolvers } from '@aztec/foundation/promise';
|
|
4
6
|
import { PriorityMemoryQueue } from '@aztec/foundation/queue';
|
|
5
7
|
import { Timer } from '@aztec/foundation/timer';
|
|
8
|
+
import { trackSpan } from '@aztec/telemetry-client';
|
|
6
9
|
import assert from 'assert';
|
|
7
10
|
import { ProvingBrokerInstrumentation } from './proving_broker_instrumentation.js';
|
|
8
11
|
/**
|
|
9
12
|
* A broker that manages proof requests and distributes them to workers based on their priority.
|
|
10
13
|
* It takes a backend that is responsible for storing and retrieving proof requests and results.
|
|
11
14
|
*/
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
15
|
+
let ProvingBroker = (() => {
|
|
16
|
+
var _a;
|
|
17
|
+
let _instanceExtraInitializers = [];
|
|
18
|
+
let _cleanupPass_decorators;
|
|
19
|
+
return _a = class ProvingBroker {
|
|
20
|
+
constructor(database, client, { jobTimeoutMs = 30000, timeoutIntervalMs = 10000, maxRetries = 3, maxEpochsToKeepResultsFor = 1, maxParallelCleanUps = 20, } = {}, logger = createLogger('prover-client:proving-broker')) {
|
|
21
|
+
this.database = (__runInitializers(this, _instanceExtraInitializers), database);
|
|
22
|
+
this.logger = logger;
|
|
23
|
+
this.queues = {
|
|
24
|
+
[ProvingRequestType.PUBLIC_VM]: new PriorityMemoryQueue(provingJobComparator),
|
|
25
|
+
[ProvingRequestType.TUBE_PROOF]: new PriorityMemoryQueue(provingJobComparator),
|
|
26
|
+
[ProvingRequestType.PRIVATE_KERNEL_EMPTY]: new PriorityMemoryQueue(provingJobComparator),
|
|
27
|
+
[ProvingRequestType.PRIVATE_BASE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
|
|
28
|
+
[ProvingRequestType.PUBLIC_BASE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
|
|
29
|
+
[ProvingRequestType.MERGE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
|
|
30
|
+
[ProvingRequestType.ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
|
|
31
|
+
[ProvingRequestType.BLOCK_MERGE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
|
|
32
|
+
[ProvingRequestType.BLOCK_ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
|
|
33
|
+
[ProvingRequestType.EMPTY_BLOCK_ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
|
|
34
|
+
[ProvingRequestType.BASE_PARITY]: new PriorityMemoryQueue(provingJobComparator),
|
|
35
|
+
[ProvingRequestType.ROOT_PARITY]: new PriorityMemoryQueue(provingJobComparator),
|
|
36
|
+
};
|
|
37
|
+
// holds a copy of the database in memory in order to quickly fulfill requests
|
|
38
|
+
// this is fine because this broker is the only one that can modify the database
|
|
39
|
+
this.jobsCache = new Map();
|
|
40
|
+
// as above, but for results
|
|
41
|
+
this.resultsCache = new Map();
|
|
42
|
+
// tracks when each job was enqueued
|
|
43
|
+
this.enqueuedAt = new Map();
|
|
44
|
+
// keeps track of which jobs are currently being processed
|
|
45
|
+
// in the event of a crash this information is lost, but that's ok
|
|
46
|
+
// the next time the broker starts it will recreate jobsCache and still
|
|
47
|
+
// accept results from the workers
|
|
48
|
+
this.inProgress = new Map();
|
|
49
|
+
// keep track of which proving job has been retried
|
|
50
|
+
this.retries = new Map();
|
|
51
|
+
// a map of promises that will be resolved when a job is settled
|
|
52
|
+
this.promises = new Map();
|
|
53
|
+
this.msTimeSource = () => Date.now();
|
|
54
|
+
/**
|
|
55
|
+
* The broker keeps track of the highest epoch its seen.
|
|
56
|
+
* This information is used for garbage collection: once it reaches the next epoch, it can start pruning the database of old state.
|
|
57
|
+
* This clean up pass is only done against _settled_ jobs. This pass will not cancel jobs that are in-progress or in-queue.
|
|
58
|
+
* It is a client responsibility to cancel jobs if they are no longer necessary.
|
|
59
|
+
* Example:
|
|
60
|
+
* proving epoch 11 - the broker will wipe all setlled jobs for epochs 9 and lower
|
|
61
|
+
* finished proving epoch 11 and got first job for epoch 12 -> the broker will wipe all setlled jobs for epochs 10 and lower
|
|
62
|
+
* reorged back to end of epoch 10 -> epoch 11 is skipped and epoch 12 starts -> the broker will wipe all setlled jobs for epochs 10 and lower
|
|
63
|
+
*/
|
|
64
|
+
this.epochHeight = 0;
|
|
65
|
+
this.maxEpochsToKeepResultsFor = 1;
|
|
66
|
+
this.measureQueueDepth = (type) => {
|
|
67
|
+
return this.queues[type].length();
|
|
68
|
+
};
|
|
69
|
+
this.countActiveJobs = (type) => {
|
|
70
|
+
let count = 0;
|
|
71
|
+
for (const { id } of this.inProgress.values()) {
|
|
72
|
+
const job = this.jobsCache.get(id);
|
|
73
|
+
if (job?.type === type) {
|
|
74
|
+
count++;
|
|
75
|
+
}
|
|
76
|
+
}
|
|
77
|
+
return count;
|
|
78
|
+
};
|
|
79
|
+
this.tracer = client.getTracer('ProvingBroker');
|
|
80
|
+
this.instrumentation = new ProvingBrokerInstrumentation(client);
|
|
81
|
+
this.cleanupPromise = new RunningPromise(this.cleanupPass.bind(this), this.logger, timeoutIntervalMs);
|
|
82
|
+
this.jobTimeoutMs = jobTimeoutMs;
|
|
83
|
+
this.maxRetries = maxRetries;
|
|
84
|
+
this.maxEpochsToKeepResultsFor = maxEpochsToKeepResultsFor;
|
|
85
|
+
this.maxParallelCleanUps = maxParallelCleanUps;
|
|
86
|
+
}
|
|
87
|
+
start() {
|
|
88
|
+
for (const [item, result] of this.database.allProvingJobs()) {
|
|
89
|
+
this.logger.info(`Restoring proving job id=${item.id} settled=${!!result}`, {
|
|
90
|
+
provingJobId: item.id,
|
|
91
|
+
status: result ? result.status : 'pending',
|
|
92
|
+
});
|
|
93
|
+
this.jobsCache.set(item.id, item);
|
|
94
|
+
this.promises.set(item.id, promiseWithResolvers());
|
|
95
|
+
if (result) {
|
|
96
|
+
this.promises.get(item.id).resolve(result);
|
|
97
|
+
this.resultsCache.set(item.id, result);
|
|
98
|
+
}
|
|
99
|
+
else {
|
|
100
|
+
this.enqueueJobInternal(item);
|
|
101
|
+
}
|
|
56
102
|
}
|
|
103
|
+
this.cleanupPromise.start();
|
|
104
|
+
this.instrumentation.monitorQueueDepth(this.measureQueueDepth);
|
|
105
|
+
this.instrumentation.monitorActiveJobs(this.countActiveJobs);
|
|
106
|
+
return Promise.resolve();
|
|
57
107
|
}
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
108
|
+
async stop() {
|
|
109
|
+
await this.cleanupPromise.stop();
|
|
110
|
+
}
|
|
111
|
+
async enqueueProvingJob(job) {
|
|
112
|
+
if (this.jobsCache.has(job.id)) {
|
|
113
|
+
const existing = this.jobsCache.get(job.id);
|
|
114
|
+
assert.deepStrictEqual(job, existing, 'Duplicate proving job ID');
|
|
115
|
+
this.logger.debug(`Duplicate proving job id=${job.id} epochNumber=${job.epochNumber}. Ignoring`, {
|
|
116
|
+
provingJobId: job.id,
|
|
117
|
+
});
|
|
118
|
+
return;
|
|
119
|
+
}
|
|
120
|
+
if (this.isJobStale(job)) {
|
|
121
|
+
this.logger.warn(`Tried enqueueing stale proving job id=${job.id} epochNumber=${job.epochNumber}`, {
|
|
122
|
+
provingJobId: job.id,
|
|
123
|
+
});
|
|
124
|
+
throw new Error(`Epoch too old: job epoch ${job.epochNumber}, current epoch: ${this.epochHeight}`);
|
|
125
|
+
}
|
|
126
|
+
this.logger.info(`New proving job id=${job.id} epochNumber=${job.epochNumber}`, { provingJobId: job.id });
|
|
127
|
+
try {
|
|
128
|
+
// do this first so it acts as a "lock". If this job is enqueued again while we're saving it the if at the top will catch it.
|
|
129
|
+
this.jobsCache.set(job.id, job);
|
|
130
|
+
await this.database.addProvingJob(job);
|
|
131
|
+
this.enqueueJobInternal(job);
|
|
132
|
+
}
|
|
133
|
+
catch (err) {
|
|
134
|
+
this.logger.error(`Failed to save proving job id=${job.id}: ${err}`, err, { provingJobId: job.id });
|
|
135
|
+
this.jobsCache.delete(job.id);
|
|
136
|
+
throw err;
|
|
137
|
+
}
|
|
138
|
+
}
|
|
139
|
+
waitForJobToSettle(id) {
|
|
140
|
+
const promiseWithResolvers = this.promises.get(id);
|
|
141
|
+
if (!promiseWithResolvers) {
|
|
142
|
+
this.logger.warn(`Job id=${id} not found`, { provingJobId: id });
|
|
143
|
+
return Promise.resolve({ status: 'rejected', reason: `Job ${id} not found` });
|
|
144
|
+
}
|
|
145
|
+
return promiseWithResolvers.promise;
|
|
146
|
+
}
|
|
147
|
+
async cancelProvingJob(id) {
|
|
148
|
+
if (!this.jobsCache.has(id)) {
|
|
149
|
+
this.logger.warn(`Can't cancel a job that doesn't exist id=${id}`, { provingJobId: id });
|
|
150
|
+
return;
|
|
151
|
+
}
|
|
152
|
+
// notify listeners of the cancellation
|
|
153
|
+
if (!this.resultsCache.has(id)) {
|
|
154
|
+
this.logger.info(`Cancelling job id=${id}`, { provingJobId: id });
|
|
155
|
+
await this.reportProvingJobError(id, 'Aborted', false);
|
|
156
|
+
}
|
|
157
|
+
}
|
|
158
|
+
async cleanUpProvingJobState(id) {
|
|
159
|
+
if (!this.jobsCache.has(id)) {
|
|
160
|
+
this.logger.warn(`Can't clean up a job that doesn't exist id=${id}`, { provingJobId: id });
|
|
161
|
+
return;
|
|
162
|
+
}
|
|
163
|
+
if (!this.resultsCache.has(id)) {
|
|
164
|
+
this.logger.warn(`Can't cleanup busy proving job: id=${id}`, { provingJobId: id });
|
|
165
|
+
return;
|
|
166
|
+
}
|
|
167
|
+
this.logger.debug(`Cleaning up state for job id=${id}`, { provingJobId: id });
|
|
168
|
+
await this.database.deleteProvingJobAndResult(id);
|
|
169
|
+
this.jobsCache.delete(id);
|
|
170
|
+
this.promises.delete(id);
|
|
171
|
+
this.resultsCache.delete(id);
|
|
172
|
+
this.inProgress.delete(id);
|
|
173
|
+
this.retries.delete(id);
|
|
174
|
+
}
|
|
175
|
+
getProvingJobStatus(id) {
|
|
176
|
+
const result = this.resultsCache.get(id);
|
|
177
|
+
if (result) {
|
|
178
|
+
return Promise.resolve(result);
|
|
179
|
+
}
|
|
180
|
+
else {
|
|
181
|
+
// no result yet, check if we know the item
|
|
182
|
+
const item = this.jobsCache.get(id);
|
|
183
|
+
if (!item) {
|
|
184
|
+
this.logger.warn(`Proving job id=${id} not found`, { provingJobId: id });
|
|
185
|
+
return Promise.resolve({ status: 'not-found' });
|
|
186
|
+
}
|
|
187
|
+
return Promise.resolve({ status: this.inProgress.has(id) ? 'in-progress' : 'in-queue' });
|
|
188
|
+
}
|
|
189
|
+
}
|
|
190
|
+
// eslint-disable-next-line require-await
|
|
191
|
+
async getProvingJob(filter = { allowList: [] }) {
|
|
192
|
+
const allowedProofs = Array.isArray(filter.allowList) && filter.allowList.length > 0
|
|
193
|
+
? [...filter.allowList]
|
|
194
|
+
: Object.values(ProvingRequestType).filter((x) => typeof x === 'number');
|
|
195
|
+
allowedProofs.sort(proofTypeComparator);
|
|
196
|
+
for (const proofType of allowedProofs) {
|
|
197
|
+
const queue = this.queues[proofType];
|
|
198
|
+
let enqueuedJob;
|
|
199
|
+
// exhaust the queue and make sure we're not sending a job that's already in progress
|
|
200
|
+
// or has already been completed
|
|
201
|
+
// this can happen if the broker crashes and restarts
|
|
202
|
+
// it's possible agents will report progress or results for jobs that are in the queue (after the restart)
|
|
203
|
+
while ((enqueuedJob = queue.getImmediate())) {
|
|
204
|
+
const job = this.jobsCache.get(enqueuedJob.id);
|
|
205
|
+
if (job && !this.inProgress.has(enqueuedJob.id) && !this.resultsCache.has(enqueuedJob.id)) {
|
|
206
|
+
const time = this.msTimeSource();
|
|
207
|
+
this.inProgress.set(job.id, {
|
|
208
|
+
id: job.id,
|
|
209
|
+
startedAt: time,
|
|
210
|
+
lastUpdatedAt: time,
|
|
211
|
+
});
|
|
212
|
+
const enqueuedAt = this.enqueuedAt.get(job.id);
|
|
213
|
+
if (enqueuedAt) {
|
|
214
|
+
this.instrumentation.recordJobWait(job.type, enqueuedAt);
|
|
215
|
+
}
|
|
216
|
+
return { job, time };
|
|
217
|
+
}
|
|
218
|
+
}
|
|
219
|
+
}
|
|
220
|
+
return undefined;
|
|
221
|
+
}
|
|
222
|
+
async reportProvingJobError(id, err, retry = false) {
|
|
223
|
+
const info = this.inProgress.get(id);
|
|
63
224
|
const item = this.jobsCache.get(id);
|
|
225
|
+
const retries = this.retries.get(id) ?? 0;
|
|
64
226
|
if (!item) {
|
|
65
|
-
this.logger.warn(`
|
|
66
|
-
|
|
67
|
-
|
|
227
|
+
this.logger.warn(`Can't set error on unknown proving job id=${id} err=${err}`, { provingJoId: id });
|
|
228
|
+
return;
|
|
229
|
+
}
|
|
230
|
+
if (!info) {
|
|
231
|
+
this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`, {
|
|
232
|
+
provingJobId: id,
|
|
233
|
+
});
|
|
68
234
|
}
|
|
69
|
-
|
|
70
|
-
if (msSinceLastUpdate >= this.jobTimeoutMs) {
|
|
71
|
-
this.logger.warn(`Proving job id=${id} timed out. Adding it back to the queue.`);
|
|
235
|
+
else {
|
|
72
236
|
this.inProgress.delete(id);
|
|
237
|
+
}
|
|
238
|
+
if (this.resultsCache.has(id)) {
|
|
239
|
+
this.logger.warn(`Proving job id=${id} is already settled, ignoring err=${err}`, {
|
|
240
|
+
provingJobId: id,
|
|
241
|
+
});
|
|
242
|
+
return;
|
|
243
|
+
}
|
|
244
|
+
if (retry && retries + 1 < this.maxRetries && !this.isJobStale(item)) {
|
|
245
|
+
this.logger.info(`Retrying proving job id=${id} type=${ProvingRequestType[item.type]} retry=${retries + 1} err=${err}`, {
|
|
246
|
+
provingJobId: id,
|
|
247
|
+
});
|
|
248
|
+
this.retries.set(id, retries + 1);
|
|
73
249
|
this.enqueueJobInternal(item);
|
|
74
|
-
this.instrumentation.
|
|
250
|
+
this.instrumentation.incRetriedJobs(item.type);
|
|
251
|
+
return;
|
|
252
|
+
}
|
|
253
|
+
this.logger.info(`Marking proving job as failed id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1} err=${err}`, {
|
|
254
|
+
provingJobId: id,
|
|
255
|
+
});
|
|
256
|
+
// save the result to the cache and notify clients of the job status
|
|
257
|
+
// this should work even if our database breaks because the result is cached in memory
|
|
258
|
+
const result = { status: 'rejected', reason: String(err) };
|
|
259
|
+
this.resultsCache.set(id, result);
|
|
260
|
+
this.promises.get(id).resolve(result);
|
|
261
|
+
this.instrumentation.incRejectedJobs(item.type);
|
|
262
|
+
if (info) {
|
|
263
|
+
const duration = this.msTimeSource() - info.startedAt;
|
|
264
|
+
this.instrumentation.recordJobDuration(item.type, duration);
|
|
265
|
+
}
|
|
266
|
+
try {
|
|
267
|
+
await this.database.setProvingJobError(id, err);
|
|
268
|
+
}
|
|
269
|
+
catch (saveErr) {
|
|
270
|
+
this.logger.error(`Failed to save proving job error status id=${id} jobErr=${err}`, saveErr, {
|
|
271
|
+
provingJobId: id,
|
|
272
|
+
});
|
|
273
|
+
throw saveErr;
|
|
75
274
|
}
|
|
76
275
|
}
|
|
77
|
-
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
276
|
+
reportProvingJobProgress(id, startedAt, filter) {
|
|
277
|
+
const job = this.jobsCache.get(id);
|
|
278
|
+
if (!job) {
|
|
279
|
+
this.logger.warn(`Proving job id=${id} does not exist`, { provingJobId: id });
|
|
280
|
+
return filter ? this.getProvingJob(filter) : Promise.resolve(undefined);
|
|
281
|
+
}
|
|
282
|
+
if (this.resultsCache.has(id)) {
|
|
283
|
+
this.logger.warn(`Proving job id=${id} has already been completed`, { provingJobId: id });
|
|
284
|
+
return filter ? this.getProvingJob(filter) : Promise.resolve(undefined);
|
|
285
|
+
}
|
|
286
|
+
const metadata = this.inProgress.get(id);
|
|
287
|
+
const now = this.msTimeSource();
|
|
288
|
+
if (!metadata) {
|
|
289
|
+
this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[job.type]} not found in the in-progress cache, adding it`, { provingJobId: id });
|
|
290
|
+
// the queue will still contain the item at this point!
|
|
291
|
+
// we need to be careful when popping off the queue to make sure we're not sending
|
|
292
|
+
// a job that's already in progress
|
|
293
|
+
this.inProgress.set(id, {
|
|
294
|
+
id,
|
|
295
|
+
startedAt,
|
|
296
|
+
lastUpdatedAt: this.msTimeSource(),
|
|
297
|
+
});
|
|
298
|
+
return Promise.resolve(undefined);
|
|
299
|
+
}
|
|
300
|
+
else if (startedAt <= metadata.startedAt) {
|
|
301
|
+
if (startedAt < metadata.startedAt) {
|
|
302
|
+
this.logger.info(`Proving job id=${id} type=${ProvingRequestType[job.type]} startedAt=${startedAt} older agent has taken job`, { provingJobId: id });
|
|
303
|
+
}
|
|
304
|
+
else {
|
|
305
|
+
this.logger.debug(`Proving job id=${id} type=${ProvingRequestType[job.type]} heartbeat`, { provingJobId: id });
|
|
306
|
+
}
|
|
307
|
+
metadata.startedAt = startedAt;
|
|
308
|
+
metadata.lastUpdatedAt = now;
|
|
309
|
+
return Promise.resolve(undefined);
|
|
310
|
+
}
|
|
311
|
+
else if (filter) {
|
|
312
|
+
this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[job.type]} already being worked on by another agent. Sending new one`, { provingJobId: id });
|
|
313
|
+
return this.getProvingJob(filter);
|
|
314
|
+
}
|
|
315
|
+
else {
|
|
316
|
+
return Promise.resolve(undefined);
|
|
317
|
+
}
|
|
91
318
|
}
|
|
92
|
-
|
|
93
|
-
this.
|
|
94
|
-
this.
|
|
319
|
+
async reportProvingJobSuccess(id, value) {
|
|
320
|
+
const info = this.inProgress.get(id);
|
|
321
|
+
const item = this.jobsCache.get(id);
|
|
322
|
+
const retries = this.retries.get(id) ?? 0;
|
|
323
|
+
if (!item) {
|
|
324
|
+
this.logger.warn(`Proving job id=${id} not found`, { provingJobId: id });
|
|
325
|
+
return;
|
|
326
|
+
}
|
|
327
|
+
if (!info) {
|
|
328
|
+
this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`, {
|
|
329
|
+
provingJobId: id,
|
|
330
|
+
});
|
|
331
|
+
}
|
|
332
|
+
else {
|
|
333
|
+
this.inProgress.delete(id);
|
|
334
|
+
}
|
|
335
|
+
if (this.resultsCache.has(id)) {
|
|
336
|
+
this.logger.warn(`Proving job id=${id} already settled, ignoring result`, { provingJobId: id });
|
|
337
|
+
return;
|
|
338
|
+
}
|
|
339
|
+
this.logger.info(`Proving job complete id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1}`, { provingJobId: id });
|
|
340
|
+
// save result to our local cache and notify clients
|
|
341
|
+
// if save to database fails, that's ok because we have the result in memory
|
|
342
|
+
// if the broker crashes and needs the result again, we're covered because we can just recompute it
|
|
343
|
+
const result = { status: 'fulfilled', value };
|
|
344
|
+
this.resultsCache.set(id, result);
|
|
345
|
+
this.promises.get(id).resolve(result);
|
|
346
|
+
this.instrumentation.incResolvedJobs(item.type);
|
|
347
|
+
if (info) {
|
|
348
|
+
const duration = this.msTimeSource() - info.startedAt;
|
|
349
|
+
this.instrumentation.recordJobDuration(item.type, duration);
|
|
350
|
+
}
|
|
351
|
+
try {
|
|
352
|
+
await this.database.setProvingJobResult(id, value);
|
|
353
|
+
}
|
|
354
|
+
catch (saveErr) {
|
|
355
|
+
this.logger.error(`Failed to save proving job result id=${id}`, saveErr, {
|
|
356
|
+
provingJobId: id,
|
|
357
|
+
});
|
|
358
|
+
throw saveErr;
|
|
359
|
+
}
|
|
95
360
|
}
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
|
|
99
|
-
this.instrumentation.monitorActiveJobs(this.countActiveJobs);
|
|
100
|
-
return Promise.resolve();
|
|
101
|
-
}
|
|
102
|
-
stop() {
|
|
103
|
-
return this.timeoutPromise.stop();
|
|
104
|
-
}
|
|
105
|
-
async enqueueProvingJob(job) {
|
|
106
|
-
if (this.jobsCache.has(job.id)) {
|
|
107
|
-
const existing = this.jobsCache.get(job.id);
|
|
108
|
-
assert.deepStrictEqual(job, existing, 'Duplicate proving job ID');
|
|
109
|
-
return;
|
|
110
|
-
}
|
|
111
|
-
await this.database.addProvingJob(job);
|
|
112
|
-
this.jobsCache.set(job.id, job);
|
|
113
|
-
this.enqueueJobInternal(job);
|
|
114
|
-
}
|
|
115
|
-
waitForJobToSettle(id) {
|
|
116
|
-
const promiseWithResolvers = this.promises.get(id);
|
|
117
|
-
if (!promiseWithResolvers) {
|
|
118
|
-
return Promise.resolve({ status: 'rejected', reason: `Job ${id} not found` });
|
|
119
|
-
}
|
|
120
|
-
return promiseWithResolvers.promise;
|
|
121
|
-
}
|
|
122
|
-
async removeAndCancelProvingJob(id) {
|
|
123
|
-
this.logger.info(`Cancelling job id=${id}`);
|
|
124
|
-
await this.database.deleteProvingJobAndResult(id);
|
|
125
|
-
// notify listeners of the cancellation
|
|
126
|
-
if (!this.resultsCache.has(id)) {
|
|
127
|
-
this.promises.get(id)?.resolve({ status: 'rejected', reason: 'Aborted' });
|
|
128
|
-
}
|
|
129
|
-
this.jobsCache.delete(id);
|
|
130
|
-
this.promises.delete(id);
|
|
131
|
-
this.resultsCache.delete(id);
|
|
132
|
-
this.inProgress.delete(id);
|
|
133
|
-
this.retries.delete(id);
|
|
134
|
-
}
|
|
135
|
-
getProvingJobStatus(id) {
|
|
136
|
-
const result = this.resultsCache.get(id);
|
|
137
|
-
if (result) {
|
|
138
|
-
return Promise.resolve(result);
|
|
139
|
-
}
|
|
140
|
-
else {
|
|
141
|
-
// no result yet, check if we know the item
|
|
142
|
-
const item = this.jobsCache.get(id);
|
|
143
|
-
if (!item) {
|
|
144
|
-
this.logger.warn(`Proving job id=${id} not found`);
|
|
145
|
-
return Promise.resolve({ status: 'not-found' });
|
|
361
|
+
async cleanupPass() {
|
|
362
|
+
await this.cleanupStaleJobs();
|
|
363
|
+
await this.reEnqueueExpiredJobs();
|
|
146
364
|
}
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
// this can happen if the broker crashes and restarts
|
|
162
|
-
// it's possible agents will report progress or results for jobs that are in the queue (after the restart)
|
|
163
|
-
while ((job = queue.getImmediate())) {
|
|
164
|
-
if (!this.inProgress.has(job.id) && !this.resultsCache.has(job.id)) {
|
|
165
|
-
const time = this.timeSource();
|
|
166
|
-
this.inProgress.set(job.id, {
|
|
167
|
-
id: job.id,
|
|
168
|
-
startedAt: time,
|
|
169
|
-
lastUpdatedAt: time,
|
|
365
|
+
async cleanupStaleJobs() {
|
|
366
|
+
const jobIds = Array.from(this.jobsCache.keys());
|
|
367
|
+
const jobsToClean = [];
|
|
368
|
+
for (const id of jobIds) {
|
|
369
|
+
const job = this.jobsCache.get(id);
|
|
370
|
+
const isComplete = this.resultsCache.has(id);
|
|
371
|
+
if (isComplete && this.isJobStale(job)) {
|
|
372
|
+
jobsToClean.push(id);
|
|
373
|
+
}
|
|
374
|
+
}
|
|
375
|
+
if (jobsToClean.length > 0) {
|
|
376
|
+
this.logger.info(`Cleaning up jobs=${jobsToClean.length}`);
|
|
377
|
+
await asyncPool(this.maxParallelCleanUps, jobsToClean, async (jobId) => {
|
|
378
|
+
await this.cleanUpProvingJobState(jobId);
|
|
170
379
|
});
|
|
171
|
-
|
|
172
|
-
|
|
173
|
-
|
|
380
|
+
}
|
|
381
|
+
}
|
|
382
|
+
async reEnqueueExpiredJobs() {
|
|
383
|
+
const inProgressEntries = Array.from(this.inProgress.entries());
|
|
384
|
+
for (const [id, metadata] of inProgressEntries) {
|
|
385
|
+
const item = this.jobsCache.get(id);
|
|
386
|
+
if (!item) {
|
|
387
|
+
this.logger.warn(`Proving job id=${id} not found. Removing it from the queue.`, { provingJobId: id });
|
|
388
|
+
this.inProgress.delete(id);
|
|
389
|
+
continue;
|
|
390
|
+
}
|
|
391
|
+
const now = this.msTimeSource();
|
|
392
|
+
const msSinceLastUpdate = now - metadata.lastUpdatedAt;
|
|
393
|
+
if (msSinceLastUpdate >= this.jobTimeoutMs) {
|
|
394
|
+
if (this.isJobStale(item)) {
|
|
395
|
+
// the job has timed out and it's also old, just cancel and move on
|
|
396
|
+
await this.cancelProvingJob(item.id);
|
|
397
|
+
}
|
|
398
|
+
else {
|
|
399
|
+
this.logger.warn(`Proving job id=${id} timed out. Adding it back to the queue.`, { provingJobId: id });
|
|
400
|
+
this.inProgress.delete(id);
|
|
401
|
+
this.enqueueJobInternal(item);
|
|
402
|
+
this.instrumentation.incTimedOutJobs(item.type);
|
|
403
|
+
}
|
|
174
404
|
}
|
|
175
|
-
return { job, time };
|
|
176
405
|
}
|
|
177
406
|
}
|
|
178
|
-
|
|
179
|
-
|
|
180
|
-
|
|
181
|
-
|
|
182
|
-
|
|
183
|
-
|
|
184
|
-
|
|
185
|
-
|
|
186
|
-
|
|
187
|
-
|
|
188
|
-
}
|
|
189
|
-
if (!info) {
|
|
190
|
-
this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`);
|
|
191
|
-
}
|
|
192
|
-
else {
|
|
193
|
-
this.inProgress.delete(id);
|
|
194
|
-
}
|
|
195
|
-
if (retry && retries + 1 < this.maxRetries) {
|
|
196
|
-
this.logger.info(`Retrying proving job id=${id} type=${ProvingRequestType[item.type]} retry=${retries + 1}`);
|
|
197
|
-
this.retries.set(id, retries + 1);
|
|
198
|
-
this.enqueueJobInternal(item);
|
|
199
|
-
this.instrumentation.incRetriedJobs(item.type);
|
|
200
|
-
return;
|
|
201
|
-
}
|
|
202
|
-
this.logger.debug(`Marking proving job id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1} as failed`);
|
|
203
|
-
await this.database.setProvingJobError(id, err);
|
|
204
|
-
const result = { status: 'rejected', reason: String(err) };
|
|
205
|
-
this.resultsCache.set(id, result);
|
|
206
|
-
this.promises.get(id).resolve(result);
|
|
207
|
-
this.instrumentation.incRejectedJobs(item.type);
|
|
208
|
-
if (info) {
|
|
209
|
-
const duration = this.timeSource() - info.startedAt;
|
|
210
|
-
this.instrumentation.recordJobDuration(item.type, duration * 1000);
|
|
211
|
-
}
|
|
212
|
-
}
|
|
213
|
-
reportProvingJobProgress(id, startedAt, filter) {
|
|
214
|
-
const job = this.jobsCache.get(id);
|
|
215
|
-
if (!job) {
|
|
216
|
-
this.logger.warn(`Proving job id=${id} does not exist`);
|
|
217
|
-
return filter ? this.getProvingJob(filter) : Promise.resolve(undefined);
|
|
218
|
-
}
|
|
219
|
-
const metadata = this.inProgress.get(id);
|
|
220
|
-
const now = this.timeSource();
|
|
221
|
-
if (!metadata) {
|
|
222
|
-
this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[job.type]} not found in the in-progress cache, adding it`);
|
|
223
|
-
// the queue will still contain the item at this point!
|
|
224
|
-
// we need to be careful when popping off the queue to make sure we're not sending
|
|
225
|
-
// a job that's already in progress
|
|
226
|
-
this.inProgress.set(id, {
|
|
227
|
-
id,
|
|
228
|
-
startedAt,
|
|
229
|
-
lastUpdatedAt: this.timeSource(),
|
|
230
|
-
});
|
|
231
|
-
return Promise.resolve(undefined);
|
|
232
|
-
}
|
|
233
|
-
else if (startedAt <= metadata.startedAt) {
|
|
234
|
-
if (startedAt < metadata.startedAt) {
|
|
235
|
-
this.logger.debug(`Proving job id=${id} type=${ProvingRequestType[job.type]} startedAt=${startedAt} older agent has taken job`);
|
|
407
|
+
enqueueJobInternal(job) {
|
|
408
|
+
if (!this.promises.has(job.id)) {
|
|
409
|
+
this.promises.set(job.id, promiseWithResolvers());
|
|
410
|
+
}
|
|
411
|
+
this.queues[job.type].put({
|
|
412
|
+
epochNumber: job.epochNumber,
|
|
413
|
+
id: job.id,
|
|
414
|
+
});
|
|
415
|
+
this.enqueuedAt.set(job.id, new Timer());
|
|
416
|
+
this.epochHeight = Math.max(this.epochHeight, job.epochNumber);
|
|
236
417
|
}
|
|
237
|
-
|
|
238
|
-
|
|
418
|
+
isJobStale(job) {
|
|
419
|
+
return job.epochNumber < this.epochHeight - this.maxEpochsToKeepResultsFor;
|
|
239
420
|
}
|
|
240
|
-
|
|
241
|
-
|
|
242
|
-
|
|
243
|
-
|
|
244
|
-
|
|
245
|
-
|
|
246
|
-
|
|
247
|
-
|
|
248
|
-
|
|
249
|
-
|
|
250
|
-
}
|
|
251
|
-
}
|
|
252
|
-
async reportProvingJobSuccess(id, value) {
|
|
253
|
-
const info = this.inProgress.get(id);
|
|
254
|
-
const item = this.jobsCache.get(id);
|
|
255
|
-
const retries = this.retries.get(id) ?? 0;
|
|
256
|
-
if (!item) {
|
|
257
|
-
this.logger.warn(`Proving job id=${id} not found`);
|
|
258
|
-
return;
|
|
259
|
-
}
|
|
260
|
-
if (!info) {
|
|
261
|
-
this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`);
|
|
262
|
-
}
|
|
263
|
-
else {
|
|
264
|
-
this.inProgress.delete(id);
|
|
265
|
-
}
|
|
266
|
-
this.logger.debug(`Proving job complete id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1}`);
|
|
267
|
-
await this.database.setProvingJobResult(id, value);
|
|
268
|
-
const result = { status: 'fulfilled', value };
|
|
269
|
-
this.resultsCache.set(id, result);
|
|
270
|
-
this.promises.get(id).resolve(result);
|
|
271
|
-
this.instrumentation.incResolvedJobs(item.type);
|
|
272
|
-
}
|
|
273
|
-
enqueueJobInternal(job) {
|
|
274
|
-
if (!this.promises.has(job.id)) {
|
|
275
|
-
this.promises.set(job.id, promiseWithResolvers());
|
|
276
|
-
}
|
|
277
|
-
this.queues[job.type].put(job);
|
|
278
|
-
this.enqueuedAt.set(job.id, new Timer());
|
|
279
|
-
this.logger.debug(`Enqueued new proving job id=${job.id}`);
|
|
280
|
-
}
|
|
281
|
-
}
|
|
421
|
+
},
|
|
422
|
+
(() => {
|
|
423
|
+
const _metadata = typeof Symbol === "function" && Symbol.metadata ? Object.create(null) : void 0;
|
|
424
|
+
_cleanupPass_decorators = [trackSpan('ProvingBroker.cleanupPass')];
|
|
425
|
+
__esDecorate(_a, null, _cleanupPass_decorators, { kind: "method", name: "cleanupPass", static: false, private: false, access: { has: obj => "cleanupPass" in obj, get: obj => obj.cleanupPass }, metadata: _metadata }, null, _instanceExtraInitializers);
|
|
426
|
+
if (_metadata) Object.defineProperty(_a, Symbol.metadata, { enumerable: true, configurable: true, writable: true, value: _metadata });
|
|
427
|
+
})(),
|
|
428
|
+
_a;
|
|
429
|
+
})();
|
|
430
|
+
export { ProvingBroker };
|
|
282
431
|
/**
|
|
283
432
|
* Compares two proving jobs and selects which one's more important
|
|
284
433
|
* @param a - A proving job
|
|
@@ -286,12 +435,10 @@ export class ProvingBroker {
|
|
|
286
435
|
* @returns A number indicating the relative priority of the two proving jobs
|
|
287
436
|
*/
|
|
288
437
|
function provingJobComparator(a, b) {
|
|
289
|
-
|
|
290
|
-
const bBlockNumber = b.blockNumber ?? 0;
|
|
291
|
-
if (aBlockNumber < bBlockNumber) {
|
|
438
|
+
if (a.epochNumber < b.epochNumber) {
|
|
292
439
|
return -1;
|
|
293
440
|
}
|
|
294
|
-
else if (
|
|
441
|
+
else if (a.epochNumber > b.epochNumber) {
|
|
295
442
|
return 1;
|
|
296
443
|
}
|
|
297
444
|
else {
|
|
@@ -349,4 +496,4 @@ const PROOF_TYPES_IN_PRIORITY_ORDER = [
|
|
|
349
496
|
ProvingRequestType.EMPTY_BLOCK_ROOT_ROLLUP,
|
|
350
497
|
ProvingRequestType.PRIVATE_KERNEL_EMPTY,
|
|
351
498
|
];
|
|
352
|
-
//# sourceMappingURL=data:application/json;base64,
|
|
499
|
+
//# sourceMappingURL=data:application/json;base64,
|