@aztec/prover-client 0.66.0 → 0.67.1-devnet

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (83) hide show
  1. package/dest/block_builder/light.d.ts +4 -3
  2. package/dest/block_builder/light.d.ts.map +1 -1
  3. package/dest/block_builder/light.js +30 -20
  4. package/dest/index.d.ts +0 -1
  5. package/dest/index.d.ts.map +1 -1
  6. package/dest/index.js +1 -2
  7. package/dest/mocks/fixtures.d.ts +3 -3
  8. package/dest/mocks/fixtures.d.ts.map +1 -1
  9. package/dest/mocks/fixtures.js +2 -2
  10. package/dest/mocks/test_context.d.ts +10 -9
  11. package/dest/mocks/test_context.d.ts.map +1 -1
  12. package/dest/mocks/test_context.js +24 -13
  13. package/dest/orchestrator/block-building-helpers.d.ts +10 -6
  14. package/dest/orchestrator/block-building-helpers.d.ts.map +1 -1
  15. package/dest/orchestrator/block-building-helpers.js +27 -16
  16. package/dest/orchestrator/block-proving-state.d.ts +6 -5
  17. package/dest/orchestrator/block-proving-state.d.ts.map +1 -1
  18. package/dest/orchestrator/block-proving-state.js +16 -8
  19. package/dest/orchestrator/epoch-proving-state.d.ts +1 -1
  20. package/dest/orchestrator/epoch-proving-state.d.ts.map +1 -1
  21. package/dest/orchestrator/epoch-proving-state.js +3 -3
  22. package/dest/orchestrator/orchestrator.d.ts +11 -8
  23. package/dest/orchestrator/orchestrator.d.ts.map +1 -1
  24. package/dest/orchestrator/orchestrator.js +94 -58
  25. package/dest/orchestrator/orchestrator_metrics.d.ts.map +1 -1
  26. package/dest/orchestrator/orchestrator_metrics.js +2 -5
  27. package/dest/prover-agent/memory-proving-queue.d.ts +2 -1
  28. package/dest/prover-agent/memory-proving-queue.d.ts.map +1 -1
  29. package/dest/prover-agent/memory-proving-queue.js +241 -224
  30. package/dest/prover-agent/prover-agent.d.ts +11 -2
  31. package/dest/prover-agent/prover-agent.d.ts.map +1 -1
  32. package/dest/prover-agent/prover-agent.js +187 -160
  33. package/dest/prover-client/prover-client.d.ts +2 -3
  34. package/dest/prover-client/prover-client.d.ts.map +1 -1
  35. package/dest/prover-client/prover-client.js +6 -9
  36. package/dest/proving_broker/broker_prover_facade.d.ts +26 -0
  37. package/dest/proving_broker/broker_prover_facade.d.ts.map +1 -0
  38. package/dest/proving_broker/broker_prover_facade.js +107 -0
  39. package/dest/proving_broker/proving_agent.d.ts +4 -3
  40. package/dest/proving_broker/proving_agent.d.ts.map +1 -1
  41. package/dest/proving_broker/proving_agent.js +74 -65
  42. package/dest/proving_broker/proving_broker.d.ts +27 -7
  43. package/dest/proving_broker/proving_broker.d.ts.map +1 -1
  44. package/dest/proving_broker/proving_broker.js +405 -258
  45. package/dest/proving_broker/proving_broker_database/persisted.d.ts.map +1 -1
  46. package/dest/proving_broker/proving_broker_database/persisted.js +4 -8
  47. package/dest/proving_broker/proving_broker_instrumentation.d.ts.map +1 -1
  48. package/dest/proving_broker/proving_broker_instrumentation.js +2 -8
  49. package/dest/proving_broker/proving_job_controller.d.ts +2 -1
  50. package/dest/proving_broker/proving_job_controller.d.ts.map +1 -1
  51. package/dest/proving_broker/proving_job_controller.js +15 -14
  52. package/dest/proving_broker/rpc.js +2 -2
  53. package/dest/test/mock_prover.d.ts +6 -6
  54. package/dest/test/mock_prover.d.ts.map +1 -1
  55. package/dest/test/mock_prover.js +5 -5
  56. package/package.json +18 -13
  57. package/src/block_builder/light.ts +31 -22
  58. package/src/index.ts +0 -1
  59. package/src/mocks/fixtures.ts +4 -4
  60. package/src/mocks/test_context.ts +39 -24
  61. package/src/orchestrator/block-building-helpers.ts +33 -20
  62. package/src/orchestrator/block-proving-state.ts +17 -6
  63. package/src/orchestrator/epoch-proving-state.ts +0 -2
  64. package/src/orchestrator/orchestrator.ts +111 -62
  65. package/src/orchestrator/orchestrator_metrics.ts +1 -11
  66. package/src/prover-agent/memory-proving-queue.ts +12 -7
  67. package/src/prover-agent/prover-agent.ts +67 -48
  68. package/src/prover-client/prover-client.ts +5 -12
  69. package/src/proving_broker/{caching_broker_facade.ts → broker_prover_facade.ts} +62 -85
  70. package/src/proving_broker/proving_agent.ts +74 -78
  71. package/src/proving_broker/proving_broker.ts +240 -73
  72. package/src/proving_broker/proving_broker_database/persisted.ts +2 -8
  73. package/src/proving_broker/proving_broker_instrumentation.ts +0 -7
  74. package/src/proving_broker/proving_job_controller.ts +13 -12
  75. package/src/proving_broker/rpc.ts +1 -1
  76. package/src/test/mock_prover.ts +7 -3
  77. package/dest/proving_broker/caching_broker_facade.d.ts +0 -30
  78. package/dest/proving_broker/caching_broker_facade.d.ts.map +0 -1
  79. package/dest/proving_broker/caching_broker_facade.js +0 -150
  80. package/dest/proving_broker/prover_cache/memory.d.ts +0 -9
  81. package/dest/proving_broker/prover_cache/memory.d.ts.map +0 -1
  82. package/dest/proving_broker/prover_cache/memory.js +0 -16
  83. package/src/proving_broker/prover_cache/memory.ts +0 -20
@@ -1,284 +1,433 @@
1
+ import { __esDecorate, __runInitializers } from "tslib";
1
2
  import { ProvingRequestType, } from '@aztec/circuit-types';
2
- import { createDebugLogger } from '@aztec/foundation/log';
3
+ import { asyncPool } from '@aztec/foundation/async-pool';
4
+ import { createLogger } from '@aztec/foundation/log';
3
5
  import { RunningPromise, promiseWithResolvers } from '@aztec/foundation/promise';
4
6
  import { PriorityMemoryQueue } from '@aztec/foundation/queue';
5
7
  import { Timer } from '@aztec/foundation/timer';
8
+ import { trackSpan } from '@aztec/telemetry-client';
6
9
  import assert from 'assert';
7
10
  import { ProvingBrokerInstrumentation } from './proving_broker_instrumentation.js';
8
11
  /**
9
12
  * A broker that manages proof requests and distributes them to workers based on their priority.
10
13
  * It takes a backend that is responsible for storing and retrieving proof requests and results.
11
14
  */
12
- export class ProvingBroker {
13
- constructor(database, client, { jobTimeoutMs = 30000, timeoutIntervalMs = 10000, maxRetries = 3 } = {}, logger = createDebugLogger('aztec:prover-client:proving-broker')) {
14
- this.database = database;
15
- this.logger = logger;
16
- this.queues = {
17
- [ProvingRequestType.PUBLIC_VM]: new PriorityMemoryQueue(provingJobComparator),
18
- [ProvingRequestType.TUBE_PROOF]: new PriorityMemoryQueue(provingJobComparator),
19
- [ProvingRequestType.PRIVATE_KERNEL_EMPTY]: new PriorityMemoryQueue(provingJobComparator),
20
- [ProvingRequestType.PRIVATE_BASE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
21
- [ProvingRequestType.PUBLIC_BASE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
22
- [ProvingRequestType.MERGE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
23
- [ProvingRequestType.ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
24
- [ProvingRequestType.BLOCK_MERGE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
25
- [ProvingRequestType.BLOCK_ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
26
- [ProvingRequestType.EMPTY_BLOCK_ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
27
- [ProvingRequestType.BASE_PARITY]: new PriorityMemoryQueue(provingJobComparator),
28
- [ProvingRequestType.ROOT_PARITY]: new PriorityMemoryQueue(provingJobComparator),
29
- };
30
- // holds a copy of the database in memory in order to quickly fulfill requests
31
- // this is fine because this broker is the only one that can modify the database
32
- this.jobsCache = new Map();
33
- // as above, but for results
34
- this.resultsCache = new Map();
35
- // tracks when each job was enqueued
36
- this.enqueuedAt = new Map();
37
- // keeps track of which jobs are currently being processed
38
- // in the event of a crash this information is lost, but that's ok
39
- // the next time the broker starts it will recreate jobsCache and still
40
- // accept results from the workers
41
- this.inProgress = new Map();
42
- // keep track of which proving job has been retried
43
- this.retries = new Map();
44
- // a map of promises that will be resolved when a job is settled
45
- this.promises = new Map();
46
- this.timeSource = () => Math.floor(Date.now() / 1000);
47
- this.measureQueueDepth = (type) => {
48
- return this.queues[type].length();
49
- };
50
- this.countActiveJobs = (type) => {
51
- let count = 0;
52
- for (const { id } of this.inProgress.values()) {
53
- const job = this.jobsCache.get(id);
54
- if (job?.type === type) {
55
- count++;
15
+ let ProvingBroker = (() => {
16
+ var _a;
17
+ let _instanceExtraInitializers = [];
18
+ let _cleanupPass_decorators;
19
+ return _a = class ProvingBroker {
20
+ constructor(database, client, { jobTimeoutMs = 30000, timeoutIntervalMs = 10000, maxRetries = 3, maxEpochsToKeepResultsFor = 1, maxParallelCleanUps = 20, } = {}, logger = createLogger('prover-client:proving-broker')) {
21
+ this.database = (__runInitializers(this, _instanceExtraInitializers), database);
22
+ this.logger = logger;
23
+ this.queues = {
24
+ [ProvingRequestType.PUBLIC_VM]: new PriorityMemoryQueue(provingJobComparator),
25
+ [ProvingRequestType.TUBE_PROOF]: new PriorityMemoryQueue(provingJobComparator),
26
+ [ProvingRequestType.PRIVATE_KERNEL_EMPTY]: new PriorityMemoryQueue(provingJobComparator),
27
+ [ProvingRequestType.PRIVATE_BASE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
28
+ [ProvingRequestType.PUBLIC_BASE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
29
+ [ProvingRequestType.MERGE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
30
+ [ProvingRequestType.ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
31
+ [ProvingRequestType.BLOCK_MERGE_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
32
+ [ProvingRequestType.BLOCK_ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
33
+ [ProvingRequestType.EMPTY_BLOCK_ROOT_ROLLUP]: new PriorityMemoryQueue(provingJobComparator),
34
+ [ProvingRequestType.BASE_PARITY]: new PriorityMemoryQueue(provingJobComparator),
35
+ [ProvingRequestType.ROOT_PARITY]: new PriorityMemoryQueue(provingJobComparator),
36
+ };
37
+ // holds a copy of the database in memory in order to quickly fulfill requests
38
+ // this is fine because this broker is the only one that can modify the database
39
+ this.jobsCache = new Map();
40
+ // as above, but for results
41
+ this.resultsCache = new Map();
42
+ // tracks when each job was enqueued
43
+ this.enqueuedAt = new Map();
44
+ // keeps track of which jobs are currently being processed
45
+ // in the event of a crash this information is lost, but that's ok
46
+ // the next time the broker starts it will recreate jobsCache and still
47
+ // accept results from the workers
48
+ this.inProgress = new Map();
49
+ // keep track of which proving job has been retried
50
+ this.retries = new Map();
51
+ // a map of promises that will be resolved when a job is settled
52
+ this.promises = new Map();
53
+ this.msTimeSource = () => Date.now();
54
+ /**
55
+ * The broker keeps track of the highest epoch its seen.
56
+ * This information is used for garbage collection: once it reaches the next epoch, it can start pruning the database of old state.
57
+ * This clean up pass is only done against _settled_ jobs. This pass will not cancel jobs that are in-progress or in-queue.
58
+ * It is a client responsibility to cancel jobs if they are no longer necessary.
59
+ * Example:
60
+ * proving epoch 11 - the broker will wipe all setlled jobs for epochs 9 and lower
61
+ * finished proving epoch 11 and got first job for epoch 12 -> the broker will wipe all setlled jobs for epochs 10 and lower
62
+ * reorged back to end of epoch 10 -> epoch 11 is skipped and epoch 12 starts -> the broker will wipe all setlled jobs for epochs 10 and lower
63
+ */
64
+ this.epochHeight = 0;
65
+ this.maxEpochsToKeepResultsFor = 1;
66
+ this.measureQueueDepth = (type) => {
67
+ return this.queues[type].length();
68
+ };
69
+ this.countActiveJobs = (type) => {
70
+ let count = 0;
71
+ for (const { id } of this.inProgress.values()) {
72
+ const job = this.jobsCache.get(id);
73
+ if (job?.type === type) {
74
+ count++;
75
+ }
76
+ }
77
+ return count;
78
+ };
79
+ this.tracer = client.getTracer('ProvingBroker');
80
+ this.instrumentation = new ProvingBrokerInstrumentation(client);
81
+ this.cleanupPromise = new RunningPromise(this.cleanupPass.bind(this), this.logger, timeoutIntervalMs);
82
+ this.jobTimeoutMs = jobTimeoutMs;
83
+ this.maxRetries = maxRetries;
84
+ this.maxEpochsToKeepResultsFor = maxEpochsToKeepResultsFor;
85
+ this.maxParallelCleanUps = maxParallelCleanUps;
86
+ }
87
+ start() {
88
+ for (const [item, result] of this.database.allProvingJobs()) {
89
+ this.logger.info(`Restoring proving job id=${item.id} settled=${!!result}`, {
90
+ provingJobId: item.id,
91
+ status: result ? result.status : 'pending',
92
+ });
93
+ this.jobsCache.set(item.id, item);
94
+ this.promises.set(item.id, promiseWithResolvers());
95
+ if (result) {
96
+ this.promises.get(item.id).resolve(result);
97
+ this.resultsCache.set(item.id, result);
98
+ }
99
+ else {
100
+ this.enqueueJobInternal(item);
101
+ }
56
102
  }
103
+ this.cleanupPromise.start();
104
+ this.instrumentation.monitorQueueDepth(this.measureQueueDepth);
105
+ this.instrumentation.monitorActiveJobs(this.countActiveJobs);
106
+ return Promise.resolve();
57
107
  }
58
- return count;
59
- };
60
- this.timeoutCheck = () => {
61
- const inProgressEntries = Array.from(this.inProgress.entries());
62
- for (const [id, metadata] of inProgressEntries) {
108
+ async stop() {
109
+ await this.cleanupPromise.stop();
110
+ }
111
+ async enqueueProvingJob(job) {
112
+ if (this.jobsCache.has(job.id)) {
113
+ const existing = this.jobsCache.get(job.id);
114
+ assert.deepStrictEqual(job, existing, 'Duplicate proving job ID');
115
+ this.logger.debug(`Duplicate proving job id=${job.id} epochNumber=${job.epochNumber}. Ignoring`, {
116
+ provingJobId: job.id,
117
+ });
118
+ return;
119
+ }
120
+ if (this.isJobStale(job)) {
121
+ this.logger.warn(`Tried enqueueing stale proving job id=${job.id} epochNumber=${job.epochNumber}`, {
122
+ provingJobId: job.id,
123
+ });
124
+ throw new Error(`Epoch too old: job epoch ${job.epochNumber}, current epoch: ${this.epochHeight}`);
125
+ }
126
+ this.logger.info(`New proving job id=${job.id} epochNumber=${job.epochNumber}`, { provingJobId: job.id });
127
+ try {
128
+ // do this first so it acts as a "lock". If this job is enqueued again while we're saving it the if at the top will catch it.
129
+ this.jobsCache.set(job.id, job);
130
+ await this.database.addProvingJob(job);
131
+ this.enqueueJobInternal(job);
132
+ }
133
+ catch (err) {
134
+ this.logger.error(`Failed to save proving job id=${job.id}: ${err}`, err, { provingJobId: job.id });
135
+ this.jobsCache.delete(job.id);
136
+ throw err;
137
+ }
138
+ }
139
+ waitForJobToSettle(id) {
140
+ const promiseWithResolvers = this.promises.get(id);
141
+ if (!promiseWithResolvers) {
142
+ this.logger.warn(`Job id=${id} not found`, { provingJobId: id });
143
+ return Promise.resolve({ status: 'rejected', reason: `Job ${id} not found` });
144
+ }
145
+ return promiseWithResolvers.promise;
146
+ }
147
+ async cancelProvingJob(id) {
148
+ if (!this.jobsCache.has(id)) {
149
+ this.logger.warn(`Can't cancel a job that doesn't exist id=${id}`, { provingJobId: id });
150
+ return;
151
+ }
152
+ // notify listeners of the cancellation
153
+ if (!this.resultsCache.has(id)) {
154
+ this.logger.info(`Cancelling job id=${id}`, { provingJobId: id });
155
+ await this.reportProvingJobError(id, 'Aborted', false);
156
+ }
157
+ }
158
+ async cleanUpProvingJobState(id) {
159
+ if (!this.jobsCache.has(id)) {
160
+ this.logger.warn(`Can't clean up a job that doesn't exist id=${id}`, { provingJobId: id });
161
+ return;
162
+ }
163
+ if (!this.resultsCache.has(id)) {
164
+ this.logger.warn(`Can't cleanup busy proving job: id=${id}`, { provingJobId: id });
165
+ return;
166
+ }
167
+ this.logger.debug(`Cleaning up state for job id=${id}`, { provingJobId: id });
168
+ await this.database.deleteProvingJobAndResult(id);
169
+ this.jobsCache.delete(id);
170
+ this.promises.delete(id);
171
+ this.resultsCache.delete(id);
172
+ this.inProgress.delete(id);
173
+ this.retries.delete(id);
174
+ }
175
+ getProvingJobStatus(id) {
176
+ const result = this.resultsCache.get(id);
177
+ if (result) {
178
+ return Promise.resolve(result);
179
+ }
180
+ else {
181
+ // no result yet, check if we know the item
182
+ const item = this.jobsCache.get(id);
183
+ if (!item) {
184
+ this.logger.warn(`Proving job id=${id} not found`, { provingJobId: id });
185
+ return Promise.resolve({ status: 'not-found' });
186
+ }
187
+ return Promise.resolve({ status: this.inProgress.has(id) ? 'in-progress' : 'in-queue' });
188
+ }
189
+ }
190
+ // eslint-disable-next-line require-await
191
+ async getProvingJob(filter = { allowList: [] }) {
192
+ const allowedProofs = Array.isArray(filter.allowList) && filter.allowList.length > 0
193
+ ? [...filter.allowList]
194
+ : Object.values(ProvingRequestType).filter((x) => typeof x === 'number');
195
+ allowedProofs.sort(proofTypeComparator);
196
+ for (const proofType of allowedProofs) {
197
+ const queue = this.queues[proofType];
198
+ let enqueuedJob;
199
+ // exhaust the queue and make sure we're not sending a job that's already in progress
200
+ // or has already been completed
201
+ // this can happen if the broker crashes and restarts
202
+ // it's possible agents will report progress or results for jobs that are in the queue (after the restart)
203
+ while ((enqueuedJob = queue.getImmediate())) {
204
+ const job = this.jobsCache.get(enqueuedJob.id);
205
+ if (job && !this.inProgress.has(enqueuedJob.id) && !this.resultsCache.has(enqueuedJob.id)) {
206
+ const time = this.msTimeSource();
207
+ this.inProgress.set(job.id, {
208
+ id: job.id,
209
+ startedAt: time,
210
+ lastUpdatedAt: time,
211
+ });
212
+ const enqueuedAt = this.enqueuedAt.get(job.id);
213
+ if (enqueuedAt) {
214
+ this.instrumentation.recordJobWait(job.type, enqueuedAt);
215
+ }
216
+ return { job, time };
217
+ }
218
+ }
219
+ }
220
+ return undefined;
221
+ }
222
+ async reportProvingJobError(id, err, retry = false) {
223
+ const info = this.inProgress.get(id);
63
224
  const item = this.jobsCache.get(id);
225
+ const retries = this.retries.get(id) ?? 0;
64
226
  if (!item) {
65
- this.logger.warn(`Proving job id=${id} not found. Removing it from the queue.`);
66
- this.inProgress.delete(id);
67
- continue;
227
+ this.logger.warn(`Can't set error on unknown proving job id=${id} err=${err}`, { provingJoId: id });
228
+ return;
229
+ }
230
+ if (!info) {
231
+ this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`, {
232
+ provingJobId: id,
233
+ });
68
234
  }
69
- const msSinceLastUpdate = (this.timeSource() - metadata.lastUpdatedAt) * 1000;
70
- if (msSinceLastUpdate >= this.jobTimeoutMs) {
71
- this.logger.warn(`Proving job id=${id} timed out. Adding it back to the queue.`);
235
+ else {
72
236
  this.inProgress.delete(id);
237
+ }
238
+ if (this.resultsCache.has(id)) {
239
+ this.logger.warn(`Proving job id=${id} is already settled, ignoring err=${err}`, {
240
+ provingJobId: id,
241
+ });
242
+ return;
243
+ }
244
+ if (retry && retries + 1 < this.maxRetries && !this.isJobStale(item)) {
245
+ this.logger.info(`Retrying proving job id=${id} type=${ProvingRequestType[item.type]} retry=${retries + 1} err=${err}`, {
246
+ provingJobId: id,
247
+ });
248
+ this.retries.set(id, retries + 1);
73
249
  this.enqueueJobInternal(item);
74
- this.instrumentation.incTimedOutJobs(item.type);
250
+ this.instrumentation.incRetriedJobs(item.type);
251
+ return;
252
+ }
253
+ this.logger.info(`Marking proving job as failed id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1} err=${err}`, {
254
+ provingJobId: id,
255
+ });
256
+ // save the result to the cache and notify clients of the job status
257
+ // this should work even if our database breaks because the result is cached in memory
258
+ const result = { status: 'rejected', reason: String(err) };
259
+ this.resultsCache.set(id, result);
260
+ this.promises.get(id).resolve(result);
261
+ this.instrumentation.incRejectedJobs(item.type);
262
+ if (info) {
263
+ const duration = this.msTimeSource() - info.startedAt;
264
+ this.instrumentation.recordJobDuration(item.type, duration);
265
+ }
266
+ try {
267
+ await this.database.setProvingJobError(id, err);
268
+ }
269
+ catch (saveErr) {
270
+ this.logger.error(`Failed to save proving job error status id=${id} jobErr=${err}`, saveErr, {
271
+ provingJobId: id,
272
+ });
273
+ throw saveErr;
75
274
  }
76
275
  }
77
- };
78
- this.instrumentation = new ProvingBrokerInstrumentation(client);
79
- this.timeoutPromise = new RunningPromise(this.timeoutCheck, timeoutIntervalMs);
80
- this.jobTimeoutMs = jobTimeoutMs;
81
- this.maxRetries = maxRetries;
82
- }
83
- start() {
84
- for (const [item, result] of this.database.allProvingJobs()) {
85
- this.logger.info(`Restoring proving job id=${item.id} settled=${!!result}`);
86
- this.jobsCache.set(item.id, item);
87
- this.promises.set(item.id, promiseWithResolvers());
88
- if (result) {
89
- this.promises.get(item.id).resolve(result);
90
- this.resultsCache.set(item.id, result);
276
+ reportProvingJobProgress(id, startedAt, filter) {
277
+ const job = this.jobsCache.get(id);
278
+ if (!job) {
279
+ this.logger.warn(`Proving job id=${id} does not exist`, { provingJobId: id });
280
+ return filter ? this.getProvingJob(filter) : Promise.resolve(undefined);
281
+ }
282
+ if (this.resultsCache.has(id)) {
283
+ this.logger.warn(`Proving job id=${id} has already been completed`, { provingJobId: id });
284
+ return filter ? this.getProvingJob(filter) : Promise.resolve(undefined);
285
+ }
286
+ const metadata = this.inProgress.get(id);
287
+ const now = this.msTimeSource();
288
+ if (!metadata) {
289
+ this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[job.type]} not found in the in-progress cache, adding it`, { provingJobId: id });
290
+ // the queue will still contain the item at this point!
291
+ // we need to be careful when popping off the queue to make sure we're not sending
292
+ // a job that's already in progress
293
+ this.inProgress.set(id, {
294
+ id,
295
+ startedAt,
296
+ lastUpdatedAt: this.msTimeSource(),
297
+ });
298
+ return Promise.resolve(undefined);
299
+ }
300
+ else if (startedAt <= metadata.startedAt) {
301
+ if (startedAt < metadata.startedAt) {
302
+ this.logger.info(`Proving job id=${id} type=${ProvingRequestType[job.type]} startedAt=${startedAt} older agent has taken job`, { provingJobId: id });
303
+ }
304
+ else {
305
+ this.logger.debug(`Proving job id=${id} type=${ProvingRequestType[job.type]} heartbeat`, { provingJobId: id });
306
+ }
307
+ metadata.startedAt = startedAt;
308
+ metadata.lastUpdatedAt = now;
309
+ return Promise.resolve(undefined);
310
+ }
311
+ else if (filter) {
312
+ this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[job.type]} already being worked on by another agent. Sending new one`, { provingJobId: id });
313
+ return this.getProvingJob(filter);
314
+ }
315
+ else {
316
+ return Promise.resolve(undefined);
317
+ }
91
318
  }
92
- else {
93
- this.logger.debug(`Re-enqueuing proving job id=${item.id}`);
94
- this.enqueueJobInternal(item);
319
+ async reportProvingJobSuccess(id, value) {
320
+ const info = this.inProgress.get(id);
321
+ const item = this.jobsCache.get(id);
322
+ const retries = this.retries.get(id) ?? 0;
323
+ if (!item) {
324
+ this.logger.warn(`Proving job id=${id} not found`, { provingJobId: id });
325
+ return;
326
+ }
327
+ if (!info) {
328
+ this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`, {
329
+ provingJobId: id,
330
+ });
331
+ }
332
+ else {
333
+ this.inProgress.delete(id);
334
+ }
335
+ if (this.resultsCache.has(id)) {
336
+ this.logger.warn(`Proving job id=${id} already settled, ignoring result`, { provingJobId: id });
337
+ return;
338
+ }
339
+ this.logger.info(`Proving job complete id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1}`, { provingJobId: id });
340
+ // save result to our local cache and notify clients
341
+ // if save to database fails, that's ok because we have the result in memory
342
+ // if the broker crashes and needs the result again, we're covered because we can just recompute it
343
+ const result = { status: 'fulfilled', value };
344
+ this.resultsCache.set(id, result);
345
+ this.promises.get(id).resolve(result);
346
+ this.instrumentation.incResolvedJobs(item.type);
347
+ if (info) {
348
+ const duration = this.msTimeSource() - info.startedAt;
349
+ this.instrumentation.recordJobDuration(item.type, duration);
350
+ }
351
+ try {
352
+ await this.database.setProvingJobResult(id, value);
353
+ }
354
+ catch (saveErr) {
355
+ this.logger.error(`Failed to save proving job result id=${id}`, saveErr, {
356
+ provingJobId: id,
357
+ });
358
+ throw saveErr;
359
+ }
95
360
  }
96
- }
97
- this.timeoutPromise.start();
98
- this.instrumentation.monitorQueueDepth(this.measureQueueDepth);
99
- this.instrumentation.monitorActiveJobs(this.countActiveJobs);
100
- return Promise.resolve();
101
- }
102
- stop() {
103
- return this.timeoutPromise.stop();
104
- }
105
- async enqueueProvingJob(job) {
106
- if (this.jobsCache.has(job.id)) {
107
- const existing = this.jobsCache.get(job.id);
108
- assert.deepStrictEqual(job, existing, 'Duplicate proving job ID');
109
- return;
110
- }
111
- await this.database.addProvingJob(job);
112
- this.jobsCache.set(job.id, job);
113
- this.enqueueJobInternal(job);
114
- }
115
- waitForJobToSettle(id) {
116
- const promiseWithResolvers = this.promises.get(id);
117
- if (!promiseWithResolvers) {
118
- return Promise.resolve({ status: 'rejected', reason: `Job ${id} not found` });
119
- }
120
- return promiseWithResolvers.promise;
121
- }
122
- async removeAndCancelProvingJob(id) {
123
- this.logger.info(`Cancelling job id=${id}`);
124
- await this.database.deleteProvingJobAndResult(id);
125
- // notify listeners of the cancellation
126
- if (!this.resultsCache.has(id)) {
127
- this.promises.get(id)?.resolve({ status: 'rejected', reason: 'Aborted' });
128
- }
129
- this.jobsCache.delete(id);
130
- this.promises.delete(id);
131
- this.resultsCache.delete(id);
132
- this.inProgress.delete(id);
133
- this.retries.delete(id);
134
- }
135
- getProvingJobStatus(id) {
136
- const result = this.resultsCache.get(id);
137
- if (result) {
138
- return Promise.resolve(result);
139
- }
140
- else {
141
- // no result yet, check if we know the item
142
- const item = this.jobsCache.get(id);
143
- if (!item) {
144
- this.logger.warn(`Proving job id=${id} not found`);
145
- return Promise.resolve({ status: 'not-found' });
361
+ async cleanupPass() {
362
+ await this.cleanupStaleJobs();
363
+ await this.reEnqueueExpiredJobs();
146
364
  }
147
- return Promise.resolve({ status: this.inProgress.has(id) ? 'in-progress' : 'in-queue' });
148
- }
149
- }
150
- // eslint-disable-next-line require-await
151
- async getProvingJob(filter = { allowList: [] }) {
152
- const allowedProofs = Array.isArray(filter.allowList) && filter.allowList.length > 0
153
- ? [...filter.allowList]
154
- : Object.values(ProvingRequestType).filter((x) => typeof x === 'number');
155
- allowedProofs.sort(proofTypeComparator);
156
- for (const proofType of allowedProofs) {
157
- const queue = this.queues[proofType];
158
- let job;
159
- // exhaust the queue and make sure we're not sending a job that's already in progress
160
- // or has already been completed
161
- // this can happen if the broker crashes and restarts
162
- // it's possible agents will report progress or results for jobs that are in the queue (after the restart)
163
- while ((job = queue.getImmediate())) {
164
- if (!this.inProgress.has(job.id) && !this.resultsCache.has(job.id)) {
165
- const time = this.timeSource();
166
- this.inProgress.set(job.id, {
167
- id: job.id,
168
- startedAt: time,
169
- lastUpdatedAt: time,
365
+ async cleanupStaleJobs() {
366
+ const jobIds = Array.from(this.jobsCache.keys());
367
+ const jobsToClean = [];
368
+ for (const id of jobIds) {
369
+ const job = this.jobsCache.get(id);
370
+ const isComplete = this.resultsCache.has(id);
371
+ if (isComplete && this.isJobStale(job)) {
372
+ jobsToClean.push(id);
373
+ }
374
+ }
375
+ if (jobsToClean.length > 0) {
376
+ this.logger.info(`Cleaning up jobs=${jobsToClean.length}`);
377
+ await asyncPool(this.maxParallelCleanUps, jobsToClean, async (jobId) => {
378
+ await this.cleanUpProvingJobState(jobId);
170
379
  });
171
- const enqueuedAt = this.enqueuedAt.get(job.id);
172
- if (enqueuedAt) {
173
- this.instrumentation.recordJobWait(job.type, enqueuedAt);
380
+ }
381
+ }
382
+ async reEnqueueExpiredJobs() {
383
+ const inProgressEntries = Array.from(this.inProgress.entries());
384
+ for (const [id, metadata] of inProgressEntries) {
385
+ const item = this.jobsCache.get(id);
386
+ if (!item) {
387
+ this.logger.warn(`Proving job id=${id} not found. Removing it from the queue.`, { provingJobId: id });
388
+ this.inProgress.delete(id);
389
+ continue;
390
+ }
391
+ const now = this.msTimeSource();
392
+ const msSinceLastUpdate = now - metadata.lastUpdatedAt;
393
+ if (msSinceLastUpdate >= this.jobTimeoutMs) {
394
+ if (this.isJobStale(item)) {
395
+ // the job has timed out and it's also old, just cancel and move on
396
+ await this.cancelProvingJob(item.id);
397
+ }
398
+ else {
399
+ this.logger.warn(`Proving job id=${id} timed out. Adding it back to the queue.`, { provingJobId: id });
400
+ this.inProgress.delete(id);
401
+ this.enqueueJobInternal(item);
402
+ this.instrumentation.incTimedOutJobs(item.type);
403
+ }
174
404
  }
175
- return { job, time };
176
405
  }
177
406
  }
178
- }
179
- return undefined;
180
- }
181
- async reportProvingJobError(id, err, retry = false) {
182
- const info = this.inProgress.get(id);
183
- const item = this.jobsCache.get(id);
184
- const retries = this.retries.get(id) ?? 0;
185
- if (!item) {
186
- this.logger.warn(`Proving job id=${id} not found`);
187
- return;
188
- }
189
- if (!info) {
190
- this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`);
191
- }
192
- else {
193
- this.inProgress.delete(id);
194
- }
195
- if (retry && retries + 1 < this.maxRetries) {
196
- this.logger.info(`Retrying proving job id=${id} type=${ProvingRequestType[item.type]} retry=${retries + 1}`);
197
- this.retries.set(id, retries + 1);
198
- this.enqueueJobInternal(item);
199
- this.instrumentation.incRetriedJobs(item.type);
200
- return;
201
- }
202
- this.logger.debug(`Marking proving job id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1} as failed`);
203
- await this.database.setProvingJobError(id, err);
204
- const result = { status: 'rejected', reason: String(err) };
205
- this.resultsCache.set(id, result);
206
- this.promises.get(id).resolve(result);
207
- this.instrumentation.incRejectedJobs(item.type);
208
- if (info) {
209
- const duration = this.timeSource() - info.startedAt;
210
- this.instrumentation.recordJobDuration(item.type, duration * 1000);
211
- }
212
- }
213
- reportProvingJobProgress(id, startedAt, filter) {
214
- const job = this.jobsCache.get(id);
215
- if (!job) {
216
- this.logger.warn(`Proving job id=${id} does not exist`);
217
- return filter ? this.getProvingJob(filter) : Promise.resolve(undefined);
218
- }
219
- const metadata = this.inProgress.get(id);
220
- const now = this.timeSource();
221
- if (!metadata) {
222
- this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[job.type]} not found in the in-progress cache, adding it`);
223
- // the queue will still contain the item at this point!
224
- // we need to be careful when popping off the queue to make sure we're not sending
225
- // a job that's already in progress
226
- this.inProgress.set(id, {
227
- id,
228
- startedAt,
229
- lastUpdatedAt: this.timeSource(),
230
- });
231
- return Promise.resolve(undefined);
232
- }
233
- else if (startedAt <= metadata.startedAt) {
234
- if (startedAt < metadata.startedAt) {
235
- this.logger.debug(`Proving job id=${id} type=${ProvingRequestType[job.type]} startedAt=${startedAt} older agent has taken job`);
407
+ enqueueJobInternal(job) {
408
+ if (!this.promises.has(job.id)) {
409
+ this.promises.set(job.id, promiseWithResolvers());
410
+ }
411
+ this.queues[job.type].put({
412
+ epochNumber: job.epochNumber,
413
+ id: job.id,
414
+ });
415
+ this.enqueuedAt.set(job.id, new Timer());
416
+ this.epochHeight = Math.max(this.epochHeight, job.epochNumber);
236
417
  }
237
- else {
238
- this.logger.debug(`Proving job id=${id} type=${ProvingRequestType[job.type]} heartbeat`);
418
+ isJobStale(job) {
419
+ return job.epochNumber < this.epochHeight - this.maxEpochsToKeepResultsFor;
239
420
  }
240
- metadata.startedAt = startedAt;
241
- metadata.lastUpdatedAt = now;
242
- return Promise.resolve(undefined);
243
- }
244
- else if (filter) {
245
- this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[job.type]} already being worked on by another agent. Sending new one`);
246
- return this.getProvingJob(filter);
247
- }
248
- else {
249
- return Promise.resolve(undefined);
250
- }
251
- }
252
- async reportProvingJobSuccess(id, value) {
253
- const info = this.inProgress.get(id);
254
- const item = this.jobsCache.get(id);
255
- const retries = this.retries.get(id) ?? 0;
256
- if (!item) {
257
- this.logger.warn(`Proving job id=${id} not found`);
258
- return;
259
- }
260
- if (!info) {
261
- this.logger.warn(`Proving job id=${id} type=${ProvingRequestType[item.type]} not in the in-progress set`);
262
- }
263
- else {
264
- this.inProgress.delete(id);
265
- }
266
- this.logger.debug(`Proving job complete id=${id} type=${ProvingRequestType[item.type]} totalAttempts=${retries + 1}`);
267
- await this.database.setProvingJobResult(id, value);
268
- const result = { status: 'fulfilled', value };
269
- this.resultsCache.set(id, result);
270
- this.promises.get(id).resolve(result);
271
- this.instrumentation.incResolvedJobs(item.type);
272
- }
273
- enqueueJobInternal(job) {
274
- if (!this.promises.has(job.id)) {
275
- this.promises.set(job.id, promiseWithResolvers());
276
- }
277
- this.queues[job.type].put(job);
278
- this.enqueuedAt.set(job.id, new Timer());
279
- this.logger.debug(`Enqueued new proving job id=${job.id}`);
280
- }
281
- }
421
+ },
422
+ (() => {
423
+ const _metadata = typeof Symbol === "function" && Symbol.metadata ? Object.create(null) : void 0;
424
+ _cleanupPass_decorators = [trackSpan('ProvingBroker.cleanupPass')];
425
+ __esDecorate(_a, null, _cleanupPass_decorators, { kind: "method", name: "cleanupPass", static: false, private: false, access: { has: obj => "cleanupPass" in obj, get: obj => obj.cleanupPass }, metadata: _metadata }, null, _instanceExtraInitializers);
426
+ if (_metadata) Object.defineProperty(_a, Symbol.metadata, { enumerable: true, configurable: true, writable: true, value: _metadata });
427
+ })(),
428
+ _a;
429
+ })();
430
+ export { ProvingBroker };
282
431
  /**
283
432
  * Compares two proving jobs and selects which one's more important
284
433
  * @param a - A proving job
@@ -286,12 +435,10 @@ export class ProvingBroker {
286
435
  * @returns A number indicating the relative priority of the two proving jobs
287
436
  */
288
437
  function provingJobComparator(a, b) {
289
- const aBlockNumber = a.blockNumber ?? 0;
290
- const bBlockNumber = b.blockNumber ?? 0;
291
- if (aBlockNumber < bBlockNumber) {
438
+ if (a.epochNumber < b.epochNumber) {
292
439
  return -1;
293
440
  }
294
- else if (aBlockNumber > bBlockNumber) {
441
+ else if (a.epochNumber > b.epochNumber) {
295
442
  return 1;
296
443
  }
297
444
  else {
@@ -349,4 +496,4 @@ const PROOF_TYPES_IN_PRIORITY_ORDER = [
349
496
  ProvingRequestType.EMPTY_BLOCK_ROOT_ROLLUP,
350
497
  ProvingRequestType.PRIVATE_KERNEL_EMPTY,
351
498
  ];
352
- //# sourceMappingURL=data:application/json;base64,
499
+ //# sourceMappingURL=data:application/json;base64,