@powersync/service-module-mongodb 0.15.4 → 0.17.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (64) hide show
  1. package/CHANGELOG.md +67 -0
  2. package/dist/api/MongoRouteAPIAdapter.js +12 -21
  3. package/dist/api/MongoRouteAPIAdapter.js.map +1 -1
  4. package/dist/replication/ChangeStream.d.ts +23 -42
  5. package/dist/replication/ChangeStream.js +363 -600
  6. package/dist/replication/ChangeStream.js.map +1 -1
  7. package/dist/replication/ChangeStreamReplicationJob.js +2 -2
  8. package/dist/replication/ChangeStreamReplicationJob.js.map +1 -1
  9. package/dist/replication/JsonBufferWriter.d.ts +80 -0
  10. package/dist/replication/JsonBufferWriter.js +342 -0
  11. package/dist/replication/JsonBufferWriter.js.map +1 -0
  12. package/dist/replication/MongoRelation.d.ts +1 -1
  13. package/dist/replication/MongoRelation.js +45 -21
  14. package/dist/replication/MongoRelation.js.map +1 -1
  15. package/dist/replication/MongoSnapshotQuery.d.ts +1 -1
  16. package/dist/replication/MongoSnapshotQuery.js +6 -3
  17. package/dist/replication/MongoSnapshotQuery.js.map +1 -1
  18. package/dist/replication/MongoSnapshotter.d.ts +81 -0
  19. package/dist/replication/MongoSnapshotter.js +594 -0
  20. package/dist/replication/MongoSnapshotter.js.map +1 -0
  21. package/dist/replication/RawChangeStream.d.ts +55 -0
  22. package/dist/replication/RawChangeStream.js +322 -0
  23. package/dist/replication/RawChangeStream.js.map +1 -0
  24. package/dist/replication/SourceRowConverter.d.ts +46 -0
  25. package/dist/replication/SourceRowConverter.js +42 -0
  26. package/dist/replication/SourceRowConverter.js.map +1 -0
  27. package/dist/replication/bufferToSqlite.d.ts +43 -0
  28. package/dist/replication/bufferToSqlite.js +740 -0
  29. package/dist/replication/bufferToSqlite.js.map +1 -0
  30. package/dist/replication/internal-mongodb-utils.d.ts +0 -12
  31. package/dist/replication/internal-mongodb-utils.js +0 -54
  32. package/dist/replication/internal-mongodb-utils.js.map +1 -1
  33. package/dist/replication/replication-index.d.ts +2 -0
  34. package/dist/replication/replication-index.js +2 -0
  35. package/dist/replication/replication-index.js.map +1 -1
  36. package/package.json +11 -11
  37. package/scripts/benchmark-change-document-json.mts +358 -0
  38. package/scripts/benchmark-change-document.mts +370 -0
  39. package/src/api/MongoRouteAPIAdapter.ts +13 -21
  40. package/src/replication/ChangeStream.ts +421 -720
  41. package/src/replication/ChangeStreamReplicationJob.ts +2 -2
  42. package/src/replication/JsonBufferWriter.ts +390 -0
  43. package/src/replication/MongoRelation.ts +54 -25
  44. package/src/replication/MongoSnapshotQuery.ts +8 -5
  45. package/src/replication/MongoSnapshotter.ts +729 -0
  46. package/src/replication/RawChangeStream.ts +460 -0
  47. package/src/replication/SourceRowConverter.ts +65 -0
  48. package/src/replication/bufferToSqlite.ts +944 -0
  49. package/src/replication/internal-mongodb-utils.ts +0 -65
  50. package/src/replication/replication-index.ts +2 -0
  51. package/test/src/buffer_to_sqlite.test.ts +1146 -0
  52. package/test/src/change_stream.test.ts +259 -19
  53. package/test/src/change_stream_utils.ts +28 -27
  54. package/test/src/checkpoint_retry.test.ts +131 -0
  55. package/test/src/mongo_test.test.ts +66 -64
  56. package/test/src/parse_document_id.test.ts +54 -0
  57. package/test/src/raw_change_stream.test.ts +547 -0
  58. package/test/src/resume.test.ts +12 -2
  59. package/test/src/resuming_snapshots.test.ts +10 -6
  60. package/test/src/util.ts +56 -3
  61. package/test/tsconfig.json +0 -1
  62. package/tsconfig.scripts.json +13 -0
  63. package/tsconfig.tsbuildinfo +1 -1
  64. package/test/src/internal_mongodb_utils.test.ts +0 -103
@@ -0,0 +1,370 @@
1
+ import * as bson from 'bson';
2
+ import { performance } from 'node:perf_hooks';
3
+ import { parseChangeDocument } from '../dist/index.js';
4
+
5
+ // This is a synthetic benchmark to test performance of parseChangeDocument
6
+ // versus the normal bson.deserialize().
7
+ // Primarily AI-generated.
8
+
9
+ const BSON_OPTIONS = { useBigInt64: true } as const;
10
+ const OPERATION_TYPES = ['insert', 'update'] as const;
11
+ const SIZE_TARGETS = [
12
+ { label: '1 KB', bytes: 1_024 },
13
+ { label: '10 KB', bytes: 10_240 },
14
+ { label: '100 KB', bytes: 102_400 }
15
+ ] as const;
16
+
17
+ type OperationType = (typeof OPERATION_TYPES)[number];
18
+
19
+ type FullDocument = {
20
+ _id: bson.ObjectId;
21
+ checksum: number;
22
+ operationType: OperationType;
23
+ tenantId: string;
24
+ version: number;
25
+ createdAt: Date;
26
+ updatedAt: Date;
27
+ flags: {
28
+ active: boolean;
29
+ archived: boolean;
30
+ source: string;
31
+ };
32
+ metrics: {
33
+ itemCount: number;
34
+ ratio: number;
35
+ };
36
+ tags: string[];
37
+ nested: {
38
+ owner: {
39
+ id: string;
40
+ region: string;
41
+ };
42
+ counters: number[];
43
+ changedFields: string[];
44
+ };
45
+ payload: string;
46
+ };
47
+
48
+ type UpdateDescription = {
49
+ updatedFields: {
50
+ payload: string;
51
+ metrics: FullDocument['metrics'];
52
+ updatedAt: Date;
53
+ version: number;
54
+ };
55
+ removedFields: string[];
56
+ truncatedArrays: never[];
57
+ };
58
+
59
+ type ChangeDocument = {
60
+ _id: {
61
+ _data: string;
62
+ };
63
+ operationType: OperationType;
64
+ wallTime: Date;
65
+ ns: {
66
+ db: string;
67
+ coll: string;
68
+ };
69
+ lsid: {
70
+ id: bson.Binary;
71
+ };
72
+ txnNumber: bson.Long;
73
+ documentKey: {
74
+ _id: bson.ObjectId;
75
+ };
76
+ fullDocument: FullDocument;
77
+ updateDescription?: UpdateDescription;
78
+ };
79
+
80
+ type Benchmark = {
81
+ label: string;
82
+ run: (buffer: Buffer) => number;
83
+ };
84
+
85
+ type Scenario = {
86
+ label: string;
87
+ operationType: OperationType;
88
+ targetBytes: number;
89
+ fullDocumentBytes: number;
90
+ eventBytes: number;
91
+ buffer: Buffer;
92
+ };
93
+
94
+ type BenchmarkResult = {
95
+ elapsedMs: number;
96
+ opsPerSecond: number;
97
+ mibPerSecond: number;
98
+ };
99
+
100
+ const BENCHMARKS: readonly Benchmark[] = [
101
+ {
102
+ label: 'parseChangeDocument',
103
+ run: (buffer: Buffer) => {
104
+ const change = parseChangeDocument(buffer);
105
+ if (!('fullDocument' in change)) {
106
+ throw new Error('Unsupported change type: ' + change.operationType);
107
+ }
108
+ return change.fullDocument?.byteLength ?? 0;
109
+ }
110
+ },
111
+ {
112
+ label: 'parseChangeDocument + fullDocument',
113
+ run: (buffer: Buffer) => {
114
+ const change = parseChangeDocument(buffer);
115
+ if (!('fullDocument' in change)) {
116
+ throw new Error('Unsupported change type: ' + change.operationType);
117
+ }
118
+ if (change.fullDocument == null) {
119
+ throw new Error('Expected fullDocument to be present');
120
+ }
121
+ const fullDocument = bson.deserialize(change.fullDocument, BSON_OPTIONS) as { checksum?: number };
122
+ return Number(fullDocument.checksum ?? 0);
123
+ }
124
+ },
125
+ {
126
+ label: 'bson.deserialize',
127
+ run: (buffer: Buffer) => {
128
+ const change = bson.deserialize(buffer, BSON_OPTIONS) as { fullDocument?: { checksum?: number } };
129
+ return Number(change.fullDocument?.checksum ?? 0);
130
+ }
131
+ }
132
+ ] as const;
133
+
134
+ function createFullDocument(operationType: OperationType, targetBytes: number): FullDocument {
135
+ const seed = targetBytes + (operationType === 'insert' ? 11 : 29);
136
+ const baseDocument: FullDocument = {
137
+ _id: new bson.ObjectId(),
138
+ checksum: seed,
139
+ operationType,
140
+ tenantId: 'tenant-benchmark',
141
+ version: operationType === 'insert' ? 1 : 2,
142
+ createdAt: new Date('2026-01-01T00:00:00.000Z'),
143
+ updatedAt: new Date('2026-01-02T03:04:05.000Z'),
144
+ flags: {
145
+ active: true,
146
+ archived: false,
147
+ source: 'benchmark'
148
+ },
149
+ metrics: {
150
+ itemCount: seed,
151
+ ratio: Number((targetBytes / 1024).toFixed(3))
152
+ },
153
+ tags: ['alpha', 'beta', 'gamma', operationType],
154
+ nested: {
155
+ owner: {
156
+ id: `owner-${seed}`,
157
+ region: 'af-south-1'
158
+ },
159
+ counters: [1, 2, 3, 5, 8, 13],
160
+ changedFields: operationType === 'update' ? ['payload', 'metrics.itemCount', 'updatedAt'] : []
161
+ },
162
+ payload: ''
163
+ };
164
+
165
+ const payloadLength = findPayloadLength(baseDocument, targetBytes);
166
+ const payload = repeatCharacter('x', payloadLength);
167
+ return {
168
+ ...baseDocument,
169
+ payload
170
+ };
171
+ }
172
+
173
+ function createChangeDocument(fullDocument: FullDocument, operationType: OperationType): ChangeDocument {
174
+ const updateDescription: UpdateDescription | undefined =
175
+ operationType === 'update'
176
+ ? {
177
+ updatedFields: {
178
+ payload: fullDocument.payload,
179
+ metrics: fullDocument.metrics,
180
+ updatedAt: fullDocument.updatedAt,
181
+ version: fullDocument.version
182
+ },
183
+ removedFields: ['legacyField'],
184
+ truncatedArrays: []
185
+ }
186
+ : undefined;
187
+
188
+ return {
189
+ _id: {
190
+ _data: `${operationType}-${fullDocument.checksum}-${new bson.ObjectId().toHexString()}`
191
+ },
192
+ operationType,
193
+ wallTime: new Date('2026-01-03T09:10:11.000Z'),
194
+ ns: {
195
+ db: 'benchmark_db',
196
+ coll: 'benchmark_coll'
197
+ },
198
+ lsid: {
199
+ id: new bson.Binary(Buffer.alloc(16, operationType === 'insert' ? 0x11 : 0x22))
200
+ },
201
+ txnNumber: seedLong(fullDocument.checksum),
202
+ documentKey: {
203
+ _id: fullDocument._id
204
+ },
205
+ ...(updateDescription == null ? {} : { updateDescription }),
206
+ fullDocument
207
+ };
208
+ }
209
+
210
+ function seedLong(value: number): bson.Long {
211
+ return bson.Long.fromNumber(value);
212
+ }
213
+
214
+ function findPayloadLength(baseDocument: FullDocument, targetBytes: number): number {
215
+ const baseSize = bson.calculateObjectSize(baseDocument);
216
+ if (baseSize >= targetBytes) {
217
+ return 0;
218
+ }
219
+
220
+ let low = 0;
221
+ let high = Math.max(16, targetBytes - baseSize);
222
+ while (calculateSizedDocumentBytes(baseDocument, high) < targetBytes) {
223
+ high *= 2;
224
+ }
225
+
226
+ while (low < high) {
227
+ const mid = Math.floor((low + high) / 2);
228
+ if (calculateSizedDocumentBytes(baseDocument, mid) < targetBytes) {
229
+ low = mid + 1;
230
+ } else {
231
+ high = mid;
232
+ }
233
+ }
234
+
235
+ return low;
236
+ }
237
+
238
+ function calculateSizedDocumentBytes(baseDocument: FullDocument, payloadLength: number): number {
239
+ return bson.calculateObjectSize({
240
+ ...baseDocument,
241
+ payload: repeatCharacter('x', payloadLength)
242
+ });
243
+ }
244
+
245
+ function repeatCharacter(character: string, count: number): string {
246
+ return character.repeat(Math.max(0, count));
247
+ }
248
+
249
+ function chooseIterations(eventBytes: number): number {
250
+ const targetBytes = 256 * 1024 * 1024;
251
+ return clamp(Math.floor(targetBytes / eventBytes), 200, 50_000);
252
+ }
253
+
254
+ function clamp(value: number, min: number, max: number): number {
255
+ return Math.max(min, Math.min(max, value));
256
+ }
257
+
258
+ function median(values: number[]): number {
259
+ const sorted = [...values].sort((a, b) => a - b);
260
+ const middle = Math.floor(sorted.length / 2);
261
+ return sorted.length % 2 === 0 ? (sorted[middle - 1] + sorted[middle]) / 2 : sorted[middle];
262
+ }
263
+
264
+ function buildScenario(operationType: OperationType, sizeLabel: string, targetBytes: number): Scenario {
265
+ const fullDocument = createFullDocument(operationType, targetBytes);
266
+ const changeDocument = createChangeDocument(fullDocument, operationType);
267
+ const buffer = Buffer.from(bson.serialize(changeDocument));
268
+ return {
269
+ label: `${operationType} ${sizeLabel}`,
270
+ operationType,
271
+ targetBytes,
272
+ fullDocumentBytes: bson.calculateObjectSize(fullDocument),
273
+ eventBytes: buffer.byteLength,
274
+ buffer
275
+ };
276
+ }
277
+
278
+ function runBenchmark(
279
+ label: string,
280
+ fn: (buffer: Buffer) => number,
281
+ buffer: Buffer,
282
+ iterations: number
283
+ ): BenchmarkResult {
284
+ const warmupIterations = Math.min(2_000, Math.max(50, Math.floor(iterations / 10)));
285
+ let sink = 0;
286
+ for (let i = 0; i < warmupIterations; i += 1) {
287
+ sink += fn(buffer);
288
+ }
289
+
290
+ const samples: number[] = [];
291
+ for (let round = 0; round < 5; round += 1) {
292
+ const start = performance.now();
293
+ for (let i = 0; i < iterations; i += 1) {
294
+ sink += fn(buffer);
295
+ }
296
+ samples.push(performance.now() - start);
297
+ }
298
+
299
+ if (sink === Number.MIN_SAFE_INTEGER) {
300
+ console.error(label);
301
+ }
302
+
303
+ const elapsedMs = median(samples);
304
+ const opsPerSecond = (iterations * 1000) / elapsedMs;
305
+ const mibPerSecond = (buffer.byteLength * iterations) / (1024 * 1024) / (elapsedMs / 1000);
306
+ return {
307
+ elapsedMs,
308
+ opsPerSecond,
309
+ mibPerSecond
310
+ };
311
+ }
312
+
313
+ function printHeader() {
314
+ console.log('Comparing parseChangeDocument against plain bson.deserialize');
315
+ console.log('The key comparison is "parseChangeDocument + fullDocument" vs "bson.deserialize".');
316
+ console.log('');
317
+ }
318
+
319
+ function printRow(values: string[]): void {
320
+ const widths = [16, 12, 12, 34, 16, 16];
321
+ const line = values
322
+ .map((value, index) => value.padEnd(widths[index] ?? value.length))
323
+ .join(' ')
324
+ .trimEnd();
325
+ console.log(line);
326
+ }
327
+
328
+ printHeader();
329
+ printRow(['Scenario', 'Full doc', 'Event', 'Benchmark', 'Ops/s', 'MiB/s']);
330
+ printRow(['--------', '--------', '-----', '---------', '-----', '-----']);
331
+
332
+ for (const operationType of OPERATION_TYPES) {
333
+ for (const size of SIZE_TARGETS) {
334
+ const scenario = buildScenario(operationType, size.label, size.bytes);
335
+ const iterations = chooseIterations(scenario.eventBytes);
336
+ const results = BENCHMARKS.map((benchmark) => ({
337
+ label: benchmark.label,
338
+ ...runBenchmark(benchmark.label, benchmark.run, scenario.buffer, iterations)
339
+ }));
340
+
341
+ let isFirstRow = true;
342
+ for (const result of results) {
343
+ printRow([
344
+ isFirstRow ? scenario.label : '',
345
+ isFirstRow ? formatBytes(scenario.fullDocumentBytes) : '',
346
+ isFirstRow ? formatBytes(scenario.eventBytes) : '',
347
+ result.label,
348
+ formatNumber(result.opsPerSecond),
349
+ formatNumber(result.mibPerSecond)
350
+ ]);
351
+ isFirstRow = false;
352
+ }
353
+ }
354
+ }
355
+
356
+ function formatNumber(value: number): string {
357
+ return new Intl.NumberFormat('en-US', {
358
+ maximumFractionDigits: value >= 100 ? 0 : 1
359
+ }).format(value);
360
+ }
361
+
362
+ function formatBytes(bytes: number): string {
363
+ if (bytes < 1024) {
364
+ return `${bytes} B`;
365
+ }
366
+ if (bytes < 1024 * 1024) {
367
+ return `${(bytes / 1024).toFixed(bytes >= 10 * 1024 ? 0 : 1)} KB`;
368
+ }
369
+ return `${(bytes / (1024 * 1024)).toFixed(1)} MB`;
370
+ }
@@ -1,6 +1,6 @@
1
1
  import * as lib_mongo from '@powersync/lib-service-mongodb';
2
2
  import { mongo } from '@powersync/lib-service-mongodb';
3
- import { api, ParseSyncRulesOptions, ReplicationHeadCallback, SourceTable } from '@powersync/service-core';
3
+ import { api, ParseSyncRulesOptions, ReplicationHeadCallback } from '@powersync/service-core';
4
4
  import * as sync_rules from '@powersync/service-sync-rules';
5
5
  import * as service_types from '@powersync/service-types';
6
6
 
@@ -137,23 +137,19 @@ export class MongoRouteAPIAdapter implements api.RouteAPI {
137
137
  if (tablePattern.isWildcard) {
138
138
  patternResult.tables = [];
139
139
  for (let collection of collections) {
140
- const sourceTable = new SourceTable({
141
- id: '', // not used
140
+ const ref: sync_rules.SourceTableRef = {
142
141
  connectionTag: this.connectionTag,
143
- objectId: collection.name,
144
- schema: schema,
145
- name: collection.name,
146
- replicaIdColumns: [],
147
- snapshotComplete: true
148
- });
142
+ schema,
143
+ name: collection.name
144
+ };
149
145
  let errors: service_types.ReplicationError[] = [];
150
146
  if (collection.type == 'view') {
151
147
  errors.push({ level: 'warning', message: `Collection ${schema}.${tablePattern.name} is a view` });
152
148
  } else {
153
149
  errors.push(...validatePostImages(schema, collection));
154
150
  }
155
- const syncData = sqlSyncRules.tableSyncsData(sourceTable);
156
- const syncParameters = sqlSyncRules.tableSyncsParameters(sourceTable);
151
+ const syncData = sqlSyncRules.tableSyncsData(ref);
152
+ const syncParameters = sqlSyncRules.tableSyncsParameters(ref);
157
153
  patternResult.tables.push({
158
154
  schema,
159
155
  name: collection.name,
@@ -164,18 +160,14 @@ export class MongoRouteAPIAdapter implements api.RouteAPI {
164
160
  });
165
161
  }
166
162
  } else {
167
- const sourceTable = new SourceTable({
168
- id: '', // not used
163
+ const ref: sync_rules.SourceTableRef = {
169
164
  connectionTag: this.connectionTag,
170
- objectId: tablePattern.name,
171
- schema: schema,
172
- name: tablePattern.name,
173
- replicaIdColumns: [],
174
- snapshotComplete: true
175
- });
165
+ schema,
166
+ name: tablePattern.name
167
+ };
176
168
 
177
- const syncData = sqlSyncRules.tableSyncsData(sourceTable);
178
- const syncParameters = sqlSyncRules.tableSyncsParameters(sourceTable);
169
+ const syncData = sqlSyncRules.tableSyncsData(ref);
170
+ const syncParameters = sqlSyncRules.tableSyncsParameters(ref);
179
171
  const collection = collections[0];
180
172
 
181
173
  let errors: service_types.ReplicationError[] = [];