@rudderstack/integrations-lib 0.2.33 → 0.2.34
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/utils/batch-processing.bench.d.ts +2 -0
- package/build/utils/batch-processing.bench.d.ts.map +1 -0
- package/build/utils/batch-processing.bench.js +96 -0
- package/build/utils/batch-processing.d.ts +75 -83
- package/build/utils/batch-processing.d.ts.map +1 -1
- package/build/utils/batch-processing.js +240 -161
- package/package.json +1 -1
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"batch-processing.bench.d.ts","sourceRoot":"","sources":["../../src/utils/batch-processing.bench.ts"],"names":[],"mappings":""}
|
|
@@ -0,0 +1,96 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
var __importDefault = (this && this.__importDefault) || function (mod) {
|
|
3
|
+
return (mod && mod.__esModule) ? mod : { "default": mod };
|
|
4
|
+
};
|
|
5
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
6
|
+
/* eslint-disable no-console */
|
|
7
|
+
const node_perf_hooks_1 = require("node:perf_hooks");
|
|
8
|
+
const lodash_1 = __importDefault(require("lodash"));
|
|
9
|
+
const batch_processing_1 = require("./batch-processing");
|
|
10
|
+
async function bench(fn, label, iterations = 5) {
|
|
11
|
+
let total = 0;
|
|
12
|
+
for (let i = 0; i < iterations; i += 1) {
|
|
13
|
+
const start = node_perf_hooks_1.performance.now();
|
|
14
|
+
// eslint-disable-next-line no-await-in-loop
|
|
15
|
+
await fn();
|
|
16
|
+
total += node_perf_hooks_1.performance.now() - start;
|
|
17
|
+
}
|
|
18
|
+
const avg = total / iterations;
|
|
19
|
+
console.log(`${label}: avg ${avg.toFixed(2)} ms over ${iterations} runs`);
|
|
20
|
+
return avg;
|
|
21
|
+
}
|
|
22
|
+
async function section(title, fn) {
|
|
23
|
+
console.log(`\n=== ${title} ===`);
|
|
24
|
+
await fn();
|
|
25
|
+
}
|
|
26
|
+
async function runBenchmarks() {
|
|
27
|
+
const arr = Array.from({ length: 10_000 }, (_, i) => i);
|
|
28
|
+
console.log(`Running benchmarks on array of length ${arr.length}`);
|
|
29
|
+
await section('map', async () => {
|
|
30
|
+
await bench(() => (0, batch_processing_1.mapInBatches)(arr, (x) => x + 1, { batchSize: 20, yieldThreshold: 10 }), 'mapInBatches { batchSize: 20, yieldThreshold: 10 }');
|
|
31
|
+
await bench(() => (0, batch_processing_1.mapInBatches)(arr, (x) => x + 1, {
|
|
32
|
+
batchSize: 20,
|
|
33
|
+
yieldThreshold: 10,
|
|
34
|
+
sequentialProcessing: false,
|
|
35
|
+
}), 'mapInBatches { batchSize: 20, yieldThreshold: 10, sequentialProcessing: false }');
|
|
36
|
+
await bench(() => Promise.resolve(lodash_1.default.map(arr, (x) => x + 1)), 'lodash.map');
|
|
37
|
+
await bench(() => Promise.resolve(arr.map((x) => x + 1)), 'Array.prototype.map');
|
|
38
|
+
});
|
|
39
|
+
await section('filter', async () => {
|
|
40
|
+
await bench(() => (0, batch_processing_1.filterInBatches)(arr, (x) => x % 2 === 0, { batchSize: 20, yieldThreshold: 10 }), 'filterInBatches { batchSize: 20, yieldThreshold: 10 }');
|
|
41
|
+
await bench(() => (0, batch_processing_1.filterInBatches)(arr, (x) => x % 2 === 0, {
|
|
42
|
+
batchSize: 20,
|
|
43
|
+
yieldThreshold: 10,
|
|
44
|
+
sequentialProcessing: false,
|
|
45
|
+
}), 'filterInBatches { batchSize: 20, yieldThreshold: 10, sequentialProcessing: false }');
|
|
46
|
+
await bench(() => Promise.resolve(lodash_1.default.filter(arr, (x) => x % 2 === 0)), 'lodash.filter');
|
|
47
|
+
await bench(() => Promise.resolve(arr.filter((x) => x % 2 === 0)), 'Array.prototype.filter');
|
|
48
|
+
});
|
|
49
|
+
await section('groupBy', async () => {
|
|
50
|
+
await bench(() => (0, batch_processing_1.groupByInBatches)(arr, (x) => (x % 2 === 0 ? 'even' : 'odd'), {
|
|
51
|
+
batchSize: 20,
|
|
52
|
+
yieldThreshold: 10,
|
|
53
|
+
}), 'groupByInBatches { batchSize: 20, yieldThreshold: 10 }');
|
|
54
|
+
await bench(() => (0, batch_processing_1.groupByInBatches)(arr, (x) => (x % 2 === 0 ? 'even' : 'odd'), {
|
|
55
|
+
batchSize: 20,
|
|
56
|
+
yieldThreshold: 10,
|
|
57
|
+
sequentialProcessing: false,
|
|
58
|
+
}), 'groupByInBatches { batchSize: 20, yieldThreshold: 10, sequentialProcessing: false }');
|
|
59
|
+
await bench(() => Promise.resolve(lodash_1.default.groupBy(arr, (x) => (x % 2 === 0 ? 'even' : 'odd'))), 'lodash.groupBy');
|
|
60
|
+
});
|
|
61
|
+
await section('reduce', async () => {
|
|
62
|
+
await bench(() => (0, batch_processing_1.reduceInBatches)(arr, (acc, x) => acc + x, 0, { batchSize: 20, yieldThreshold: 10 }), 'reduceInBatches { batchSize: 20, yieldThreshold: 10 }');
|
|
63
|
+
await bench(() => Promise.resolve(lodash_1.default.reduce(arr, (acc, x) => acc + x, 0)), 'lodash.reduce');
|
|
64
|
+
await bench(() => Promise.resolve(arr.reduce((acc, x) => acc + x, 0)), 'Array.prototype.reduce');
|
|
65
|
+
});
|
|
66
|
+
await section('flatMap', async () => {
|
|
67
|
+
await bench(() => (0, batch_processing_1.flatMapInBatches)(arr, (x) => [x, x], { batchSize: 20, yieldThreshold: 10 }), 'flatMapInBatches { batchSize: 20, yieldThreshold: 10 }');
|
|
68
|
+
await bench(() => (0, batch_processing_1.flatMapInBatches)(arr, (x) => [x, x], {
|
|
69
|
+
batchSize: 20,
|
|
70
|
+
yieldThreshold: 10,
|
|
71
|
+
sequentialProcessing: false,
|
|
72
|
+
}), 'flatMapInBatches { batchSize: 20, yieldThreshold: 10, sequentialProcessing: false }');
|
|
73
|
+
await bench(() => Promise.resolve(lodash_1.default.flatMap(arr, (x) => [x, x])), 'lodash.flatMap');
|
|
74
|
+
await bench(() => Promise.resolve(arr.flatMap
|
|
75
|
+
? arr.flatMap((x) => [x, x])
|
|
76
|
+
: [].concat(...arr.map((x) => [x, x]))), 'Array.prototype.flatMap');
|
|
77
|
+
});
|
|
78
|
+
await section('forEach', async () => {
|
|
79
|
+
await bench(() => (0, batch_processing_1.forEachInBatches)(arr, () => { }, { batchSize: 20, yieldThreshold: 10 }), 'forEachInBatches { batchSize: 20, yieldThreshold: 10 }');
|
|
80
|
+
await bench(() => (0, batch_processing_1.forEachInBatches)(arr, () => { }, {
|
|
81
|
+
batchSize: 20,
|
|
82
|
+
yieldThreshold: 10,
|
|
83
|
+
sequentialProcessing: false,
|
|
84
|
+
}), 'forEachInBatches { batchSize: 20, yieldThreshold: 10, sequentialProcessing: false }');
|
|
85
|
+
await bench(() => Promise.resolve(arr.forEach(() => { })), 'Array.prototype.forEach');
|
|
86
|
+
await bench(() => Promise.resolve(lodash_1.default.forEach(arr, () => { })), 'lodash.forEach');
|
|
87
|
+
});
|
|
88
|
+
}
|
|
89
|
+
// to run benchmarks use: npx ts-node src/utils/batch-processing.bench.ts
|
|
90
|
+
if (require.main === module) {
|
|
91
|
+
runBenchmarks().catch((err) => {
|
|
92
|
+
console.error(err);
|
|
93
|
+
process.exit(1);
|
|
94
|
+
});
|
|
95
|
+
}
|
|
96
|
+
//# sourceMappingURL=data:application/json;base64,
|
|
@@ -1,15 +1,23 @@
|
|
|
1
1
|
/**
|
|
2
|
-
*
|
|
2
|
+
* Options for batch processing operations
|
|
3
3
|
*/
|
|
4
|
-
export interface
|
|
4
|
+
export interface BatchProcessingOptions {
|
|
5
5
|
/**
|
|
6
|
-
*
|
|
6
|
+
* Number of items to process in each batch (default: 10)
|
|
7
|
+
* Must be a positive integer.
|
|
7
8
|
*/
|
|
8
9
|
batchSize?: number;
|
|
9
10
|
/**
|
|
10
|
-
*
|
|
11
|
+
* Time threshold in milliseconds (default: 10) before yielding control back to the event loop.
|
|
12
|
+
* Set to 0 to yield after every batch. Must be a non-negative integer.
|
|
11
13
|
*/
|
|
12
14
|
yieldThreshold?: number;
|
|
15
|
+
/**
|
|
16
|
+
* Whether to process items sequentially within each batch. When true (default), each item in a batch
|
|
17
|
+
* will be processed one at a time. When false, all items in a batch will be processed concurrently.
|
|
18
|
+
* Consider the implications of concurrency on your processing logic before setting this to false, e.g. race conditions, rate limits, memory pressure, etc.
|
|
19
|
+
*/
|
|
20
|
+
sequentialProcessing?: boolean;
|
|
13
21
|
}
|
|
14
22
|
/**
|
|
15
23
|
* Configure global defaults for batch processing operations
|
|
@@ -25,11 +33,14 @@ export interface BatchProcessingDefaults {
|
|
|
25
33
|
* // Set only batch size
|
|
26
34
|
* configureBatchProcessingDefaults({ batchSize: 50 });
|
|
27
35
|
*
|
|
36
|
+
* // Enable concurrent processing within batches
|
|
37
|
+
* configureBatchProcessingDefaults({ sequentialProcessing: false });
|
|
38
|
+
*
|
|
28
39
|
* // Get current configuration
|
|
29
40
|
* const currentConfig = configureBatchProcessingDefaults();
|
|
30
41
|
* ```
|
|
31
42
|
*/
|
|
32
|
-
export declare function configureBatchProcessingDefaults(config?:
|
|
43
|
+
export declare function configureBatchProcessingDefaults(config?: BatchProcessingOptions): BatchProcessingOptions;
|
|
33
44
|
/**
|
|
34
45
|
* Maps over an array in batches to avoid blocking the event loop.
|
|
35
46
|
* Processes items in chunks and yields control back to the event loop between batches
|
|
@@ -39,26 +50,20 @@ export declare function configureBatchProcessingDefaults(config?: BatchProcessin
|
|
|
39
50
|
* @template R - The type of items in the result array
|
|
40
51
|
* @param items - The array to map over
|
|
41
52
|
* @param mapFn - The mapping function to apply to each item. Receives the item and its index.
|
|
42
|
-
* @param
|
|
43
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
53
|
+
* @param options - Batch processing options
|
|
44
54
|
* @returns A promise that resolves to the mapped array
|
|
45
55
|
* @throws {Error} When batchSize is not a positive integer
|
|
46
56
|
*
|
|
47
57
|
* @example
|
|
48
58
|
* ```typescript
|
|
49
|
-
* // Synchronous mapping
|
|
50
|
-
* const doubled = await mapInBatches([1, 2, 3, 4], (x) => x * 2
|
|
51
|
-
* // Result: [2, 4, 6, 8]
|
|
52
|
-
*
|
|
53
|
-
* // Asynchronous mapping
|
|
54
|
-
* const fetched = await mapInBatches(urls, async (url) => fetch(url), 3);
|
|
59
|
+
* // Synchronous mapping with default options (sequential processing)
|
|
60
|
+
* const doubled = await mapInBatches([1, 2, 3, 4], (x) => x * 2);
|
|
55
61
|
*
|
|
56
|
-
* // With
|
|
57
|
-
* const
|
|
58
|
-
* // Result: ['a-0', 'b-1']
|
|
62
|
+
* // With concurrent processing within batches
|
|
63
|
+
* const doubled = await mapInBatches([1, 2, 3, 4], (x) => x * 2, { sequentialProcessing: false });
|
|
59
64
|
* ```
|
|
60
65
|
*/
|
|
61
|
-
export declare function mapInBatches<T, R>(items: T[], mapFn: (item: T, index: number) => R | Promise<R>,
|
|
66
|
+
export declare function mapInBatches<T, R>(items: T[], mapFn: (item: T, index: number) => R | Promise<R>, options?: BatchProcessingOptions): Promise<R[]>;
|
|
62
67
|
/**
|
|
63
68
|
* Filters an array in batches to avoid blocking the event loop.
|
|
64
69
|
* Processes items in chunks and yields control back to the event loop between batches
|
|
@@ -67,29 +72,21 @@ export declare function mapInBatches<T, R>(items: T[], mapFn: (item: T, index: n
|
|
|
67
72
|
* @template T - The type of items in the array
|
|
68
73
|
* @param items - The array to filter
|
|
69
74
|
* @param predicate - The predicate function to test each item. Receives the item and its index.
|
|
70
|
-
* @param
|
|
71
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
75
|
+
* @param options - Batch processing options
|
|
72
76
|
* @returns A promise that resolves to the filtered array
|
|
73
77
|
* @throws {Error} When batchSize is not a positive integer
|
|
74
78
|
*
|
|
75
79
|
* @example
|
|
76
80
|
* ```typescript
|
|
77
|
-
* // Synchronous filtering
|
|
78
|
-
* const evens = await filterInBatches([1, 2, 3, 4, 5], (x) => x % 2 === 0
|
|
81
|
+
* // Synchronous filtering with default options
|
|
82
|
+
* const evens = await filterInBatches([1, 2, 3, 4, 5], (x) => x % 2 === 0);
|
|
79
83
|
* // Result: [2, 4]
|
|
80
84
|
*
|
|
81
|
-
* //
|
|
82
|
-
* const
|
|
83
|
-
* const response = await fetch(url);
|
|
84
|
-
* return response.ok;
|
|
85
|
-
* }, 3);
|
|
86
|
-
*
|
|
87
|
-
* // With index
|
|
88
|
-
* const evenIndices = await filterInBatches(['a', 'b', 'c'], (_, index) => index % 2 === 0);
|
|
89
|
-
* // Result: ['a', 'c']
|
|
85
|
+
* // With custom batch size
|
|
86
|
+
* const evens = await filterInBatches([1, 2, 3, 4, 5], (x) => x % 2 === 0, { batchSize: 2 });
|
|
90
87
|
* ```
|
|
91
88
|
*/
|
|
92
|
-
export declare function filterInBatches<T>(items: T[], predicate: (item: T, index: number) => boolean | Promise<boolean>,
|
|
89
|
+
export declare function filterInBatches<T>(items: T[], predicate: (item: T, index: number) => boolean | Promise<boolean>, options?: BatchProcessingOptions): Promise<T[]>;
|
|
93
90
|
/**
|
|
94
91
|
* Groups an array by a key function in batches to avoid blocking the event loop.
|
|
95
92
|
* Processes items in chunks and yields control back to the event loop between batches
|
|
@@ -99,73 +96,54 @@ export declare function filterInBatches<T>(items: T[], predicate: (item: T, inde
|
|
|
99
96
|
* @template K - The type of the grouping key (must extend PropertyKey)
|
|
100
97
|
* @param items - The array to group
|
|
101
98
|
* @param keyFn - The function to extract the grouping key from each item. Receives the item and its index.
|
|
102
|
-
* @param
|
|
103
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
99
|
+
* @param options - Batch processing options
|
|
104
100
|
* @returns A promise that resolves to an object with grouped items
|
|
105
101
|
* @throws {Error} When batchSize is not a positive integer
|
|
106
102
|
*
|
|
107
103
|
* @example
|
|
108
104
|
* ```typescript
|
|
109
|
-
* // Group by property
|
|
105
|
+
* // Group by property with default options
|
|
110
106
|
* const byType = await groupByInBatches(
|
|
111
107
|
* [{type: 'A', value: 1}, {type: 'B', value: 2}, {type: 'A', value: 3}],
|
|
112
|
-
* (item) => item.type
|
|
113
|
-
* 2
|
|
108
|
+
* (item) => item.type
|
|
114
109
|
* );
|
|
115
110
|
* // Result: {A: [{type: 'A', value: 1}, {type: 'A', value: 3}], B: [{type: 'B', value: 2}]}
|
|
116
111
|
*
|
|
117
|
-
* //
|
|
118
|
-
* const
|
|
119
|
-
*
|
|
120
|
-
*
|
|
121
|
-
*
|
|
122
|
-
*
|
|
123
|
-
* return await getCategoryForItem(item);
|
|
124
|
-
* });
|
|
112
|
+
* // With custom batch size
|
|
113
|
+
* const byType = await groupByInBatches(
|
|
114
|
+
* [{type: 'A', value: 1}, {type: 'B', value: 2}, {type: 'A', value: 3}],
|
|
115
|
+
* (item) => item.type,
|
|
116
|
+
* { batchSize: 2 }
|
|
117
|
+
* );
|
|
125
118
|
* ```
|
|
126
119
|
*/
|
|
127
|
-
export declare function groupByInBatches<T, K extends PropertyKey>(items: T[], keyFn: (item: T, index: number) => K | Promise<K>,
|
|
120
|
+
export declare function groupByInBatches<T, K extends PropertyKey>(items: T[], keyFn: (item: T, index: number) => K | Promise<K>, options?: BatchProcessingOptions): Promise<Record<K, T[]>>;
|
|
128
121
|
/**
|
|
129
122
|
* Reduces an array in batches to avoid blocking the event loop.
|
|
130
123
|
* Processes items in chunks and yields control back to the event loop between batches
|
|
131
|
-
* when the processing time exceeds the threshold.
|
|
124
|
+
* when the processing time exceeds the threshold. Sequential processing is always used for the reducer function,
|
|
125
|
+
* irrespective of the `sequentialProcessing` option.
|
|
132
126
|
*
|
|
133
127
|
* @template T - The type of items in the array
|
|
134
128
|
* @template R - The type of the accumulator/result
|
|
135
129
|
* @param items - The array to reduce
|
|
136
130
|
* @param reducer - The reducer function. Receives the accumulator, current item, and index.
|
|
137
131
|
* @param initialValue - The initial value for the accumulator
|
|
138
|
-
* @param
|
|
139
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
132
|
+
* @param options - Batch processing options
|
|
140
133
|
* @returns A promise that resolves to the reduced value
|
|
141
134
|
* @throws {Error} When batchSize is not a positive integer
|
|
142
135
|
*
|
|
143
136
|
* @example
|
|
144
137
|
* ```typescript
|
|
145
|
-
* // Sum numbers
|
|
146
|
-
* const sum = await reduceInBatches([1, 2, 3, 4], (acc, x) => acc + x, 0
|
|
138
|
+
* // Sum numbers with default options
|
|
139
|
+
* const sum = await reduceInBatches([1, 2, 3, 4], (acc, x) => acc + x, 0);
|
|
147
140
|
* // Result: 10
|
|
148
141
|
*
|
|
149
|
-
* //
|
|
150
|
-
* const
|
|
151
|
-
* // Result: 'abc'
|
|
152
|
-
*
|
|
153
|
-
* // Build object with index
|
|
154
|
-
* const indexed = await reduceInBatches(
|
|
155
|
-
* ['x', 'y'],
|
|
156
|
-
* (acc, item, index) => ({ ...acc, [index]: item }),
|
|
157
|
-
* {}
|
|
158
|
-
* );
|
|
159
|
-
* // Result: {0: 'x', 1: 'y'}
|
|
160
|
-
*
|
|
161
|
-
* // Asynchronous reducer
|
|
162
|
-
* const processed = await reduceInBatches(urls, async (acc, url) => {
|
|
163
|
-
* const data = await fetch(url).then(r => r.json());
|
|
164
|
-
* return [...acc, data];
|
|
165
|
-
* }, []);
|
|
142
|
+
* // With custom batch size
|
|
143
|
+
* const sum = await reduceInBatches([1, 2, 3, 4], (acc, x) => acc + x, 0, { batchSize: 2 });
|
|
166
144
|
* ```
|
|
167
145
|
*/
|
|
168
|
-
export declare function reduceInBatches<T, R>(items: T[], reducer: (acc: R, item: T, index: number) => R | Promise<R>, initialValue: R,
|
|
146
|
+
export declare function reduceInBatches<T, R>(items: T[], reducer: (acc: R, item: T, index: number) => R | Promise<R>, initialValue: R, options?: BatchProcessingOptions): Promise<R>;
|
|
169
147
|
/**
|
|
170
148
|
* FlatMaps an array in batches to avoid blocking the event loop.
|
|
171
149
|
* Processes items in chunks, flattens the results, and yields control back to the event loop between batches
|
|
@@ -175,31 +153,45 @@ export declare function reduceInBatches<T, R>(items: T[], reducer: (acc: R, item
|
|
|
175
153
|
* @template R - The type of items in the flattened result array
|
|
176
154
|
* @param items - The array to flatMap over
|
|
177
155
|
* @param mapFn - The mapping function that returns an array for each item. Receives the item and its index.
|
|
178
|
-
* @param
|
|
179
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
156
|
+
* @param options - Batch processing options
|
|
180
157
|
* @returns A promise that resolves to the flattened mapped array
|
|
181
158
|
* @throws {Error} When batchSize is not a positive integer
|
|
182
159
|
*
|
|
183
160
|
* @example
|
|
184
161
|
* ```typescript
|
|
185
|
-
* // Duplicate each item
|
|
186
|
-
* const duplicated = await flatMapInBatches([1, 2, 3], (x) => [x, x]
|
|
162
|
+
* // Duplicate each item with default options
|
|
163
|
+
* const duplicated = await flatMapInBatches([1, 2, 3], (x) => [x, x]);
|
|
187
164
|
* // Result: [1, 1, 2, 2, 3, 3]
|
|
188
165
|
*
|
|
189
|
-
* //
|
|
190
|
-
* const
|
|
191
|
-
*
|
|
166
|
+
* // With custom batch size
|
|
167
|
+
* const duplicated = await flatMapInBatches([1, 2, 3], (x) => [x, x], { batchSize: 2 });
|
|
168
|
+
* ```
|
|
169
|
+
*/
|
|
170
|
+
export declare function flatMapInBatches<T, R>(items: T[], mapFn: (item: T, index: number) => R[] | Promise<R[]>, options?: BatchProcessingOptions): Promise<R[]>;
|
|
171
|
+
/**
|
|
172
|
+
* forEach over an array in batches to avoid blocking the event loop.
|
|
173
|
+
* Processes items in chunks and yields control back to the event loop between batches
|
|
174
|
+
* when the processing time exceeds the threshold.
|
|
192
175
|
*
|
|
193
|
-
*
|
|
194
|
-
*
|
|
195
|
-
*
|
|
176
|
+
* @template T - The type of items in the input array
|
|
177
|
+
* @param items - The array to iterate over
|
|
178
|
+
* @param fn - The function to apply to each item. Receives the item and its index. Can be async.
|
|
179
|
+
* @param options - Batch processing options
|
|
180
|
+
* @returns A promise that resolves when all items have been processed
|
|
181
|
+
* @throws {Error} When batchSize is not a positive integer
|
|
196
182
|
*
|
|
197
|
-
*
|
|
198
|
-
*
|
|
199
|
-
*
|
|
200
|
-
*
|
|
183
|
+
* @example
|
|
184
|
+
* ```typescript
|
|
185
|
+
* // Process items in batches with default options
|
|
186
|
+
* await forEachInBatches([1, 2, 3, 4], async (x) => {
|
|
187
|
+
* await doSomething(x);
|
|
201
188
|
* });
|
|
189
|
+
*
|
|
190
|
+
* // With custom batch size
|
|
191
|
+
* await forEachInBatches([1, 2, 3, 4], async (x) => {
|
|
192
|
+
* await doSomething(x);
|
|
193
|
+
* }, { batchSize: 2 });
|
|
202
194
|
* ```
|
|
203
195
|
*/
|
|
204
|
-
export declare function
|
|
196
|
+
export declare function forEachInBatches<T>(items: T[], fn: (item: T, index: number) => void | Promise<void>, options?: BatchProcessingOptions): Promise<void>;
|
|
205
197
|
//# sourceMappingURL=batch-processing.d.ts.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"batch-processing.d.ts","sourceRoot":"","sources":["../../src/utils/batch-processing.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,MAAM,WAAW,
|
|
1
|
+
{"version":3,"file":"batch-processing.d.ts","sourceRoot":"","sources":["../../src/utils/batch-processing.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,MAAM,WAAW,sBAAsB;IACrC;;;OAGG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB;;;OAGG;IACH,cAAc,CAAC,EAAE,MAAM,CAAC;IAExB;;;;OAIG;IACH,oBAAoB,CAAC,EAAE,OAAO,CAAC;CAChC;AAOD;;;;;;;;;;;;;;;;;;;;GAoBG;AACH,wBAAgB,gCAAgC,CAC9C,MAAM,CAAC,EAAE,sBAAsB,GAC9B,sBAAsB,CA0BxB;AAoFD;;;;;;;;;;;;;;;;;;;;;GAqBG;AACH,wBAAgB,YAAY,CAAC,CAAC,EAAE,CAAC,EAC/B,KAAK,EAAE,CAAC,EAAE,EACV,KAAK,EAAE,CAAC,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,MAAM,KAAK,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,EACjD,OAAO,CAAC,EAAE,sBAAsB,GAC/B,OAAO,CAAC,CAAC,EAAE,CAAC,CAqBd;AAED;;;;;;;;;;;;;;;;;;;;;GAqBG;AACH,wBAAgB,eAAe,CAAC,CAAC,EAC/B,KAAK,EAAE,CAAC,EAAE,EACV,SAAS,EAAE,CAAC,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,MAAM,KAAK,OAAO,GAAG,OAAO,CAAC,OAAO,CAAC,EACjE,OAAO,CAAC,EAAE,sBAAsB,GAC/B,OAAO,CAAC,CAAC,EAAE,CAAC,CAuBd;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA6BG;AACH,wBAAgB,gBAAgB,CAAC,CAAC,EAAE,CAAC,SAAS,WAAW,EACvD,KAAK,EAAE,CAAC,EAAE,EACV,KAAK,EAAE,CAAC,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,MAAM,KAAK,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,EACjD,OAAO,CAAC,EAAE,sBAAsB,GAC/B,OAAO,CAAC,MAAM,CAAC,CAAC,EAAE,CAAC,EAAE,CAAC,CAAC,CA0BzB;AAED;;;;;;;;;;;;;;;;;;;;;;;;GAwBG;AACH,wBAAgB,eAAe,CAAC,CAAC,EAAE,CAAC,EAClC,KAAK,EAAE,CAAC,EAAE,EACV,OAAO,EAAE,CAAC,GAAG,EAAE,CAAC,EAAE,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,MAAM,KAAK,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,EAC3D,YAAY,EAAE,CAAC,EACf,OAAO,CAAC,EAAE,sBAAsB,GAC/B,OAAO,CAAC,CAAC,CAAC,CAcZ;AAED;;;;;;;;;;;;;;;;;;;;;;GAsBG;AACH,wBAAgB,gBAAgB,CAAC,CAAC,EAAE,CAAC,EACnC,KAAK,EAAE,CAAC,EAAE,EACV,KAAK,EAAE,CAAC,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,MAAM,KAAK,CAAC,EAAE,GAAG,OAAO,CAAC,CAAC,EAAE,CAAC,EACrD,OAAO,CAAC,EAAE,sBAAsB,GAC/B,OAAO,CAAC,CAAC,EAAE,CAAC,CAuBd;AAED;;;;;;;;;;;;;;;;;;;;;;;;GAwBG;AACH,wBAAgB,gBAAgB,CAAC,CAAC,EAChC,KAAK,EAAE,CAAC,EAAE,EACV,EAAE,EAAE,CAAC,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,MAAM,KAAK,IAAI,GAAG,OAAO,CAAC,IAAI,CAAC,EACpD,OAAO,CAAC,EAAE,sBAAsB,GAC/B,OAAO,CAAC,IAAI,CAAC,CAef"}
|
|
@@ -6,9 +6,11 @@ exports.filterInBatches = filterInBatches;
|
|
|
6
6
|
exports.groupByInBatches = groupByInBatches;
|
|
7
7
|
exports.reduceInBatches = reduceInBatches;
|
|
8
8
|
exports.flatMapInBatches = flatMapInBatches;
|
|
9
|
+
exports.forEachInBatches = forEachInBatches;
|
|
9
10
|
// Default configuration values (internal)
|
|
10
11
|
let defaultBatchSize = 10;
|
|
11
12
|
let defaultYieldThreshold = 10;
|
|
13
|
+
let defaultSequentialProcessing = true;
|
|
12
14
|
/**
|
|
13
15
|
* Configure global defaults for batch processing operations
|
|
14
16
|
*
|
|
@@ -23,6 +25,9 @@ let defaultYieldThreshold = 10;
|
|
|
23
25
|
* // Set only batch size
|
|
24
26
|
* configureBatchProcessingDefaults({ batchSize: 50 });
|
|
25
27
|
*
|
|
28
|
+
* // Enable concurrent processing within batches
|
|
29
|
+
* configureBatchProcessingDefaults({ sequentialProcessing: false });
|
|
30
|
+
*
|
|
26
31
|
* // Get current configuration
|
|
27
32
|
* const currentConfig = configureBatchProcessingDefaults();
|
|
28
33
|
* ```
|
|
@@ -41,10 +46,14 @@ function configureBatchProcessingDefaults(config) {
|
|
|
41
46
|
}
|
|
42
47
|
defaultYieldThreshold = config.yieldThreshold;
|
|
43
48
|
}
|
|
49
|
+
if (config.sequentialProcessing !== undefined) {
|
|
50
|
+
defaultSequentialProcessing = Boolean(config.sequentialProcessing);
|
|
51
|
+
}
|
|
44
52
|
}
|
|
45
53
|
return {
|
|
46
54
|
batchSize: defaultBatchSize,
|
|
47
55
|
yieldThreshold: defaultYieldThreshold,
|
|
56
|
+
sequentialProcessing: defaultSequentialProcessing,
|
|
48
57
|
};
|
|
49
58
|
}
|
|
50
59
|
/**
|
|
@@ -68,6 +77,57 @@ function defer(startTime, yieldThreshold) {
|
|
|
68
77
|
// Otherwise continue immediately
|
|
69
78
|
return Promise.resolve(false);
|
|
70
79
|
}
|
|
80
|
+
/**
|
|
81
|
+
* Helper to get batch processing options with defaults applied
|
|
82
|
+
* @param options - User provided options
|
|
83
|
+
* @returns Options with defaults applied
|
|
84
|
+
* @internal
|
|
85
|
+
*/
|
|
86
|
+
function getOptions(options) {
|
|
87
|
+
const batchSize = options?.batchSize ?? defaultBatchSize;
|
|
88
|
+
const yieldThreshold = options?.yieldThreshold ?? defaultYieldThreshold;
|
|
89
|
+
const sequentialProcessing = options?.sequentialProcessing ?? defaultSequentialProcessing;
|
|
90
|
+
if (!Number.isInteger(batchSize) || batchSize <= 0) {
|
|
91
|
+
throw new Error('batchSize must be a positive integer');
|
|
92
|
+
}
|
|
93
|
+
if (!Number.isInteger(yieldThreshold) || yieldThreshold < 0) {
|
|
94
|
+
throw new Error('yieldThreshold must be a non-negative integer');
|
|
95
|
+
}
|
|
96
|
+
return {
|
|
97
|
+
batchSize,
|
|
98
|
+
yieldThreshold,
|
|
99
|
+
sequentialProcessing,
|
|
100
|
+
};
|
|
101
|
+
}
|
|
102
|
+
/**
|
|
103
|
+
* Helper to process an array in batches, yielding as needed.
|
|
104
|
+
* @param items - The array to process
|
|
105
|
+
* @param options - Batch processing options
|
|
106
|
+
* @param batchHandler - Function to handle each batch: (batch, batchStartIndex) => Promise<any>
|
|
107
|
+
* @returns Promise<void>
|
|
108
|
+
*/
|
|
109
|
+
async function processInBatches(items, options, batchHandler) {
|
|
110
|
+
let i = 0;
|
|
111
|
+
let startTime = Date.now();
|
|
112
|
+
const { batchSize } = options;
|
|
113
|
+
const n = items.length;
|
|
114
|
+
// Allocate a single batch array and reuses it for all batches
|
|
115
|
+
const batch = Array(batchSize);
|
|
116
|
+
while (i < n) {
|
|
117
|
+
const len = Math.min(batchSize, n - i);
|
|
118
|
+
for (let j = 0; j < len; j += 1) {
|
|
119
|
+
batch[j] = items[i + j];
|
|
120
|
+
}
|
|
121
|
+
batch.length = len;
|
|
122
|
+
// eslint-disable-next-line no-await-in-loop
|
|
123
|
+
await batchHandler(batch, i);
|
|
124
|
+
i += batchSize;
|
|
125
|
+
// eslint-disable-next-line no-await-in-loop
|
|
126
|
+
const didYield = await defer(startTime, options.yieldThreshold);
|
|
127
|
+
if (didYield)
|
|
128
|
+
startTime = Date.now();
|
|
129
|
+
}
|
|
130
|
+
}
|
|
71
131
|
/**
|
|
72
132
|
* Maps over an array in batches to avoid blocking the event loop.
|
|
73
133
|
* Processes items in chunks and yields control back to the event loop between batches
|
|
@@ -77,40 +137,40 @@ function defer(startTime, yieldThreshold) {
|
|
|
77
137
|
* @template R - The type of items in the result array
|
|
78
138
|
* @param items - The array to map over
|
|
79
139
|
* @param mapFn - The mapping function to apply to each item. Receives the item and its index.
|
|
80
|
-
* @param
|
|
81
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
140
|
+
* @param options - Batch processing options
|
|
82
141
|
* @returns A promise that resolves to the mapped array
|
|
83
142
|
* @throws {Error} When batchSize is not a positive integer
|
|
84
143
|
*
|
|
85
144
|
* @example
|
|
86
145
|
* ```typescript
|
|
87
|
-
* // Synchronous mapping
|
|
88
|
-
* const doubled = await mapInBatches([1, 2, 3, 4], (x) => x * 2
|
|
89
|
-
* // Result: [2, 4, 6, 8]
|
|
90
|
-
*
|
|
91
|
-
* // Asynchronous mapping
|
|
92
|
-
* const fetched = await mapInBatches(urls, async (url) => fetch(url), 3);
|
|
146
|
+
* // Synchronous mapping with default options (sequential processing)
|
|
147
|
+
* const doubled = await mapInBatches([1, 2, 3, 4], (x) => x * 2);
|
|
93
148
|
*
|
|
94
|
-
* // With
|
|
95
|
-
* const
|
|
96
|
-
* // Result: ['a-0', 'b-1']
|
|
149
|
+
* // With concurrent processing within batches
|
|
150
|
+
* const doubled = await mapInBatches([1, 2, 3, 4], (x) => x * 2, { sequentialProcessing: false });
|
|
97
151
|
* ```
|
|
98
152
|
*/
|
|
99
|
-
function mapInBatches(items, mapFn,
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
153
|
+
function mapInBatches(items, mapFn, options) {
|
|
154
|
+
const opts = getOptions(options);
|
|
155
|
+
return (async () => {
|
|
156
|
+
const result = [];
|
|
157
|
+
await processInBatches(items, opts, async (batch, batchStart) => {
|
|
158
|
+
if (opts.sequentialProcessing) {
|
|
159
|
+
// Process items sequentially
|
|
160
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
161
|
+
// eslint-disable-next-line no-await-in-loop -- sequential processing is required
|
|
162
|
+
const mapped = await mapFn(batch[j], batchStart + j);
|
|
163
|
+
result.push(mapped);
|
|
164
|
+
}
|
|
165
|
+
}
|
|
166
|
+
else {
|
|
167
|
+
// Process items concurrently
|
|
168
|
+
const mapped = await Promise.all(batch.map((item, j) => mapFn(item, batchStart + j)));
|
|
169
|
+
result.push(...mapped);
|
|
170
|
+
}
|
|
171
|
+
});
|
|
172
|
+
return result;
|
|
173
|
+
})();
|
|
114
174
|
}
|
|
115
175
|
/**
|
|
116
176
|
* Filters an array in batches to avoid blocking the event loop.
|
|
@@ -120,44 +180,45 @@ function mapInBatches(items, mapFn, batchSize = defaultBatchSize, yieldThreshold
|
|
|
120
180
|
* @template T - The type of items in the array
|
|
121
181
|
* @param items - The array to filter
|
|
122
182
|
* @param predicate - The predicate function to test each item. Receives the item and its index.
|
|
123
|
-
* @param
|
|
124
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
183
|
+
* @param options - Batch processing options
|
|
125
184
|
* @returns A promise that resolves to the filtered array
|
|
126
185
|
* @throws {Error} When batchSize is not a positive integer
|
|
127
186
|
*
|
|
128
187
|
* @example
|
|
129
188
|
* ```typescript
|
|
130
|
-
* // Synchronous filtering
|
|
131
|
-
* const evens = await filterInBatches([1, 2, 3, 4, 5], (x) => x % 2 === 0
|
|
189
|
+
* // Synchronous filtering with default options
|
|
190
|
+
* const evens = await filterInBatches([1, 2, 3, 4, 5], (x) => x % 2 === 0);
|
|
132
191
|
* // Result: [2, 4]
|
|
133
192
|
*
|
|
134
|
-
* //
|
|
135
|
-
* const
|
|
136
|
-
* const response = await fetch(url);
|
|
137
|
-
* return response.ok;
|
|
138
|
-
* }, 3);
|
|
139
|
-
*
|
|
140
|
-
* // With index
|
|
141
|
-
* const evenIndices = await filterInBatches(['a', 'b', 'c'], (_, index) => index % 2 === 0);
|
|
142
|
-
* // Result: ['a', 'c']
|
|
193
|
+
* // With custom batch size
|
|
194
|
+
* const evens = await filterInBatches([1, 2, 3, 4, 5], (x) => x % 2 === 0, { batchSize: 2 });
|
|
143
195
|
* ```
|
|
144
196
|
*/
|
|
145
|
-
function filterInBatches(items, predicate,
|
|
146
|
-
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
|
|
197
|
+
function filterInBatches(items, predicate, options) {
|
|
198
|
+
const opts = getOptions(options);
|
|
199
|
+
return (async () => {
|
|
200
|
+
const result = [];
|
|
201
|
+
await processInBatches(items, opts, async (batch, batchStart) => {
|
|
202
|
+
if (opts.sequentialProcessing) {
|
|
203
|
+
// Process items sequentially
|
|
204
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
205
|
+
// eslint-disable-next-line no-await-in-loop -- sequential processing is required
|
|
206
|
+
const passes = await predicate(batch[j], batchStart + j);
|
|
207
|
+
if (passes)
|
|
208
|
+
result.push(batch[j]);
|
|
209
|
+
}
|
|
210
|
+
}
|
|
211
|
+
else {
|
|
212
|
+
// Process items concurrently
|
|
213
|
+
const flags = await Promise.all(batch.map((item, j) => predicate(item, batchStart + j)));
|
|
214
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
215
|
+
if (flags[j])
|
|
216
|
+
result.push(batch[j]);
|
|
217
|
+
}
|
|
218
|
+
}
|
|
219
|
+
});
|
|
220
|
+
return result;
|
|
221
|
+
})();
|
|
161
222
|
}
|
|
162
223
|
/**
|
|
163
224
|
* Groups an array by a key function in batches to avoid blocking the event loop.
|
|
@@ -168,112 +229,94 @@ function filterInBatches(items, predicate, batchSize = defaultBatchSize, yieldTh
|
|
|
168
229
|
* @template K - The type of the grouping key (must extend PropertyKey)
|
|
169
230
|
* @param items - The array to group
|
|
170
231
|
* @param keyFn - The function to extract the grouping key from each item. Receives the item and its index.
|
|
171
|
-
* @param
|
|
172
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
232
|
+
* @param options - Batch processing options
|
|
173
233
|
* @returns A promise that resolves to an object with grouped items
|
|
174
234
|
* @throws {Error} When batchSize is not a positive integer
|
|
175
235
|
*
|
|
176
236
|
* @example
|
|
177
237
|
* ```typescript
|
|
178
|
-
* // Group by property
|
|
238
|
+
* // Group by property with default options
|
|
179
239
|
* const byType = await groupByInBatches(
|
|
180
240
|
* [{type: 'A', value: 1}, {type: 'B', value: 2}, {type: 'A', value: 3}],
|
|
181
|
-
* (item) => item.type
|
|
182
|
-
* 2
|
|
241
|
+
* (item) => item.type
|
|
183
242
|
* );
|
|
184
243
|
* // Result: {A: [{type: 'A', value: 1}, {type: 'A', value: 3}], B: [{type: 'B', value: 2}]}
|
|
185
244
|
*
|
|
186
|
-
* //
|
|
187
|
-
* const
|
|
188
|
-
*
|
|
189
|
-
*
|
|
190
|
-
*
|
|
191
|
-
*
|
|
192
|
-
* return await getCategoryForItem(item);
|
|
193
|
-
* });
|
|
245
|
+
* // With custom batch size
|
|
246
|
+
* const byType = await groupByInBatches(
|
|
247
|
+
* [{type: 'A', value: 1}, {type: 'B', value: 2}, {type: 'A', value: 3}],
|
|
248
|
+
* (item) => item.type,
|
|
249
|
+
* { batchSize: 2 }
|
|
250
|
+
* );
|
|
194
251
|
* ```
|
|
195
252
|
*/
|
|
196
|
-
function groupByInBatches(items, keyFn,
|
|
197
|
-
|
|
198
|
-
|
|
199
|
-
|
|
200
|
-
|
|
201
|
-
|
|
202
|
-
|
|
203
|
-
|
|
204
|
-
|
|
205
|
-
|
|
206
|
-
|
|
207
|
-
|
|
208
|
-
|
|
209
|
-
|
|
210
|
-
|
|
211
|
-
|
|
212
|
-
|
|
213
|
-
|
|
214
|
-
|
|
215
|
-
|
|
216
|
-
|
|
217
|
-
|
|
253
|
+
function groupByInBatches(items, keyFn, options) {
|
|
254
|
+
const opts = getOptions(options);
|
|
255
|
+
return (async () => {
|
|
256
|
+
const result = {};
|
|
257
|
+
await processInBatches(items, opts, async (batch, batchStart) => {
|
|
258
|
+
if (opts.sequentialProcessing) {
|
|
259
|
+
// Process items sequentially
|
|
260
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
261
|
+
// eslint-disable-next-line no-await-in-loop -- sequential processing is required
|
|
262
|
+
const key = await keyFn(batch[j], batchStart + j);
|
|
263
|
+
if (!result[key])
|
|
264
|
+
result[key] = [];
|
|
265
|
+
result[key].push(batch[j]);
|
|
266
|
+
}
|
|
267
|
+
}
|
|
268
|
+
else {
|
|
269
|
+
// Process items concurrently
|
|
270
|
+
const keys = await Promise.all(batch.map((item, j) => keyFn(item, batchStart + j)));
|
|
271
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
272
|
+
const key = keys[j];
|
|
273
|
+
if (!result[key])
|
|
274
|
+
result[key] = [];
|
|
275
|
+
result[key].push(batch[j]);
|
|
276
|
+
}
|
|
277
|
+
}
|
|
278
|
+
});
|
|
279
|
+
return result;
|
|
280
|
+
})();
|
|
218
281
|
}
|
|
219
282
|
/**
|
|
220
283
|
* Reduces an array in batches to avoid blocking the event loop.
|
|
221
284
|
* Processes items in chunks and yields control back to the event loop between batches
|
|
222
|
-
* when the processing time exceeds the threshold.
|
|
285
|
+
* when the processing time exceeds the threshold. Sequential processing is always used for the reducer function,
|
|
286
|
+
* irrespective of the `sequentialProcessing` option.
|
|
223
287
|
*
|
|
224
288
|
* @template T - The type of items in the array
|
|
225
289
|
* @template R - The type of the accumulator/result
|
|
226
290
|
* @param items - The array to reduce
|
|
227
291
|
* @param reducer - The reducer function. Receives the accumulator, current item, and index.
|
|
228
292
|
* @param initialValue - The initial value for the accumulator
|
|
229
|
-
* @param
|
|
230
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
293
|
+
* @param options - Batch processing options
|
|
231
294
|
* @returns A promise that resolves to the reduced value
|
|
232
295
|
* @throws {Error} When batchSize is not a positive integer
|
|
233
296
|
*
|
|
234
297
|
* @example
|
|
235
298
|
* ```typescript
|
|
236
|
-
* // Sum numbers
|
|
237
|
-
* const sum = await reduceInBatches([1, 2, 3, 4], (acc, x) => acc + x, 0
|
|
299
|
+
* // Sum numbers with default options
|
|
300
|
+
* const sum = await reduceInBatches([1, 2, 3, 4], (acc, x) => acc + x, 0);
|
|
238
301
|
* // Result: 10
|
|
239
302
|
*
|
|
240
|
-
* //
|
|
241
|
-
* const
|
|
242
|
-
* // Result: 'abc'
|
|
243
|
-
*
|
|
244
|
-
* // Build object with index
|
|
245
|
-
* const indexed = await reduceInBatches(
|
|
246
|
-
* ['x', 'y'],
|
|
247
|
-
* (acc, item, index) => ({ ...acc, [index]: item }),
|
|
248
|
-
* {}
|
|
249
|
-
* );
|
|
250
|
-
* // Result: {0: 'x', 1: 'y'}
|
|
251
|
-
*
|
|
252
|
-
* // Asynchronous reducer
|
|
253
|
-
* const processed = await reduceInBatches(urls, async (acc, url) => {
|
|
254
|
-
* const data = await fetch(url).then(r => r.json());
|
|
255
|
-
* return [...acc, data];
|
|
256
|
-
* }, []);
|
|
303
|
+
* // With custom batch size
|
|
304
|
+
* const sum = await reduceInBatches([1, 2, 3, 4], (acc, x) => acc + x, 0, { batchSize: 2 });
|
|
257
305
|
* ```
|
|
258
306
|
*/
|
|
259
|
-
function reduceInBatches(items, reducer, initialValue,
|
|
260
|
-
|
|
261
|
-
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
|
|
265
|
-
|
|
266
|
-
|
|
267
|
-
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
|
|
271
|
-
|
|
272
|
-
return reducer(resolvedAcc, item, i + j);
|
|
273
|
-
}, Promise.resolve(acc));
|
|
274
|
-
return defer(startTime, yieldThreshold).then((didYield) => process(i + batchSize, reduced, didYield ? Date.now() : startTime));
|
|
275
|
-
};
|
|
276
|
-
return process();
|
|
307
|
+
function reduceInBatches(items, reducer, initialValue, options) {
|
|
308
|
+
const opts = getOptions(options);
|
|
309
|
+
return (async () => {
|
|
310
|
+
let acc = initialValue;
|
|
311
|
+
await processInBatches(items, opts, async (batch, batchStart) => {
|
|
312
|
+
// Always sequential, regardless of sequentialProcessing option
|
|
313
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
314
|
+
// eslint-disable-next-line no-await-in-loop -- sequential processing is required
|
|
315
|
+
acc = await reducer(acc, batch[j], batchStart + j);
|
|
316
|
+
}
|
|
317
|
+
});
|
|
318
|
+
return acc;
|
|
319
|
+
})();
|
|
277
320
|
}
|
|
278
321
|
/**
|
|
279
322
|
* FlatMaps an array in batches to avoid blocking the event loop.
|
|
@@ -284,47 +327,83 @@ function reduceInBatches(items, reducer, initialValue, batchSize = defaultBatchS
|
|
|
284
327
|
* @template R - The type of items in the flattened result array
|
|
285
328
|
* @param items - The array to flatMap over
|
|
286
329
|
* @param mapFn - The mapping function that returns an array for each item. Receives the item and its index.
|
|
287
|
-
* @param
|
|
288
|
-
* @param yieldThreshold - Time threshold in milliseconds before yielding control (default: @see defaultYieldThreshold)
|
|
330
|
+
* @param options - Batch processing options
|
|
289
331
|
* @returns A promise that resolves to the flattened mapped array
|
|
290
332
|
* @throws {Error} When batchSize is not a positive integer
|
|
291
333
|
*
|
|
292
334
|
* @example
|
|
293
335
|
* ```typescript
|
|
294
|
-
* // Duplicate each item
|
|
295
|
-
* const duplicated = await flatMapInBatches([1, 2, 3], (x) => [x, x]
|
|
336
|
+
* // Duplicate each item with default options
|
|
337
|
+
* const duplicated = await flatMapInBatches([1, 2, 3], (x) => [x, x]);
|
|
296
338
|
* // Result: [1, 1, 2, 2, 3, 3]
|
|
297
339
|
*
|
|
298
|
-
* //
|
|
299
|
-
* const
|
|
300
|
-
*
|
|
340
|
+
* // With custom batch size
|
|
341
|
+
* const duplicated = await flatMapInBatches([1, 2, 3], (x) => [x, x], { batchSize: 2 });
|
|
342
|
+
* ```
|
|
343
|
+
*/
|
|
344
|
+
function flatMapInBatches(items, mapFn, options) {
|
|
345
|
+
const opts = getOptions(options);
|
|
346
|
+
return (async () => {
|
|
347
|
+
const result = [];
|
|
348
|
+
await processInBatches(items, opts, async (batch, batchStart) => {
|
|
349
|
+
if (opts.sequentialProcessing) {
|
|
350
|
+
// Process items sequentially
|
|
351
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
352
|
+
// eslint-disable-next-line no-await-in-loop -- sequential processing is required
|
|
353
|
+
const mapped = await mapFn(batch[j], batchStart + j);
|
|
354
|
+
result.push(...mapped);
|
|
355
|
+
}
|
|
356
|
+
}
|
|
357
|
+
else {
|
|
358
|
+
// Process items concurrently
|
|
359
|
+
const mapped = await Promise.all(batch.map((item, j) => mapFn(item, batchStart + j)));
|
|
360
|
+
mapped.forEach((arr) => {
|
|
361
|
+
result.push(...arr);
|
|
362
|
+
});
|
|
363
|
+
}
|
|
364
|
+
});
|
|
365
|
+
return result;
|
|
366
|
+
})();
|
|
367
|
+
}
|
|
368
|
+
/**
|
|
369
|
+
* forEach over an array in batches to avoid blocking the event loop.
|
|
370
|
+
* Processes items in chunks and yields control back to the event loop between batches
|
|
371
|
+
* when the processing time exceeds the threshold.
|
|
301
372
|
*
|
|
302
|
-
*
|
|
303
|
-
*
|
|
304
|
-
*
|
|
373
|
+
* @template T - The type of items in the input array
|
|
374
|
+
* @param items - The array to iterate over
|
|
375
|
+
* @param fn - The function to apply to each item. Receives the item and its index. Can be async.
|
|
376
|
+
* @param options - Batch processing options
|
|
377
|
+
* @returns A promise that resolves when all items have been processed
|
|
378
|
+
* @throws {Error} When batchSize is not a positive integer
|
|
305
379
|
*
|
|
306
|
-
*
|
|
307
|
-
*
|
|
308
|
-
*
|
|
309
|
-
*
|
|
380
|
+
* @example
|
|
381
|
+
* ```typescript
|
|
382
|
+
* // Process items in batches with default options
|
|
383
|
+
* await forEachInBatches([1, 2, 3, 4], async (x) => {
|
|
384
|
+
* await doSomething(x);
|
|
310
385
|
* });
|
|
386
|
+
*
|
|
387
|
+
* // With custom batch size
|
|
388
|
+
* await forEachInBatches([1, 2, 3, 4], async (x) => {
|
|
389
|
+
* await doSomething(x);
|
|
390
|
+
* }, { batchSize: 2 });
|
|
311
391
|
* ```
|
|
312
392
|
*/
|
|
313
|
-
function
|
|
314
|
-
|
|
315
|
-
|
|
316
|
-
|
|
317
|
-
|
|
318
|
-
|
|
319
|
-
|
|
320
|
-
|
|
321
|
-
|
|
322
|
-
|
|
323
|
-
|
|
324
|
-
|
|
325
|
-
|
|
326
|
-
|
|
327
|
-
};
|
|
328
|
-
return process();
|
|
393
|
+
function forEachInBatches(items, fn, options) {
|
|
394
|
+
const opts = getOptions(options);
|
|
395
|
+
return processInBatches(items, opts, async (batch, batchStart) => {
|
|
396
|
+
if (opts.sequentialProcessing) {
|
|
397
|
+
// Process items sequentially
|
|
398
|
+
for (let j = 0; j < batch.length; j += 1) {
|
|
399
|
+
// eslint-disable-next-line no-await-in-loop -- sequential processing is required
|
|
400
|
+
await fn(batch[j], batchStart + j);
|
|
401
|
+
}
|
|
402
|
+
}
|
|
403
|
+
else {
|
|
404
|
+
// Process items concurrently
|
|
405
|
+
await Promise.all(batch.map((item, j) => fn(item, batchStart + j)));
|
|
406
|
+
}
|
|
407
|
+
});
|
|
329
408
|
}
|
|
330
|
-
//# sourceMappingURL=data:application/json;base64,
|
|
409
|
+
//# sourceMappingURL=data:application/json;base64,
|