@crawlee/core 4.0.0-beta.4 → 4.0.0-beta.41

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (171) hide show
  1. package/README.md +9 -5
  2. package/autoscaling/autoscaled_pool.d.ts +3 -5
  3. package/autoscaling/autoscaled_pool.d.ts.map +1 -1
  4. package/autoscaling/autoscaled_pool.js +3 -9
  5. package/autoscaling/autoscaled_pool.js.map +1 -1
  6. package/autoscaling/snapshotter.d.ts +3 -13
  7. package/autoscaling/snapshotter.d.ts.map +1 -1
  8. package/autoscaling/snapshotter.js +18 -29
  9. package/autoscaling/snapshotter.js.map +1 -1
  10. package/autoscaling/system_status.d.ts +0 -3
  11. package/autoscaling/system_status.d.ts.map +1 -1
  12. package/autoscaling/system_status.js +2 -3
  13. package/autoscaling/system_status.js.map +1 -1
  14. package/configuration.d.ts +5 -78
  15. package/configuration.d.ts.map +1 -1
  16. package/configuration.js +6 -102
  17. package/configuration.js.map +1 -1
  18. package/cookie_utils.d.ts +1 -1
  19. package/cookie_utils.d.ts.map +1 -1
  20. package/cookie_utils.js +8 -8
  21. package/cookie_utils.js.map +1 -1
  22. package/crawlers/context_pipeline.d.ts +71 -0
  23. package/crawlers/context_pipeline.d.ts.map +1 -0
  24. package/crawlers/context_pipeline.js +123 -0
  25. package/crawlers/context_pipeline.js.map +1 -0
  26. package/crawlers/crawler_commons.d.ts +15 -23
  27. package/crawlers/crawler_commons.d.ts.map +1 -1
  28. package/crawlers/crawler_commons.js +0 -8
  29. package/crawlers/crawler_commons.js.map +1 -1
  30. package/crawlers/error_snapshotter.d.ts +3 -2
  31. package/crawlers/error_snapshotter.d.ts.map +1 -1
  32. package/crawlers/error_snapshotter.js +2 -2
  33. package/crawlers/error_snapshotter.js.map +1 -1
  34. package/crawlers/error_tracker.d.ts +2 -1
  35. package/crawlers/error_tracker.d.ts.map +1 -1
  36. package/crawlers/error_tracker.js.map +1 -1
  37. package/crawlers/index.d.ts +1 -1
  38. package/crawlers/index.d.ts.map +1 -1
  39. package/crawlers/index.js +1 -1
  40. package/crawlers/index.js.map +1 -1
  41. package/crawlers/internals/types.d.ts +8 -0
  42. package/crawlers/internals/types.d.ts.map +1 -0
  43. package/crawlers/internals/types.js +2 -0
  44. package/crawlers/internals/types.js.map +1 -0
  45. package/crawlers/statistics.d.ts +15 -15
  46. package/crawlers/statistics.d.ts.map +1 -1
  47. package/crawlers/statistics.js +21 -18
  48. package/crawlers/statistics.js.map +1 -1
  49. package/enqueue_links/enqueue_links.d.ts +30 -18
  50. package/enqueue_links/enqueue_links.d.ts.map +1 -1
  51. package/enqueue_links/enqueue_links.js +41 -23
  52. package/enqueue_links/enqueue_links.js.map +1 -1
  53. package/enqueue_links/shared.d.ts +24 -7
  54. package/enqueue_links/shared.d.ts.map +1 -1
  55. package/enqueue_links/shared.js +66 -37
  56. package/enqueue_links/shared.js.map +1 -1
  57. package/errors.d.ts +18 -0
  58. package/errors.d.ts.map +1 -1
  59. package/errors.js +35 -0
  60. package/errors.js.map +1 -1
  61. package/events/event_manager.d.ts +8 -5
  62. package/events/event_manager.d.ts.map +1 -1
  63. package/events/event_manager.js +7 -9
  64. package/events/event_manager.js.map +1 -1
  65. package/events/local_event_manager.d.ts +14 -4
  66. package/events/local_event_manager.d.ts.map +1 -1
  67. package/events/local_event_manager.js +33 -39
  68. package/events/local_event_manager.js.map +1 -1
  69. package/index.d.ts +2 -1
  70. package/index.d.ts.map +1 -1
  71. package/index.js +2 -1
  72. package/index.js.map +1 -1
  73. package/log.d.ts +82 -2
  74. package/log.d.ts.map +1 -1
  75. package/log.js +102 -0
  76. package/log.js.map +1 -1
  77. package/package.json +6 -7
  78. package/proxy_configuration.d.ts +17 -94
  79. package/proxy_configuration.d.ts.map +1 -1
  80. package/proxy_configuration.js +18 -54
  81. package/proxy_configuration.js.map +1 -1
  82. package/recoverable_state.d.ts +121 -0
  83. package/recoverable_state.d.ts.map +1 -0
  84. package/recoverable_state.js +137 -0
  85. package/recoverable_state.js.map +1 -0
  86. package/request.d.ts +48 -6
  87. package/request.d.ts.map +1 -1
  88. package/request.js +62 -16
  89. package/request.js.map +1 -1
  90. package/service_locator.d.ts +162 -0
  91. package/service_locator.d.ts.map +1 -0
  92. package/service_locator.js +247 -0
  93. package/service_locator.js.map +1 -0
  94. package/session_pool/session.d.ts +9 -31
  95. package/session_pool/session.d.ts.map +1 -1
  96. package/session_pool/session.js +17 -21
  97. package/session_pool/session.js.map +1 -1
  98. package/session_pool/session_pool.d.ts +27 -54
  99. package/session_pool/session_pool.d.ts.map +1 -1
  100. package/session_pool/session_pool.js +54 -69
  101. package/session_pool/session_pool.js.map +1 -1
  102. package/storages/dataset.d.ts +53 -3
  103. package/storages/dataset.d.ts.map +1 -1
  104. package/storages/dataset.js +78 -6
  105. package/storages/dataset.js.map +1 -1
  106. package/storages/index.d.ts +2 -0
  107. package/storages/index.d.ts.map +1 -1
  108. package/storages/index.js +2 -0
  109. package/storages/index.js.map +1 -1
  110. package/storages/key_value_store.d.ts +71 -1
  111. package/storages/key_value_store.d.ts.map +1 -1
  112. package/storages/key_value_store.js +95 -12
  113. package/storages/key_value_store.js.map +1 -1
  114. package/storages/request_list.d.ts +9 -9
  115. package/storages/request_list.d.ts.map +1 -1
  116. package/storages/request_list.js +11 -8
  117. package/storages/request_list.js.map +1 -1
  118. package/storages/request_list_adapter.d.ts +58 -0
  119. package/storages/request_list_adapter.d.ts.map +1 -0
  120. package/storages/request_list_adapter.js +81 -0
  121. package/storages/request_list_adapter.js.map +1 -0
  122. package/storages/request_manager_tandem.d.ts +68 -0
  123. package/storages/request_manager_tandem.d.ts.map +1 -0
  124. package/storages/request_manager_tandem.js +124 -0
  125. package/storages/request_manager_tandem.js.map +1 -0
  126. package/storages/request_provider.d.ts +76 -9
  127. package/storages/request_provider.d.ts.map +1 -1
  128. package/storages/request_provider.js +92 -54
  129. package/storages/request_provider.js.map +1 -1
  130. package/storages/request_queue.d.ts +1 -3
  131. package/storages/request_queue.d.ts.map +1 -1
  132. package/storages/request_queue.js +2 -4
  133. package/storages/request_queue.js.map +1 -1
  134. package/storages/request_queue_v2.d.ts +3 -3
  135. package/storages/request_queue_v2.d.ts.map +1 -1
  136. package/storages/request_queue_v2.js +4 -5
  137. package/storages/request_queue_v2.js.map +1 -1
  138. package/storages/sitemap_request_list.d.ts +5 -5
  139. package/storages/sitemap_request_list.d.ts.map +1 -1
  140. package/storages/sitemap_request_list.js +10 -7
  141. package/storages/sitemap_request_list.js.map +1 -1
  142. package/storages/storage_manager.d.ts +10 -8
  143. package/storages/storage_manager.d.ts.map +1 -1
  144. package/storages/storage_manager.js +12 -22
  145. package/storages/storage_manager.js.map +1 -1
  146. package/storages/utils.d.ts.map +1 -1
  147. package/storages/utils.js +4 -3
  148. package/storages/utils.js.map +1 -1
  149. package/typedefs.d.ts +1 -1
  150. package/typedefs.d.ts.map +1 -1
  151. package/crawlers/crawler_extension.d.ts +0 -12
  152. package/crawlers/crawler_extension.d.ts.map +0 -1
  153. package/crawlers/crawler_extension.js +0 -14
  154. package/crawlers/crawler_extension.js.map +0 -1
  155. package/http_clients/base-http-client.d.ts +0 -134
  156. package/http_clients/base-http-client.d.ts.map +0 -1
  157. package/http_clients/base-http-client.js +0 -33
  158. package/http_clients/base-http-client.js.map +0 -1
  159. package/http_clients/form-data-like.d.ts +0 -67
  160. package/http_clients/form-data-like.d.ts.map +0 -1
  161. package/http_clients/form-data-like.js +0 -5
  162. package/http_clients/form-data-like.js.map +0 -1
  163. package/http_clients/got-scraping-http-client.d.ts +0 -15
  164. package/http_clients/got-scraping-http-client.d.ts.map +0 -1
  165. package/http_clients/got-scraping-http-client.js +0 -69
  166. package/http_clients/got-scraping-http-client.js.map +0 -1
  167. package/http_clients/index.d.ts +0 -3
  168. package/http_clients/index.d.ts.map +0 -1
  169. package/http_clients/index.js +0 -3
  170. package/http_clients/index.js.map +0 -1
  171. package/tsconfig.build.tsbuildinfo +0 -1
@@ -1,6 +1,5 @@
1
1
  import ow from 'ow';
2
- import log from '@apify/log';
3
- import { cryptoRandomObjectId } from '@apify/utilities';
2
+ import { serviceLocator } from './service_locator.js';
4
3
  /**
5
4
  * Internal class for tracking the proxy tier history for a specific domain.
6
5
  *
@@ -85,7 +84,7 @@ export class ProxyConfiguration {
85
84
  tieredProxyUrls;
86
85
  usedProxyUrls = new Map();
87
86
  newUrlFunction;
88
- log = log.child({ prefix: 'ProxyConfiguration' });
87
+ log = serviceLocator.getLogger().child({ prefix: 'ProxyConfiguration' });
89
88
  domainTiers = new Map();
90
89
  /**
91
90
  * Creates a {@link ProxyConfiguration} instance based on the provided options. Proxy servers are used to prevent target websites from
@@ -110,7 +109,7 @@ export class ProxyConfiguration {
110
109
  constructor(options = {}) {
111
110
  const { validateRequired, ...rest } = options;
112
111
  ow(rest, ow.object.exactShape({
113
- proxyUrls: ow.optional.array.nonEmpty.ofType(ow.string.url),
112
+ proxyUrls: ow.optional.array.nonEmpty.ofType(ow.any(ow.string.url, ow.null)),
114
113
  newUrlFunction: ow.optional.function,
115
114
  tieredProxyUrls: ow.optional.array.nonEmpty.ofType(ow.array.nonEmpty.ofType(ow.any(ow.string.url, ow.null))),
116
115
  }));
@@ -129,35 +128,24 @@ export class ProxyConfiguration {
129
128
  * the currently used proxy via the requestHandler parameter `proxyInfo`.
130
129
  * Use it if you want to work with a rich representation of a proxy URL.
131
130
  * If you need the URL string only, use {@link ProxyConfiguration.newUrl}.
132
- * @param [sessionId]
133
- * Represents the identifier of user {@link Session} that can be managed by the {@link SessionPool} or
134
- * you can use the Apify Proxy [Session](https://docs.apify.com/proxy#sessions) identifier.
135
- * When the provided sessionId is a number, it's converted to a string. Property sessionId of
136
- * {@link ProxyInfo} is always returned as a type string.
137
131
  *
138
- * All the HTTP requests going through the proxy with the same session identifier
139
- * will use the same target proxy server (i.e. the same IP address).
140
- * The identifier must not be longer than 50 characters and include only the following: `0-9`, `a-z`, `A-Z`, `"."`, `"_"` and `"~"`.
141
132
  * @return Represents information about used proxy and its configuration.
142
133
  */
143
- async newProxyInfo(sessionId, options) {
144
- if (typeof sessionId === 'number')
145
- sessionId = `${sessionId}`;
134
+ async newProxyInfo(options) {
146
135
  let url;
147
136
  let tier;
148
137
  if (this.tieredProxyUrls) {
149
- const { proxyUrl, proxyTier } = this._handleTieredUrl(sessionId ?? cryptoRandomObjectId(6), options);
138
+ const { proxyUrl, proxyTier } = this._handleTieredUrl(options);
150
139
  url = proxyUrl ?? undefined;
151
140
  tier = proxyTier;
152
141
  }
153
142
  else {
154
- url = await this.newUrl(sessionId, options);
143
+ url = await this.newUrl(options);
155
144
  }
156
145
  if (!url)
157
146
  return undefined;
158
147
  const { username, password, port, hostname } = new URL(url);
159
148
  return {
160
- sessionId,
161
149
  url,
162
150
  username: decodeURIComponent(username),
163
151
  password: decodeURIComponent(password),
@@ -167,12 +155,11 @@ export class ProxyConfiguration {
167
155
  };
168
156
  }
169
157
  /**
170
- * Given a session identifier and a request / proxy tier, this function returns a new proxy URL based on the provided configuration options.
171
- * @param _sessionId Session identifier
158
+ * Given a request / proxy tier, this function returns a new proxy URL based on the provided configuration options.
172
159
  * @param options Options for the tiered proxy rotation
173
160
  * @returns An object with the proxy URL and the proxy tier used.
174
161
  */
175
- _handleTieredUrl(_sessionId, options) {
162
+ _handleTieredUrl(options) {
176
163
  if (!this.tieredProxyUrls)
177
164
  throw new Error('Tiered proxy URLs are not set');
178
165
  if (!options || (!options?.request && options?.proxyTier === undefined)) {
@@ -211,58 +198,35 @@ export class ProxyConfiguration {
211
198
  const tierPrediction = tracker.predictTier();
212
199
  if (typeof request.userData.__crawlee.lastProxyTier === 'number' &&
213
200
  request.userData.__crawlee.lastProxyTier !== tierPrediction) {
214
- log.debug(`Changing proxy tier for domain "${domain}" from ${request.userData.__crawlee.lastProxyTier} to ${tierPrediction}.`);
201
+ this.log.debug(`Changing proxy tier for domain "${domain}" from ${request.userData.__crawlee.lastProxyTier} to ${tierPrediction}.`);
215
202
  }
216
203
  request.userData.__crawlee.lastProxyTier = tierPrediction;
217
204
  request.userData.__crawlee.forefront = true;
218
205
  return tierPrediction;
219
206
  }
220
207
  /**
221
- * Returns a new proxy URL based on provided configuration options and the `sessionId` parameter.
222
- * @param [sessionId]
223
- * Represents the identifier of user {@link Session} that can be managed by the {@link SessionPool} or
224
- * you can use the Apify Proxy [Session](https://docs.apify.com/proxy#sessions) identifier.
225
- * When the provided sessionId is a number, it's converted to a string.
208
+ * Returns a new proxy URL based on provided configuration options.
226
209
  *
227
- * All the HTTP requests going through the proxy with the same session identifier
228
- * will use the same target proxy server (i.e. the same IP address).
229
- * The identifier must not be longer than 50 characters and include only the following: `0-9`, `a-z`, `A-Z`, `"."`, `"_"` and `"~"`.
230
210
  * @return A string with a proxy URL, including authentication credentials and port number.
231
211
  * For example, `http://bob:password123@proxy.example.com:8000`
232
212
  */
233
- async newUrl(sessionId, options) {
234
- if (typeof sessionId === 'number')
235
- sessionId = `${sessionId}`;
213
+ async newUrl(options) {
236
214
  if (this.newUrlFunction) {
237
- return (await this._callNewUrlFunction(sessionId, { request: options?.request })) ?? undefined;
215
+ return (await this._callNewUrlFunction({ request: options?.request })) ?? undefined;
238
216
  }
239
217
  if (this.tieredProxyUrls) {
240
- return this._handleTieredUrl(sessionId ?? cryptoRandomObjectId(6), options).proxyUrl ?? undefined;
218
+ return this._handleTieredUrl(options).proxyUrl ?? undefined;
241
219
  }
242
- return this._handleCustomUrl(sessionId);
220
+ return this._handleProxyUrlsList() ?? undefined;
243
221
  }
244
- /**
245
- * Handles custom url rotation with session
246
- */
247
- _handleCustomUrl(sessionId) {
248
- let customUrlToUse;
249
- if (!sessionId) {
250
- return this.proxyUrls[this.nextCustomUrlIndex++ % this.proxyUrls.length];
251
- }
252
- if (this.usedProxyUrls.has(sessionId)) {
253
- customUrlToUse = this.usedProxyUrls.get(sessionId);
254
- }
255
- else {
256
- customUrlToUse = this.proxyUrls[this.nextCustomUrlIndex++ % this.proxyUrls.length];
257
- this.usedProxyUrls.set(sessionId, customUrlToUse);
258
- }
259
- return customUrlToUse;
222
+ _handleProxyUrlsList() {
223
+ return this.proxyUrls[this.nextCustomUrlIndex++ % this.proxyUrls.length];
260
224
  }
261
225
  /**
262
226
  * Calls the custom newUrlFunction and checks format of its return value
263
227
  */
264
- async _callNewUrlFunction(sessionId, options) {
265
- const proxyUrl = await this.newUrlFunction(sessionId, options);
228
+ async _callNewUrlFunction(options) {
229
+ const proxyUrl = await this.newUrlFunction(options);
266
230
  try {
267
231
  if (proxyUrl) {
268
232
  new URL(proxyUrl); // eslint-disable-line no-new
@@ -1 +1 @@
1
- {"version":3,"file":"proxy_configuration.js","sourceRoot":"","sources":["../src/proxy_configuration.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,MAAM,IAAI,CAAC;AAEpB,OAAO,GAAG,MAAM,YAAY,CAAC;AAC7B,OAAO,EAAE,oBAAoB,EAAE,MAAM,kBAAkB,CAAC;AAmHxD;;;;GAIG;AACH,MAAM,gBAAgB;IACV,SAAS,CAAW;IACpB,WAAW,CAAS;IAE5B,YAAY,eAAoC;QAC5C,IAAI,CAAC,SAAS,GAAG,eAAe,CAAC,GAAG,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,CAAC;QAC9C,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC;IACzB,CAAC;IAED;;OAEG;IACK,WAAW;QACf,IAAI,CAAC,SAAS,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE;YAC5B,IAAI,IAAI,CAAC,WAAW,KAAK,CAAC;gBAAE,OAAO;YACnC,IAAI,CAAC,GAAG,CAAC;gBAAE,IAAI,CAAC,SAAS,CAAC,CAAC,CAAC,EAAE,CAAC;QACnC,CAAC,CAAC,CAAC;QAEH,MAAM,IAAI,GAAG,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC;QACpF,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,GAAG,IAAI,CAAC,SAAS,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC;QAE7G,IAAI,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,KAAK,CAAC,EAAE,CAAC;YAC3D,IAAI,CAAC,WAAW,GAAG,IAAI,IAAI,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC;QACnF,CAAC;aAAM,IAAI,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,CAAC,KAAK,IAAI,EAAE,CAAC;YACnD,IAAI,CAAC,WAAW,EAAE,CAAC;QACvB,CAAC;IACL,CAAC;IAED;;;;;OAKG;IACH,QAAQ,CAAC,IAAY;QACjB,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,IAAI,EAAE,CAAC;IAC/B,CAAC;IAED;;;OAGG;IACH,WAAW;QACP,IAAI,CAAC,WAAW,EAAE,CAAC;QACnB,OAAO,IAAI,CAAC,WAAW,CAAC;IAC5B,CAAC;CACJ;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;GA2BG;AACH,MAAM,OAAO,kBAAkB;IAC3B,gBAAgB,GAAG,KAAK,CAAC;IACf,kBAAkB,GAAG,CAAC,CAAC;IACvB,SAAS,CAAY;IACrB,eAAe,CAAuB;IACtC,aAAa,GAAG,IAAI,GAAG,EAAkB,CAAC;IAC1C,cAAc,CAA8B;IAC5C,GAAG,GAAG,GAAG,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,oBAAoB,EAAE,CAAC,CAAC;IAClD,WAAW,GAAG,IAAI,GAAG,EAA4B,CAAC;IAE5D;;;;;;;;;;;;;;;;;;;OAmBG;IACH,YAAY,UAAqC,EAAE;QAC/C,MAAM,EAAE,gBAAgB,EAAE,GAAG,IAAI,EAAE,GAAG,OAAqB,CAAC;QAC5D,EAAE,CACE,IAAI,EACJ,EAAE,CAAC,MAAM,CAAC,UAAU,CAAC;YACjB,SAAS,EAAE,EAAE,CAAC,QAAQ,CAAC,KAAK,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC,MAAM,CAAC,GAAG,CAAC;YAC3D,cAAc,EAAE,EAAE,CAAC,QAAQ,CAAC,QAAQ;YACpC,eAAe,EAAE,EAAE,CAAC,QAAQ,CAAC,KAAK,CAAC,QAAQ,CAAC,MAAM,CAC9C,EAAE,CAAC,KAAK,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC,GAAG,CAAC,EAAE,CAAC,MAAM,CAAC,GAAG,EAAE,EAAE,CAAC,IAAI,CAAC,CAAC,CAC3D;SACJ,CAAC,CACL,CAAC;QAEF,MAAM,EAAE,SAAS,EAAE,cAAc,EAAE,eAAe,EAAE,GAAG,OAAO,CAAC;QAE/D,IAAI,CAAC,SAAS,EAAE,cAAc,EAAE,eAAe,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,GAAG,CAAC;YACxE,IAAI,CAAC,gCAAgC,EAAE,CAAC;QAC5C,IAAI,CAAC,SAAS,IAAI,CAAC,cAAc,IAAI,gBAAgB;YAAE,IAAI,CAAC,uBAAuB,EAAE,CAAC;QAEtF,IAAI,CAAC,SAAS,GAAG,SAAS,CAAC;QAC3B,IAAI,CAAC,cAAc,GAAG,cAAc,CAAC;QACrC,IAAI,CAAC,eAAe,GAAG,eAAe,CAAC;IAC3C,CAAC;IAED;;;;;;;;;;;;;;;;OAgBG;IACH,KAAK,CAAC,YAAY,CAAC,SAA2B,EAAE,OAA4B;QACxE,IAAI,OAAO,SAAS,KAAK,QAAQ;YAAE,SAAS,GAAG,GAAG,SAAS,EAAE,CAAC;QAE9D,IAAI,GAAuB,CAAC;QAC5B,IAAI,IAAwB,CAAC;QAC7B,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACvB,MAAM,EAAE,QAAQ,EAAE,SAAS,EAAE,GAAG,IAAI,CAAC,gBAAgB,CAAC,SAAS,IAAI,oBAAoB,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC;YACrG,GAAG,GAAG,QAAQ,IAAI,SAAS,CAAC;YAC5B,IAAI,GAAG,SAAS,CAAC;QACrB,CAAC;aAAM,CAAC;YACJ,GAAG,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,SAAS,EAAE,OAAO,CAAC,CAAC;QAChD,CAAC;QAED,IAAI,CAAC,GAAG;YAAE,OAAO,SAAS,CAAC;QAE3B,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,IAAI,EAAE,QAAQ,EAAE,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC;QAE5D,OAAO;YACH,SAAS;YACT,GAAG;YACH,QAAQ,EAAE,kBAAkB,CAAC,QAAQ,CAAC;YACtC,QAAQ,EAAE,kBAAkB,CAAC,QAAQ,CAAC;YACtC,QAAQ;YACR,IAAI,EAAE,IAAK;YACX,SAAS,EAAE,IAAI;SAClB,CAAC;IACN,CAAC;IAED;;;;;OAKG;IACO,gBAAgB,CAAC,UAAkB,EAAE,OAA4B;QACvE,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,MAAM,IAAI,KAAK,CAAC,+BAA+B,CAAC,CAAC;QAE5E,IAAI,CAAC,OAAO,IAAI,CAAC,CAAC,OAAO,EAAE,OAAO,IAAI,OAAO,EAAE,SAAS,KAAK,SAAS,CAAC,EAAE,CAAC;YACtE,MAAM,YAAY,GAAG,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC;YACjD,OAAO;gBACH,QAAQ,EAAE,YAAY,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,YAAY,CAAC,MAAM,CAAC;aAC1E,CAAC;QACN,CAAC;QAED,IAAI,cAAc,GAAG,OAAO,CAAC,SAAU,CAAC;QAExC,IAAI,OAAO,cAAc,KAAK,QAAQ,EAAE,CAAC;YACrC,cAAc,GAAG,IAAI,CAAC,gBAAgB,CAAC,OAAO,CAAC,OAAQ,CAAE,CAAC;QAC9D,CAAC;QAED,MAAM,SAAS,GAAG,IAAI,CAAC,eAAgB,CAAC,cAAc,CAAC,CAAC;QAExD,OAAO;YACH,QAAQ,EAAE,SAAS,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,SAAS,CAAC,MAAM,CAAC;YACjE,SAAS,EAAE,cAAc;SAC5B,CAAC;IACN,CAAC;IAED;;;;OAIG;IACO,gBAAgB,CAAC,OAAgB;QACvC,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,OAAO,IAAI,CAAC;QAEvC,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,QAAQ,CAAC;QAC7C,IAAI,CAAC,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,MAAM,CAAC,EAAE,CAAC;YAChC,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,MAAM,EAAE,IAAI,gBAAgB,CAAC,IAAI,CAAC,eAAe,CAAC,CAAC,CAAC;QAC7E,CAAC;QAED,OAAO,CAAC,QAAQ,CAAC,SAAS,KAAK,EAAE,CAAC;QAElC,MAAM,OAAO,GAAG,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,MAAM,CAAE,CAAC;QAE9C,IAAI,OAAO,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,KAAK,QAAQ,EAAE,CAAC;YAC/D,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,CAAC,CAAC;QAC/D,CAAC;QAED,MAAM,cAAc,GAAG,OAAO,CAAC,WAAW,EAAE,CAAC;QAE7C,IACI,OAAO,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,KAAK,QAAQ;YAC5D,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,KAAK,cAAc,EAC7D,CAAC;YACC,GAAG,CAAC,KAAK,CACL,mCAAmC,MAAM,UAAU,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,OAAO,cAAc,GAAG,CACtH,CAAC;QACN,CAAC;QAED,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,GAAG,cAAc,CAAC;QAC1D,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,SAAS,GAAG,IAAI,CAAC;QAE5C,OAAO,cAAc,CAAC;IAC1B,CAAC;IAED;;;;;;;;;;;;OAYG;IACH,KAAK,CAAC,MAAM,CAAC,SAA2B,EAAE,OAA4B;QAClE,IAAI,OAAO,SAAS,KAAK,QAAQ;YAAE,SAAS,GAAG,GAAG,SAAS,EAAE,CAAC;QAE9D,IAAI,IAAI,CAAC,cAAc,EAAE,CAAC;YACtB,OAAO,CAAC,MAAM,IAAI,CAAC,mBAAmB,CAAC,SAAS,EAAE,EAAE,OAAO,EAAE,OAAO,EAAE,OAAO,EAAE,CAAC,CAAC,IAAI,SAAS,CAAC;QACnG,CAAC;QAED,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACvB,OAAO,IAAI,CAAC,gBAAgB,CAAC,SAAS,IAAI,oBAAoB,CAAC,CAAC,CAAC,EAAE,OAAO,CAAC,CAAC,QAAQ,IAAI,SAAS,CAAC;QACtG,CAAC;QAED,OAAO,IAAI,CAAC,gBAAgB,CAAC,SAAS,CAAC,CAAC;IAC5C,CAAC;IAED;;OAEG;IACO,gBAAgB,CAAC,SAAkB;QACzC,IAAI,cAAsB,CAAC;QAE3B,IAAI,CAAC,SAAS,EAAE,CAAC;YACb,OAAO,IAAI,CAAC,SAAU,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,IAAI,CAAC,SAAU,CAAC,MAAM,CAAC,CAAC;QAC/E,CAAC;QAED,IAAI,IAAI,CAAC,aAAa,CAAC,GAAG,CAAC,SAAS,CAAC,EAAE,CAAC;YACpC,cAAc,GAAG,IAAI,CAAC,aAAa,CAAC,GAAG,CAAC,SAAS,CAAE,CAAC;QACxD,CAAC;aAAM,CAAC;YACJ,cAAc,GAAG,IAAI,CAAC,SAAU,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,IAAI,CAAC,SAAU,CAAC,MAAM,CAAC,CAAC;YACrF,IAAI,CAAC,aAAa,CAAC,GAAG,CAAC,SAAS,EAAE,cAAc,CAAC,CAAC;QACtD,CAAC;QAED,OAAO,cAAc,CAAC;IAC1B,CAAC;IAED;;OAEG;IACO,KAAK,CAAC,mBAAmB,CAAC,SAAkB,EAAE,OAA+B;QACnF,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,cAAe,CAAC,SAAU,EAAE,OAAO,CAAC,CAAC;QACjE,IAAI,CAAC;YACD,IAAI,QAAQ,EAAE,CAAC;gBACX,IAAI,GAAG,CAAC,QAAQ,CAAC,CAAC,CAAC,6BAA6B;YACpD,CAAC;YACD,OAAO,QAAQ,CAAC;QACpB,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,MAAM,IAAI,KAAK,CACX,mEAAoE,GAAa,CAAC,OAAO,EAAE,CAC9F,CAAC;QACN,CAAC;IACL,CAAC;IAES,gCAAgC;QACtC,MAAM,IAAI,KAAK,CACX,6GAA6G,CAChH,CAAC;IACN,CAAC;IAES,uBAAuB;QAC7B,MAAM,IAAI,KAAK,CAAC,8EAA8E,CAAC,CAAC;IACpG,CAAC;CACJ"}
1
+ {"version":3,"file":"proxy_configuration.js","sourceRoot":"","sources":["../src/proxy_configuration.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,MAAM,IAAI,CAAC;AAGpB,OAAO,EAAE,cAAc,EAAE,MAAM,sBAAsB,CAAC;AAgDtD;;;;GAIG;AACH,MAAM,gBAAgB;IACV,SAAS,CAAW;IACpB,WAAW,CAAS;IAE5B,YAAY,eAAoC;QAC5C,IAAI,CAAC,SAAS,GAAG,eAAe,CAAC,GAAG,CAAC,GAAG,EAAE,CAAC,CAAC,CAAC,CAAC;QAC9C,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC;IACzB,CAAC;IAED;;OAEG;IACK,WAAW;QACf,IAAI,CAAC,SAAS,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE;YAC5B,IAAI,IAAI,CAAC,WAAW,KAAK,CAAC;gBAAE,OAAO;YACnC,IAAI,CAAC,GAAG,CAAC;gBAAE,IAAI,CAAC,SAAS,CAAC,CAAC,CAAC,EAAE,CAAC;QACnC,CAAC,CAAC,CAAC;QAEH,MAAM,IAAI,GAAG,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC;QACpF,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,GAAG,IAAI,CAAC,SAAS,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC;QAE7G,IAAI,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,KAAK,CAAC,EAAE,CAAC;YAC3D,IAAI,CAAC,WAAW,GAAG,IAAI,IAAI,KAAK,CAAC,CAAC,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,WAAW,GAAG,CAAC,CAAC;QACnF,CAAC;aAAM,IAAI,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,WAAW,CAAC,KAAK,IAAI,EAAE,CAAC;YACnD,IAAI,CAAC,WAAW,EAAE,CAAC;QACvB,CAAC;IACL,CAAC;IAED;;;;;OAKG;IACH,QAAQ,CAAC,IAAY;QACjB,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,IAAI,EAAE,CAAC;IAC/B,CAAC;IAED;;;OAGG;IACH,WAAW;QACP,IAAI,CAAC,WAAW,EAAE,CAAC;QACnB,OAAO,IAAI,CAAC,WAAW,CAAC;IAC5B,CAAC;CACJ;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;GA2BG;AACH,MAAM,OAAO,kBAAkB;IAC3B,gBAAgB,GAAG,KAAK,CAAC;IACf,kBAAkB,GAAG,CAAC,CAAC;IACvB,SAAS,CAAW;IACpB,eAAe,CAAa;IAC5B,aAAa,GAAG,IAAI,GAAG,EAAyB,CAAC;IACjD,cAAc,CAA8B;IAC5C,GAAG,GAAG,cAAc,CAAC,SAAS,EAAE,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,oBAAoB,EAAE,CAAC,CAAC;IACzE,WAAW,GAAG,IAAI,GAAG,EAA4B,CAAC;IAE5D;;;;;;;;;;;;;;;;;;;OAmBG;IACH,YAAY,UAAqC,EAAE;QAC/C,MAAM,EAAE,gBAAgB,EAAE,GAAG,IAAI,EAAE,GAAG,OAAqB,CAAC;QAC5D,EAAE,CACE,IAAI,EACJ,EAAE,CAAC,MAAM,CAAC,UAAU,CAAC;YACjB,SAAS,EAAE,EAAE,CAAC,QAAQ,CAAC,KAAK,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC,GAAG,CAAC,EAAE,CAAC,MAAM,CAAC,GAAG,EAAE,EAAE,CAAC,IAAI,CAAC,CAAC;YAC5E,cAAc,EAAE,EAAE,CAAC,QAAQ,CAAC,QAAQ;YACpC,eAAe,EAAE,EAAE,CAAC,QAAQ,CAAC,KAAK,CAAC,QAAQ,CAAC,MAAM,CAC9C,EAAE,CAAC,KAAK,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE,CAAC,GAAG,CAAC,EAAE,CAAC,MAAM,CAAC,GAAG,EAAE,EAAE,CAAC,IAAI,CAAC,CAAC,CAC3D;SACJ,CAAC,CACL,CAAC;QAEF,MAAM,EAAE,SAAS,EAAE,cAAc,EAAE,eAAe,EAAE,GAAG,OAAO,CAAC;QAE/D,IAAI,CAAC,SAAS,EAAE,cAAc,EAAE,eAAe,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,GAAG,CAAC;YACxE,IAAI,CAAC,gCAAgC,EAAE,CAAC;QAC5C,IAAI,CAAC,SAAS,IAAI,CAAC,cAAc,IAAI,gBAAgB;YAAE,IAAI,CAAC,uBAAuB,EAAE,CAAC;QAEtF,IAAI,CAAC,SAAS,GAAG,SAAS,CAAC;QAC3B,IAAI,CAAC,cAAc,GAAG,cAAc,CAAC;QACrC,IAAI,CAAC,eAAe,GAAG,eAAe,CAAC;IAC3C,CAAC;IAED;;;;;;;;OAQG;IACH,KAAK,CAAC,YAAY,CAAC,OAA4B;QAC3C,IAAI,GAAuB,CAAC;QAC5B,IAAI,IAAwB,CAAC;QAC7B,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACvB,MAAM,EAAE,QAAQ,EAAE,SAAS,EAAE,GAAG,IAAI,CAAC,gBAAgB,CAAC,OAAO,CAAC,CAAC;YAC/D,GAAG,GAAG,QAAQ,IAAI,SAAS,CAAC;YAC5B,IAAI,GAAG,SAAS,CAAC;QACrB,CAAC;aAAM,CAAC;YACJ,GAAG,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC;QACrC,CAAC;QAED,IAAI,CAAC,GAAG;YAAE,OAAO,SAAS,CAAC;QAE3B,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,IAAI,EAAE,QAAQ,EAAE,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC;QAE5D,OAAO;YACH,GAAG;YACH,QAAQ,EAAE,kBAAkB,CAAC,QAAQ,CAAC;YACtC,QAAQ,EAAE,kBAAkB,CAAC,QAAQ,CAAC;YACtC,QAAQ;YACR,IAAI,EAAE,IAAK;YACX,SAAS,EAAE,IAAI;SAClB,CAAC;IACN,CAAC;IAED;;;;OAIG;IACO,gBAAgB,CAAC,OAA4B;QACnD,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,MAAM,IAAI,KAAK,CAAC,+BAA+B,CAAC,CAAC;QAE5E,IAAI,CAAC,OAAO,IAAI,CAAC,CAAC,OAAO,EAAE,OAAO,IAAI,OAAO,EAAE,SAAS,KAAK,SAAS,CAAC,EAAE,CAAC;YACtE,MAAM,YAAY,GAAG,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,CAAC;YACjD,OAAO;gBACH,QAAQ,EAAE,YAAY,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,YAAY,CAAC,MAAM,CAAC;aAC1E,CAAC;QACN,CAAC;QAED,IAAI,cAAc,GAAG,OAAO,CAAC,SAAU,CAAC;QAExC,IAAI,OAAO,cAAc,KAAK,QAAQ,EAAE,CAAC;YACrC,cAAc,GAAG,IAAI,CAAC,gBAAgB,CAAC,OAAO,CAAC,OAAQ,CAAE,CAAC;QAC9D,CAAC;QAED,MAAM,SAAS,GAAG,IAAI,CAAC,eAAgB,CAAC,cAAc,CAAC,CAAC;QAExD,OAAO;YACH,QAAQ,EAAE,SAAS,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,SAAS,CAAC,MAAM,CAAC;YACjE,SAAS,EAAE,cAAc;SAC5B,CAAC;IACN,CAAC;IAED;;;;OAIG;IACO,gBAAgB,CAAC,OAAgB;QACvC,IAAI,CAAC,IAAI,CAAC,eAAe;YAAE,OAAO,IAAI,CAAC;QAEvC,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,QAAQ,CAAC;QAC7C,IAAI,CAAC,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,MAAM,CAAC,EAAE,CAAC;YAChC,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,MAAM,EAAE,IAAI,gBAAgB,CAAC,IAAI,CAAC,eAAe,CAAC,CAAC,CAAC;QAC7E,CAAC;QAED,OAAO,CAAC,QAAQ,CAAC,SAAS,KAAK,EAAE,CAAC;QAElC,MAAM,OAAO,GAAG,IAAI,CAAC,WAAW,CAAC,GAAG,CAAC,MAAM,CAAE,CAAC;QAE9C,IAAI,OAAO,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,KAAK,QAAQ,EAAE,CAAC;YAC/D,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,CAAC,CAAC;QAC/D,CAAC;QAED,MAAM,cAAc,GAAG,OAAO,CAAC,WAAW,EAAE,CAAC;QAE7C,IACI,OAAO,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,KAAK,QAAQ;YAC5D,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,KAAK,cAAc,EAC7D,CAAC;YACC,IAAI,CAAC,GAAG,CAAC,KAAK,CACV,mCAAmC,MAAM,UAAU,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,OAAO,cAAc,GAAG,CACtH,CAAC;QACN,CAAC;QAED,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,aAAa,GAAG,cAAc,CAAC;QAC1D,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAC,SAAS,GAAG,IAAI,CAAC;QAE5C,OAAO,cAAc,CAAC;IAC1B,CAAC;IAED;;;;;OAKG;IACH,KAAK,CAAC,MAAM,CAAC,OAA4B;QACrC,IAAI,IAAI,CAAC,cAAc,EAAE,CAAC;YACtB,OAAO,CAAC,MAAM,IAAI,CAAC,mBAAmB,CAAC,EAAE,OAAO,EAAE,OAAO,EAAE,OAAO,EAAE,CAAC,CAAC,IAAI,SAAS,CAAC;QACxF,CAAC;QAED,IAAI,IAAI,CAAC,eAAe,EAAE,CAAC;YACvB,OAAO,IAAI,CAAC,gBAAgB,CAAC,OAAO,CAAC,CAAC,QAAQ,IAAI,SAAS,CAAC;QAChE,CAAC;QAED,OAAO,IAAI,CAAC,oBAAoB,EAAE,IAAI,SAAS,CAAC;IACpD,CAAC;IAES,oBAAoB;QAC1B,OAAO,IAAI,CAAC,SAAU,CAAC,IAAI,CAAC,kBAAkB,EAAE,GAAG,IAAI,CAAC,SAAU,CAAC,MAAM,CAAC,CAAC;IAC/E,CAAC;IAED;;OAEG;IACO,KAAK,CAAC,mBAAmB,CAAC,OAA+B;QAC/D,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,cAAe,CAAC,OAAO,CAAC,CAAC;QACrD,IAAI,CAAC;YACD,IAAI,QAAQ,EAAE,CAAC;gBACX,IAAI,GAAG,CAAC,QAAQ,CAAC,CAAC,CAAC,6BAA6B;YACpD,CAAC;YACD,OAAO,QAAQ,CAAC;QACpB,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,MAAM,IAAI,KAAK,CACX,mEAAoE,GAAa,CAAC,OAAO,EAAE,CAC9F,CAAC;QACN,CAAC;IACL,CAAC;IAES,gCAAgC;QACtC,MAAM,IAAI,KAAK,CACX,6GAA6G,CAChH,CAAC;IACN,CAAC;IAES,uBAAuB;QAC7B,MAAM,IAAI,KAAK,CAAC,8EAA8E,CAAC,CAAC;IACpG,CAAC;CACJ"}
@@ -0,0 +1,121 @@
1
+ import type { Configuration, CrawleeLogger } from '@crawlee/core';
2
+ export interface RecoverableStatePersistenceOptions {
3
+ /**
4
+ * The key under which the state is stored in the KeyValueStore
5
+ */
6
+ persistStateKey: string;
7
+ /**
8
+ * Flag to enable or disable state persistence
9
+ */
10
+ persistenceEnabled?: boolean;
11
+ /**
12
+ * The name of the KeyValueStore to use for persistence.
13
+ * If neither a name nor an id are supplied, the default store will be used.
14
+ */
15
+ persistStateKvsName?: string;
16
+ /**
17
+ * The identifier of the KeyValueStore to use for persistence.
18
+ * If neither a name nor an id are supplied, the default store will be used.
19
+ */
20
+ persistStateKvsId?: string;
21
+ }
22
+ /**
23
+ * Options for configuring the RecoverableState
24
+ */
25
+ export interface RecoverableStateOptions<TStateModel = Record<string, unknown>> extends RecoverableStatePersistenceOptions {
26
+ /**
27
+ * The default state used if no persisted state is found.
28
+ * A deep copy is made each time the state is used.
29
+ */
30
+ defaultState: TStateModel;
31
+ /**
32
+ * A logger instance for logging operations related to state persistence
33
+ */
34
+ logger?: CrawleeLogger;
35
+ /**
36
+ * Configuration instance to use
37
+ */
38
+ config?: Configuration;
39
+ /**
40
+ * Optional function to transform the state to a JSON string before persistence.
41
+ * If not provided, JSON.stringify will be used.
42
+ */
43
+ serialize?: (state: TStateModel) => string;
44
+ /**
45
+ * Optional function to transform a JSON-serialized object back to the state model.
46
+ * If not provided, JSON.parse is used.
47
+ * It is advisable to perform validation in this function and to throw an exception if it fails.
48
+ */
49
+ deserialize?: (serializedState: string) => TStateModel;
50
+ }
51
+ /**
52
+ * A class for managing persistent recoverable state using a plain JavaScript object.
53
+ *
54
+ * This class facilitates state persistence to a `KeyValueStore`, allowing data to be saved and retrieved
55
+ * across migrations or restarts. It manages the loading, saving, and resetting of state data,
56
+ * with optional persistence capabilities.
57
+ *
58
+ * The state is represented by a plain JavaScript object that can be serialized to and deserialized from JSON.
59
+ * The class automatically hooks into the event system to persist state when needed.
60
+ */
61
+ export declare class RecoverableState<TStateModel = Record<string, unknown>> {
62
+ private readonly defaultState;
63
+ private state;
64
+ private readonly persistenceEnabled;
65
+ private readonly persistStateKey;
66
+ private readonly persistStateKvsName?;
67
+ private readonly persistStateKvsId?;
68
+ private keyValueStore;
69
+ private readonly log;
70
+ private readonly serialize;
71
+ private readonly deserialize;
72
+ /**
73
+ * Initialize a new recoverable state object.
74
+ *
75
+ * @param options Configuration options for the recoverable state
76
+ */
77
+ constructor(options: RecoverableStateOptions<TStateModel>);
78
+ /**
79
+ * Initialize the recoverable state.
80
+ *
81
+ * This method must be called before using the recoverable state. It loads the saved state
82
+ * if persistence is enabled and registers the object to listen for PERSIST_STATE events.
83
+ *
84
+ * @returns The loaded state object
85
+ */
86
+ initialize(): Promise<TStateModel>;
87
+ /**
88
+ * Clean up resources used by the recoverable state.
89
+ *
90
+ * If persistence is enabled, this method deregisters the object from PERSIST_STATE events
91
+ * and persists the current state one last time.
92
+ */
93
+ teardown(): Promise<void>;
94
+ /**
95
+ * Get the current state.
96
+ */
97
+ get currentValue(): TStateModel;
98
+ /**
99
+ * Reset the state to the default values and clear any persisted state.
100
+ *
101
+ * Resets the current state to the default state and, if persistence is enabled,
102
+ * clears the persisted state from the KeyValueStore.
103
+ */
104
+ reset(): Promise<void>;
105
+ /**
106
+ * Persist the current state to the KeyValueStore.
107
+ *
108
+ * This method is typically called in response to a PERSIST_STATE event, but can also be called
109
+ * directly when needed.
110
+ *
111
+ * @param eventData Optional data associated with a PERSIST_STATE event
112
+ */
113
+ persistState(eventData?: {
114
+ isMigrating: boolean;
115
+ }): Promise<void>;
116
+ /**
117
+ * Load the saved state from the KeyValueStore
118
+ */
119
+ private loadSavedState;
120
+ }
121
+ //# sourceMappingURL=recoverable_state.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"recoverable_state.d.ts","sourceRoot":"","sources":["../src/recoverable_state.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,aAAa,EAAE,aAAa,EAAE,MAAM,eAAe,CAAC;AAGlE,MAAM,WAAW,kCAAkC;IAC/C;;OAEG;IACH,eAAe,EAAE,MAAM,CAAC;IAExB;;OAEG;IACH,kBAAkB,CAAC,EAAE,OAAO,CAAC;IAE7B;;;OAGG;IACH,mBAAmB,CAAC,EAAE,MAAM,CAAC;IAE7B;;;OAGG;IACH,iBAAiB,CAAC,EAAE,MAAM,CAAC;CAC9B;AAED;;GAEG;AACH,MAAM,WAAW,uBAAuB,CAAC,WAAW,GAAG,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAC1E,SAAQ,kCAAkC;IAC1C;;;OAGG;IACH,YAAY,EAAE,WAAW,CAAC;IAE1B;;OAEG;IACH,MAAM,CAAC,EAAE,aAAa,CAAC;IAEvB;;OAEG;IACH,MAAM,CAAC,EAAE,aAAa,CAAC;IAEvB;;;OAGG;IACH,SAAS,CAAC,EAAE,CAAC,KAAK,EAAE,WAAW,KAAK,MAAM,CAAC;IAE3C;;;;OAIG;IACH,WAAW,CAAC,EAAE,CAAC,eAAe,EAAE,MAAM,KAAK,WAAW,CAAC;CAC1D;AAED;;;;;;;;;GASG;AACH,qBAAa,gBAAgB,CAAC,WAAW,GAAG,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC;IAC/D,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAc;IAC3C,OAAO,CAAC,KAAK,CAA4B;IACzC,OAAO,CAAC,QAAQ,CAAC,kBAAkB,CAAU;IAC7C,OAAO,CAAC,QAAQ,CAAC,eAAe,CAAS;IACzC,OAAO,CAAC,QAAQ,CAAC,mBAAmB,CAAC,CAAS;IAC9C,OAAO,CAAC,QAAQ,CAAC,iBAAiB,CAAC,CAAS;IAC5C,OAAO,CAAC,aAAa,CAA8B;IACnD,OAAO,CAAC,QAAQ,CAAC,GAAG,CAAgB;IACpC,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAiC;IAC3D,OAAO,CAAC,QAAQ,CAAC,WAAW,CAA2C;IAEvE;;;;OAIG;gBACS,OAAO,EAAE,uBAAuB,CAAC,WAAW,CAAC;IAazD;;;;;;;OAOG;IACG,UAAU,IAAI,OAAO,CAAC,WAAW,CAAC;IAuBxC;;;;;OAKG;IACG,QAAQ,IAAI,OAAO,CAAC,IAAI,CAAC;IAU/B;;OAEG;IACH,IAAI,YAAY,IAAI,WAAW,CAM9B;IAED;;;;;OAKG;IACG,KAAK,IAAI,OAAO,CAAC,IAAI,CAAC;IAY5B;;;;;;;OAOG;IACG,YAAY,CAAC,SAAS,CAAC,EAAE;QAAE,WAAW,EAAE,OAAO,CAAA;KAAE,GAAG,OAAO,CAAC,IAAI,CAAC;IAcvE;;OAEG;YACW,cAAc;CAY/B"}
@@ -0,0 +1,137 @@
1
+ import { KeyValueStore, serviceLocator } from '@crawlee/core';
2
+ /**
3
+ * A class for managing persistent recoverable state using a plain JavaScript object.
4
+ *
5
+ * This class facilitates state persistence to a `KeyValueStore`, allowing data to be saved and retrieved
6
+ * across migrations or restarts. It manages the loading, saving, and resetting of state data,
7
+ * with optional persistence capabilities.
8
+ *
9
+ * The state is represented by a plain JavaScript object that can be serialized to and deserialized from JSON.
10
+ * The class automatically hooks into the event system to persist state when needed.
11
+ */
12
+ export class RecoverableState {
13
+ defaultState;
14
+ state = null;
15
+ persistenceEnabled;
16
+ persistStateKey;
17
+ persistStateKvsName;
18
+ persistStateKvsId;
19
+ keyValueStore = null;
20
+ log;
21
+ serialize;
22
+ deserialize;
23
+ /**
24
+ * Initialize a new recoverable state object.
25
+ *
26
+ * @param options Configuration options for the recoverable state
27
+ */
28
+ constructor(options) {
29
+ this.defaultState = options.defaultState;
30
+ this.persistStateKey = options.persistStateKey;
31
+ this.persistenceEnabled = options.persistenceEnabled ?? false;
32
+ this.persistStateKvsName = options.persistStateKvsName;
33
+ this.persistStateKvsId = options.persistStateKvsId;
34
+ this.log = options.logger ?? serviceLocator.getLogger().child({ prefix: 'RecoverableState' });
35
+ this.serialize = options.serialize ?? JSON.stringify;
36
+ this.deserialize = options.deserialize ?? JSON.parse;
37
+ this.persistState = this.persistState.bind(this);
38
+ }
39
+ /**
40
+ * Initialize the recoverable state.
41
+ *
42
+ * This method must be called before using the recoverable state. It loads the saved state
43
+ * if persistence is enabled and registers the object to listen for PERSIST_STATE events.
44
+ *
45
+ * @returns The loaded state object
46
+ */
47
+ async initialize() {
48
+ if (this.state !== null && this.state !== undefined) {
49
+ return this.currentValue;
50
+ }
51
+ if (!this.persistenceEnabled) {
52
+ this.state = this.deserialize(this.serialize(this.defaultState));
53
+ return this.currentValue;
54
+ }
55
+ this.keyValueStore = await KeyValueStore.open(this.persistStateKvsName ?? this.persistStateKvsId, {
56
+ config: serviceLocator.getConfiguration(),
57
+ });
58
+ await this.loadSavedState();
59
+ // Register for persist state events
60
+ const eventManager = serviceLocator.getEventManager();
61
+ eventManager.on("persistState" /* EventType.PERSIST_STATE */, this.persistState);
62
+ return this.currentValue;
63
+ }
64
+ /**
65
+ * Clean up resources used by the recoverable state.
66
+ *
67
+ * If persistence is enabled, this method deregisters the object from PERSIST_STATE events
68
+ * and persists the current state one last time.
69
+ */
70
+ async teardown() {
71
+ if (!this.persistenceEnabled || !this.persistState) {
72
+ return;
73
+ }
74
+ const eventManager = serviceLocator.getEventManager();
75
+ eventManager.off("persistState" /* EventType.PERSIST_STATE */, this.persistState);
76
+ await this.persistState();
77
+ }
78
+ /**
79
+ * Get the current state.
80
+ */
81
+ get currentValue() {
82
+ if (this.state === null) {
83
+ throw new Error('Recoverable state has not yet been loaded');
84
+ }
85
+ return this.state;
86
+ }
87
+ /**
88
+ * Reset the state to the default values and clear any persisted state.
89
+ *
90
+ * Resets the current state to the default state and, if persistence is enabled,
91
+ * clears the persisted state from the KeyValueStore.
92
+ */
93
+ async reset() {
94
+ this.state = this.deserialize(this.serialize(this.defaultState));
95
+ if (this.persistenceEnabled) {
96
+ if (this.keyValueStore === null) {
97
+ throw new Error('Recoverable state has not yet been initialized');
98
+ }
99
+ await this.keyValueStore.setValue(this.persistStateKey, null);
100
+ }
101
+ }
102
+ /**
103
+ * Persist the current state to the KeyValueStore.
104
+ *
105
+ * This method is typically called in response to a PERSIST_STATE event, but can also be called
106
+ * directly when needed.
107
+ *
108
+ * @param eventData Optional data associated with a PERSIST_STATE event
109
+ */
110
+ async persistState(eventData) {
111
+ this.log.debug(`Persisting state of the RecoverableState (eventData=${JSON.stringify(eventData)}).`);
112
+ if (this.keyValueStore === null || this.state === null) {
113
+ throw new Error('Recoverable state has not yet been initialized');
114
+ }
115
+ if (this.persistenceEnabled) {
116
+ await this.keyValueStore.setValue(this.persistStateKey, this.serialize(this.state), {
117
+ contentType: 'text/plain', // HACK - the result is expected to be JSON, but we do this to avoid the implicit JSON.parse in `KeyValueStore.getValue`
118
+ });
119
+ }
120
+ }
121
+ /**
122
+ * Load the saved state from the KeyValueStore
123
+ */
124
+ async loadSavedState() {
125
+ if (this.keyValueStore === null) {
126
+ throw new Error('Recoverable state has not yet been initialized');
127
+ }
128
+ const storedState = await this.keyValueStore.getValue(this.persistStateKey);
129
+ if (storedState === null || storedState === undefined) {
130
+ this.state = this.deserialize(this.serialize(this.defaultState));
131
+ }
132
+ else {
133
+ this.state = this.deserialize(storedState);
134
+ }
135
+ }
136
+ }
137
+ //# sourceMappingURL=recoverable_state.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"recoverable_state.js","sourceRoot":"","sources":["../src/recoverable_state.ts"],"names":[],"mappings":"AACA,OAAO,EAAa,aAAa,EAAE,cAAc,EAAE,MAAM,eAAe,CAAC;AA6DzE;;;;;;;;;GASG;AACH,MAAM,OAAO,gBAAgB;IACR,YAAY,CAAc;IACnC,KAAK,GAAuB,IAAI,CAAC;IACxB,kBAAkB,CAAU;IAC5B,eAAe,CAAS;IACxB,mBAAmB,CAAU;IAC7B,iBAAiB,CAAU;IACpC,aAAa,GAAyB,IAAI,CAAC;IAClC,GAAG,CAAgB;IACnB,SAAS,CAAiC;IAC1C,WAAW,CAA2C;IAEvE;;;;OAIG;IACH,YAAY,OAA6C;QACrD,IAAI,CAAC,YAAY,GAAG,OAAO,CAAC,YAAY,CAAC;QACzC,IAAI,CAAC,eAAe,GAAG,OAAO,CAAC,eAAe,CAAC;QAC/C,IAAI,CAAC,kBAAkB,GAAG,OAAO,CAAC,kBAAkB,IAAI,KAAK,CAAC;QAC9D,IAAI,CAAC,mBAAmB,GAAG,OAAO,CAAC,mBAAmB,CAAC;QACvD,IAAI,CAAC,iBAAiB,GAAG,OAAO,CAAC,iBAAiB,CAAC;QACnD,IAAI,CAAC,GAAG,GAAG,OAAO,CAAC,MAAM,IAAI,cAAc,CAAC,SAAS,EAAE,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,kBAAkB,EAAE,CAAC,CAAC;QAC9F,IAAI,CAAC,SAAS,GAAG,OAAO,CAAC,SAAS,IAAI,IAAI,CAAC,SAAS,CAAC;QACrD,IAAI,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW,IAAI,IAAI,CAAC,KAAK,CAAC;QAErD,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IACrD,CAAC;IAED;;;;;;;OAOG;IACH,KAAK,CAAC,UAAU;QACZ,IAAI,IAAI,CAAC,KAAK,KAAK,IAAI,IAAI,IAAI,CAAC,KAAK,KAAK,SAAS,EAAE,CAAC;YAClD,OAAO,IAAI,CAAC,YAAY,CAAC;QAC7B,CAAC;QAED,IAAI,CAAC,IAAI,CAAC,kBAAkB,EAAE,CAAC;YAC3B,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,YAAY,CAAC,CAAC,CAAC;YACjE,OAAO,IAAI,CAAC,YAAY,CAAC;QAC7B,CAAC;QAED,IAAI,CAAC,aAAa,GAAG,MAAM,aAAa,CAAC,IAAI,CAAC,IAAI,CAAC,mBAAmB,IAAI,IAAI,CAAC,iBAAiB,EAAE;YAC9F,MAAM,EAAE,cAAc,CAAC,gBAAgB,EAAE;SAC5C,CAAC,CAAC;QAEH,MAAM,IAAI,CAAC,cAAc,EAAE,CAAC;QAE5B,oCAAoC;QACpC,MAAM,YAAY,GAAG,cAAc,CAAC,eAAe,EAAE,CAAC;QACtD,YAAY,CAAC,EAAE,+CAA0B,IAAI,CAAC,YAAY,CAAC,CAAC;QAE5D,OAAO,IAAI,CAAC,YAAY,CAAC;IAC7B,CAAC;IAED;;;;;OAKG;IACH,KAAK,CAAC,QAAQ;QACV,IAAI,CAAC,IAAI,CAAC,kBAAkB,IAAI,CAAC,IAAI,CAAC,YAAY,EAAE,CAAC;YACjD,OAAO;QACX,CAAC;QAED,MAAM,YAAY,GAAG,cAAc,CAAC,eAAe,EAAE,CAAC;QACtD,YAAY,CAAC,GAAG,+CAA0B,IAAI,CAAC,YAAY,CAAC,CAAC;QAC7D,MAAM,IAAI,CAAC,YAAY,EAAE,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,IAAI,YAAY;QACZ,IAAI,IAAI,CAAC,KAAK,KAAK,IAAI,EAAE,CAAC;YACtB,MAAM,IAAI,KAAK,CAAC,2CAA2C,CAAC,CAAC;QACjE,CAAC;QAED,OAAO,IAAI,CAAC,KAAK,CAAC;IACtB,CAAC;IAED;;;;;OAKG;IACH,KAAK,CAAC,KAAK;QACP,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,YAAY,CAAC,CAAC,CAAC;QAEjE,IAAI,IAAI,CAAC,kBAAkB,EAAE,CAAC;YAC1B,IAAI,IAAI,CAAC,aAAa,KAAK,IAAI,EAAE,CAAC;gBAC9B,MAAM,IAAI,KAAK,CAAC,gDAAgD,CAAC,CAAC;YACtE,CAAC;YAED,MAAM,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,IAAI,CAAC,eAAe,EAAE,IAAI,CAAC,CAAC;QAClE,CAAC;IACL,CAAC;IAED;;;;;;;OAOG;IACH,KAAK,CAAC,YAAY,CAAC,SAAoC;QACnD,IAAI,CAAC,GAAG,CAAC,KAAK,CAAC,uDAAuD,IAAI,CAAC,SAAS,CAAC,SAAS,CAAC,IAAI,CAAC,CAAC;QAErG,IAAI,IAAI,CAAC,aAAa,KAAK,IAAI,IAAI,IAAI,CAAC,KAAK,KAAK,IAAI,EAAE,CAAC;YACrD,MAAM,IAAI,KAAK,CAAC,gDAAgD,CAAC,CAAC;QACtE,CAAC;QAED,IAAI,IAAI,CAAC,kBAAkB,EAAE,CAAC;YAC1B,MAAM,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,IAAI,CAAC,eAAe,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE;gBAChF,WAAW,EAAE,YAAY,EAAE,wHAAwH;aACtJ,CAAC,CAAC;QACP,CAAC;IACL,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,cAAc;QACxB,IAAI,IAAI,CAAC,aAAa,KAAK,IAAI,EAAE,CAAC;YAC9B,MAAM,IAAI,KAAK,CAAC,gDAAgD,CAAC,CAAC;QACtE,CAAC;QAED,MAAM,WAAW,GAAG,MAAM,IAAI,CAAC,aAAa,CAAC,QAAQ,CAAC,IAAI,CAAC,eAAe,CAAC,CAAC;QAC5E,IAAI,WAAW,KAAK,IAAI,IAAI,WAAW,KAAK,SAAS,EAAE,CAAC;YACpD,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,YAAY,CAAC,CAAC,CAAC;QACrE,CAAC;aAAM,CAAC;YACJ,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,WAAW,CAAC,WAAqB,CAAC,CAAC;QACzD,CAAC;IACL,CAAC;CACJ"}
package/request.d.ts CHANGED
@@ -1,6 +1,7 @@
1
1
  import type { BinaryLike } from 'node:crypto';
2
2
  import type { Dictionary } from '@crawlee/types';
3
3
  import type { EnqueueLinksOptions } from './enqueue_links/enqueue_links.js';
4
+ import type { SkippedRequestReason } from './enqueue_links/shared.js';
4
5
  import type { AllowedHttpMethods } from './typedefs.js';
5
6
  export declare enum RequestState {
6
7
  UNPROCESSED = 0,
@@ -43,7 +44,7 @@ export declare enum RequestState {
43
44
  * ```
44
45
  * @category Sources
45
46
  */
46
- export declare class Request<UserData extends Dictionary = Dictionary> {
47
+ declare class CrawleeRequest<UserData extends Dictionary = Dictionary> {
47
48
  /** Request ID */
48
49
  id?: string;
49
50
  /** URL of the web page to crawl. */
@@ -76,7 +77,12 @@ export declare class Request<UserData extends Dictionary = Dictionary> {
76
77
  headers?: Record<string, string>;
77
78
  /** Private store for the custom user data assigned to the request. */
78
79
  private _userData;
79
- /** Custom user data assigned to the request. */
80
+ /**
81
+ * Custom user data assigned to the request.
82
+ *
83
+ * All data stored in `userData` must be JSON-serializable.
84
+ * Storing non-serializable values (e.g. functions, symbols) may result in unexpected results.
85
+ */
80
86
  userData: UserData;
81
87
  /**
82
88
  * ISO datetime string that indicates the time when the request has been processed.
@@ -87,10 +93,25 @@ export declare class Request<UserData extends Dictionary = Dictionary> {
87
93
  * `Request` parameters including the URL, HTTP method and headers, and others.
88
94
  */
89
95
  constructor(options: RequestOptions<UserData>);
96
+ /**
97
+ * Converts the Crawlee Request object to a `fetch` API Request object.
98
+ * @returns The native `fetch` API Request object.
99
+ */
100
+ intoFetchAPIRequest(): Request;
90
101
  /** Tells the crawler processing this request to skip the navigation and process the request directly. */
91
102
  get skipNavigation(): boolean;
92
103
  /** Tells the crawler processing this request to skip the navigation and process the request directly. */
93
104
  set skipNavigation(value: boolean);
105
+ /**
106
+ * Depth of the request in the current crawl tree.
107
+ * Note that this is dependent on the crawler setup and might produce unexpected results when used with multiple crawlers.
108
+ */
109
+ get crawlDepth(): number;
110
+ /**
111
+ * Depth of the request in the current crawl tree.
112
+ * Note that this is dependent on the crawler setup and might produce unexpected results when used with multiple crawlers.
113
+ */
114
+ set crawlDepth(value: number);
94
115
  /** Indicates the number of times the crawling of the request has rotated the session due to a session or a proxy error. */
95
116
  get sessionRotationCount(): number;
96
117
  /** Indicates the number of times the crawling of the request has rotated the session due to a session or a proxy error. */
@@ -107,6 +128,14 @@ export declare class Request<UserData extends Dictionary = Dictionary> {
107
128
  get state(): RequestState;
108
129
  /** Describes the request's current lifecycle state. */
109
130
  set state(value: RequestState);
131
+ /**
132
+ * Reason for skipping this request.
133
+ */
134
+ get skippedReason(): SkippedRequestReason | undefined;
135
+ /**
136
+ * Reason for skipping this request.
137
+ */
138
+ set skippedReason(value: SkippedRequestReason | undefined);
110
139
  private get enqueueStrategy();
111
140
  private set enqueueStrategy(value);
112
141
  /**
@@ -123,8 +152,6 @@ export declare class Request<UserData extends Dictionary = Dictionary> {
123
152
  * @param [options]
124
153
  */
125
154
  pushErrorMessage(errorOrMessage: unknown, options?: PushErrorMessageOptions): void;
126
- protected _computeUniqueKey(options: ComputeUniqueKeyOptions): string;
127
- protected _hashPayload(payload: BinaryLike): string;
128
155
  /** @internal */
129
156
  static computeUniqueKey({ url, method, payload, keepUrlFragment, useExtendedUniqueKey, }: ComputeUniqueKeyOptions): string;
130
157
  /** @internal */
@@ -171,6 +198,9 @@ export interface RequestOptions<UserData extends Dictionary = Dictionary> {
171
198
  /**
172
199
  * Custom user data assigned to the request. Use this to save any request related data to the
173
200
  * request's scope, keeping them accessible on retries, failures etc.
201
+ *
202
+ * All data stored in `userData` must be JSON-serializable.
203
+ * Storing non-serializable values (e.g. functions, symbols) may result in unexpected results.
174
204
  */
175
205
  userData?: UserData;
176
206
  /**
@@ -203,6 +233,18 @@ export interface RequestOptions<UserData extends Dictionary = Dictionary> {
203
233
  * @default false
204
234
  */
205
235
  skipNavigation?: boolean;
236
+ /**
237
+ * Depth of the request in the current crawl tree.
238
+ * Note that this is dependent on the crawler setup and might produce unexpected results when used with multiple crawlers.
239
+ * @default 0
240
+ */
241
+ crawlDepth?: number;
242
+ /**
243
+ * Reason for skipping this request.
244
+ * This is used to provide more information about why the request was skipped.
245
+ * @internal
246
+ */
247
+ skippedReason?: SkippedRequestReason;
206
248
  /**
207
249
  * Maximum number of retries for this request. Allows to override the global `maxRequestRetries` option of `BasicCrawler`.
208
250
  */
@@ -233,11 +275,11 @@ interface ComputeUniqueKeyOptions {
233
275
  export type Source = (Partial<RequestOptions> & {
234
276
  requestsFromUrl?: string;
235
277
  regex?: RegExp;
236
- }) | Request;
278
+ }) | CrawleeRequest;
237
279
  /** @internal */
238
280
  export interface InternalSource {
239
281
  requestsFromUrl: string;
240
282
  regex?: RegExp;
241
283
  }
242
- export {};
284
+ export { CrawleeRequest as Request };
243
285
  //# sourceMappingURL=request.d.ts.map
package/request.d.ts.map CHANGED
@@ -1 +1 @@
1
- {"version":3,"file":"request.d.ts","sourceRoot":"","sources":["../src/request.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,UAAU,EAAE,MAAM,aAAa,CAAC;AAI9C,OAAO,KAAK,EAAE,UAAU,EAAE,MAAM,gBAAgB,CAAC;AAMjD,OAAO,KAAK,EAAE,mBAAmB,EAAE,MAAM,kCAAkC,CAAC;AAE5E,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,eAAe,CAAC;AA2BxD,oBAAY,YAAY;IACpB,WAAW,IAAA;IACX,UAAU,IAAA;IACV,SAAS,IAAA;IACT,eAAe,IAAA;IACf,IAAI,IAAA;IACJ,aAAa,IAAA;IACb,KAAK,IAAA;IACL,OAAO,IAAA;CACV;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8BG;AACH,qBAAa,OAAO,CAAC,QAAQ,SAAS,UAAU,GAAG,UAAU;IACzD,iBAAiB;IACjB,EAAE,CAAC,EAAE,MAAM,CAAC;IAEZ,oCAAoC;IACpC,GAAG,EAAE,MAAM,CAAC;IAEZ;;;;;;;OAOG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB;;;OAGG;IACH,SAAS,EAAE,MAAM,CAAC;IAElB,yCAAyC;IACzC,MAAM,EAAE,kBAAkB,CAAC;IAE3B,oDAAoD;IACpD,OAAO,CAAC,EAAE,MAAM,CAAC;IAEjB,8FAA8F;IAC9F,OAAO,EAAE,OAAO,CAAC;IAEjB,2FAA2F;IAC3F,UAAU,EAAE,MAAM,CAAC;IAEnB,0DAA0D;IAC1D,aAAa,EAAE,MAAM,EAAE,CAAC;IAExB,wEAAwE;IACxE,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAEjC,sEAAsE;IACtE,OAAO,CAAC,SAAS,CAA2B;IAE5C,gDAAgD;IAChD,QAAQ,EAAE,QAAQ,CAAkB;IAEpC;;;OAGG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB;;OAEG;gBACS,OAAO,EAAE,cAAc,CAAC,QAAQ,CAAC;IAwH7C,yGAAyG;IACzG,IAAI,cAAc,IAAI,OAAO,CAE5B;IAED,yGAAyG;IACzG,IAAI,cAAc,CAAC,KAAK,EAAE,OAAO,EAMhC;IAED,2HAA2H;IAC3H,IAAI,oBAAoB,IAAI,MAAM,CAEjC;IAED,2HAA2H;IAC3H,IAAI,oBAAoB,CAAC,KAAK,EAAE,MAAM,EAMrC;IAED,oDAAoD;IACpD,IAAI,KAAK,IAAI,MAAM,GAAG,SAAS,CAE9B;IAED,oDAAoD;IACpD,IAAI,KAAK,CAAC,KAAK,EAAE,MAAM,GAAG,SAAS,EAElC;IAED,8HAA8H;IAC9H,IAAI,UAAU,IAAI,MAAM,GAAG,SAAS,CAEnC;IAED,8HAA8H;IAC9H,IAAI,UAAU,CAAC,KAAK,EAAE,MAAM,GAAG,SAAS,EAMvC;IAED,uDAAuD;IACvD,IAAI,KAAK,IAAI,YAAY,CAExB;IAED,uDAAuD;IACvD,IAAI,KAAK,CAAC,KAAK,EAAE,YAAY,EAM5B;IAED,OAAO,KAAK,eAAe,GAE1B;IAED,OAAO,KAAK,eAAe,QAM1B;IAED;;;;;;;;;;;;OAYG;IACH,gBAAgB,CAAC,cAAc,EAAE,OAAO,EAAE,OAAO,GAAE,uBAA4B,GAAG,IAAI;IAiCtF,SAAS,CAAC,iBAAiB,CAAC,OAAO,EAAE,uBAAuB;IAK5D,SAAS,CAAC,YAAY,CAAC,OAAO,EAAE,UAAU,GAAG,MAAM;IAInD,gBAAgB;IAChB,MAAM,CAAC,gBAAgB,CAAC,EACpB,GAAG,EACH,MAAc,EACd,OAAO,EACP,eAAuB,EACvB,oBAA4B,GAC/B,EAAE,uBAAuB;IAiB1B,gBAAgB;IAChB,MAAM,CAAC,WAAW,CAAC,OAAO,EAAE,UAAU,GAAG,MAAM;CAGlD;AAED;;GAEG;AACH,MAAM,WAAW,cAAc,CAAC,QAAQ,SAAS,UAAU,GAAG,UAAU;IACpE,mEAAmE;IACnE,GAAG,EAAE,MAAM,CAAC;IAEZ;;;;;;;;;;;;;;;;OAgBG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB,qBAAqB;IACrB,MAAM,CAAC,EAAE,kBAAkB,GAAG,SAAS,CAAC,kBAAkB,CAAC,CAAC;IAE5D,oDAAoD;IACpD,OAAO,CAAC,EAAE,MAAM,CAAC;IAEjB;;;;;;;;OAQG;IACH,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAEjC;;;OAGG;IACH,QAAQ,CAAC,EAAE,QAAQ,CAAC;IAEpB;;OAEG;IACH,KAAK,CAAC,EAAE,MAAM,CAAC;IAEf;;;;;;OAMG;IACH,eAAe,CAAC,EAAE,OAAO,CAAC;IAE1B;;;;;OAKG;IACH,oBAAoB,CAAC,EAAE,OAAO,CAAC;IAE/B;;;OAGG;IACH,OAAO,CAAC,EAAE,OAAO,CAAC;IAElB;;;;OAIG;IACH,cAAc,CAAC,EAAE,OAAO,CAAC;IAEzB;;OAEG;IACH,UAAU,CAAC,EAAE,MAAM,CAAC;IAEpB,gBAAgB;IAChB,EAAE,CAAC,EAAE,MAAM,CAAC;IAEZ,gBAAgB;IAChB,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB,gBAAgB;IAChB,aAAa,CAAC,EAAE,IAAI,CAAC;IAErB,gBAAgB;IAChB,eAAe,CAAC,EAAE,mBAAmB,CAAC,UAAU,CAAC,CAAC;CACrD;AAED,MAAM,WAAW,uBAAuB;IACpC;;;OAGG;IACH,SAAS,CAAC,EAAE,OAAO,CAAC;CACvB;AAED,UAAU,uBAAuB;IAC7B,GAAG,EAAE,MAAM,CAAC;IACZ,MAAM,EAAE,kBAAkB,CAAC;IAC3B,OAAO,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;IAC1B,eAAe,CAAC,EAAE,OAAO,CAAC;IAC1B,oBAAoB,CAAC,EAAE,OAAO,CAAC;CAClC;AAED,MAAM,MAAM,MAAM,GAAG,CAAC,OAAO,CAAC,cAAc,CAAC,GAAG;IAAE,eAAe,CAAC,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAA;CAAE,CAAC,GAAG,OAAO,CAAC;AAExG,gBAAgB;AAChB,MAAM,WAAW,cAAc;IAC3B,eAAe,EAAE,MAAM,CAAC;IACxB,KAAK,CAAC,EAAE,MAAM,CAAC;CAClB"}
1
+ {"version":3,"file":"request.d.ts","sourceRoot":"","sources":["../src/request.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,UAAU,EAAE,MAAM,aAAa,CAAC;AAI9C,OAAO,KAAK,EAAE,UAAU,EAAE,MAAM,gBAAgB,CAAC;AAMjD,OAAO,KAAK,EAAE,mBAAmB,EAAE,MAAM,kCAAkC,CAAC;AAC5E,OAAO,KAAK,EAAE,oBAAoB,EAAE,MAAM,2BAA2B,CAAC;AAEtE,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,eAAe,CAAC;AA0BxD,oBAAY,YAAY;IACpB,WAAW,IAAA;IACX,UAAU,IAAA;IACV,SAAS,IAAA;IACT,eAAe,IAAA;IACf,IAAI,IAAA;IACJ,aAAa,IAAA;IACb,KAAK,IAAA;IACL,OAAO,IAAA;CACV;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8BG;AACH,cAAM,cAAc,CAAC,QAAQ,SAAS,UAAU,GAAG,UAAU;IACzD,iBAAiB;IACjB,EAAE,CAAC,EAAE,MAAM,CAAC;IAEZ,oCAAoC;IACpC,GAAG,EAAE,MAAM,CAAC;IAEZ;;;;;;;OAOG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB;;;OAGG;IACH,SAAS,EAAE,MAAM,CAAC;IAElB,yCAAyC;IACzC,MAAM,EAAE,kBAAkB,CAAC;IAE3B,oDAAoD;IACpD,OAAO,CAAC,EAAE,MAAM,CAAC;IAEjB,8FAA8F;IAC9F,OAAO,EAAE,OAAO,CAAC;IAEjB,2FAA2F;IAC3F,UAAU,EAAE,MAAM,CAAC;IAEnB,0DAA0D;IAC1D,aAAa,EAAE,MAAM,EAAE,CAAC;IAExB,wEAAwE;IACxE,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAEjC,sEAAsE;IACtE,OAAO,CAAC,SAAS,CAA2B;IAE5C;;;;;OAKG;IACH,QAAQ,EAAE,QAAQ,CAAkB;IAEpC;;;OAGG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB;;OAEG;gBACS,OAAO,EAAE,cAAc,CAAC,QAAQ,CAAC;IA2H7C;;;OAGG;IACI,mBAAmB,IAAI,OAAO;IAQrC,yGAAyG;IACzG,IAAI,cAAc,IAAI,OAAO,CAE5B;IAED,yGAAyG;IACzG,IAAI,cAAc,CAAC,KAAK,EAAE,OAAO,EAMhC;IAED;;;OAGG;IACH,IAAI,UAAU,IAAI,MAAM,CAEvB;IAED;;;OAGG;IACH,IAAI,UAAU,CAAC,KAAK,EAAE,MAAM,EAG3B;IAED,2HAA2H;IAC3H,IAAI,oBAAoB,IAAI,MAAM,CAEjC;IAED,2HAA2H;IAC3H,IAAI,oBAAoB,CAAC,KAAK,EAAE,MAAM,EAMrC;IAED,oDAAoD;IACpD,IAAI,KAAK,IAAI,MAAM,GAAG,SAAS,CAE9B;IAED,oDAAoD;IACpD,IAAI,KAAK,CAAC,KAAK,EAAE,MAAM,GAAG,SAAS,EAElC;IAED,8HAA8H;IAC9H,IAAI,UAAU,IAAI,MAAM,GAAG,SAAS,CAEnC;IAED,8HAA8H;IAC9H,IAAI,UAAU,CAAC,KAAK,EAAE,MAAM,GAAG,SAAS,EAMvC;IAED,uDAAuD;IACvD,IAAI,KAAK,IAAI,YAAY,CAExB;IAED,uDAAuD;IACvD,IAAI,KAAK,CAAC,KAAK,EAAE,YAAY,EAM5B;IAED;;OAEG;IACH,IAAI,aAAa,IAAI,oBAAoB,GAAG,SAAS,CAEpD;IAED;;OAEG;IACH,IAAI,aAAa,CAAC,KAAK,EAAE,oBAAoB,GAAG,SAAS,EAMxD;IAED,OAAO,KAAK,eAAe,GAE1B;IAED,OAAO,KAAK,eAAe,QAM1B;IAED;;;;;;;;;;;;OAYG;IACH,gBAAgB,CAAC,cAAc,EAAE,OAAO,EAAE,OAAO,GAAE,uBAA4B,GAAG,IAAI;IAgCtF,gBAAgB;IAChB,MAAM,CAAC,gBAAgB,CAAC,EACpB,GAAG,EACH,MAAc,EACd,OAAO,EACP,eAAuB,EACvB,oBAA4B,GAC/B,EAAE,uBAAuB;IAmB1B,gBAAgB;IAChB,MAAM,CAAC,WAAW,CAAC,OAAO,EAAE,UAAU,GAAG,MAAM;CAGlD;AAED;;GAEG;AACH,MAAM,WAAW,cAAc,CAAC,QAAQ,SAAS,UAAU,GAAG,UAAU;IACpE,mEAAmE;IACnE,GAAG,EAAE,MAAM,CAAC;IAEZ;;;;;;;;;;;;;;;;OAgBG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB,qBAAqB;IACrB,MAAM,CAAC,EAAE,kBAAkB,GAAG,SAAS,CAAC,kBAAkB,CAAC,CAAC;IAE5D,oDAAoD;IACpD,OAAO,CAAC,EAAE,MAAM,CAAC;IAEjB;;;;;;;;OAQG;IACH,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAEjC;;;;;;OAMG;IACH,QAAQ,CAAC,EAAE,QAAQ,CAAC;IAEpB;;OAEG;IACH,KAAK,CAAC,EAAE,MAAM,CAAC;IAEf;;;;;;OAMG;IACH,eAAe,CAAC,EAAE,OAAO,CAAC;IAE1B;;;;;OAKG;IACH,oBAAoB,CAAC,EAAE,OAAO,CAAC;IAE/B;;;OAGG;IACH,OAAO,CAAC,EAAE,OAAO,CAAC;IAElB;;;;OAIG;IACH,cAAc,CAAC,EAAE,OAAO,CAAC;IAEzB;;;;OAIG;IACH,UAAU,CAAC,EAAE,MAAM,CAAC;IAEpB;;;;OAIG;IACH,aAAa,CAAC,EAAE,oBAAoB,CAAC;IAErC;;OAEG;IACH,UAAU,CAAC,EAAE,MAAM,CAAC;IAEpB,gBAAgB;IAChB,EAAE,CAAC,EAAE,MAAM,CAAC;IAEZ,gBAAgB;IAChB,SAAS,CAAC,EAAE,MAAM,CAAC;IAEnB,gBAAgB;IAChB,aAAa,CAAC,EAAE,IAAI,CAAC;IAErB,gBAAgB;IAChB,eAAe,CAAC,EAAE,mBAAmB,CAAC,UAAU,CAAC,CAAC;CACrD;AAED,MAAM,WAAW,uBAAuB;IACpC;;;OAGG;IACH,SAAS,CAAC,EAAE,OAAO,CAAC;CACvB;AAED,UAAU,uBAAuB;IAC7B,GAAG,EAAE,MAAM,CAAC;IACZ,MAAM,EAAE,kBAAkB,CAAC;IAC3B,OAAO,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;IAC1B,eAAe,CAAC,EAAE,OAAO,CAAC;IAC1B,oBAAoB,CAAC,EAAE,OAAO,CAAC;CAClC;AAED,MAAM,MAAM,MAAM,GAAG,CAAC,OAAO,CAAC,cAAc,CAAC,GAAG;IAAE,eAAe,CAAC,EAAE,MAAM,CAAC;IAAC,KAAK,CAAC,EAAE,MAAM,CAAA;CAAE,CAAC,GAAG,cAAc,CAAC;AAE/G,gBAAgB;AAChB,MAAM,WAAW,cAAc;IAC3B,eAAe,EAAE,MAAM,CAAC;IACxB,KAAK,CAAC,EAAE,MAAM,CAAC;CAClB;AAED,OAAO,EAAE,cAAc,IAAI,OAAO,EAAE,CAAC"}