@crawlee/core 4.0.0-beta.4 → 4.0.0-beta.40

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (171) hide show
  1. package/README.md +9 -5
  2. package/autoscaling/autoscaled_pool.d.ts +3 -5
  3. package/autoscaling/autoscaled_pool.d.ts.map +1 -1
  4. package/autoscaling/autoscaled_pool.js +3 -9
  5. package/autoscaling/autoscaled_pool.js.map +1 -1
  6. package/autoscaling/snapshotter.d.ts +3 -13
  7. package/autoscaling/snapshotter.d.ts.map +1 -1
  8. package/autoscaling/snapshotter.js +15 -29
  9. package/autoscaling/snapshotter.js.map +1 -1
  10. package/autoscaling/system_status.d.ts +0 -3
  11. package/autoscaling/system_status.d.ts.map +1 -1
  12. package/autoscaling/system_status.js +2 -3
  13. package/autoscaling/system_status.js.map +1 -1
  14. package/configuration.d.ts +5 -78
  15. package/configuration.d.ts.map +1 -1
  16. package/configuration.js +6 -102
  17. package/configuration.js.map +1 -1
  18. package/cookie_utils.d.ts +1 -1
  19. package/cookie_utils.d.ts.map +1 -1
  20. package/cookie_utils.js +8 -8
  21. package/cookie_utils.js.map +1 -1
  22. package/crawlers/context_pipeline.d.ts +71 -0
  23. package/crawlers/context_pipeline.d.ts.map +1 -0
  24. package/crawlers/context_pipeline.js +121 -0
  25. package/crawlers/context_pipeline.js.map +1 -0
  26. package/crawlers/crawler_commons.d.ts +15 -23
  27. package/crawlers/crawler_commons.d.ts.map +1 -1
  28. package/crawlers/crawler_commons.js +0 -8
  29. package/crawlers/crawler_commons.js.map +1 -1
  30. package/crawlers/error_snapshotter.d.ts +3 -2
  31. package/crawlers/error_snapshotter.d.ts.map +1 -1
  32. package/crawlers/error_snapshotter.js +2 -2
  33. package/crawlers/error_snapshotter.js.map +1 -1
  34. package/crawlers/error_tracker.d.ts +2 -1
  35. package/crawlers/error_tracker.d.ts.map +1 -1
  36. package/crawlers/error_tracker.js.map +1 -1
  37. package/crawlers/index.d.ts +1 -1
  38. package/crawlers/index.d.ts.map +1 -1
  39. package/crawlers/index.js +1 -1
  40. package/crawlers/index.js.map +1 -1
  41. package/crawlers/internals/types.d.ts +8 -0
  42. package/crawlers/internals/types.d.ts.map +1 -0
  43. package/crawlers/internals/types.js +2 -0
  44. package/crawlers/internals/types.js.map +1 -0
  45. package/crawlers/statistics.d.ts +15 -15
  46. package/crawlers/statistics.d.ts.map +1 -1
  47. package/crawlers/statistics.js +21 -18
  48. package/crawlers/statistics.js.map +1 -1
  49. package/enqueue_links/enqueue_links.d.ts +30 -18
  50. package/enqueue_links/enqueue_links.d.ts.map +1 -1
  51. package/enqueue_links/enqueue_links.js +41 -23
  52. package/enqueue_links/enqueue_links.js.map +1 -1
  53. package/enqueue_links/shared.d.ts +24 -7
  54. package/enqueue_links/shared.d.ts.map +1 -1
  55. package/enqueue_links/shared.js +66 -37
  56. package/enqueue_links/shared.js.map +1 -1
  57. package/errors.d.ts +18 -0
  58. package/errors.d.ts.map +1 -1
  59. package/errors.js +35 -0
  60. package/errors.js.map +1 -1
  61. package/events/event_manager.d.ts +8 -5
  62. package/events/event_manager.d.ts.map +1 -1
  63. package/events/event_manager.js +7 -9
  64. package/events/event_manager.js.map +1 -1
  65. package/events/local_event_manager.d.ts +14 -4
  66. package/events/local_event_manager.d.ts.map +1 -1
  67. package/events/local_event_manager.js +27 -39
  68. package/events/local_event_manager.js.map +1 -1
  69. package/index.d.ts +2 -1
  70. package/index.d.ts.map +1 -1
  71. package/index.js +2 -1
  72. package/index.js.map +1 -1
  73. package/log.d.ts +146 -2
  74. package/log.d.ts.map +1 -1
  75. package/log.js +102 -0
  76. package/log.js.map +1 -1
  77. package/package.json +6 -7
  78. package/proxy_configuration.d.ts +17 -94
  79. package/proxy_configuration.d.ts.map +1 -1
  80. package/proxy_configuration.js +18 -54
  81. package/proxy_configuration.js.map +1 -1
  82. package/recoverable_state.d.ts +121 -0
  83. package/recoverable_state.d.ts.map +1 -0
  84. package/recoverable_state.js +137 -0
  85. package/recoverable_state.js.map +1 -0
  86. package/request.d.ts +48 -6
  87. package/request.d.ts.map +1 -1
  88. package/request.js +62 -16
  89. package/request.js.map +1 -1
  90. package/service_locator.d.ts +130 -0
  91. package/service_locator.d.ts.map +1 -0
  92. package/service_locator.js +249 -0
  93. package/service_locator.js.map +1 -0
  94. package/session_pool/session.d.ts +9 -31
  95. package/session_pool/session.d.ts.map +1 -1
  96. package/session_pool/session.js +17 -21
  97. package/session_pool/session.js.map +1 -1
  98. package/session_pool/session_pool.d.ts +27 -54
  99. package/session_pool/session_pool.d.ts.map +1 -1
  100. package/session_pool/session_pool.js +54 -69
  101. package/session_pool/session_pool.js.map +1 -1
  102. package/storages/dataset.d.ts +53 -3
  103. package/storages/dataset.d.ts.map +1 -1
  104. package/storages/dataset.js +78 -6
  105. package/storages/dataset.js.map +1 -1
  106. package/storages/index.d.ts +2 -0
  107. package/storages/index.d.ts.map +1 -1
  108. package/storages/index.js +2 -0
  109. package/storages/index.js.map +1 -1
  110. package/storages/key_value_store.d.ts +71 -1
  111. package/storages/key_value_store.d.ts.map +1 -1
  112. package/storages/key_value_store.js +95 -12
  113. package/storages/key_value_store.js.map +1 -1
  114. package/storages/request_list.d.ts +9 -9
  115. package/storages/request_list.d.ts.map +1 -1
  116. package/storages/request_list.js +11 -8
  117. package/storages/request_list.js.map +1 -1
  118. package/storages/request_list_adapter.d.ts +58 -0
  119. package/storages/request_list_adapter.d.ts.map +1 -0
  120. package/storages/request_list_adapter.js +81 -0
  121. package/storages/request_list_adapter.js.map +1 -0
  122. package/storages/request_manager_tandem.d.ts +68 -0
  123. package/storages/request_manager_tandem.d.ts.map +1 -0
  124. package/storages/request_manager_tandem.js +124 -0
  125. package/storages/request_manager_tandem.js.map +1 -0
  126. package/storages/request_provider.d.ts +76 -9
  127. package/storages/request_provider.d.ts.map +1 -1
  128. package/storages/request_provider.js +92 -54
  129. package/storages/request_provider.js.map +1 -1
  130. package/storages/request_queue.d.ts +1 -3
  131. package/storages/request_queue.d.ts.map +1 -1
  132. package/storages/request_queue.js +2 -4
  133. package/storages/request_queue.js.map +1 -1
  134. package/storages/request_queue_v2.d.ts +3 -3
  135. package/storages/request_queue_v2.d.ts.map +1 -1
  136. package/storages/request_queue_v2.js +4 -5
  137. package/storages/request_queue_v2.js.map +1 -1
  138. package/storages/sitemap_request_list.d.ts +5 -5
  139. package/storages/sitemap_request_list.d.ts.map +1 -1
  140. package/storages/sitemap_request_list.js +8 -7
  141. package/storages/sitemap_request_list.js.map +1 -1
  142. package/storages/storage_manager.d.ts +10 -8
  143. package/storages/storage_manager.d.ts.map +1 -1
  144. package/storages/storage_manager.js +12 -22
  145. package/storages/storage_manager.js.map +1 -1
  146. package/storages/utils.d.ts.map +1 -1
  147. package/storages/utils.js +4 -3
  148. package/storages/utils.js.map +1 -1
  149. package/typedefs.d.ts +1 -1
  150. package/typedefs.d.ts.map +1 -1
  151. package/crawlers/crawler_extension.d.ts +0 -12
  152. package/crawlers/crawler_extension.d.ts.map +0 -1
  153. package/crawlers/crawler_extension.js +0 -14
  154. package/crawlers/crawler_extension.js.map +0 -1
  155. package/http_clients/base-http-client.d.ts +0 -134
  156. package/http_clients/base-http-client.d.ts.map +0 -1
  157. package/http_clients/base-http-client.js +0 -33
  158. package/http_clients/base-http-client.js.map +0 -1
  159. package/http_clients/form-data-like.d.ts +0 -67
  160. package/http_clients/form-data-like.d.ts.map +0 -1
  161. package/http_clients/form-data-like.js +0 -5
  162. package/http_clients/form-data-like.js.map +0 -1
  163. package/http_clients/got-scraping-http-client.d.ts +0 -15
  164. package/http_clients/got-scraping-http-client.d.ts.map +0 -1
  165. package/http_clients/got-scraping-http-client.js +0 -69
  166. package/http_clients/got-scraping-http-client.js.map +0 -1
  167. package/http_clients/index.d.ts +0 -3
  168. package/http_clients/index.d.ts.map +0 -1
  169. package/http_clients/index.js +0 -3
  170. package/http_clients/index.js.map +0 -1
  171. package/tsconfig.build.tsbuildinfo +0 -1
@@ -1,12 +1,25 @@
1
- import os from 'node:os';
2
- import { getCurrentCpuTicksV2, getMemoryInfo, getMemoryInfoV2, isContainerized } from '@crawlee/utils';
3
- import log from '@apify/log';
4
1
  import { betterClearInterval, betterSetInterval } from '@apify/utilities';
2
+ import { serviceLocator } from '../service_locator.js';
5
3
  import { EventManager } from './event_manager.js';
6
4
  export class LocalEventManager extends EventManager {
7
- previousTicks = { idle: 0, total: 0 };
5
+ systemInfoIntervalMillis;
6
+ constructor(options) {
7
+ super(options);
8
+ this.systemInfoIntervalMillis = options.systemInfoIntervalMillis;
9
+ }
10
+ /**
11
+ * Creates a new `LocalEventManager` based on the provided `Configuration`.
12
+ * Uses the global configuration from the service locator if none is provided.
13
+ */
14
+ static fromConfig(config) {
15
+ const resolvedConfig = config ?? serviceLocator.getConfiguration();
16
+ return new LocalEventManager({
17
+ persistStateIntervalMillis: resolvedConfig.get('persistStateIntervalMillis'),
18
+ systemInfoIntervalMillis: resolvedConfig.get('systemInfoIntervalMillis'),
19
+ });
20
+ }
8
21
  /**
9
- * Initializes the EventManager and sets up periodic `systemInfo` and `persistState` events.
22
+ * Initializes the EventManager and sets up periodic `systemInfo` events.
10
23
  * This is automatically called at the beginning of `crawler.run()`.
11
24
  */
12
25
  async init() {
@@ -14,9 +27,8 @@ export class LocalEventManager extends EventManager {
14
27
  return;
15
28
  }
16
29
  await super.init();
17
- const systemInfoIntervalMillis = this.config.get('systemInfoIntervalMillis');
18
30
  this.emitSystemInfoEvent = this.emitSystemInfoEvent.bind(this);
19
- this.intervals.systemInfo = betterSetInterval(this.emitSystemInfoEvent.bind(this), systemInfoIntervalMillis);
31
+ this.intervals.systemInfo = betterSetInterval(this.emitSystemInfoEvent.bind(this), this.systemInfoIntervalMillis);
20
32
  }
21
33
  /**
22
34
  * @inheritDoc
@@ -33,7 +45,7 @@ export class LocalEventManager extends EventManager {
33
45
  */
34
46
  async emitSystemInfoEvent(intervalCallback) {
35
47
  const info = await this.createSystemInfo({
36
- maxUsedCpuRatio: this.config.get('maxUsedCpuRatio'),
48
+ maxUsedCpuRatio: serviceLocator.getConfiguration().get('maxUsedCpuRatio'),
37
49
  });
38
50
  this.events.emit("systemInfo" /* EventType.SYSTEM_INFO */, info);
39
51
  intervalCallback();
@@ -42,17 +54,8 @@ export class LocalEventManager extends EventManager {
42
54
  * @internal
43
55
  */
44
56
  async isContainerizedWrapper() {
45
- return this.config.get('containerized', await isContainerized());
46
- }
47
- getCurrentCpuTicks() {
48
- const cpus = os.cpus();
49
- return cpus.reduce((acc, cpu) => {
50
- const cpuTimes = Object.values(cpu.times);
51
- return {
52
- idle: acc.idle + cpu.times.idle,
53
- total: acc.total + cpuTimes.reduce((sum, num) => sum + num),
54
- };
55
- }, { idle: 0, total: 0 });
57
+ const { isContainerized } = await import('@crawlee/utils');
58
+ return serviceLocator.getConfiguration().get('containerized', await isContainerized());
56
59
  }
57
60
  /**
58
61
  * Creates a SystemInfo object based on local metrics.
@@ -65,18 +68,8 @@ export class LocalEventManager extends EventManager {
65
68
  };
66
69
  }
67
70
  async createCpuInfo(options) {
68
- if (this.config.get('systemInfoV2')) {
69
- const usedCpuRatio = await getCurrentCpuTicksV2(await this.isContainerizedWrapper());
70
- return {
71
- cpuCurrentUsage: usedCpuRatio * 100,
72
- isCpuOverloaded: usedCpuRatio > options.maxUsedCpuRatio,
73
- };
74
- }
75
- const ticks = this.getCurrentCpuTicks();
76
- const idleTicksDelta = ticks.idle - this.previousTicks.idle;
77
- const totalTicksDelta = ticks.total - this.previousTicks.total;
78
- const usedCpuRatio = totalTicksDelta ? 1 - idleTicksDelta / totalTicksDelta : 0;
79
- Object.assign(this.previousTicks, ticks);
71
+ const { getCurrentCpuTicksV2 } = await import('@crawlee/utils');
72
+ const usedCpuRatio = await getCurrentCpuTicksV2(await this.isContainerizedWrapper());
80
73
  return {
81
74
  cpuCurrentUsage: usedCpuRatio * 100,
82
75
  isCpuOverloaded: usedCpuRatio > options.maxUsedCpuRatio,
@@ -84,19 +77,14 @@ export class LocalEventManager extends EventManager {
84
77
  }
85
78
  async createMemoryInfo() {
86
79
  try {
87
- if (this.config.get('systemInfoV2')) {
88
- const memInfo = await getMemoryInfoV2(await this.isContainerizedWrapper());
89
- return {
90
- memCurrentBytes: memInfo.mainProcessBytes + memInfo.childProcessesBytes,
91
- };
92
- }
93
- const memInfo = await getMemoryInfo();
80
+ const { getMemoryInfo } = await import('@crawlee/utils');
81
+ const memInfo = await getMemoryInfo(await this.isContainerizedWrapper());
94
82
  return {
95
83
  memCurrentBytes: memInfo.mainProcessBytes + memInfo.childProcessesBytes,
96
84
  };
97
85
  }
98
86
  catch (err) {
99
- log.exception(err, 'Memory snapshot failed.');
87
+ this.log.exception(err, 'Memory snapshot failed.');
100
88
  return {};
101
89
  }
102
90
  }
@@ -1 +1 @@
1
- {"version":3,"file":"local_event_manager.js","sourceRoot":"","sources":["../../src/events/local_event_manager.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,MAAM,SAAS,CAAC;AAEzB,OAAO,EAAE,oBAAoB,EAAE,aAAa,EAAE,eAAe,EAAE,eAAe,EAAE,MAAM,gBAAgB,CAAC;AAEvG,OAAO,GAAG,MAAM,YAAY,CAAC;AAC7B,OAAO,EAAE,mBAAmB,EAAE,iBAAiB,EAAE,MAAM,kBAAkB,CAAC;AAG1E,OAAO,EAAE,YAAY,EAAa,MAAM,oBAAoB,CAAC;AAE7D,MAAM,OAAO,iBAAkB,SAAQ,YAAY;IACvC,aAAa,GAAG,EAAE,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,CAAC,EAAE,CAAC;IAE9C;;;OAGG;IACM,KAAK,CAAC,IAAI;QACf,IAAI,IAAI,CAAC,WAAW,EAAE,CAAC;YACnB,OAAO;QACX,CAAC;QAED,MAAM,KAAK,CAAC,IAAI,EAAE,CAAC;QAEnB,MAAM,wBAAwB,GAAG,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,0BAA0B,CAAE,CAAC;QAC9E,IAAI,CAAC,mBAAmB,GAAG,IAAI,CAAC,mBAAmB,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAC/D,IAAI,CAAC,SAAS,CAAC,UAAU,GAAG,iBAAiB,CAAC,IAAI,CAAC,mBAAmB,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,wBAAwB,CAAC,CAAC;IACjH,CAAC;IAED;;OAEG;IACM,KAAK,CAAC,KAAK;QAChB,IAAI,CAAC,IAAI,CAAC,WAAW,EAAE,CAAC;YACpB,OAAO;QACX,CAAC;QAED,MAAM,KAAK,CAAC,KAAK,EAAE,CAAC;QACpB,mBAAmB,CAAC,IAAI,CAAC,SAAS,CAAC,UAAW,CAAC,CAAC;IACpD,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,mBAAmB,CAAC,gBAA+B;QACrD,MAAM,IAAI,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC;YACrC,eAAe,EAAE,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,iBAAiB,CAAC;SACtD,CAAC,CAAC;QACH,IAAI,CAAC,MAAM,CAAC,IAAI,2CAAwB,IAAI,CAAC,CAAC;QAC9C,gBAAgB,EAAE,CAAC;IACvB,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,sBAAsB;QACxB,OAAO,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,eAAe,EAAE,MAAM,eAAe,EAAE,CAAC,CAAC;IACrE,CAAC;IAEO,kBAAkB;QACtB,MAAM,IAAI,GAAG,EAAE,CAAC,IAAI,EAAE,CAAC;QACvB,OAAO,IAAI,CAAC,MAAM,CACd,CAAC,GAAG,EAAE,GAAG,EAAE,EAAE;YACT,MAAM,QAAQ,GAAG,MAAM,CAAC,MAAM,CAAC,GAAG,CAAC,KAAK,CAAC,CAAC;YAC1C,OAAO;gBACH,IAAI,EAAE,GAAG,CAAC,IAAI,GAAG,GAAG,CAAC,KAAK,CAAC,IAAI;gBAC/B,KAAK,EAAE,GAAG,CAAC,KAAK,GAAG,QAAQ,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,GAAG,EAAE,EAAE,CAAC,GAAG,GAAG,GAAG,CAAC;aAC9D,CAAC;QACN,CAAC,EACD,EAAE,IAAI,EAAE,CAAC,EAAE,KAAK,EAAE,CAAC,EAAE,CACxB,CAAC;IACN,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,gBAAgB,CAAC,OAAoC;QAC/D,OAAO;YACH,SAAS,EAAE,IAAI,IAAI,EAAE;YACrB,GAAG,CAAC,MAAM,IAAI,CAAC,aAAa,CAAC,OAAO,CAAC,CAAC;YACtC,GAAG,CAAC,MAAM,IAAI,CAAC,gBAAgB,EAAE,CAAC;SACvB,CAAC;IACpB,CAAC;IAEO,KAAK,CAAC,aAAa,CAAC,OAAoC;QAC5D,IAAI,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,cAAc,CAAC,EAAE,CAAC;YAClC,MAAM,YAAY,GAAG,MAAM,oBAAoB,CAAC,MAAM,IAAI,CAAC,sBAAsB,EAAE,CAAC,CAAC;YACrF,OAAO;gBACH,eAAe,EAAE,YAAY,GAAG,GAAG;gBACnC,eAAe,EAAE,YAAY,GAAG,OAAO,CAAC,eAAe;aAC1D,CAAC;QACN,CAAC;QACD,MAAM,KAAK,GAAG,IAAI,CAAC,kBAAkB,EAAE,CAAC;QACxC,MAAM,cAAc,GAAG,KAAK,CAAC,IAAI,GAAG,IAAI,CAAC,aAAc,CAAC,IAAI,CAAC;QAC7D,MAAM,eAAe,GAAG,KAAK,CAAC,KAAK,GAAG,IAAI,CAAC,aAAc,CAAC,KAAK,CAAC;QAChE,MAAM,YAAY,GAAG,eAAe,CAAC,CAAC,CAAC,CAAC,GAAG,cAAc,GAAG,eAAe,CAAC,CAAC,CAAC,CAAC,CAAC;QAChF,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,aAAa,EAAE,KAAK,CAAC,CAAC;QAEzC,OAAO;YACH,eAAe,EAAE,YAAY,GAAG,GAAG;YACnC,eAAe,EAAE,YAAY,GAAG,OAAO,CAAC,eAAe;SAC1D,CAAC;IACN,CAAC;IAEO,KAAK,CAAC,gBAAgB;QAC1B,IAAI,CAAC;YACD,IAAI,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,cAAc,CAAC,EAAE,CAAC;gBAClC,MAAM,OAAO,GAAG,MAAM,eAAe,CAAC,MAAM,IAAI,CAAC,sBAAsB,EAAE,CAAC,CAAC;gBAC3E,OAAO;oBACH,eAAe,EAAE,OAAO,CAAC,gBAAgB,GAAG,OAAO,CAAC,mBAAmB;iBAC1E,CAAC;YACN,CAAC;YACD,MAAM,OAAO,GAAG,MAAM,aAAa,EAAE,CAAC;YACtC,OAAO;gBACH,eAAe,EAAE,OAAO,CAAC,gBAAgB,GAAG,OAAO,CAAC,mBAAmB;aAC1E,CAAC;QACN,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,GAAG,CAAC,SAAS,CAAC,GAAY,EAAE,yBAAyB,CAAC,CAAC;YACvD,OAAO,EAAE,CAAC;QACd,CAAC;IACL,CAAC;CACJ"}
1
+ {"version":3,"file":"local_event_manager.js","sourceRoot":"","sources":["../../src/events/local_event_manager.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,mBAAmB,EAAE,iBAAiB,EAAE,MAAM,kBAAkB,CAAC;AAI1E,OAAO,EAAE,cAAc,EAAE,MAAM,uBAAuB,CAAC;AACvD,OAAO,EAAE,YAAY,EAAuC,MAAM,oBAAoB,CAAC;AAOvF,MAAM,OAAO,iBAAkB,SAAQ,YAAY;IACvC,wBAAwB,CAAS;IAEzC,YAAY,OAAiC;QACzC,KAAK,CAAC,OAAO,CAAC,CAAC;QACf,IAAI,CAAC,wBAAwB,GAAG,OAAO,CAAC,wBAAwB,CAAC;IACrE,CAAC;IAED;;;OAGG;IACH,MAAM,CAAC,UAAU,CAAC,MAAsB;QACpC,MAAM,cAAc,GAAG,MAAM,IAAI,cAAc,CAAC,gBAAgB,EAAE,CAAC;QAEnE,OAAO,IAAI,iBAAiB,CAAC;YACzB,0BAA0B,EAAE,cAAc,CAAC,GAAG,CAAC,4BAA4B,CAAC;YAC5E,wBAAwB,EAAE,cAAc,CAAC,GAAG,CAAC,0BAA0B,CAAC;SAC3E,CAAC,CAAC;IACP,CAAC;IAED;;;OAGG;IACM,KAAK,CAAC,IAAI;QACf,IAAI,IAAI,CAAC,WAAW,EAAE,CAAC;YACnB,OAAO;QACX,CAAC;QAED,MAAM,KAAK,CAAC,IAAI,EAAE,CAAC;QAEnB,IAAI,CAAC,mBAAmB,GAAG,IAAI,CAAC,mBAAmB,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAC/D,IAAI,CAAC,SAAS,CAAC,UAAU,GAAG,iBAAiB,CACzC,IAAI,CAAC,mBAAmB,CAAC,IAAI,CAAC,IAAI,CAAC,EACnC,IAAI,CAAC,wBAAwB,CAChC,CAAC;IACN,CAAC;IAED;;OAEG;IACM,KAAK,CAAC,KAAK;QAChB,IAAI,CAAC,IAAI,CAAC,WAAW,EAAE,CAAC;YACpB,OAAO;QACX,CAAC;QAED,MAAM,KAAK,CAAC,KAAK,EAAE,CAAC;QACpB,mBAAmB,CAAC,IAAI,CAAC,SAAS,CAAC,UAAW,CAAC,CAAC;IACpD,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,mBAAmB,CAAC,gBAA+B;QACrD,MAAM,IAAI,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC;YACrC,eAAe,EAAE,cAAc,CAAC,gBAAgB,EAAE,CAAC,GAAG,CAAC,iBAAiB,CAAC;SAC5E,CAAC,CAAC;QACH,IAAI,CAAC,MAAM,CAAC,IAAI,2CAAwB,IAAI,CAAC,CAAC;QAC9C,gBAAgB,EAAE,CAAC;IACvB,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,sBAAsB;QACxB,MAAM,EAAE,eAAe,EAAE,GAAG,MAAM,MAAM,CAAC,gBAAgB,CAAC,CAAC;QAC3D,OAAO,cAAc,CAAC,gBAAgB,EAAE,CAAC,GAAG,CAAC,eAAe,EAAE,MAAM,eAAe,EAAE,CAAC,CAAC;IAC3F,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,gBAAgB,CAAC,OAAoC;QAC/D,OAAO;YACH,SAAS,EAAE,IAAI,IAAI,EAAE;YACrB,GAAG,CAAC,MAAM,IAAI,CAAC,aAAa,CAAC,OAAO,CAAC,CAAC;YACtC,GAAG,CAAC,MAAM,IAAI,CAAC,gBAAgB,EAAE,CAAC;SACvB,CAAC;IACpB,CAAC;IAEO,KAAK,CAAC,aAAa,CAAC,OAAoC;QAC5D,MAAM,EAAE,oBAAoB,EAAE,GAAG,MAAM,MAAM,CAAC,gBAAgB,CAAC,CAAC;QAChE,MAAM,YAAY,GAAG,MAAM,oBAAoB,CAAC,MAAM,IAAI,CAAC,sBAAsB,EAAE,CAAC,CAAC;QACrF,OAAO;YACH,eAAe,EAAE,YAAY,GAAG,GAAG;YACnC,eAAe,EAAE,YAAY,GAAG,OAAO,CAAC,eAAe;SAC1D,CAAC;IACN,CAAC;IAEO,KAAK,CAAC,gBAAgB;QAC1B,IAAI,CAAC;YACD,MAAM,EAAE,aAAa,EAAE,GAAG,MAAM,MAAM,CAAC,gBAAgB,CAAC,CAAC;YACzD,MAAM,OAAO,GAAG,MAAM,aAAa,CAAC,MAAM,IAAI,CAAC,sBAAsB,EAAE,CAAC,CAAC;YACzE,OAAO;gBACH,eAAe,EAAE,OAAO,CAAC,gBAAgB,GAAG,OAAO,CAAC,mBAAmB;aAC1E,CAAC;QACN,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACX,IAAI,CAAC,GAAG,CAAC,SAAS,CAAC,GAAY,EAAE,yBAAyB,CAAC,CAAC;YAC5D,OAAO,EAAE,CAAC;QACd,CAAC;IACL,CAAC;CACJ"}
package/index.d.ts CHANGED
@@ -1,10 +1,10 @@
1
1
  export * from './errors.js';
2
2
  export * from './autoscaling/index.js';
3
3
  export * from './configuration.js';
4
+ export * from './service_locator.js';
4
5
  export * from './crawlers/index.js';
5
6
  export * from './enqueue_links/index.js';
6
7
  export * from './events/index.js';
7
- export * from './http_clients/index.js';
8
8
  export * from './log.js';
9
9
  export * from './proxy_configuration.js';
10
10
  export * from './request.js';
@@ -14,6 +14,7 @@ export * from './session_pool/index.js';
14
14
  export * from './storages/index.js';
15
15
  export * from './validators.js';
16
16
  export * from './cookie_utils.js';
17
+ export * from './recoverable_state.js';
17
18
  export { PseudoUrl } from '@apify/pseudo_url';
18
19
  export { Dictionary, Awaitable, Constructor, StorageClient, Cookie, QueueOperationInfo } from '@crawlee/types';
19
20
  //# sourceMappingURL=index.d.ts.map
package/index.d.ts.map CHANGED
@@ -1 +1 @@
1
- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,cAAc,aAAa,CAAC;AAC5B,cAAc,wBAAwB,CAAC;AACvC,cAAc,oBAAoB,CAAC;AACnC,cAAc,qBAAqB,CAAC;AACpC,cAAc,0BAA0B,CAAC;AACzC,cAAc,mBAAmB,CAAC;AAClC,cAAc,yBAAyB,CAAC;AACxC,cAAc,UAAU,CAAC;AACzB,cAAc,0BAA0B,CAAC;AACzC,cAAc,cAAc,CAAC;AAC7B,cAAc,aAAa,CAAC;AAC5B,cAAc,oBAAoB,CAAC;AACnC,cAAc,yBAAyB,CAAC;AACxC,cAAc,qBAAqB,CAAC;AACpC,cAAc,iBAAiB,CAAC;AAChC,cAAc,mBAAmB,CAAC;AAClC,OAAO,EAAE,SAAS,EAAE,MAAM,mBAAmB,CAAC;AAC9C,OAAO,EAAE,UAAU,EAAE,SAAS,EAAE,WAAW,EAAE,aAAa,EAAE,MAAM,EAAE,kBAAkB,EAAE,MAAM,gBAAgB,CAAC"}
1
+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,cAAc,aAAa,CAAC;AAC5B,cAAc,wBAAwB,CAAC;AACvC,cAAc,oBAAoB,CAAC;AACnC,cAAc,sBAAsB,CAAC;AACrC,cAAc,qBAAqB,CAAC;AACpC,cAAc,0BAA0B,CAAC;AACzC,cAAc,mBAAmB,CAAC;AAClC,cAAc,UAAU,CAAC;AACzB,cAAc,0BAA0B,CAAC;AACzC,cAAc,cAAc,CAAC;AAC7B,cAAc,aAAa,CAAC;AAC5B,cAAc,oBAAoB,CAAC;AACnC,cAAc,yBAAyB,CAAC;AACxC,cAAc,qBAAqB,CAAC;AACpC,cAAc,iBAAiB,CAAC;AAChC,cAAc,mBAAmB,CAAC;AAClC,cAAc,wBAAwB,CAAC;AACvC,OAAO,EAAE,SAAS,EAAE,MAAM,mBAAmB,CAAC;AAC9C,OAAO,EAAE,UAAU,EAAE,SAAS,EAAE,WAAW,EAAE,aAAa,EAAE,MAAM,EAAE,kBAAkB,EAAE,MAAM,gBAAgB,CAAC"}
package/index.js CHANGED
@@ -1,10 +1,10 @@
1
1
  export * from './errors.js';
2
2
  export * from './autoscaling/index.js';
3
3
  export * from './configuration.js';
4
+ export * from './service_locator.js';
4
5
  export * from './crawlers/index.js';
5
6
  export * from './enqueue_links/index.js';
6
7
  export * from './events/index.js';
7
- export * from './http_clients/index.js';
8
8
  export * from './log.js';
9
9
  export * from './proxy_configuration.js';
10
10
  export * from './request.js';
@@ -14,5 +14,6 @@ export * from './session_pool/index.js';
14
14
  export * from './storages/index.js';
15
15
  export * from './validators.js';
16
16
  export * from './cookie_utils.js';
17
+ export * from './recoverable_state.js';
17
18
  export { PseudoUrl } from '@apify/pseudo_url';
18
19
  //# sourceMappingURL=index.js.map
package/index.js.map CHANGED
@@ -1 +1 @@
1
- {"version":3,"file":"index.js","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,cAAc,aAAa,CAAC;AAC5B,cAAc,wBAAwB,CAAC;AACvC,cAAc,oBAAoB,CAAC;AACnC,cAAc,qBAAqB,CAAC;AACpC,cAAc,0BAA0B,CAAC;AACzC,cAAc,mBAAmB,CAAC;AAClC,cAAc,yBAAyB,CAAC;AACxC,cAAc,UAAU,CAAC;AACzB,cAAc,0BAA0B,CAAC;AACzC,cAAc,cAAc,CAAC;AAC7B,cAAc,aAAa,CAAC;AAC5B,cAAc,oBAAoB,CAAC;AACnC,cAAc,yBAAyB,CAAC;AACxC,cAAc,qBAAqB,CAAC;AACpC,cAAc,iBAAiB,CAAC;AAChC,cAAc,mBAAmB,CAAC;AAClC,OAAO,EAAE,SAAS,EAAE,MAAM,mBAAmB,CAAC"}
1
+ {"version":3,"file":"index.js","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,cAAc,aAAa,CAAC;AAC5B,cAAc,wBAAwB,CAAC;AACvC,cAAc,oBAAoB,CAAC;AACnC,cAAc,sBAAsB,CAAC;AACrC,cAAc,qBAAqB,CAAC;AACpC,cAAc,0BAA0B,CAAC;AACzC,cAAc,mBAAmB,CAAC;AAClC,cAAc,UAAU,CAAC;AACzB,cAAc,0BAA0B,CAAC;AACzC,cAAc,cAAc,CAAC;AAC7B,cAAc,aAAa,CAAC;AAC5B,cAAc,oBAAoB,CAAC;AACnC,cAAc,yBAAyB,CAAC;AACxC,cAAc,qBAAqB,CAAC;AACpC,cAAc,iBAAiB,CAAC;AAChC,cAAc,mBAAmB,CAAC;AAClC,cAAc,wBAAwB,CAAC;AACvC,OAAO,EAAE,SAAS,EAAE,MAAM,mBAAmB,CAAC"}
package/log.d.ts CHANGED
@@ -1,3 +1,147 @@
1
- import log, { Log, Logger, LoggerJson, LoggerOptions, LoggerText, LogLevel } from '@apify/log';
2
- export { log, Log, LoggerOptions, LogLevel, Logger, LoggerJson, LoggerText };
1
+ import type { LoggerOptions } from '@apify/log';
2
+ import log, { Log, Logger, LoggerJson, LoggerText, LogLevel } from '@apify/log';
3
+ /**
4
+ * Configuration options for Crawlee logger implementations.
5
+ */
6
+ export interface CrawleeLoggerOptions {
7
+ /** Prefix to be prepended to each logged line. */
8
+ prefix?: string | null;
9
+ }
10
+ /**
11
+ * Interface for Crawlee logger implementations.
12
+ * This allows users to inject custom loggers (e.g., Winston, Pino) while maintaining
13
+ * compatibility with the default `@apify/log` implementation.
14
+ */
15
+ export interface CrawleeLogger {
16
+ /**
17
+ * Returns the logger configuration.
18
+ */
19
+ getOptions(): CrawleeLoggerOptions;
20
+ /**
21
+ * Configures logger options.
22
+ */
23
+ setOptions(options: Partial<CrawleeLoggerOptions>): void;
24
+ /**
25
+ * Creates a new instance of logger that inherits settings from a parent logger.
26
+ */
27
+ child(options: Partial<CrawleeLoggerOptions>): CrawleeLogger;
28
+ /**
29
+ * Logs an `ERROR` message.
30
+ */
31
+ error(message: string, data?: Record<string, unknown>): void;
32
+ /**
33
+ * Logs an `ERROR` level message with a nicely formatted exception.
34
+ */
35
+ exception(exception: Error, message: string, data?: Record<string, unknown>): void;
36
+ /**
37
+ * Logs a `SOFT_FAIL` level message.
38
+ */
39
+ softFail(message: string, data?: Record<string, unknown>): void;
40
+ /**
41
+ * Logs a `WARNING` level message.
42
+ */
43
+ warning(message: string, data?: Record<string, unknown>): void;
44
+ /**
45
+ * Logs a `WARNING` level message only once.
46
+ */
47
+ warningOnce(message: string): void;
48
+ /**
49
+ * Logs an `INFO` message.
50
+ */
51
+ info(message: string, data?: Record<string, unknown>): void;
52
+ /**
53
+ * Logs a `DEBUG` message.
54
+ */
55
+ debug(message: string, data?: Record<string, unknown>): void;
56
+ /**
57
+ * Logs a `PERF` level message for performance tracking.
58
+ */
59
+ perf(message: string, data?: Record<string, unknown>): void;
60
+ /**
61
+ * Logs given message only once as WARNING for deprecated features.
62
+ */
63
+ deprecated(message: string): void;
64
+ /**
65
+ * Logs a message at the given level. Useful when the log level is determined dynamically.
66
+ */
67
+ logWithLevel(level: number, message: string, data?: Record<string, unknown>): void;
68
+ }
69
+ /**
70
+ * Abstract base class for custom Crawlee logger implementations.
71
+ *
72
+ * Subclasses must implement two methods:
73
+ * - {@link BaseCrawleeLogger.logWithLevel} — the core logging dispatch
74
+ * - {@link BaseCrawleeLogger.createChild} — how to create a child logger instance
75
+ *
76
+ * All other `CrawleeLogger` methods (`error`, `warning`, `info`, `debug`, etc.)
77
+ * are derived automatically. Level filtering is entirely the responsibility of the
78
+ * underlying library — `logWithLevel()` is called for every message.
79
+ *
80
+ * **Example — Winston adapter:**
81
+ * ```typescript
82
+ * const CRAWLEE_TO_WINSTON = { 1: 'error', 2: 'warn', 3: 'warn', 4: 'info', 5: 'debug', 6: 'debug' };
83
+ *
84
+ * class WinstonAdapter extends BaseCrawleeLogger {
85
+ * constructor(private logger: winston.Logger, options?: Partial<CrawleeLoggerOptions>) {
86
+ * super(options);
87
+ * }
88
+ *
89
+ * logWithLevel(level: number, message: string, data?: Record<string, unknown>): void {
90
+ * this.logger.log(CRAWLEE_TO_WINSTON[level] ?? 'info', message, data);
91
+ * }
92
+ *
93
+ * protected createChild(options: Partial<CrawleeLoggerOptions>): CrawleeLogger {
94
+ * return new WinstonAdapter(this.logger.child({ prefix: options.prefix }), { ...this.getOptions(), ...options });
95
+ * }
96
+ * }
97
+ * ```
98
+ */
99
+ export declare abstract class BaseCrawleeLogger implements CrawleeLogger {
100
+ private options;
101
+ private readonly warningsLogged;
102
+ constructor(options?: Partial<CrawleeLoggerOptions>);
103
+ /**
104
+ * Core logging method. Subclasses must implement this to dispatch log messages
105
+ * to the underlying logger (Winston, Pino, console, etc.).
106
+ *
107
+ * Level filtering is the responsibility of the underlying library — this method
108
+ * is called for every message regardless of the current level.
109
+ *
110
+ * @param level Crawlee log level (use {@link LogLevel} constants)
111
+ * @param message The log message
112
+ * @param data Optional structured data to attach to the log entry
113
+ */
114
+ abstract logWithLevel(level: number, message: string, data?: Record<string, unknown>): void;
115
+ /**
116
+ * Creates a child logger instance. Subclasses must implement this to define
117
+ * how child loggers are created for the underlying logger.
118
+ */
119
+ protected abstract createChild(options: Partial<CrawleeLoggerOptions>): CrawleeLogger;
120
+ getOptions(): CrawleeLoggerOptions;
121
+ setOptions(options: Partial<CrawleeLoggerOptions>): void;
122
+ child(options: Partial<CrawleeLoggerOptions>): CrawleeLogger;
123
+ error(message: string, data?: Record<string, unknown>): void;
124
+ exception(exception: Error, message: string, data?: Record<string, unknown>): void;
125
+ softFail(message: string, data?: Record<string, unknown>): void;
126
+ warning(message: string, data?: Record<string, unknown>): void;
127
+ warningOnce(message: string): void;
128
+ info(message: string, data?: Record<string, unknown>): void;
129
+ debug(message: string, data?: Record<string, unknown>): void;
130
+ perf(message: string, data?: Record<string, unknown>): void;
131
+ deprecated(message: string): void;
132
+ }
133
+ /**
134
+ * Adapter that wraps `@apify/log`'s {@link Log} instance to implement the {@link CrawleeLogger} interface.
135
+ *
136
+ * This is the default logger used by Crawlee when no custom logger is configured.
137
+ * Users who want to use a different logging library should implement {@link BaseCrawleeLogger} directly.
138
+ */
139
+ export declare class ApifyLogAdapter extends BaseCrawleeLogger {
140
+ private readonly apifyLog;
141
+ constructor(apifyLog: Log, options?: Partial<CrawleeLoggerOptions>);
142
+ logWithLevel(level: number, message: string, data?: Record<string, unknown>): void;
143
+ protected createChild(options: Partial<CrawleeLoggerOptions>): CrawleeLogger;
144
+ }
145
+ export { log, Log, LogLevel, Logger, LoggerJson, LoggerText };
146
+ export type { LoggerOptions };
3
147
  //# sourceMappingURL=log.d.ts.map
package/log.d.ts.map CHANGED
@@ -1 +1 @@
1
- {"version":3,"file":"log.d.ts","sourceRoot":"","sources":["../src/log.ts"],"names":[],"mappings":"AAAA,OAAO,GAAG,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,UAAU,EAAE,aAAa,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,YAAY,CAAC;AAE/F,OAAO,EAAE,GAAG,EAAE,GAAG,EAAE,aAAa,EAAE,QAAQ,EAAE,MAAM,EAAE,UAAU,EAAE,UAAU,EAAE,CAAC"}
1
+ {"version":3,"file":"log.d.ts","sourceRoot":"","sources":["../src/log.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,YAAY,CAAC;AAChD,OAAO,GAAG,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,UAAU,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,YAAY,CAAC;AAEhF;;GAEG;AACH,MAAM,WAAW,oBAAoB;IACjC,kDAAkD;IAClD,MAAM,CAAC,EAAE,MAAM,GAAG,IAAI,CAAC;CAC1B;AAED;;;;GAIG;AACH,MAAM,WAAW,aAAa;IAC1B;;OAEG;IACH,UAAU,IAAI,oBAAoB,CAAC;IAEnC;;OAEG;IACH,UAAU,CAAC,OAAO,EAAE,OAAO,CAAC,oBAAoB,CAAC,GAAG,IAAI,CAAC;IAEzD;;OAEG;IACH,KAAK,CAAC,OAAO,EAAE,OAAO,CAAC,oBAAoB,CAAC,GAAG,aAAa,CAAC;IAE7D;;OAEG;IACH,KAAK,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IAE7D;;OAEG;IACH,SAAS,CAAC,SAAS,EAAE,KAAK,EAAE,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IAEnF;;OAEG;IACH,QAAQ,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IAEhE;;OAEG;IACH,OAAO,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IAE/D;;OAEG;IACH,WAAW,CAAC,OAAO,EAAE,MAAM,GAAG,IAAI,CAAC;IAEnC;;OAEG;IACH,IAAI,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IAE5D;;OAEG;IACH,KAAK,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IAE7D;;OAEG;IACH,IAAI,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;IAE5D;;OAEG;IACH,UAAU,CAAC,OAAO,EAAE,MAAM,GAAG,IAAI,CAAC;IAElC;;OAEG;IACH,YAAY,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI,CAAC;CACtF;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA6BG;AACH,8BAAsB,iBAAkB,YAAW,aAAa;IAC5D,OAAO,CAAC,OAAO,CAAuB;IACtC,OAAO,CAAC,QAAQ,CAAC,cAAc,CAAqB;gBAExC,OAAO,GAAE,OAAO,CAAC,oBAAoB,CAAM;IAIvD;;;;;;;;;;OAUG;IACH,QAAQ,CAAC,YAAY,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAE3F;;;OAGG;IACH,SAAS,CAAC,QAAQ,CAAC,WAAW,CAAC,OAAO,EAAE,OAAO,CAAC,oBAAoB,CAAC,GAAG,aAAa;IAErF,UAAU,IAAI,oBAAoB;IAIlC,UAAU,CAAC,OAAO,EAAE,OAAO,CAAC,oBAAoB,CAAC,GAAG,IAAI;IAIxD,KAAK,CAAC,OAAO,EAAE,OAAO,CAAC,oBAAoB,CAAC,GAAG,aAAa;IAI5D,KAAK,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAI5D,SAAS,CAAC,SAAS,EAAE,KAAK,EAAE,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAQlF,QAAQ,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAI/D,OAAO,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAI9D,WAAW,CAAC,OAAO,EAAE,MAAM,GAAG,IAAI;IAOlC,IAAI,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAI3D,KAAK,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAI5D,IAAI,CAAC,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAI3D,UAAU,CAAC,OAAO,EAAE,MAAM,GAAG,IAAI;CAGpC;AAED;;;;;GAKG;AACH,qBAAa,eAAgB,SAAQ,iBAAiB;IAE9C,OAAO,CAAC,QAAQ,CAAC,QAAQ;gBAAR,QAAQ,EAAE,GAAG,EAC9B,OAAO,CAAC,EAAE,OAAO,CAAC,oBAAoB,CAAC;IAK3C,YAAY,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,IAAI,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,IAAI;IAIlF,SAAS,CAAC,WAAW,CAAC,OAAO,EAAE,OAAO,CAAC,oBAAoB,CAAC,GAAG,aAAa;CAM/E;AAED,OAAO,EAAE,GAAG,EAAE,GAAG,EAAE,QAAQ,EAAE,MAAM,EAAE,UAAU,EAAE,UAAU,EAAE,CAAC;AAC9D,YAAY,EAAE,aAAa,EAAE,CAAC"}
package/log.js CHANGED
@@ -1,3 +1,105 @@
1
1
  import log, { Log, Logger, LoggerJson, LoggerText, LogLevel } from '@apify/log';
2
+ /**
3
+ * Abstract base class for custom Crawlee logger implementations.
4
+ *
5
+ * Subclasses must implement two methods:
6
+ * - {@link BaseCrawleeLogger.logWithLevel} — the core logging dispatch
7
+ * - {@link BaseCrawleeLogger.createChild} — how to create a child logger instance
8
+ *
9
+ * All other `CrawleeLogger` methods (`error`, `warning`, `info`, `debug`, etc.)
10
+ * are derived automatically. Level filtering is entirely the responsibility of the
11
+ * underlying library — `logWithLevel()` is called for every message.
12
+ *
13
+ * **Example — Winston adapter:**
14
+ * ```typescript
15
+ * const CRAWLEE_TO_WINSTON = { 1: 'error', 2: 'warn', 3: 'warn', 4: 'info', 5: 'debug', 6: 'debug' };
16
+ *
17
+ * class WinstonAdapter extends BaseCrawleeLogger {
18
+ * constructor(private logger: winston.Logger, options?: Partial<CrawleeLoggerOptions>) {
19
+ * super(options);
20
+ * }
21
+ *
22
+ * logWithLevel(level: number, message: string, data?: Record<string, unknown>): void {
23
+ * this.logger.log(CRAWLEE_TO_WINSTON[level] ?? 'info', message, data);
24
+ * }
25
+ *
26
+ * protected createChild(options: Partial<CrawleeLoggerOptions>): CrawleeLogger {
27
+ * return new WinstonAdapter(this.logger.child({ prefix: options.prefix }), { ...this.getOptions(), ...options });
28
+ * }
29
+ * }
30
+ * ```
31
+ */
32
+ export class BaseCrawleeLogger {
33
+ options;
34
+ warningsLogged = new Set();
35
+ constructor(options = {}) {
36
+ this.options = options;
37
+ }
38
+ getOptions() {
39
+ return this.options;
40
+ }
41
+ setOptions(options) {
42
+ this.options = { ...this.options, ...options };
43
+ }
44
+ child(options) {
45
+ return this.createChild(options);
46
+ }
47
+ error(message, data) {
48
+ this.logWithLevel(LogLevel.ERROR, message, data);
49
+ }
50
+ exception(exception, message, data) {
51
+ this.logWithLevel(LogLevel.ERROR, `${message}: ${exception.message}`, {
52
+ ...data,
53
+ stack: exception.stack,
54
+ exception,
55
+ });
56
+ }
57
+ softFail(message, data) {
58
+ this.logWithLevel(LogLevel.SOFT_FAIL, message, data);
59
+ }
60
+ warning(message, data) {
61
+ this.logWithLevel(LogLevel.WARNING, message, data);
62
+ }
63
+ warningOnce(message) {
64
+ if (!this.warningsLogged.has(message)) {
65
+ this.warningsLogged.add(message);
66
+ this.warning(message);
67
+ }
68
+ }
69
+ info(message, data) {
70
+ this.logWithLevel(LogLevel.INFO, message, data);
71
+ }
72
+ debug(message, data) {
73
+ this.logWithLevel(LogLevel.DEBUG, message, data);
74
+ }
75
+ perf(message, data) {
76
+ this.logWithLevel(LogLevel.PERF, `[PERF] ${message}`, data);
77
+ }
78
+ deprecated(message) {
79
+ this.warningOnce(`[DEPRECATED] ${message}`);
80
+ }
81
+ }
82
+ /**
83
+ * Adapter that wraps `@apify/log`'s {@link Log} instance to implement the {@link CrawleeLogger} interface.
84
+ *
85
+ * This is the default logger used by Crawlee when no custom logger is configured.
86
+ * Users who want to use a different logging library should implement {@link BaseCrawleeLogger} directly.
87
+ */
88
+ export class ApifyLogAdapter extends BaseCrawleeLogger {
89
+ apifyLog;
90
+ constructor(apifyLog, options) {
91
+ super(options ?? {});
92
+ this.apifyLog = apifyLog;
93
+ }
94
+ logWithLevel(level, message, data) {
95
+ this.apifyLog.internal(level, message, data);
96
+ }
97
+ createChild(options) {
98
+ return new ApifyLogAdapter(this.apifyLog.child({ prefix: options.prefix ?? null }), {
99
+ ...this.getOptions(),
100
+ ...options,
101
+ });
102
+ }
103
+ }
2
104
  export { log, Log, LogLevel, Logger, LoggerJson, LoggerText };
3
105
  //# sourceMappingURL=log.js.map
package/log.js.map CHANGED
@@ -1 +1 @@
1
- {"version":3,"file":"log.js","sourceRoot":"","sources":["../src/log.ts"],"names":[],"mappings":"AAAA,OAAO,GAAG,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,UAAU,EAAiB,UAAU,EAAE,QAAQ,EAAE,MAAM,YAAY,CAAC;AAE/F,OAAO,EAAE,GAAG,EAAE,GAAG,EAAiB,QAAQ,EAAE,MAAM,EAAE,UAAU,EAAE,UAAU,EAAE,CAAC"}
1
+ {"version":3,"file":"log.js","sourceRoot":"","sources":["../src/log.ts"],"names":[],"mappings":"AACA,OAAO,GAAG,EAAE,EAAE,GAAG,EAAE,MAAM,EAAE,UAAU,EAAE,UAAU,EAAE,QAAQ,EAAE,MAAM,YAAY,CAAC;AAkFhF;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA6BG;AACH,MAAM,OAAgB,iBAAiB;IAC3B,OAAO,CAAuB;IACrB,cAAc,GAAG,IAAI,GAAG,EAAU,CAAC;IAEpD,YAAY,UAAyC,EAAE;QACnD,IAAI,CAAC,OAAO,GAAG,OAAO,CAAC;IAC3B,CAAC;IAqBD,UAAU;QACN,OAAO,IAAI,CAAC,OAAO,CAAC;IACxB,CAAC;IAED,UAAU,CAAC,OAAsC;QAC7C,IAAI,CAAC,OAAO,GAAG,EAAE,GAAG,IAAI,CAAC,OAAO,EAAE,GAAG,OAAO,EAAE,CAAC;IACnD,CAAC;IAED,KAAK,CAAC,OAAsC;QACxC,OAAO,IAAI,CAAC,WAAW,CAAC,OAAO,CAAC,CAAC;IACrC,CAAC;IAED,KAAK,CAAC,OAAe,EAAE,IAA8B;QACjD,IAAI,CAAC,YAAY,CAAC,QAAQ,CAAC,KAAK,EAAE,OAAO,EAAE,IAAI,CAAC,CAAC;IACrD,CAAC;IAED,SAAS,CAAC,SAAgB,EAAE,OAAe,EAAE,IAA8B;QACvE,IAAI,CAAC,YAAY,CAAC,QAAQ,CAAC,KAAK,EAAE,GAAG,OAAO,KAAK,SAAS,CAAC,OAAO,EAAE,EAAE;YAClE,GAAG,IAAI;YACP,KAAK,EAAE,SAAS,CAAC,KAAK;YACtB,SAAS;SACZ,CAAC,CAAC;IACP,CAAC;IAED,QAAQ,CAAC,OAAe,EAAE,IAA8B;QACpD,IAAI,CAAC,YAAY,CAAC,QAAQ,CAAC,SAAS,EAAE,OAAO,EAAE,IAAI,CAAC,CAAC;IACzD,CAAC;IAED,OAAO,CAAC,OAAe,EAAE,IAA8B;QACnD,IAAI,CAAC,YAAY,CAAC,QAAQ,CAAC,OAAO,EAAE,OAAO,EAAE,IAAI,CAAC,CAAC;IACvD,CAAC;IAED,WAAW,CAAC,OAAe;QACvB,IAAI,CAAC,IAAI,CAAC,cAAc,CAAC,GAAG,CAAC,OAAO,CAAC,EAAE,CAAC;YACpC,IAAI,CAAC,cAAc,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC;YACjC,IAAI,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC;QAC1B,CAAC;IACL,CAAC;IAED,IAAI,CAAC,OAAe,EAAE,IAA8B;QAChD,IAAI,CAAC,YAAY,CAAC,QAAQ,CAAC,IAAI,EAAE,OAAO,EAAE,IAAI,CAAC,CAAC;IACpD,CAAC;IAED,KAAK,CAAC,OAAe,EAAE,IAA8B;QACjD,IAAI,CAAC,YAAY,CAAC,QAAQ,CAAC,KAAK,EAAE,OAAO,EAAE,IAAI,CAAC,CAAC;IACrD,CAAC;IAED,IAAI,CAAC,OAAe,EAAE,IAA8B;QAChD,IAAI,CAAC,YAAY,CAAC,QAAQ,CAAC,IAAI,EAAE,UAAU,OAAO,EAAE,EAAE,IAAI,CAAC,CAAC;IAChE,CAAC;IAED,UAAU,CAAC,OAAe;QACtB,IAAI,CAAC,WAAW,CAAC,gBAAgB,OAAO,EAAE,CAAC,CAAC;IAChD,CAAC;CACJ;AAED;;;;;GAKG;AACH,MAAM,OAAO,eAAgB,SAAQ,iBAAiB;IAE7B;IADrB,YACqB,QAAa,EAC9B,OAAuC;QAEvC,KAAK,CAAC,OAAO,IAAI,EAAE,CAAC,CAAC;QAHJ,aAAQ,GAAR,QAAQ,CAAK;IAIlC,CAAC;IAED,YAAY,CAAC,KAAa,EAAE,OAAe,EAAE,IAA8B;QACvE,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,KAAiB,EAAE,OAAO,EAAE,IAAI,CAAC,CAAC;IAC7D,CAAC;IAES,WAAW,CAAC,OAAsC;QACxD,OAAO,IAAI,eAAe,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,MAAM,EAAE,OAAO,CAAC,MAAM,IAAI,IAAI,EAAE,CAAC,EAAE;YAChF,GAAG,IAAI,CAAC,UAAU,EAAE;YACpB,GAAG,OAAO;SACb,CAAC,CAAC;IACP,CAAC;CACJ;AAED,OAAO,EAAE,GAAG,EAAE,GAAG,EAAE,QAAQ,EAAE,MAAM,EAAE,UAAU,EAAE,UAAU,EAAE,CAAC"}
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@crawlee/core",
3
- "version": "4.0.0-beta.4",
3
+ "version": "4.0.0-beta.40",
4
4
  "description": "The scalable web crawling and scraping library for JavaScript/Node.js. Enables development of data extraction and web automation jobs (not only) with headless Chrome and Puppeteer.",
5
5
  "engines": {
6
6
  "node": ">=22.0.0"
@@ -53,20 +53,19 @@
53
53
  "@apify/pseudo_url": "^2.0.59",
54
54
  "@apify/timeout": "^0.3.2",
55
55
  "@apify/utilities": "^2.15.5",
56
- "@crawlee/memory-storage": "4.0.0-beta.4",
57
- "@crawlee/types": "4.0.0-beta.4",
58
- "@crawlee/utils": "4.0.0-beta.4",
56
+ "@crawlee/memory-storage": "4.0.0-beta.40",
57
+ "@crawlee/types": "4.0.0-beta.40",
58
+ "@crawlee/utils": "4.0.0-beta.40",
59
59
  "@sapphire/async-queue": "^1.5.5",
60
60
  "@vladfrangu/async_event_emitter": "^2.4.6",
61
61
  "csv-stringify": "^6.5.2",
62
62
  "fs-extra": "^11.3.0",
63
- "got-scraping": "^4.1.1",
64
63
  "json5": "^2.2.3",
65
64
  "minimatch": "^10.0.1",
66
65
  "ow": "^2.0.0",
67
66
  "stream-json": "^1.9.1",
68
67
  "tldts": "^7.0.6",
69
- "tough-cookie": "^5.1.2",
68
+ "tough-cookie": "^6.0.0",
70
69
  "tslib": "^2.8.1",
71
70
  "type-fest": "^4.41.0"
72
71
  },
@@ -77,5 +76,5 @@
77
76
  }
78
77
  }
79
78
  },
80
- "gitHead": "3880cdebbcddf9e2a242bc89751e36e2ef5ae897"
79
+ "gitHead": "679534db27d04c0acf4737700bb979c040845762"
81
80
  }