crawlee-one 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (131) hide show
  1. package/README.md +81 -0
  2. package/dist/cjs/cli/cli.d.ts +1 -0
  3. package/dist/cjs/cli/cli.js +61 -0
  4. package/dist/cjs/cli/cli.js.map +1 -0
  5. package/dist/cjs/cli/index.d.ts +2 -0
  6. package/dist/cjs/cli/index.js +6 -0
  7. package/dist/cjs/cli/index.js.map +1 -0
  8. package/dist/cjs/index.d.ts +24 -0
  9. package/dist/cjs/index.js +43 -0
  10. package/dist/cjs/index.js.map +1 -0
  11. package/dist/cjs/lib/actions/dom.d.ts +102 -0
  12. package/dist/cjs/lib/actions/dom.js +743 -0
  13. package/dist/cjs/lib/actions/dom.js.map +1 -0
  14. package/dist/cjs/lib/actions/domUtils.d.ts +42 -0
  15. package/dist/cjs/lib/actions/domUtils.js +126 -0
  16. package/dist/cjs/lib/actions/domUtils.js.map +1 -0
  17. package/dist/cjs/lib/actions/page.d.ts +69 -0
  18. package/dist/cjs/lib/actions/page.js +205 -0
  19. package/dist/cjs/lib/actions/page.js.map +1 -0
  20. package/dist/cjs/lib/actions/scrapeListing.d.ts +78 -0
  21. package/dist/cjs/lib/actions/scrapeListing.js +242 -0
  22. package/dist/cjs/lib/actions/scrapeListing.js.map +1 -0
  23. package/dist/cjs/lib/actor/actor.d.ts +90 -0
  24. package/dist/cjs/lib/actor/actor.js +306 -0
  25. package/dist/cjs/lib/actor/actor.js.map +1 -0
  26. package/dist/cjs/lib/actor/types.d.ts +162 -0
  27. package/dist/cjs/lib/actor/types.js +3 -0
  28. package/dist/cjs/lib/actor/types.js.map +1 -0
  29. package/dist/cjs/lib/actor.d.ts +189 -0
  30. package/dist/cjs/lib/actor.js +225 -0
  31. package/dist/cjs/lib/actor.js.map +1 -0
  32. package/dist/cjs/lib/actorSpec.d.ts +20 -0
  33. package/dist/cjs/lib/actorSpec.js +3 -0
  34. package/dist/cjs/lib/actorSpec.js.map +1 -0
  35. package/dist/cjs/lib/config.d.ts +561 -0
  36. package/dist/cjs/lib/config.js +707 -0
  37. package/dist/cjs/lib/config.js.map +1 -0
  38. package/dist/cjs/lib/dataset/maxCount.d.ts +30 -0
  39. package/dist/cjs/lib/dataset/maxCount.js +55 -0
  40. package/dist/cjs/lib/dataset/maxCount.js.map +1 -0
  41. package/dist/cjs/lib/dataset/pushData.d.ts +123 -0
  42. package/dist/cjs/lib/dataset/pushData.js +182 -0
  43. package/dist/cjs/lib/dataset/pushData.js.map +1 -0
  44. package/dist/cjs/lib/dataset.d.ts +98 -0
  45. package/dist/cjs/lib/dataset.js +122 -0
  46. package/dist/cjs/lib/dataset.js.map +1 -0
  47. package/dist/cjs/lib/dom.d.ts +78 -0
  48. package/dist/cjs/lib/dom.js +243 -0
  49. package/dist/cjs/lib/dom.js.map +1 -0
  50. package/dist/cjs/lib/error/errorHandler.d.ts +112 -0
  51. package/dist/cjs/lib/error/errorHandler.js +164 -0
  52. package/dist/cjs/lib/error/errorHandler.js.map +1 -0
  53. package/dist/cjs/lib/error/sentry.d.ts +11 -0
  54. package/dist/cjs/lib/error/sentry.js +60 -0
  55. package/dist/cjs/lib/error/sentry.js.map +1 -0
  56. package/dist/cjs/lib/integrations/apify.d.ts +67 -0
  57. package/dist/cjs/lib/integrations/apify.js +106 -0
  58. package/dist/cjs/lib/integrations/apify.js.map +1 -0
  59. package/dist/cjs/lib/integrations/types.d.ts +274 -0
  60. package/dist/cjs/lib/integrations/types.js +3 -0
  61. package/dist/cjs/lib/integrations/types.js.map +1 -0
  62. package/dist/cjs/lib/io/dataset.d.ts +67 -0
  63. package/dist/cjs/lib/io/dataset.js +86 -0
  64. package/dist/cjs/lib/io/dataset.js.map +1 -0
  65. package/dist/cjs/lib/io/maxCount.d.ts +30 -0
  66. package/dist/cjs/lib/io/maxCount.js +55 -0
  67. package/dist/cjs/lib/io/maxCount.js.map +1 -0
  68. package/dist/cjs/lib/io/pushData.d.ts +124 -0
  69. package/dist/cjs/lib/io/pushData.js +193 -0
  70. package/dist/cjs/lib/io/pushData.js.map +1 -0
  71. package/dist/cjs/lib/io/pushRequests.d.ts +38 -0
  72. package/dist/cjs/lib/io/pushRequests.js +63 -0
  73. package/dist/cjs/lib/io/pushRequests.js.map +1 -0
  74. package/dist/cjs/lib/io/requestQueue.d.ts +28 -0
  75. package/dist/cjs/lib/io/requestQueue.js +40 -0
  76. package/dist/cjs/lib/io/requestQueue.js.map +1 -0
  77. package/dist/cjs/lib/log.d.ts +38 -0
  78. package/dist/cjs/lib/log.js +54 -0
  79. package/dist/cjs/lib/log.js.map +1 -0
  80. package/dist/cjs/lib/migrate/localMigrator.d.ts +10 -0
  81. package/dist/cjs/lib/migrate/localMigrator.js +57 -0
  82. package/dist/cjs/lib/migrate/localMigrator.js.map +1 -0
  83. package/dist/cjs/lib/migrate/localState.d.ts +7 -0
  84. package/dist/cjs/lib/migrate/localState.js +43 -0
  85. package/dist/cjs/lib/migrate/localState.js.map +1 -0
  86. package/dist/cjs/lib/migrate/types.d.ts +6 -0
  87. package/dist/cjs/lib/migrate/types.js +3 -0
  88. package/dist/cjs/lib/migrate/types.js.map +1 -0
  89. package/dist/cjs/lib/readme/readme.d.ts +65 -0
  90. package/dist/cjs/lib/readme/readme.js +534 -0
  91. package/dist/cjs/lib/readme/readme.js.map +1 -0
  92. package/dist/cjs/lib/readme/types.d.ts +260 -0
  93. package/dist/cjs/lib/readme/types.js +54 -0
  94. package/dist/cjs/lib/readme/types.js.map +1 -0
  95. package/dist/cjs/lib/router.d.ts +132 -0
  96. package/dist/cjs/lib/router.js +165 -0
  97. package/dist/cjs/lib/router.js.map +1 -0
  98. package/dist/cjs/lib/scraper/scrapeListing.d.ts +78 -0
  99. package/dist/cjs/lib/scraper/scrapeListing.js +242 -0
  100. package/dist/cjs/lib/scraper/scrapeListing.js.map +1 -0
  101. package/dist/cjs/lib/test/actor.d.ts +21 -0
  102. package/dist/cjs/lib/test/actor.js +56 -0
  103. package/dist/cjs/lib/test/actor.js.map +1 -0
  104. package/dist/cjs/lib/test/mockApifyClient.d.ts +32 -0
  105. package/dist/cjs/lib/test/mockApifyClient.js +176 -0
  106. package/dist/cjs/lib/test/mockApifyClient.js.map +1 -0
  107. package/dist/cjs/types.d.ts +31 -0
  108. package/dist/cjs/types.js +3 -0
  109. package/dist/cjs/types.js.map +1 -0
  110. package/dist/cjs/utils/async.d.ts +19 -0
  111. package/dist/cjs/utils/async.js +74 -0
  112. package/dist/cjs/utils/async.js.map +1 -0
  113. package/dist/cjs/utils/error.d.ts +1 -0
  114. package/dist/cjs/utils/error.js +10 -0
  115. package/dist/cjs/utils/error.js.map +1 -0
  116. package/dist/cjs/utils/format.d.ts +9 -0
  117. package/dist/cjs/utils/format.js +19 -0
  118. package/dist/cjs/utils/format.js.map +1 -0
  119. package/dist/cjs/utils/package.d.ts +15 -0
  120. package/dist/cjs/utils/package.js +25 -0
  121. package/dist/cjs/utils/package.js.map +1 -0
  122. package/dist/cjs/utils/types.d.ts +6 -0
  123. package/dist/cjs/utils/types.js +9 -0
  124. package/dist/cjs/utils/types.js.map +1 -0
  125. package/dist/cjs/utils/url.d.ts +9 -0
  126. package/dist/cjs/utils/url.js +32 -0
  127. package/dist/cjs/utils/url.js.map +1 -0
  128. package/dist/cjs/utils/valueMonitor.d.ts +31 -0
  129. package/dist/cjs/utils/valueMonitor.js +91 -0
  130. package/dist/cjs/utils/valueMonitor.js.map +1 -0
  131. package/package.json +85 -0
@@ -0,0 +1,561 @@
1
+ import type { Actor } from 'apify';
2
+ import type { CheerioCrawlerOptions } from 'crawlee';
3
+ import Joi from 'joi';
4
+ import type { CrawlerUrl } from '../types';
5
+ import { LogLevel } from './log';
6
+ export type AllActorInputs = InputActorInput & CrawlerConfigActorInput & PerfActorInput & StartUrlsActorInput & LoggingActorInput & ProxyActorInput & PrivacyActorInput & RequestActorInput & OutputActorInput & MetamorphActorInput;
7
+ /** Crawler config fields that can be overriden from the actor input */
8
+ export type CrawlerConfigActorInput = Pick<CheerioCrawlerOptions, 'navigationTimeoutSecs' | 'ignoreSslErrors' | 'additionalMimeTypes' | 'suggestResponseEncoding' | 'forceResponseEncoding' | 'requestHandlerTimeoutSecs' | 'maxRequestRetries' | 'maxRequestsPerCrawl' | 'maxRequestsPerMinute' | 'minConcurrency' | 'maxConcurrency' | 'keepAlive'>;
9
+ /** Common input fields related to extending Actor input with remote or generated data */
10
+ export interface InputActorInput {
11
+ /**
12
+ * If set, the Actor input is extended with a config from this URL.
13
+ *
14
+ * For example, you can store your actor input in a source control, and import it here.
15
+ *
16
+ * In case of a conflict (if a field is defined both in Actor input and in imported input)
17
+ * the Actor input overwrites the imported fields.
18
+ *
19
+ * The URL must point to a JSON file containing a single object (the config).
20
+ */
21
+ inputExtendUrl?: string;
22
+ /**
23
+ * If set, the Actor input is extended with a config from this custom function.
24
+ *
25
+ * For example, you can store your actor input in a source control, and import it here.
26
+ *
27
+ * In case of a conflict (if a field is defined both in Actor input and in imported input)
28
+ * the Actor input overwrites the imported fields.
29
+ *
30
+ * The URL must point to a JSON file containing a single object (the config).
31
+ */
32
+ inputExtendFromFunction?: string;
33
+ }
34
+ /** Common input fields related to performance which are not part of the CrawlerConfig */
35
+ export interface PerfActorInput {
36
+ /**
37
+ * If set, multiple Requests will be handled by a single Actor instance.
38
+ *
39
+ * See official docs: https://docs.apify.com/platform/actors/development/performance#batch-jobs-win-over-the-single-jobs
40
+ *
41
+ * Example: If set to 20, then up to 20 requests will be handled in a single "go".
42
+ */
43
+ perfBatchSize?: number;
44
+ /**
45
+ * How long to wait between entries within a single batch.
46
+ *
47
+ * Increase this value if you're using batching and you're sending requests to the scraped website too fast.
48
+ *
49
+ * Example: If set to 1, then after each entry in a batch, wait 1 second before continuing.
50
+ */
51
+ perfBatchWaitSecs?: number;
52
+ }
53
+ /** Common input fields for defining URLs to scrape */
54
+ export interface StartUrlsActorInput {
55
+ /** URLs to start with, defined manually as a list of strings or crawler requests */
56
+ startUrls?: CrawlerUrl[];
57
+ /**
58
+ * Import starting URLs from an existing Dataset.
59
+ *
60
+ * String is in the format `datasetID#field` (e.g. `datasetid123#url`).
61
+ */
62
+ startUrlsFromDataset?: string;
63
+ /**
64
+ * Import or generate starting URLs using a custom function.
65
+ *
66
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
67
+ * and a shared state in the first argument.
68
+ *
69
+ * ```js
70
+ * // Example: Create and load URLs from a Dataset by combining multiple fields
71
+ * async ({ io, input, state, itemCacheKey }) => {
72
+ * const dataset = await io.openDataset(datasetNameOrId);
73
+ * const data = await dataset.getData();
74
+ * const urls = data.items.map((item) => `https://example.com/u/${item.userId}/list/${item.listId}`);
75
+ * return urls;
76
+ * }
77
+ * ```
78
+ */
79
+ startUrlsFromFunction?: string;
80
+ }
81
+ /** Common input fields related to logging setup */
82
+ export interface LoggingActorInput {
83
+ logLevel?: LogLevel;
84
+ /**
85
+ * Whether to send actor error reports to <a href="https://sentry.io/">Sentry</a>.
86
+ *
87
+ * This info is used by the author of this actor to identify broken integrations,
88
+ * and track down and fix issues.
89
+ */
90
+ errorSendToSentry?: boolean;
91
+ /**
92
+ * Dataset ID to which errors should be captured.
93
+ *
94
+ * Default: `'REPORTING'`.
95
+ */
96
+ errorReportingDatasetId?: string;
97
+ }
98
+ /** Common input fields related to proxy setup */
99
+ export interface ProxyActorInput {
100
+ proxy?: Parameters<Actor['createProxyConfiguration']>[0];
101
+ }
102
+ /** Common input fields related to actor requests */
103
+ export interface RequestActorInput {
104
+ /**
105
+ * If set, only at most this many requests will be scraped.
106
+ *
107
+ * The count is determined from the RequestQueue that's used for the Actor run.
108
+ *
109
+ * This means that if `requestMaxEntries` is set to 50, but the
110
+ * associated RequestQueue already handled 40 requests, then only 10 new requests
111
+ * will be handled.
112
+ */
113
+ requestMaxEntries?: number;
114
+ /**
115
+ * Option to freely transform a request using a custom function before pushing it to the RequestQueue.
116
+ *
117
+ * If not set, the request will remain as is.
118
+ *
119
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
120
+ * and a shared state in the second argument.
121
+ *
122
+ * `async (entry, { io, input, state, itemCacheKey }) => { ... }`
123
+ */
124
+ requestTransform?: string;
125
+ /**
126
+ * Use this if you need to run one-time initialization code before `requestTransform`.
127
+ *
128
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
129
+ * and a shared state in the first argument.
130
+ *
131
+ * `async ({ io, input, state, itemCacheKey }) => { ... }`
132
+ */
133
+ requestTransformBefore?: string;
134
+ /**
135
+ * Use this if you need to run one-time teardown code after `requestTransform`.
136
+ *
137
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
138
+ * and a shared state in the first argument.
139
+ *
140
+ * `async ({ io, input, state, itemCacheKey }) => { ... }`
141
+ */
142
+ requestTransformAfter?: string;
143
+ /**
144
+ * Option to filter a request using a custom function before pushing it to the RequestQueue.
145
+ *
146
+ * If not set, all requests will be included.
147
+ *
148
+ * This is done after `requestTransform`.
149
+ *
150
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
151
+ * and a shared state in the second argument.
152
+ *
153
+ * `async (entry, { io, input, state, itemCacheKey }) => boolean`
154
+ */
155
+ requestFilter?: string;
156
+ /**
157
+ * Use this if you need to run one-time initialization code before `requestFilter`.
158
+ *
159
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
160
+ * and a shared state in the first argument.
161
+ *
162
+ * `async ({ io, input, state, itemCacheKey }) => boolean`
163
+ */
164
+ requestFilterBefore?: string;
165
+ /**
166
+ * Use this if you need to run one-time initialization code after `requestFilter`.
167
+ *
168
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
169
+ * and a shared state in the first argument.
170
+ *
171
+ * `async ({ io, input, state, itemCacheKey }) => boolean`
172
+ */
173
+ requestFilterAfter?: string;
174
+ /** ID of the RequestQueue to which the requests should be pushed */
175
+ requestQueueId?: string;
176
+ }
177
+ /** Common input fields related to actor output */
178
+ export interface OutputActorInput {
179
+ /**
180
+ * If set, only at most this many entries will be scraped.
181
+ *
182
+ * The count is determined from the Dataset that's used for the Actor run.
183
+ *
184
+ * This means that if `outputMaxEntries` is set to 50, but the
185
+ * associated Dataset already has 40 items in it, then only 10 new entries
186
+ * will be saved.
187
+ */
188
+ outputMaxEntries?: number;
189
+ /**
190
+ * Option to select a subset of keys/fields of an entry that
191
+ * will be pushed to the dataset.
192
+ *
193
+ * If not set, all fields on an entry will be pushed to the dataset.
194
+ *
195
+ * This is done after `outputRenameFields`.
196
+ *
197
+ * Keys can be nested, e.g. `"someProp.value[0]"`. Nested path is
198
+ * resolved using Lodash.get().
199
+ */
200
+ outputPickFields?: string[];
201
+ /**
202
+ * Option to remap the keys before pushing the entries to the dataset.
203
+ *
204
+ * This is done before `outputRenameFields`.
205
+ *
206
+ * Keys can be nested, e.g. `"someProp.value[0]"`. Nested path is
207
+ * resolved using Lodash.get().
208
+ */
209
+ outputRenameFields?: Record<string, string>;
210
+ /**
211
+ * Option to freely transform the output data object using a custom function before pushing it to the dataset.
212
+ *
213
+ * If not set, the data will remain as is.
214
+ *
215
+ * This is done after `outputPickFields` and `outputRenameFields`.
216
+ *
217
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
218
+ * and a shared state in the second argument.
219
+ *
220
+ * `async (entry, { io, input, state, itemCacheKey }) => { ... }`
221
+ */
222
+ outputTransform?: string;
223
+ /**
224
+ * Use this if you need to run one-time initialization code before `outputTransform`.
225
+ *
226
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
227
+ * and a shared state in the first argument.
228
+ *
229
+ * `async ({ io, input, state, itemCacheKey }) => { ... }`
230
+ */
231
+ outputTransformBefore?: string;
232
+ /**
233
+ * Use this if you need to run one-time teardown code after `outputTransform`.
234
+ *
235
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
236
+ * and a shared state in the first argument.
237
+ *
238
+ * `async ({ io, input, state, itemCacheKey }) => { ... }`
239
+ */
240
+ outputTransformAfter?: string;
241
+ /**
242
+ * Option to filter out the data using a custom function before pushing it to the dataset.
243
+ *
244
+ * If not set, all entries will be included.
245
+ *
246
+ * This is done after `outputPickFields`, `outputRenameFields`, and `outputTransform`.
247
+ *
248
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
249
+ * and a shared state in the second argument.
250
+ *
251
+ * `async (entry, { io, input, state, itemCacheKey }) => boolean`
252
+ */
253
+ outputFilter?: string;
254
+ /**
255
+ * Use this if you need to run one-time initialization code before `outputFilter`.
256
+ *
257
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
258
+ * and a shared state in the first argument.
259
+ *
260
+ * `async ({ io, input, state, itemCacheKey }) => boolean`
261
+ */
262
+ outputFilterBefore?: string;
263
+ /**
264
+ * Use this if you need to run one-time initialization code after `outputFilter`.
265
+ *
266
+ * The function has access to Apify's Actor class (under variable `io`), and actor's input
267
+ * and a shared state in the first argument.
268
+ *
269
+ * `async ({ io, input, state, itemCacheKey }) => boolean`
270
+ */
271
+ outputFilterAfter?: string;
272
+ /** ID or name of the dataset to which the data should be pushed */
273
+ outputDatasetId?: string;
274
+ /** ID or name of the key-value store used as cache */
275
+ outputCacheStoreId?: string;
276
+ /** Define fields that will be used for cache key */
277
+ outputCachePrimaryKeys?: string[];
278
+ /** Define whether we want to add, remove, or overwrite cached entries with results from the actor run */
279
+ outputCacheActionOnResult?: 'add' | 'remove' | 'overwrite' | null;
280
+ }
281
+ /** Common input fields related to actor metamorphing */
282
+ export interface MetamorphActorInput {
283
+ /**
284
+ * If you want to run another actor with the same dataset after
285
+ * this actor has finished (AKA metamorph into another actor),
286
+ * then set the ID of the target actor.
287
+ *
288
+ * See https://docs.apify.com/sdk/python/docs/concepts/interacting-with-other-actors#actormetamorph
289
+ */
290
+ metamorphActorId?: string;
291
+ /**
292
+ * Tag or number of the target actor build to metamorph into (e.g. `beta` or `1.2.345`).
293
+ *
294
+ * See https://docs.apify.com/sdk/python/docs/concepts/interacting-with-other-actors#actormetamorph
295
+ */
296
+ metamorphActorBuild?: string;
297
+ /**
298
+ * Input passed to the follow-up (metamorph) actor.
299
+ *
300
+ * See https://docs.apify.com/sdk/python/docs/concepts/interacting-with-other-actors#actormetamorph
301
+ */
302
+ metamorphActorInput?: object;
303
+ }
304
+ /** Common input fields related to privacy setup */
305
+ export interface PrivacyActorInput {
306
+ includePersonalData?: boolean;
307
+ }
308
+ /** Common input fields related to actor input */
309
+ export declare const inputInput: {
310
+ inputExtendUrl: import("apify-actor-config").StringField<string, string>;
311
+ inputExtendFromFunction: import("apify-actor-config").StringField<string, string>;
312
+ };
313
+ /** Common input fields related to crawler setup */
314
+ export declare const crawlerInput: {
315
+ maxRequestRetries: import("apify-actor-config").IntegerField<number, string>;
316
+ maxRequestsPerMinute: import("apify-actor-config").IntegerField<number, string>;
317
+ maxRequestsPerCrawl: import("apify-actor-config").IntegerField<number, string>;
318
+ minConcurrency: import("apify-actor-config").IntegerField<number, string>;
319
+ maxConcurrency: import("apify-actor-config").IntegerField<number, string>;
320
+ navigationTimeoutSecs: import("apify-actor-config").IntegerField<number, string>;
321
+ requestHandlerTimeoutSecs: import("apify-actor-config").IntegerField<number, string>;
322
+ keepAlive: import("apify-actor-config").BooleanField<boolean>;
323
+ ignoreSslErrors: import("apify-actor-config").BooleanField<boolean>;
324
+ additionalMimeTypes: import("apify-actor-config").ArrayField<any[]>;
325
+ suggestResponseEncoding: import("apify-actor-config").StringField<string, string>;
326
+ forceResponseEncoding: import("apify-actor-config").StringField<string, string>;
327
+ };
328
+ /** Common input fields related to performance which are not part of the CrawlerConfig */
329
+ export declare const perfInput: {
330
+ perfBatchSize: import("apify-actor-config").IntegerField<number, string>;
331
+ perfBatchWaitSecs: import("apify-actor-config").IntegerField<number, string>;
332
+ };
333
+ /** Common input fields for defining URLs to scrape */
334
+ export declare const startUrlsInput: {
335
+ startUrls: import("apify-actor-config").ArrayField<any[]>;
336
+ startUrlsFromDataset: import("apify-actor-config").StringField<string, string>;
337
+ startUrlsFromFunction: import("apify-actor-config").StringField<string, string>;
338
+ };
339
+ /** Common input fields related to logging setup */
340
+ export declare const loggingInput: {
341
+ logLevel: import("apify-actor-config").StringField<"error" | "off" | "info" | "debug" | "warn", string>;
342
+ errorReportingDatasetId: import("apify-actor-config").StringField<string, string>;
343
+ errorSendToSentry: import("apify-actor-config").BooleanField<boolean>;
344
+ };
345
+ /** Common input fields related to proxy setup */
346
+ export declare const proxyInput: {
347
+ proxy: import("apify-actor-config").ObjectField<object>;
348
+ };
349
+ /** Common input fields related to proxy setup */
350
+ export declare const privacyInput: {
351
+ includePersonalData: import("apify-actor-config").BooleanField<boolean>;
352
+ };
353
+ /** Common input fields related to actor request */
354
+ export declare const requestInput: {
355
+ requestMaxEntries: import("apify-actor-config").IntegerField<number, string>;
356
+ requestTransform: import("apify-actor-config").StringField<string, string>;
357
+ requestTransformBefore: import("apify-actor-config").StringField<string, string>;
358
+ requestTransformAfter: import("apify-actor-config").StringField<string, string>;
359
+ requestFilter: import("apify-actor-config").StringField<string, string>;
360
+ requestFilterBefore: import("apify-actor-config").StringField<string, string>;
361
+ requestFilterAfter: import("apify-actor-config").StringField<string, string>;
362
+ requestQueueId: import("apify-actor-config").StringField<string, string>;
363
+ };
364
+ /** Common input fields related to actor output */
365
+ export declare const outputInput: {
366
+ outputMaxEntries: import("apify-actor-config").IntegerField<number, string>;
367
+ outputRenameFields: import("apify-actor-config").ObjectField<{
368
+ oldFieldName: string;
369
+ }>;
370
+ outputPickFields: import("apify-actor-config").ArrayField<string[]>;
371
+ outputTransform: import("apify-actor-config").StringField<string, string>;
372
+ outputTransformBefore: import("apify-actor-config").StringField<string, string>;
373
+ outputTransformAfter: import("apify-actor-config").StringField<string, string>;
374
+ outputFilter: import("apify-actor-config").StringField<string, string>;
375
+ outputFilterBefore: import("apify-actor-config").StringField<string, string>;
376
+ outputFilterAfter: import("apify-actor-config").StringField<string, string>;
377
+ outputDatasetId: import("apify-actor-config").StringField<string, string>;
378
+ outputCacheStoreId: import("apify-actor-config").StringField<string, string>;
379
+ outputCachePrimaryKeys: import("apify-actor-config").ArrayField<string[]>;
380
+ outputCacheActionOnResult: import("apify-actor-config").StringField<NonNullable<"add" | "remove" | "overwrite" | null | undefined>, string>;
381
+ };
382
+ /** Common input fields related to actor metamorphing */
383
+ export declare const metamorphInput: {
384
+ metamorphActorId: import("apify-actor-config").StringField<string, string>;
385
+ metamorphActorBuild: import("apify-actor-config").StringField<string, string>;
386
+ metamorphActorInput: import("apify-actor-config").ObjectField<{
387
+ uploadDatasetToGDrive: boolean;
388
+ }>;
389
+ };
390
+ export declare const allActorInputs: {
391
+ metamorphActorId: import("apify-actor-config").StringField<string, string>;
392
+ metamorphActorBuild: import("apify-actor-config").StringField<string, string>;
393
+ metamorphActorInput: import("apify-actor-config").ObjectField<{
394
+ uploadDatasetToGDrive: boolean;
395
+ }>;
396
+ logLevel: import("apify-actor-config").StringField<"error" | "off" | "info" | "debug" | "warn", string>;
397
+ errorReportingDatasetId: import("apify-actor-config").StringField<string, string>;
398
+ errorSendToSentry: import("apify-actor-config").BooleanField<boolean>;
399
+ perfBatchSize: import("apify-actor-config").IntegerField<number, string>;
400
+ perfBatchWaitSecs: import("apify-actor-config").IntegerField<number, string>;
401
+ maxRequestRetries: import("apify-actor-config").IntegerField<number, string>;
402
+ maxRequestsPerMinute: import("apify-actor-config").IntegerField<number, string>;
403
+ maxRequestsPerCrawl: import("apify-actor-config").IntegerField<number, string>;
404
+ minConcurrency: import("apify-actor-config").IntegerField<number, string>;
405
+ maxConcurrency: import("apify-actor-config").IntegerField<number, string>;
406
+ navigationTimeoutSecs: import("apify-actor-config").IntegerField<number, string>;
407
+ requestHandlerTimeoutSecs: import("apify-actor-config").IntegerField<number, string>;
408
+ keepAlive: import("apify-actor-config").BooleanField<boolean>;
409
+ ignoreSslErrors: import("apify-actor-config").BooleanField<boolean>;
410
+ additionalMimeTypes: import("apify-actor-config").ArrayField<any[]>;
411
+ suggestResponseEncoding: import("apify-actor-config").StringField<string, string>;
412
+ forceResponseEncoding: import("apify-actor-config").StringField<string, string>;
413
+ outputMaxEntries: import("apify-actor-config").IntegerField<number, string>;
414
+ outputRenameFields: import("apify-actor-config").ObjectField<{
415
+ oldFieldName: string;
416
+ }>;
417
+ outputPickFields: import("apify-actor-config").ArrayField<string[]>;
418
+ outputTransform: import("apify-actor-config").StringField<string, string>;
419
+ outputTransformBefore: import("apify-actor-config").StringField<string, string>;
420
+ outputTransformAfter: import("apify-actor-config").StringField<string, string>;
421
+ outputFilter: import("apify-actor-config").StringField<string, string>;
422
+ outputFilterBefore: import("apify-actor-config").StringField<string, string>;
423
+ outputFilterAfter: import("apify-actor-config").StringField<string, string>;
424
+ outputDatasetId: import("apify-actor-config").StringField<string, string>;
425
+ outputCacheStoreId: import("apify-actor-config").StringField<string, string>;
426
+ outputCachePrimaryKeys: import("apify-actor-config").ArrayField<string[]>;
427
+ outputCacheActionOnResult: import("apify-actor-config").StringField<NonNullable<"add" | "remove" | "overwrite" | null | undefined>, string>;
428
+ requestMaxEntries: import("apify-actor-config").IntegerField<number, string>;
429
+ requestTransform: import("apify-actor-config").StringField<string, string>;
430
+ requestTransformBefore: import("apify-actor-config").StringField<string, string>;
431
+ requestTransformAfter: import("apify-actor-config").StringField<string, string>;
432
+ requestFilter: import("apify-actor-config").StringField<string, string>;
433
+ requestFilterBefore: import("apify-actor-config").StringField<string, string>;
434
+ requestFilterAfter: import("apify-actor-config").StringField<string, string>;
435
+ requestQueueId: import("apify-actor-config").StringField<string, string>;
436
+ includePersonalData: import("apify-actor-config").BooleanField<boolean>;
437
+ proxy: import("apify-actor-config").ObjectField<object>;
438
+ startUrls: import("apify-actor-config").ArrayField<any[]>;
439
+ startUrlsFromDataset: import("apify-actor-config").StringField<string, string>;
440
+ startUrlsFromFunction: import("apify-actor-config").StringField<string, string>;
441
+ inputExtendUrl: import("apify-actor-config").StringField<string, string>;
442
+ inputExtendFromFunction: import("apify-actor-config").StringField<string, string>;
443
+ };
444
+ export declare const crawlerInputValidationFields: {
445
+ navigationTimeoutSecs: Joi.NumberSchema<number>;
446
+ ignoreSslErrors: Joi.BooleanSchema<boolean>;
447
+ additionalMimeTypes: Joi.ArraySchema<any[]>;
448
+ suggestResponseEncoding: Joi.StringSchema<string>;
449
+ forceResponseEncoding: Joi.StringSchema<string>;
450
+ requestHandlerTimeoutSecs: Joi.NumberSchema<number>;
451
+ maxRequestRetries: Joi.NumberSchema<number>;
452
+ maxRequestsPerCrawl: Joi.NumberSchema<number>;
453
+ maxRequestsPerMinute: Joi.NumberSchema<number>;
454
+ minConcurrency: Joi.NumberSchema<number>;
455
+ maxConcurrency: Joi.NumberSchema<number>;
456
+ keepAlive: Joi.BooleanSchema<boolean>;
457
+ };
458
+ export declare const perfInputValidationFields: {
459
+ perfBatchSize: Joi.NumberSchema<number>;
460
+ perfBatchWaitSecs: Joi.NumberSchema<number>;
461
+ };
462
+ export declare const inputInputValidationFields: {
463
+ inputExtendUrl: Joi.StringSchema<string>;
464
+ inputExtendFromFunction: Joi.StringSchema<string>;
465
+ };
466
+ export declare const startUrlsInputValidationFields: {
467
+ startUrls: Joi.ArraySchema<any[]>;
468
+ startUrlsFromDataset: Joi.StringSchema<string>;
469
+ startUrlsFromFunction: Joi.StringSchema<string>;
470
+ };
471
+ export declare const loggingInputValidationFields: {
472
+ logLevel: Joi.StringSchema<string>;
473
+ errorReportingDatasetId: Joi.StringSchema<string>;
474
+ errorSendToSentry: Joi.BooleanSchema<boolean>;
475
+ };
476
+ export declare const proxyInputValidationFields: {
477
+ proxy: Joi.ObjectSchema<any>;
478
+ };
479
+ export declare const privacyInputValidationFields: {
480
+ includePersonalData: Joi.BooleanSchema<boolean>;
481
+ };
482
+ export declare const requestInputValidationFields: {
483
+ requestMaxEntries: Joi.NumberSchema<number>;
484
+ requestTransform: Joi.StringSchema<string>;
485
+ requestTransformBefore: Joi.StringSchema<string>;
486
+ requestTransformAfter: Joi.StringSchema<string>;
487
+ requestFilter: Joi.StringSchema<string>;
488
+ requestFilterBefore: Joi.StringSchema<string>;
489
+ requestFilterAfter: Joi.StringSchema<string>;
490
+ requestQueueId: Joi.StringSchema<string>;
491
+ };
492
+ export declare const outputInputValidationFields: {
493
+ outputMaxEntries: Joi.NumberSchema<number>;
494
+ outputPickFields: Joi.ArraySchema<any[]>;
495
+ outputRenameFields: Joi.ObjectSchema<any>;
496
+ outputTransform: Joi.StringSchema<string>;
497
+ outputTransformBefore: Joi.StringSchema<string>;
498
+ outputTransformAfter: Joi.StringSchema<string>;
499
+ outputFilter: Joi.StringSchema<string>;
500
+ outputFilterBefore: Joi.StringSchema<string>;
501
+ outputFilterAfter: Joi.StringSchema<string>;
502
+ outputCacheStoreId: Joi.StringSchema<string>;
503
+ outputCachePrimaryKeys: Joi.ArraySchema<any[]>;
504
+ outputCacheActionOnResult: Joi.StringSchema<string>;
505
+ outputDatasetId: Joi.StringSchema<string>;
506
+ };
507
+ export declare const metamorphInputValidationFields: {
508
+ metamorphActorId: Joi.StringSchema<string>;
509
+ metamorphActorBuild: Joi.StringSchema<string>;
510
+ metamorphActorInput: Joi.ObjectSchema<any>;
511
+ };
512
+ export declare const allActorInputValidationFields: {
513
+ metamorphActorId: Joi.StringSchema<string>;
514
+ metamorphActorBuild: Joi.StringSchema<string>;
515
+ metamorphActorInput: Joi.ObjectSchema<any>;
516
+ logLevel: Joi.StringSchema<string>;
517
+ errorReportingDatasetId: Joi.StringSchema<string>;
518
+ errorSendToSentry: Joi.BooleanSchema<boolean>;
519
+ perfBatchSize: Joi.NumberSchema<number>;
520
+ perfBatchWaitSecs: Joi.NumberSchema<number>;
521
+ navigationTimeoutSecs: Joi.NumberSchema<number>;
522
+ ignoreSslErrors: Joi.BooleanSchema<boolean>;
523
+ additionalMimeTypes: Joi.ArraySchema<any[]>;
524
+ suggestResponseEncoding: Joi.StringSchema<string>;
525
+ forceResponseEncoding: Joi.StringSchema<string>;
526
+ requestHandlerTimeoutSecs: Joi.NumberSchema<number>;
527
+ maxRequestRetries: Joi.NumberSchema<number>;
528
+ maxRequestsPerCrawl: Joi.NumberSchema<number>;
529
+ maxRequestsPerMinute: Joi.NumberSchema<number>;
530
+ minConcurrency: Joi.NumberSchema<number>;
531
+ maxConcurrency: Joi.NumberSchema<number>;
532
+ keepAlive: Joi.BooleanSchema<boolean>;
533
+ outputMaxEntries: Joi.NumberSchema<number>;
534
+ outputPickFields: Joi.ArraySchema<any[]>;
535
+ outputRenameFields: Joi.ObjectSchema<any>;
536
+ outputTransform: Joi.StringSchema<string>;
537
+ outputTransformBefore: Joi.StringSchema<string>;
538
+ outputTransformAfter: Joi.StringSchema<string>;
539
+ outputFilter: Joi.StringSchema<string>;
540
+ outputFilterBefore: Joi.StringSchema<string>;
541
+ outputFilterAfter: Joi.StringSchema<string>;
542
+ outputCacheStoreId: Joi.StringSchema<string>;
543
+ outputCachePrimaryKeys: Joi.ArraySchema<any[]>;
544
+ outputCacheActionOnResult: Joi.StringSchema<string>;
545
+ outputDatasetId: Joi.StringSchema<string>;
546
+ requestMaxEntries: Joi.NumberSchema<number>;
547
+ requestTransform: Joi.StringSchema<string>;
548
+ requestTransformBefore: Joi.StringSchema<string>;
549
+ requestTransformAfter: Joi.StringSchema<string>;
550
+ requestFilter: Joi.StringSchema<string>;
551
+ requestFilterBefore: Joi.StringSchema<string>;
552
+ requestFilterAfter: Joi.StringSchema<string>;
553
+ requestQueueId: Joi.StringSchema<string>;
554
+ includePersonalData: Joi.BooleanSchema<boolean>;
555
+ proxy: Joi.ObjectSchema<any>;
556
+ startUrls: Joi.ArraySchema<any[]>;
557
+ startUrlsFromDataset: Joi.StringSchema<string>;
558
+ startUrlsFromFunction: Joi.StringSchema<string>;
559
+ inputExtendUrl: Joi.StringSchema<string>;
560
+ inputExtendFromFunction: Joi.StringSchema<string>;
561
+ };