clean-web-scraper 4.3.0 → 4.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2) hide show
  1. package/example-usage.js +7 -5
  2. package/package.json +2 -2
package/example-usage.js CHANGED
@@ -134,9 +134,11 @@ async function electronicintifada ( enable )
134
134
  "https://electronicintifada.net/review",
135
135
  "https://electronicintifada.net/artmusicculture",
136
136
  "https://electronicintifada.net/blog/editors",
137
- "https://electronicintifada.net/blog"
138
137
  ],
139
138
  exactExcludeList: [
139
+ "https://electronicintifada.net/blog",
140
+ /^https:\/\/electronicintifada\.net\/blog\/.*/,
141
+ /^https:\/\/electronicintifada\.net\/blog\?page=\d+$/,
140
142
  "https://electronicintifada.net",
141
143
  "https://electronicintifada.net/blogs",
142
144
  "https://electronicintifada.net/review",
@@ -149,10 +151,10 @@ async function electronicintifada ( enable )
149
151
  metadataFields: ["author", "articleTitle", "pageTitle", "description", "dataScrapedDate", "url"],
150
152
  maxArticles: 2000,
151
153
  maxDepth: 16,
152
- batchSize: 30,
154
+ batchSize: 40,
153
155
  axiosHeaders: headers,
154
- axiosMaxRetries: 3,
155
- axiosRetryDelay: 10000,
156
+ axiosMaxRetries: 2,
157
+ axiosRetryDelay: 8000,
156
158
  axiosProxy: {
157
159
  host: "localhost",
158
160
  port: 2080,
@@ -230,7 +232,7 @@ async function mondoweiss ( enable )
230
232
  maxDepth: 15,
231
233
  batchSize: 20,
232
234
  axiosHeaders: headers,
233
- axiosMaxRetries: 3,
235
+ axiosMaxRetries: 2,
234
236
  axiosRetryDelay: 10000,
235
237
  axiosProxy: {
236
238
  host: "localhost",
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "clean-web-scraper",
3
- "version": "4.3.0",
3
+ "version": "4.3.1",
4
4
  "main": "main.js",
5
5
  "scripts": {
6
6
  "start": "node main.js",
@@ -30,4 +30,4 @@
30
30
  "puppeteer": "^24.1.1",
31
31
  "puppeteer-real-browser": "^1.3.22"
32
32
  }
33
- }
33
+ }