@kreuzberg/kreuzcrawl 0.1.1 → 0.1.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/Cargo.toml +5 -1
- package/index.d.ts +1 -31
- package/index.js +52 -53
- package/npm/darwin-arm64/kreuzcrawl-node.darwin-arm64.node +0 -0
- package/npm/darwin-arm64/package.json +1 -1
- package/npm/kreuzberg-kreuzcrawl-darwin-arm64-0.1.2.tgz +0 -0
- package/npm/kreuzberg-kreuzcrawl-linux-arm64-gnu-0.1.2.tgz +0 -0
- package/npm/kreuzberg-kreuzcrawl-linux-x64-gnu-0.1.2.tgz +0 -0
- package/npm/kreuzberg-kreuzcrawl-win32-x64-msvc-0.1.2.tgz +0 -0
- package/npm/linux-arm64-gnu/kreuzcrawl-node.linux-arm64-gnu.node +0 -0
- package/npm/linux-arm64-gnu/package.json +1 -1
- package/npm/linux-x64-gnu/kreuzcrawl-node.linux-x64-gnu.node +0 -0
- package/npm/linux-x64-gnu/package.json +1 -1
- package/npm/win32-x64-msvc/kreuzcrawl-node.win32-x64-msvc.node +0 -0
- package/npm/win32-x64-msvc/package.json +1 -1
- package/package.json +5 -5
- package/src/lib.rs +13 -105
- package/npm/kreuzberg-kreuzcrawl-darwin-arm64-0.1.1.tgz +0 -0
- package/npm/kreuzberg-kreuzcrawl-linux-arm64-gnu-0.1.1.tgz +0 -0
- package/npm/kreuzberg-kreuzcrawl-linux-x64-gnu-0.1.1.tgz +0 -0
- package/npm/kreuzberg-kreuzcrawl-win32-x64-msvc-0.1.1.tgz +0 -0
package/Cargo.toml
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[package]
|
|
2
2
|
name = "kreuzcrawl-node"
|
|
3
|
-
version = "0.1.
|
|
3
|
+
version = "0.1.2"
|
|
4
4
|
edition = "2024"
|
|
5
5
|
license = "Elastic-2.0"
|
|
6
6
|
|
|
@@ -16,3 +16,7 @@ serde_json = "1"
|
|
|
16
16
|
|
|
17
17
|
[build-dependencies]
|
|
18
18
|
napi-build = "2"
|
|
19
|
+
|
|
20
|
+
[lints.clippy]
|
|
21
|
+
duplicated_attributes = "allow"
|
|
22
|
+
unwrap_used = "allow"
|
package/index.d.ts
CHANGED
|
@@ -12,14 +12,6 @@ export declare function crawl(engine: JsCrawlEngineHandle, url: string): Promise
|
|
|
12
12
|
|
|
13
13
|
export declare function createEngine(config?: JsCrawlConfig | undefined | null): JsCrawlEngineHandle
|
|
14
14
|
|
|
15
|
-
export interface JsActionResult {
|
|
16
|
-
actionIndex?: number
|
|
17
|
-
actionType?: string
|
|
18
|
-
success?: boolean
|
|
19
|
-
data?: string
|
|
20
|
-
error?: string
|
|
21
|
-
}
|
|
22
|
-
|
|
23
15
|
export interface JsArticleMetadata {
|
|
24
16
|
publishedTime?: string
|
|
25
17
|
modifiedTime?: string
|
|
@@ -83,16 +75,6 @@ export declare const enum JsBrowserWait {
|
|
|
83
75
|
Fixed = 'fixed'
|
|
84
76
|
}
|
|
85
77
|
|
|
86
|
-
export interface JsCachedPage {
|
|
87
|
-
url?: string
|
|
88
|
-
statusCode?: number
|
|
89
|
-
contentType?: string
|
|
90
|
-
body?: string
|
|
91
|
-
etag?: string
|
|
92
|
-
lastModified?: string
|
|
93
|
-
cachedAt?: number
|
|
94
|
-
}
|
|
95
|
-
|
|
96
78
|
export interface JsCitationReference {
|
|
97
79
|
index?: number
|
|
98
80
|
url?: string
|
|
@@ -123,6 +105,7 @@ export interface JsCrawlConfig {
|
|
|
123
105
|
excludePaths?: Array<string>
|
|
124
106
|
customHeaders?: Record<string, string>
|
|
125
107
|
requestTimeout?: number
|
|
108
|
+
rateLimitMs?: number
|
|
126
109
|
maxRedirects?: number
|
|
127
110
|
retryCount?: number
|
|
128
111
|
retryCodes?: Array<number>
|
|
@@ -148,12 +131,6 @@ export interface JsCrawlConfig {
|
|
|
148
131
|
saveBrowserProfile?: boolean
|
|
149
132
|
}
|
|
150
133
|
|
|
151
|
-
export declare const enum JsCrawlEvent {
|
|
152
|
-
Page = 'Page',
|
|
153
|
-
Error = 'Error',
|
|
154
|
-
Complete = 'Complete'
|
|
155
|
-
}
|
|
156
|
-
|
|
157
134
|
export interface JsCrawlPageResult {
|
|
158
135
|
url?: string
|
|
159
136
|
normalizedUrl?: string
|
|
@@ -258,13 +235,6 @@ export declare const enum JsImageSource {
|
|
|
258
235
|
TwitterImage = 'twitter_image'
|
|
259
236
|
}
|
|
260
237
|
|
|
261
|
-
export interface JsInteractionResult {
|
|
262
|
-
actionResults?: Array<JsActionResult>
|
|
263
|
-
finalHtml?: string
|
|
264
|
-
finalUrl?: string
|
|
265
|
-
screenshot?: Array<number>
|
|
266
|
-
}
|
|
267
|
-
|
|
268
238
|
export interface JsJsonLdEntry {
|
|
269
239
|
schemaType?: string
|
|
270
240
|
name?: string
|
package/index.js
CHANGED
|
@@ -77,8 +77,8 @@ function requireNative() {
|
|
|
77
77
|
try {
|
|
78
78
|
const binding = require('@kreuzberg/kreuzcrawl-android-arm64')
|
|
79
79
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-android-arm64/package.json').version
|
|
80
|
-
if (bindingPackageVersion !== '0.1.
|
|
81
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
80
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
81
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
82
82
|
}
|
|
83
83
|
return binding
|
|
84
84
|
} catch (e) {
|
|
@@ -93,8 +93,8 @@ function requireNative() {
|
|
|
93
93
|
try {
|
|
94
94
|
const binding = require('@kreuzberg/kreuzcrawl-android-arm-eabi')
|
|
95
95
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-android-arm-eabi/package.json').version
|
|
96
|
-
if (bindingPackageVersion !== '0.1.
|
|
97
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
96
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
97
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
98
98
|
}
|
|
99
99
|
return binding
|
|
100
100
|
} catch (e) {
|
|
@@ -114,8 +114,8 @@ function requireNative() {
|
|
|
114
114
|
try {
|
|
115
115
|
const binding = require('@kreuzberg/kreuzcrawl-win32-x64-gnu')
|
|
116
116
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-win32-x64-gnu/package.json').version
|
|
117
|
-
if (bindingPackageVersion !== '0.1.
|
|
118
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
117
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
118
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
119
119
|
}
|
|
120
120
|
return binding
|
|
121
121
|
} catch (e) {
|
|
@@ -130,8 +130,8 @@ function requireNative() {
|
|
|
130
130
|
try {
|
|
131
131
|
const binding = require('@kreuzberg/kreuzcrawl-win32-x64-msvc')
|
|
132
132
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-win32-x64-msvc/package.json').version
|
|
133
|
-
if (bindingPackageVersion !== '0.1.
|
|
134
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
133
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
134
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
135
135
|
}
|
|
136
136
|
return binding
|
|
137
137
|
} catch (e) {
|
|
@@ -147,8 +147,8 @@ function requireNative() {
|
|
|
147
147
|
try {
|
|
148
148
|
const binding = require('@kreuzberg/kreuzcrawl-win32-ia32-msvc')
|
|
149
149
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-win32-ia32-msvc/package.json').version
|
|
150
|
-
if (bindingPackageVersion !== '0.1.
|
|
151
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
150
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
151
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
152
152
|
}
|
|
153
153
|
return binding
|
|
154
154
|
} catch (e) {
|
|
@@ -163,8 +163,8 @@ function requireNative() {
|
|
|
163
163
|
try {
|
|
164
164
|
const binding = require('@kreuzberg/kreuzcrawl-win32-arm64-msvc')
|
|
165
165
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-win32-arm64-msvc/package.json').version
|
|
166
|
-
if (bindingPackageVersion !== '0.1.
|
|
167
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
166
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
167
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
168
168
|
}
|
|
169
169
|
return binding
|
|
170
170
|
} catch (e) {
|
|
@@ -182,8 +182,8 @@ function requireNative() {
|
|
|
182
182
|
try {
|
|
183
183
|
const binding = require('@kreuzberg/kreuzcrawl-darwin-universal')
|
|
184
184
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-darwin-universal/package.json').version
|
|
185
|
-
if (bindingPackageVersion !== '0.1.
|
|
186
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
185
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
186
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
187
187
|
}
|
|
188
188
|
return binding
|
|
189
189
|
} catch (e) {
|
|
@@ -198,8 +198,8 @@ function requireNative() {
|
|
|
198
198
|
try {
|
|
199
199
|
const binding = require('@kreuzberg/kreuzcrawl-darwin-x64')
|
|
200
200
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-darwin-x64/package.json').version
|
|
201
|
-
if (bindingPackageVersion !== '0.1.
|
|
202
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
201
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
202
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
203
203
|
}
|
|
204
204
|
return binding
|
|
205
205
|
} catch (e) {
|
|
@@ -214,8 +214,8 @@ function requireNative() {
|
|
|
214
214
|
try {
|
|
215
215
|
const binding = require('@kreuzberg/kreuzcrawl-darwin-arm64')
|
|
216
216
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-darwin-arm64/package.json').version
|
|
217
|
-
if (bindingPackageVersion !== '0.1.
|
|
218
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
217
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
218
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
219
219
|
}
|
|
220
220
|
return binding
|
|
221
221
|
} catch (e) {
|
|
@@ -234,8 +234,8 @@ function requireNative() {
|
|
|
234
234
|
try {
|
|
235
235
|
const binding = require('@kreuzberg/kreuzcrawl-freebsd-x64')
|
|
236
236
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-freebsd-x64/package.json').version
|
|
237
|
-
if (bindingPackageVersion !== '0.1.
|
|
238
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
237
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
238
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
239
239
|
}
|
|
240
240
|
return binding
|
|
241
241
|
} catch (e) {
|
|
@@ -250,8 +250,8 @@ function requireNative() {
|
|
|
250
250
|
try {
|
|
251
251
|
const binding = require('@kreuzberg/kreuzcrawl-freebsd-arm64')
|
|
252
252
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-freebsd-arm64/package.json').version
|
|
253
|
-
if (bindingPackageVersion !== '0.1.
|
|
254
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
253
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
254
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
255
255
|
}
|
|
256
256
|
return binding
|
|
257
257
|
} catch (e) {
|
|
@@ -271,8 +271,8 @@ function requireNative() {
|
|
|
271
271
|
try {
|
|
272
272
|
const binding = require('@kreuzberg/kreuzcrawl-linux-x64-musl')
|
|
273
273
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-x64-musl/package.json').version
|
|
274
|
-
if (bindingPackageVersion !== '0.1.
|
|
275
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
274
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
275
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
276
276
|
}
|
|
277
277
|
return binding
|
|
278
278
|
} catch (e) {
|
|
@@ -287,8 +287,8 @@ function requireNative() {
|
|
|
287
287
|
try {
|
|
288
288
|
const binding = require('@kreuzberg/kreuzcrawl-linux-x64-gnu')
|
|
289
289
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-x64-gnu/package.json').version
|
|
290
|
-
if (bindingPackageVersion !== '0.1.
|
|
291
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
290
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
291
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
292
292
|
}
|
|
293
293
|
return binding
|
|
294
294
|
} catch (e) {
|
|
@@ -305,8 +305,8 @@ function requireNative() {
|
|
|
305
305
|
try {
|
|
306
306
|
const binding = require('@kreuzberg/kreuzcrawl-linux-arm64-musl')
|
|
307
307
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-arm64-musl/package.json').version
|
|
308
|
-
if (bindingPackageVersion !== '0.1.
|
|
309
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
308
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
309
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
310
310
|
}
|
|
311
311
|
return binding
|
|
312
312
|
} catch (e) {
|
|
@@ -321,8 +321,8 @@ function requireNative() {
|
|
|
321
321
|
try {
|
|
322
322
|
const binding = require('@kreuzberg/kreuzcrawl-linux-arm64-gnu')
|
|
323
323
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-arm64-gnu/package.json').version
|
|
324
|
-
if (bindingPackageVersion !== '0.1.
|
|
325
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
324
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
325
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
326
326
|
}
|
|
327
327
|
return binding
|
|
328
328
|
} catch (e) {
|
|
@@ -339,8 +339,8 @@ function requireNative() {
|
|
|
339
339
|
try {
|
|
340
340
|
const binding = require('@kreuzberg/kreuzcrawl-linux-arm-musleabihf')
|
|
341
341
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-arm-musleabihf/package.json').version
|
|
342
|
-
if (bindingPackageVersion !== '0.1.
|
|
343
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
342
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
343
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
344
344
|
}
|
|
345
345
|
return binding
|
|
346
346
|
} catch (e) {
|
|
@@ -355,8 +355,8 @@ function requireNative() {
|
|
|
355
355
|
try {
|
|
356
356
|
const binding = require('@kreuzberg/kreuzcrawl-linux-arm-gnueabihf')
|
|
357
357
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-arm-gnueabihf/package.json').version
|
|
358
|
-
if (bindingPackageVersion !== '0.1.
|
|
359
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
358
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
359
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
360
360
|
}
|
|
361
361
|
return binding
|
|
362
362
|
} catch (e) {
|
|
@@ -373,8 +373,8 @@ function requireNative() {
|
|
|
373
373
|
try {
|
|
374
374
|
const binding = require('@kreuzberg/kreuzcrawl-linux-loong64-musl')
|
|
375
375
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-loong64-musl/package.json').version
|
|
376
|
-
if (bindingPackageVersion !== '0.1.
|
|
377
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
376
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
377
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
378
378
|
}
|
|
379
379
|
return binding
|
|
380
380
|
} catch (e) {
|
|
@@ -389,8 +389,8 @@ function requireNative() {
|
|
|
389
389
|
try {
|
|
390
390
|
const binding = require('@kreuzberg/kreuzcrawl-linux-loong64-gnu')
|
|
391
391
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-loong64-gnu/package.json').version
|
|
392
|
-
if (bindingPackageVersion !== '0.1.
|
|
393
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
392
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
393
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
394
394
|
}
|
|
395
395
|
return binding
|
|
396
396
|
} catch (e) {
|
|
@@ -407,8 +407,8 @@ function requireNative() {
|
|
|
407
407
|
try {
|
|
408
408
|
const binding = require('@kreuzberg/kreuzcrawl-linux-riscv64-musl')
|
|
409
409
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-riscv64-musl/package.json').version
|
|
410
|
-
if (bindingPackageVersion !== '0.1.
|
|
411
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
410
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
411
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
412
412
|
}
|
|
413
413
|
return binding
|
|
414
414
|
} catch (e) {
|
|
@@ -423,8 +423,8 @@ function requireNative() {
|
|
|
423
423
|
try {
|
|
424
424
|
const binding = require('@kreuzberg/kreuzcrawl-linux-riscv64-gnu')
|
|
425
425
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-riscv64-gnu/package.json').version
|
|
426
|
-
if (bindingPackageVersion !== '0.1.
|
|
427
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
426
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
427
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
428
428
|
}
|
|
429
429
|
return binding
|
|
430
430
|
} catch (e) {
|
|
@@ -440,8 +440,8 @@ function requireNative() {
|
|
|
440
440
|
try {
|
|
441
441
|
const binding = require('@kreuzberg/kreuzcrawl-linux-ppc64-gnu')
|
|
442
442
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-ppc64-gnu/package.json').version
|
|
443
|
-
if (bindingPackageVersion !== '0.1.
|
|
444
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
443
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
444
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
445
445
|
}
|
|
446
446
|
return binding
|
|
447
447
|
} catch (e) {
|
|
@@ -456,8 +456,8 @@ function requireNative() {
|
|
|
456
456
|
try {
|
|
457
457
|
const binding = require('@kreuzberg/kreuzcrawl-linux-s390x-gnu')
|
|
458
458
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-linux-s390x-gnu/package.json').version
|
|
459
|
-
if (bindingPackageVersion !== '0.1.
|
|
460
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
459
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
460
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
461
461
|
}
|
|
462
462
|
return binding
|
|
463
463
|
} catch (e) {
|
|
@@ -476,8 +476,8 @@ function requireNative() {
|
|
|
476
476
|
try {
|
|
477
477
|
const binding = require('@kreuzberg/kreuzcrawl-openharmony-arm64')
|
|
478
478
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-openharmony-arm64/package.json').version
|
|
479
|
-
if (bindingPackageVersion !== '0.1.
|
|
480
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
479
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
480
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
481
481
|
}
|
|
482
482
|
return binding
|
|
483
483
|
} catch (e) {
|
|
@@ -492,8 +492,8 @@ function requireNative() {
|
|
|
492
492
|
try {
|
|
493
493
|
const binding = require('@kreuzberg/kreuzcrawl-openharmony-x64')
|
|
494
494
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-openharmony-x64/package.json').version
|
|
495
|
-
if (bindingPackageVersion !== '0.1.
|
|
496
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
495
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
496
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
497
497
|
}
|
|
498
498
|
return binding
|
|
499
499
|
} catch (e) {
|
|
@@ -508,8 +508,8 @@ function requireNative() {
|
|
|
508
508
|
try {
|
|
509
509
|
const binding = require('@kreuzberg/kreuzcrawl-openharmony-arm')
|
|
510
510
|
const bindingPackageVersion = require('@kreuzberg/kreuzcrawl-openharmony-arm/package.json').version
|
|
511
|
-
if (bindingPackageVersion !== '0.1.
|
|
512
|
-
throw new Error(`Native binding package version mismatch, expected 0.1.
|
|
511
|
+
if (bindingPackageVersion !== '0.1.2' && process.env.NAPI_RS_ENFORCE_VERSION_CHECK && process.env.NAPI_RS_ENFORCE_VERSION_CHECK !== '0') {
|
|
512
|
+
throw new Error(`Native binding package version mismatch, expected 0.1.2 but got ${bindingPackageVersion}. You can reinstall dependencies to fix this issue.`)
|
|
513
513
|
}
|
|
514
514
|
return binding
|
|
515
515
|
} catch (e) {
|
|
@@ -584,7 +584,6 @@ module.exports.createEngine = nativeBinding.createEngine
|
|
|
584
584
|
module.exports.JsAssetCategory = nativeBinding.JsAssetCategory
|
|
585
585
|
module.exports.JsBrowserMode = nativeBinding.JsBrowserMode
|
|
586
586
|
module.exports.JsBrowserWait = nativeBinding.JsBrowserWait
|
|
587
|
-
module.exports.JsCrawlEvent = nativeBinding.JsCrawlEvent
|
|
588
587
|
module.exports.JsFeedType = nativeBinding.JsFeedType
|
|
589
588
|
module.exports.JsImageSource = nativeBinding.JsImageSource
|
|
590
589
|
module.exports.JsLinkType = nativeBinding.JsLinkType
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@kreuzberg/kreuzcrawl",
|
|
3
|
-
"version": "0.1.
|
|
3
|
+
"version": "0.1.2",
|
|
4
4
|
"main": "index.js",
|
|
5
5
|
"types": "index.d.ts",
|
|
6
6
|
"repository": {
|
|
@@ -35,9 +35,9 @@
|
|
|
35
35
|
"@napi-rs/cli": "^3.6.2"
|
|
36
36
|
},
|
|
37
37
|
"optionalDependencies": {
|
|
38
|
-
"@kreuzberg/kreuzcrawl-darwin-arm64": "0.1.
|
|
39
|
-
"@kreuzberg/kreuzcrawl-linux-arm64-gnu": "0.1.
|
|
40
|
-
"@kreuzberg/kreuzcrawl-linux-x64-gnu": "0.1.
|
|
41
|
-
"@kreuzberg/kreuzcrawl-win32-x64-msvc": "0.1.
|
|
38
|
+
"@kreuzberg/kreuzcrawl-darwin-arm64": "0.1.2",
|
|
39
|
+
"@kreuzberg/kreuzcrawl-linux-arm64-gnu": "0.1.2",
|
|
40
|
+
"@kreuzberg/kreuzcrawl-linux-x64-gnu": "0.1.2",
|
|
41
|
+
"@kreuzberg/kreuzcrawl-win32-x64-msvc": "0.1.2"
|
|
42
42
|
}
|
|
43
43
|
}
|
package/src/lib.rs
CHANGED
|
@@ -6,7 +6,13 @@
|
|
|
6
6
|
clippy::let_unit_value,
|
|
7
7
|
clippy::needless_borrow,
|
|
8
8
|
clippy::map_identity,
|
|
9
|
-
clippy::just_underscores_and_digits
|
|
9
|
+
clippy::just_underscores_and_digits,
|
|
10
|
+
clippy::unnecessary_cast,
|
|
11
|
+
clippy::unused_unit,
|
|
12
|
+
clippy::unwrap_or_default,
|
|
13
|
+
clippy::derivable_impls,
|
|
14
|
+
clippy::needless_borrows_for_generic_args,
|
|
15
|
+
clippy::unnecessary_fallible_conversions
|
|
10
16
|
)]
|
|
11
17
|
|
|
12
18
|
use napi::*;
|
|
@@ -80,6 +86,8 @@ pub struct JsCrawlConfig {
|
|
|
80
86
|
pub custom_headers: Option<HashMap<String, String>>,
|
|
81
87
|
#[napi(js_name = "requestTimeout")]
|
|
82
88
|
pub request_timeout: Option<i64>,
|
|
89
|
+
#[napi(js_name = "rateLimitMs")]
|
|
90
|
+
pub rate_limit_ms: Option<i64>,
|
|
83
91
|
#[napi(js_name = "maxRedirects")]
|
|
84
92
|
pub max_redirects: Option<i64>,
|
|
85
93
|
#[napi(js_name = "retryCount")]
|
|
@@ -139,30 +147,6 @@ pub struct JsDownloadedDocument {
|
|
|
139
147
|
pub headers: Option<HashMap<String, String>>,
|
|
140
148
|
}
|
|
141
149
|
|
|
142
|
-
#[derive(Clone, Default, serde::Serialize, serde::Deserialize)]
|
|
143
|
-
#[napi(object)]
|
|
144
|
-
pub struct JsInteractionResult {
|
|
145
|
-
#[napi(js_name = "actionResults")]
|
|
146
|
-
pub action_results: Option<Vec<JsActionResult>>,
|
|
147
|
-
#[napi(js_name = "finalHtml")]
|
|
148
|
-
pub final_html: Option<String>,
|
|
149
|
-
#[napi(js_name = "finalUrl")]
|
|
150
|
-
pub final_url: Option<String>,
|
|
151
|
-
pub screenshot: Option<Vec<u8>>,
|
|
152
|
-
}
|
|
153
|
-
|
|
154
|
-
#[derive(Clone, Default, serde::Serialize, serde::Deserialize)]
|
|
155
|
-
#[napi(object)]
|
|
156
|
-
pub struct JsActionResult {
|
|
157
|
-
#[napi(js_name = "actionIndex")]
|
|
158
|
-
pub action_index: Option<i64>,
|
|
159
|
-
#[napi(js_name = "actionType")]
|
|
160
|
-
pub action_type: Option<String>,
|
|
161
|
-
pub success: Option<bool>,
|
|
162
|
-
pub data: Option<String>,
|
|
163
|
-
pub error: Option<String>,
|
|
164
|
-
}
|
|
165
|
-
|
|
166
150
|
#[derive(Clone, Default, serde::Serialize, serde::Deserialize)]
|
|
167
151
|
#[napi(object)]
|
|
168
152
|
pub struct JsScrapeResult {
|
|
@@ -297,22 +281,6 @@ pub struct JsMarkdownResult {
|
|
|
297
281
|
pub fit_content: Option<String>,
|
|
298
282
|
}
|
|
299
283
|
|
|
300
|
-
#[derive(Clone, Default, serde::Serialize, serde::Deserialize)]
|
|
301
|
-
#[napi(object)]
|
|
302
|
-
pub struct JsCachedPage {
|
|
303
|
-
pub url: Option<String>,
|
|
304
|
-
#[napi(js_name = "statusCode")]
|
|
305
|
-
pub status_code: Option<u16>,
|
|
306
|
-
#[napi(js_name = "contentType")]
|
|
307
|
-
pub content_type: Option<String>,
|
|
308
|
-
pub body: Option<String>,
|
|
309
|
-
pub etag: Option<String>,
|
|
310
|
-
#[napi(js_name = "lastModified")]
|
|
311
|
-
pub last_modified: Option<String>,
|
|
312
|
-
#[napi(js_name = "cachedAt")]
|
|
313
|
-
pub cached_at: Option<i64>,
|
|
314
|
-
}
|
|
315
|
-
|
|
316
284
|
#[derive(Clone, Default, serde::Serialize, serde::Deserialize)]
|
|
317
285
|
#[napi(object)]
|
|
318
286
|
pub struct JsLinkInfo {
|
|
@@ -674,21 +642,6 @@ impl Default for JsAssetCategory {
|
|
|
674
642
|
}
|
|
675
643
|
}
|
|
676
644
|
|
|
677
|
-
#[napi(string_enum)]
|
|
678
|
-
#[derive(Clone, serde::Serialize, serde::Deserialize)]
|
|
679
|
-
pub enum JsCrawlEvent {
|
|
680
|
-
Page,
|
|
681
|
-
Error,
|
|
682
|
-
Complete,
|
|
683
|
-
}
|
|
684
|
-
|
|
685
|
-
#[allow(clippy::derivable_impls)]
|
|
686
|
-
impl Default for JsCrawlEvent {
|
|
687
|
-
fn default() -> Self {
|
|
688
|
-
Self::Page
|
|
689
|
-
}
|
|
690
|
-
}
|
|
691
|
-
|
|
692
645
|
#[allow(clippy::missing_errors_doc)]
|
|
693
646
|
#[napi(js_name = "createEngine")]
|
|
694
647
|
pub fn create_engine(config: Option<JsCrawlConfig>) -> Result<JsCrawlEngineHandle> {
|
|
@@ -828,6 +781,7 @@ impl From<JsCrawlConfig> for kreuzcrawl::CrawlConfig {
|
|
|
828
781
|
if let Some(__v) = val.request_timeout {
|
|
829
782
|
__result.request_timeout = std::time::Duration::from_millis(__v as u64);
|
|
830
783
|
}
|
|
784
|
+
__result.rate_limit_ms = val.rate_limit_ms.map(|v| v as u64);
|
|
831
785
|
__result.max_redirects = val.max_redirects.map(|v| v as usize).unwrap_or_default();
|
|
832
786
|
__result.retry_count = val.retry_count.map(|v| v as usize).unwrap_or_default();
|
|
833
787
|
__result.retry_codes = val.retry_codes.unwrap_or_default();
|
|
@@ -872,6 +826,7 @@ impl From<kreuzcrawl::CrawlConfig> for JsCrawlConfig {
|
|
|
872
826
|
exclude_paths: Some(val.exclude_paths),
|
|
873
827
|
custom_headers: Some(val.custom_headers.into_iter().collect()),
|
|
874
828
|
request_timeout: Some(val.request_timeout.as_millis() as u64 as i64),
|
|
829
|
+
rate_limit_ms: val.rate_limit_ms.map(|v| v as i64),
|
|
875
830
|
max_redirects: Some(val.max_redirects as i64),
|
|
876
831
|
retry_count: Some(val.retry_count as i64),
|
|
877
832
|
retry_codes: Some(val.retry_codes),
|
|
@@ -920,41 +875,18 @@ impl From<kreuzcrawl::DownloadedDocument> for JsDownloadedDocument {
|
|
|
920
875
|
mime_type: Some(format!("{:?}", val.mime_type)),
|
|
921
876
|
content: Some(val.content.to_vec()),
|
|
922
877
|
size: Some(val.size as i64),
|
|
923
|
-
filename: val.filename.as_ref().map(|v| format!("{:?}"
|
|
878
|
+
filename: val.filename.as_ref().map(|v| format!("{v:?}")),
|
|
924
879
|
content_hash: Some(format!("{:?}", val.content_hash)),
|
|
925
880
|
headers: Some(
|
|
926
881
|
val.headers
|
|
927
882
|
.into_iter()
|
|
928
|
-
.map(|(k, v)| (
|
|
883
|
+
.map(|(k, v)| (k.to_string(), v.to_string()))
|
|
929
884
|
.collect(),
|
|
930
885
|
),
|
|
931
886
|
}
|
|
932
887
|
}
|
|
933
888
|
}
|
|
934
889
|
|
|
935
|
-
impl From<kreuzcrawl::InteractionResult> for JsInteractionResult {
|
|
936
|
-
fn from(val: kreuzcrawl::InteractionResult) -> Self {
|
|
937
|
-
Self {
|
|
938
|
-
action_results: Some(val.action_results.into_iter().map(Into::into).collect()),
|
|
939
|
-
final_html: Some(val.final_html),
|
|
940
|
-
final_url: Some(val.final_url),
|
|
941
|
-
screenshot: val.screenshot.map(|v| v.to_vec()),
|
|
942
|
-
}
|
|
943
|
-
}
|
|
944
|
-
}
|
|
945
|
-
|
|
946
|
-
impl From<kreuzcrawl::ActionResult> for JsActionResult {
|
|
947
|
-
fn from(val: kreuzcrawl::ActionResult) -> Self {
|
|
948
|
-
Self {
|
|
949
|
-
action_index: Some(val.action_index as i64),
|
|
950
|
-
action_type: Some(format!("{:?}", val.action_type)),
|
|
951
|
-
success: Some(val.success),
|
|
952
|
-
data: val.data.as_ref().map(ToString::to_string),
|
|
953
|
-
error: val.error,
|
|
954
|
-
}
|
|
955
|
-
}
|
|
956
|
-
}
|
|
957
|
-
|
|
958
890
|
impl From<JsScrapeResult> for kreuzcrawl::ScrapeResult {
|
|
959
891
|
fn from(val: JsScrapeResult) -> Self {
|
|
960
892
|
Self {
|
|
@@ -1213,20 +1145,6 @@ impl From<kreuzcrawl::MarkdownResult> for JsMarkdownResult {
|
|
|
1213
1145
|
}
|
|
1214
1146
|
}
|
|
1215
1147
|
|
|
1216
|
-
impl From<kreuzcrawl::CachedPage> for JsCachedPage {
|
|
1217
|
-
fn from(val: kreuzcrawl::CachedPage) -> Self {
|
|
1218
|
-
Self {
|
|
1219
|
-
url: Some(val.url),
|
|
1220
|
-
status_code: Some(val.status_code),
|
|
1221
|
-
content_type: Some(val.content_type),
|
|
1222
|
-
body: Some(val.body),
|
|
1223
|
-
etag: val.etag,
|
|
1224
|
-
last_modified: val.last_modified,
|
|
1225
|
-
cached_at: Some(val.cached_at as i64),
|
|
1226
|
-
}
|
|
1227
|
-
}
|
|
1228
|
-
}
|
|
1229
|
-
|
|
1230
1148
|
impl From<JsLinkInfo> for kreuzcrawl::LinkInfo {
|
|
1231
1149
|
fn from(val: JsLinkInfo) -> Self {
|
|
1232
1150
|
Self {
|
|
@@ -1845,16 +1763,6 @@ impl From<kreuzcrawl::AssetCategory> for JsAssetCategory {
|
|
|
1845
1763
|
}
|
|
1846
1764
|
}
|
|
1847
1765
|
|
|
1848
|
-
impl From<kreuzcrawl::CrawlEvent> for JsCrawlEvent {
|
|
1849
|
-
fn from(val: kreuzcrawl::CrawlEvent) -> Self {
|
|
1850
|
-
match val {
|
|
1851
|
-
kreuzcrawl::CrawlEvent::Page(..) => Self::Page,
|
|
1852
|
-
kreuzcrawl::CrawlEvent::Error { .. } => Self::Error,
|
|
1853
|
-
kreuzcrawl::CrawlEvent::Complete { .. } => Self::Complete,
|
|
1854
|
-
}
|
|
1855
|
-
}
|
|
1856
|
-
}
|
|
1857
|
-
|
|
1858
1766
|
// Error variant name constants
|
|
1859
1767
|
pub const CRAWL_ERROR_ERROR_NOT_FOUND: &str = "NotFound";
|
|
1860
1768
|
pub const CRAWL_ERROR_ERROR_UNAUTHORIZED: &str = "Unauthorized";
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|