@crawlee/jsdom 3.17.1-beta.21 → 3.17.1-beta.23
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
import type { IncomingMessage } from 'node:http';
|
|
2
|
-
import type { BasicCrawlingContext, Configuration, EnqueueLinksOptions, ErrorHandler, GetUserDataFromRequest, HttpCrawlerOptions, InternalHttpCrawlingContext, InternalHttpHook, RequestHandler, RequestProvider, RouterRoutes, SkippedRequestCallback } from '@crawlee/http';
|
|
2
|
+
import type { BasicCrawlingContext, Configuration, EnqueueLinksOptions, ErrorHandler, GetUserDataFromRequest, HttpCrawlerOptions, InternalHttpCrawlingContext, InternalHttpHook, RequestHandler, RequestProvider, RouterHandler, RouterRoutes, SkippedRequestCallback } from '@crawlee/http';
|
|
3
3
|
import { HttpCrawler } from '@crawlee/http';
|
|
4
4
|
import type { Dictionary } from '@crawlee/types';
|
|
5
5
|
import { type CheerioRoot, type RobotsTxtFile } from '@crawlee/utils';
|
|
@@ -218,6 +218,6 @@ export declare function domCrawlerEnqueueLinks(options: EnqueueLinksInternalOpti
|
|
|
218
218
|
* await crawler.run();
|
|
219
219
|
* ```
|
|
220
220
|
*/
|
|
221
|
-
|
|
222
|
-
export declare function createJSDOMRouter<Context extends JSDOMCrawlingContext = JSDOMCrawlingContext, UserData extends Dictionary = GetUserDataFromRequest<Context['request']>>(routes?: RouterRoutes<Context, UserData
|
|
221
|
+
export declare function createJSDOMRouter<Context extends JSDOMCrawlingContext = JSDOMCrawlingContext, Routes extends Record<keyof Routes, Dictionary> = Record<string, GetUserDataFromRequest<Context['request']>>>(routes?: RouterRoutes<Context, Routes>): RouterHandler<Context, Routes>;
|
|
222
|
+
export declare function createJSDOMRouter<Context extends JSDOMCrawlingContext = JSDOMCrawlingContext, UserData extends Dictionary = GetUserDataFromRequest<Context['request']>>(routes?: RouterRoutes<Context, Record<string, UserData>>): RouterHandler<Context, Record<string, UserData>>;
|
|
223
223
|
export {};
|
|
@@ -296,30 +296,6 @@ function extractUrlsFromWindow(window, selector, baseUrl) {
|
|
|
296
296
|
})
|
|
297
297
|
.filter((href) => href !== undefined && href !== '');
|
|
298
298
|
}
|
|
299
|
-
/**
|
|
300
|
-
* Creates new {@link Router} instance that works based on request labels.
|
|
301
|
-
* This instance can then serve as a `requestHandler` of your {@link JSDOMCrawler}.
|
|
302
|
-
* Defaults to the {@link JSDOMCrawlingContext}.
|
|
303
|
-
*
|
|
304
|
-
* > Serves as a shortcut for using `Router.create<JSDOMCrawlingContext>()`.
|
|
305
|
-
*
|
|
306
|
-
* ```ts
|
|
307
|
-
* import { JSDOMCrawler, createJSDOMRouter } from 'crawlee';
|
|
308
|
-
*
|
|
309
|
-
* const router = createJSDOMRouter();
|
|
310
|
-
* router.addHandler('label-a', async (ctx) => {
|
|
311
|
-
* ctx.log.info('...');
|
|
312
|
-
* });
|
|
313
|
-
* router.addDefaultHandler(async (ctx) => {
|
|
314
|
-
* ctx.log.info('...');
|
|
315
|
-
* });
|
|
316
|
-
*
|
|
317
|
-
* const crawler = new JSDOMCrawler({
|
|
318
|
-
* requestHandler: router,
|
|
319
|
-
* });
|
|
320
|
-
* await crawler.run();
|
|
321
|
-
* ```
|
|
322
|
-
*/
|
|
323
299
|
function createJSDOMRouter(routes) {
|
|
324
300
|
return http_1.Router.create(routes);
|
|
325
301
|
}
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@crawlee/jsdom",
|
|
3
|
-
"version": "3.17.1-beta.
|
|
3
|
+
"version": "3.17.1-beta.23",
|
|
4
4
|
"description": "The scalable web crawling and scraping library for JavaScript/Node.js. Enables development of data extraction and web automation jobs (not only) with headless Chrome and Puppeteer.",
|
|
5
5
|
"engines": {
|
|
6
6
|
"node": ">=16.0.0"
|
|
@@ -55,9 +55,9 @@
|
|
|
55
55
|
"dependencies": {
|
|
56
56
|
"@apify/timeout": "^0.3.0",
|
|
57
57
|
"@apify/utilities": "^2.7.10",
|
|
58
|
-
"@crawlee/http": "3.17.1-beta.
|
|
59
|
-
"@crawlee/types": "3.17.1-beta.
|
|
60
|
-
"@crawlee/utils": "3.17.1-beta.
|
|
58
|
+
"@crawlee/http": "3.17.1-beta.23",
|
|
59
|
+
"@crawlee/types": "3.17.1-beta.23",
|
|
60
|
+
"@crawlee/utils": "3.17.1-beta.23",
|
|
61
61
|
"@types/jsdom": "^21.0.0",
|
|
62
62
|
"cheerio": "1.0.0-rc.12",
|
|
63
63
|
"jsdom": "^26.0.0",
|
|
@@ -71,5 +71,5 @@
|
|
|
71
71
|
}
|
|
72
72
|
}
|
|
73
73
|
},
|
|
74
|
-
"gitHead": "
|
|
74
|
+
"gitHead": "704d91af7d46c2efaf8bff883025e4a7d8ffd6d7"
|
|
75
75
|
}
|