xcrawl-mcp 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (51) hide show
  1. package/.editorconfig +12 -0
  2. package/.env.example +3 -0
  3. package/.prettierrc +6 -0
  4. package/README.md +244 -0
  5. package/claude.md +295 -0
  6. package/dist/core/crawl.d.ts +246 -0
  7. package/dist/core/crawl.d.ts.map +1 -0
  8. package/dist/core/crawl.js +141 -0
  9. package/dist/core/crawl.js.map +1 -0
  10. package/dist/core/map.d.ts +34 -0
  11. package/dist/core/map.d.ts.map +1 -0
  12. package/dist/core/map.js +50 -0
  13. package/dist/core/map.js.map +1 -0
  14. package/dist/core/scrape.d.ts +201 -0
  15. package/dist/core/scrape.d.ts.map +1 -0
  16. package/dist/core/scrape.js +148 -0
  17. package/dist/core/scrape.js.map +1 -0
  18. package/dist/core/search.d.ts +144 -0
  19. package/dist/core/search.d.ts.map +1 -0
  20. package/dist/core/search.js +75 -0
  21. package/dist/core/search.js.map +1 -0
  22. package/dist/index.d.ts +8 -0
  23. package/dist/index.d.ts.map +1 -0
  24. package/dist/index.js +516 -0
  25. package/dist/index.js.map +1 -0
  26. package/dist/stdio.d.ts +3 -0
  27. package/dist/stdio.d.ts.map +1 -0
  28. package/dist/stdio.js +551 -0
  29. package/dist/stdio.js.map +1 -0
  30. package/dist/tools.d.ts +540 -0
  31. package/dist/tools.d.ts.map +1 -0
  32. package/dist/tools.js +528 -0
  33. package/dist/tools.js.map +1 -0
  34. package/dist/types.d.ts +214 -0
  35. package/dist/types.d.ts.map +1 -0
  36. package/dist/types.js +5 -0
  37. package/dist/types.js.map +1 -0
  38. package/package.json +33 -0
  39. package/src/core/crawl.ts +149 -0
  40. package/src/core/map.ts +56 -0
  41. package/src/core/scrape.ts +156 -0
  42. package/src/core/search.ts +81 -0
  43. package/src/index.ts +565 -0
  44. package/src/stdio.ts +584 -0
  45. package/src/tools.ts +539 -0
  46. package/src/types.ts +221 -0
  47. package/tsconfig.build.json +14 -0
  48. package/tsconfig.json +45 -0
  49. package/vitest.config.mts +11 -0
  50. package/worker-configuration.d.ts +10848 -0
  51. package/wrangler.jsonc +26 -0
@@ -0,0 +1,540 @@
1
+ /**
2
+ * Shared tool definitions for both stdio and HTTP modes
3
+ */
4
+ export declare const XCRAWL_SCRAPE_TOOL: {
5
+ name: string;
6
+ description: string;
7
+ inputSchema: {
8
+ type: string;
9
+ properties: {
10
+ url: {
11
+ type: string;
12
+ format: string;
13
+ description: string;
14
+ };
15
+ mode: {
16
+ type: string;
17
+ enum: string[];
18
+ default: string;
19
+ description: string;
20
+ };
21
+ proxy: {
22
+ type: string;
23
+ properties: {
24
+ location: {
25
+ type: string;
26
+ description: string;
27
+ };
28
+ sticky_session: {
29
+ type: string;
30
+ description: string;
31
+ };
32
+ };
33
+ description: string;
34
+ };
35
+ request: {
36
+ type: string;
37
+ properties: {
38
+ locale: {
39
+ type: string;
40
+ description: string;
41
+ };
42
+ device: {
43
+ type: string;
44
+ enum: string[];
45
+ description: string;
46
+ };
47
+ cookies: {
48
+ type: string;
49
+ additionalProperties: {
50
+ type: string;
51
+ };
52
+ description: string;
53
+ };
54
+ headers: {
55
+ type: string;
56
+ additionalProperties: {
57
+ type: string;
58
+ };
59
+ description: string;
60
+ };
61
+ only_main_content: {
62
+ type: string;
63
+ description: string;
64
+ };
65
+ block_ads: {
66
+ type: string;
67
+ description: string;
68
+ };
69
+ skip_tls_verification: {
70
+ type: string;
71
+ description: string;
72
+ };
73
+ };
74
+ description: string;
75
+ };
76
+ js_render: {
77
+ type: string;
78
+ properties: {
79
+ enabled: {
80
+ type: string;
81
+ default: boolean;
82
+ description: string;
83
+ };
84
+ wait_until: {
85
+ type: string;
86
+ enum: string[];
87
+ description: string;
88
+ };
89
+ viewport: {
90
+ type: string;
91
+ properties: {
92
+ width: {
93
+ type: string;
94
+ description: string;
95
+ };
96
+ height: {
97
+ type: string;
98
+ description: string;
99
+ };
100
+ };
101
+ description: string;
102
+ };
103
+ };
104
+ description: string;
105
+ };
106
+ output: {
107
+ type: string;
108
+ description: string;
109
+ properties: {
110
+ formats: {
111
+ type: string;
112
+ items: {
113
+ type: string;
114
+ enum: string[];
115
+ };
116
+ default: string[];
117
+ description: string;
118
+ };
119
+ screenshot: {
120
+ type: string;
121
+ enum: string[];
122
+ description: string;
123
+ };
124
+ json: {
125
+ type: string;
126
+ properties: {
127
+ prompt: {
128
+ type: string;
129
+ description: string;
130
+ };
131
+ json_schema: {
132
+ type: string;
133
+ description: string;
134
+ additionalProperties: boolean;
135
+ };
136
+ };
137
+ description: string;
138
+ };
139
+ };
140
+ };
141
+ webhook: {
142
+ type: string;
143
+ properties: {
144
+ url: {
145
+ type: string;
146
+ description: string;
147
+ };
148
+ headers: {
149
+ type: string;
150
+ additionalProperties: {
151
+ type: string;
152
+ };
153
+ description: string;
154
+ };
155
+ events: {
156
+ type: string;
157
+ items: {
158
+ type: string;
159
+ enum: string[];
160
+ };
161
+ description: string;
162
+ };
163
+ };
164
+ description: string;
165
+ };
166
+ };
167
+ required: string[];
168
+ };
169
+ };
170
+ export declare const XCRAWL_CHECK_STATUS_TOOL: {
171
+ name: string;
172
+ description: string;
173
+ inputSchema: {
174
+ type: string;
175
+ properties: {
176
+ scrape_id: {
177
+ type: string;
178
+ description: string;
179
+ };
180
+ };
181
+ required: string[];
182
+ };
183
+ };
184
+ export declare const XCRAWL_SEARCH_TOOL: {
185
+ name: string;
186
+ description: string;
187
+ inputSchema: {
188
+ type: string;
189
+ properties: {
190
+ query: {
191
+ type: string;
192
+ description: string;
193
+ };
194
+ location: {
195
+ type: string;
196
+ description: string;
197
+ };
198
+ language: {
199
+ type: string;
200
+ description: string;
201
+ };
202
+ limit: {
203
+ type: string;
204
+ description: string;
205
+ minimum: number;
206
+ maximum: number;
207
+ };
208
+ serp_options: {
209
+ type: string;
210
+ description: string;
211
+ properties: {
212
+ q: {
213
+ type: string;
214
+ description: string;
215
+ };
216
+ location: {
217
+ type: string;
218
+ description: string;
219
+ };
220
+ uule: {
221
+ type: string;
222
+ description: string;
223
+ };
224
+ google_domain: {
225
+ type: string;
226
+ description: string;
227
+ };
228
+ gl: {
229
+ type: string;
230
+ description: string;
231
+ };
232
+ hl: {
233
+ type: string;
234
+ description: string;
235
+ };
236
+ cr: {
237
+ type: string;
238
+ description: string;
239
+ };
240
+ lr: {
241
+ type: string;
242
+ description: string;
243
+ };
244
+ safe: {
245
+ type: string;
246
+ description: string;
247
+ };
248
+ nfpr: {
249
+ type: string;
250
+ description: string;
251
+ };
252
+ filter: {
253
+ type: string;
254
+ description: string;
255
+ };
256
+ tbs: {
257
+ type: string;
258
+ description: string;
259
+ };
260
+ start: {
261
+ type: string;
262
+ description: string;
263
+ };
264
+ num: {
265
+ type: string;
266
+ description: string;
267
+ };
268
+ ludocid: {
269
+ type: string;
270
+ description: string;
271
+ };
272
+ lsig: {
273
+ type: string;
274
+ description: string;
275
+ };
276
+ kgmid: {
277
+ type: string;
278
+ description: string;
279
+ };
280
+ si: {
281
+ type: string;
282
+ description: string;
283
+ };
284
+ ibp: {
285
+ type: string;
286
+ description: string;
287
+ };
288
+ uds: {
289
+ type: string;
290
+ description: string;
291
+ };
292
+ no_cache: {
293
+ type: string;
294
+ description: string;
295
+ };
296
+ };
297
+ };
298
+ };
299
+ required: string[];
300
+ };
301
+ };
302
+ export declare const XCRAWL_MAP_TOOL: {
303
+ name: string;
304
+ description: string;
305
+ inputSchema: {
306
+ type: string;
307
+ properties: {
308
+ url: {
309
+ type: string;
310
+ format: string;
311
+ description: string;
312
+ };
313
+ filter: {
314
+ type: string;
315
+ description: string;
316
+ };
317
+ limit: {
318
+ type: string;
319
+ description: string;
320
+ minimum: number;
321
+ maximum: number;
322
+ };
323
+ include_subdomains: {
324
+ type: string;
325
+ description: string;
326
+ };
327
+ ignore_query_parameters: {
328
+ type: string;
329
+ description: string;
330
+ };
331
+ };
332
+ required: string[];
333
+ };
334
+ };
335
+ export declare const XCRAWL_CRAWL_TOOL: {
336
+ name: string;
337
+ description: string;
338
+ inputSchema: {
339
+ type: string;
340
+ properties: {
341
+ url: {
342
+ type: string;
343
+ format: string;
344
+ description: string;
345
+ };
346
+ crawler: {
347
+ type: string;
348
+ properties: {
349
+ limit: {
350
+ type: string;
351
+ description: string;
352
+ };
353
+ include: {
354
+ type: string;
355
+ items: {
356
+ type: string;
357
+ };
358
+ description: string;
359
+ };
360
+ exclude: {
361
+ type: string;
362
+ items: {
363
+ type: string;
364
+ };
365
+ description: string;
366
+ };
367
+ max_depth: {
368
+ type: string;
369
+ description: string;
370
+ };
371
+ include_entire_domain: {
372
+ type: string;
373
+ description: string;
374
+ };
375
+ include_subdomains: {
376
+ type: string;
377
+ description: string;
378
+ };
379
+ include_external_links: {
380
+ type: string;
381
+ description: string;
382
+ };
383
+ sitemaps: {
384
+ type: string;
385
+ description: string;
386
+ };
387
+ };
388
+ description: string;
389
+ };
390
+ proxy: {
391
+ type: string;
392
+ properties: {
393
+ location: {
394
+ type: string;
395
+ description: string;
396
+ };
397
+ sticky_session: {
398
+ type: string;
399
+ description: string;
400
+ };
401
+ };
402
+ description: string;
403
+ };
404
+ request: {
405
+ type: string;
406
+ properties: {
407
+ locale: {
408
+ type: string;
409
+ description: string;
410
+ };
411
+ device: {
412
+ type: string;
413
+ enum: string[];
414
+ description: string;
415
+ };
416
+ cookies: {
417
+ type: string;
418
+ description: string;
419
+ };
420
+ headers: {
421
+ type: string;
422
+ description: string;
423
+ };
424
+ only_main_content: {
425
+ type: string;
426
+ description: string;
427
+ };
428
+ block_ads: {
429
+ type: string;
430
+ description: string;
431
+ };
432
+ skip_tls_verification: {
433
+ type: string;
434
+ description: string;
435
+ };
436
+ };
437
+ description: string;
438
+ };
439
+ js_render: {
440
+ type: string;
441
+ properties: {
442
+ enabled: {
443
+ type: string;
444
+ description: string;
445
+ };
446
+ wait_until: {
447
+ type: string;
448
+ enum: string[];
449
+ description: string;
450
+ };
451
+ viewport: {
452
+ type: string;
453
+ properties: {
454
+ width: {
455
+ type: string;
456
+ description: string;
457
+ };
458
+ height: {
459
+ type: string;
460
+ description: string;
461
+ };
462
+ };
463
+ };
464
+ };
465
+ description: string;
466
+ };
467
+ output: {
468
+ type: string;
469
+ properties: {
470
+ formats: {
471
+ type: string;
472
+ items: {
473
+ type: string;
474
+ enum: string[];
475
+ };
476
+ default: string[];
477
+ description: string;
478
+ };
479
+ screenshot: {
480
+ type: string;
481
+ enum: string[];
482
+ description: string;
483
+ };
484
+ json: {
485
+ type: string;
486
+ properties: {
487
+ prompt: {
488
+ type: string;
489
+ description: string;
490
+ };
491
+ json_schema: {
492
+ type: string;
493
+ description: string;
494
+ };
495
+ };
496
+ };
497
+ };
498
+ description: string;
499
+ };
500
+ webhook: {
501
+ type: string;
502
+ properties: {
503
+ url: {
504
+ type: string;
505
+ description: string;
506
+ };
507
+ headers: {
508
+ type: string;
509
+ description: string;
510
+ };
511
+ events: {
512
+ type: string;
513
+ items: {
514
+ type: string;
515
+ enum: string[];
516
+ };
517
+ description: string;
518
+ };
519
+ };
520
+ description: string;
521
+ };
522
+ };
523
+ required: string[];
524
+ };
525
+ };
526
+ export declare const XCRAWL_CHECK_CRAWL_STATUS_TOOL: {
527
+ name: string;
528
+ description: string;
529
+ inputSchema: {
530
+ type: string;
531
+ properties: {
532
+ crawl_id: {
533
+ type: string;
534
+ description: string;
535
+ };
536
+ };
537
+ required: string[];
538
+ };
539
+ };
540
+ //# sourceMappingURL=tools.d.ts.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"tools.d.ts","sourceRoot":"","sources":["../src/tools.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,eAAO,MAAM,kBAAkB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA4K9B,CAAC;AAEF,eAAO,MAAM,wBAAwB;;;;;;;;;;;;;CA8BpC,CAAC;AAEF,eAAO,MAAM,kBAAkB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAuE9B,CAAC;AAEF,eAAO,MAAM,eAAe;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAkD3B,CAAC;AAEF,eAAO,MAAM,iBAAiB;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAiL7B,CAAC;AAEF,eAAO,MAAM,8BAA8B;;;;;;;;;;;;;CAwB1C,CAAC"}