cloudflare-bot-directory 1.0.7 → 1.0.16
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE.md +1 -1
- package/README.md +4 -4
- package/package.json +4 -4
- package/src/index.json +370 -59
package/LICENSE.md
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
The MIT License (MIT)
|
|
2
2
|
|
|
3
|
-
Copyright ©
|
|
3
|
+
Copyright © 2019 Microlink <hello@microlink.io> (microlink.io)
|
|
4
4
|
|
|
5
5
|
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
6
6
|
of this software and associated documentation files (the "Software"), to deal
|
package/README.md
CHANGED
|
@@ -6,7 +6,7 @@
|
|
|
6
6
|
<br>
|
|
7
7
|
</p>
|
|
8
8
|
|
|
9
|
-

|
|
10
10
|
[](https://www.npmjs.org/package/cloudflare-bot-directory)
|
|
11
11
|
|
|
12
12
|
> A comprehensive list of **500+ verified bots** and web crawlers from [CloudFlare Radar](https://radar.cloudflare.com/traffic/verified-bots), available as a JSON dataset for bot detection, user agent analysis, and web scraping identification.
|
|
@@ -69,7 +69,7 @@ const isKnownBot = (userAgent) =>
|
|
|
69
69
|
|
|
70
70
|
## License
|
|
71
71
|
|
|
72
|
-
**cloudflare-bot-directory** © [
|
|
73
|
-
Authored and maintained by [Kiko Beats](https://kikobeats.com) with help from [contributors](https://microlinkhq/cloudflare-bot-directory/
|
|
72
|
+
**cloudflare-bot-directory** © [Microlink](https://microlink.io), released under the [MIT](https://github.com/microlinkhq/cloudflare-bot-directory/blob/master/LICENSE.md) License.<br>
|
|
73
|
+
Authored and maintained by [Kiko Beats](https://kikobeats.com) with help from [contributors](https://github.com/microlinkhq/cloudflare-bot-directory/contributors).
|
|
74
74
|
|
|
75
|
-
> [
|
|
75
|
+
> [microlink.io](https://microlink.io) · GitHub [microlinkhq](https://github.com/microlinkhq) · X [@microlinkhq](https://x.com/microlinkhq)
|
package/package.json
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "cloudflare-bot-directory",
|
|
3
3
|
"description": "CloudFlare Radar verified bots directory - 500+ web crawlers, search engine bots, and user agents as JSON for bot detection and traffic filtering",
|
|
4
|
-
"homepage": "https://microlinkhq/cloudflare-bot-directory
|
|
5
|
-
"version": "1.0.
|
|
4
|
+
"homepage": "https://github.com/microlinkhq/cloudflare-bot-directory",
|
|
5
|
+
"version": "1.0.16",
|
|
6
6
|
"types": "./src/index.d.ts",
|
|
7
7
|
"main": "./src/index.js",
|
|
8
8
|
"exports": {
|
|
@@ -16,10 +16,10 @@
|
|
|
16
16
|
"contributors": [],
|
|
17
17
|
"repository": {
|
|
18
18
|
"type": "git",
|
|
19
|
-
"url": "git+https://microlinkhq/cloudflare-bot-directory
|
|
19
|
+
"url": "git+https://github.com/microlinkhq/cloudflare-bot-directory.git"
|
|
20
20
|
},
|
|
21
21
|
"bugs": {
|
|
22
|
-
"url": "https://microlinkhq/cloudflare-bot-directory/
|
|
22
|
+
"url": "https://github.com/microlinkhq/cloudflare-bot-directory/issues"
|
|
23
23
|
},
|
|
24
24
|
"keywords": [
|
|
25
25
|
"bingbot",
|
package/src/index.json
CHANGED
|
@@ -557,6 +557,22 @@
|
|
|
557
557
|
"Anchor Browser"
|
|
558
558
|
]
|
|
559
559
|
},
|
|
560
|
+
{
|
|
561
|
+
"slug": "apify-website-content-crawler",
|
|
562
|
+
"name": "Apify Website Content Crawler",
|
|
563
|
+
"kind": "AGENT",
|
|
564
|
+
"operator": null,
|
|
565
|
+
"operatorUrl": "https://apify.com/apify/website-content-crawler",
|
|
566
|
+
"category": "AI_ASSISTANT",
|
|
567
|
+
"description": "Crawl websites and extract content to feed AI apps. Convert web data to Markdown or HTML, download files, and more.",
|
|
568
|
+
"followsRobotsTxt": false,
|
|
569
|
+
"userAgentPatterns": [
|
|
570
|
+
"ApifyWebsiteContentCrawler"
|
|
571
|
+
],
|
|
572
|
+
"userAgents": [
|
|
573
|
+
"ApifyWebsiteContentCrawler/1.0 (+https://apify.com/apify/website-content-crawler)"
|
|
574
|
+
]
|
|
575
|
+
},
|
|
560
576
|
{
|
|
561
577
|
"slug": "apple",
|
|
562
578
|
"name": "Applebot",
|
|
@@ -736,22 +752,6 @@
|
|
|
736
752
|
"Tumblr/14.0.835.186"
|
|
737
753
|
]
|
|
738
754
|
},
|
|
739
|
-
{
|
|
740
|
-
"slug": "autorag",
|
|
741
|
-
"name": "AutoRAG",
|
|
742
|
-
"kind": "BOT",
|
|
743
|
-
"operator": "Cloudflare",
|
|
744
|
-
"operatorUrl": "https://developers.cloudflare.com/autorag",
|
|
745
|
-
"category": "AI_SEARCH",
|
|
746
|
-
"description": "AutoRAG is an all-in-one AI search solution",
|
|
747
|
-
"followsRobotsTxt": true,
|
|
748
|
-
"userAgentPatterns": [
|
|
749
|
-
"Cloudflare-AutoRAG"
|
|
750
|
-
],
|
|
751
|
-
"userAgents": [
|
|
752
|
-
"Cloudflare-AutoRAG (https://developers.cloudflare.com/autorag; autorag@cloudflare.com)"
|
|
753
|
-
]
|
|
754
|
-
},
|
|
755
755
|
{
|
|
756
756
|
"slug": "awario",
|
|
757
757
|
"name": "AwarioSmartBot",
|
|
@@ -808,7 +808,7 @@
|
|
|
808
808
|
"operator": "Baidu",
|
|
809
809
|
"operatorUrl": null,
|
|
810
810
|
"category": "SEARCH_ENGINE_CRAWLER",
|
|
811
|
-
"description": "Baidu's
|
|
811
|
+
"description": "Baidu's scrubbing proxy.",
|
|
812
812
|
"followsRobotsTxt": false,
|
|
813
813
|
"userAgentPatterns": [
|
|
814
814
|
"Baidu-ADS"
|
|
@@ -897,6 +897,22 @@
|
|
|
897
897
|
"bigsur.ai (+https://www.bigsur.ai)"
|
|
898
898
|
]
|
|
899
899
|
},
|
|
900
|
+
{
|
|
901
|
+
"slug": "bigscootsmonitor",
|
|
902
|
+
"name": "BigScootsMonitor",
|
|
903
|
+
"kind": "BOT",
|
|
904
|
+
"operator": null,
|
|
905
|
+
"operatorUrl": "https://monitor.bigscoots.dev",
|
|
906
|
+
"category": "MONITORING_AND_ANALYTICS",
|
|
907
|
+
"description": "BigScoots Managed Services Monitor - Uptime",
|
|
908
|
+
"followsRobotsTxt": false,
|
|
909
|
+
"userAgentPatterns": [
|
|
910
|
+
"BigScootsMonitor"
|
|
911
|
+
],
|
|
912
|
+
"userAgents": [
|
|
913
|
+
"BigScootsMonitor Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36"
|
|
914
|
+
]
|
|
915
|
+
},
|
|
900
916
|
{
|
|
901
917
|
"slug": "bigupdatabot",
|
|
902
918
|
"name": "BigUpData Bot",
|
|
@@ -1469,6 +1485,22 @@
|
|
|
1469
1485
|
"Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/69.0.3464.0 Mobile Safari/537.36 Chrome-Lighthouse"
|
|
1470
1486
|
]
|
|
1471
1487
|
},
|
|
1488
|
+
{
|
|
1489
|
+
"slug": "citibotsitecrawler",
|
|
1490
|
+
"name": "CitibotSiteCrawler",
|
|
1491
|
+
"kind": "BOT",
|
|
1492
|
+
"operator": null,
|
|
1493
|
+
"operatorUrl": "https://www.citibot.io/",
|
|
1494
|
+
"category": "AI_CRAWLER",
|
|
1495
|
+
"description": "CitibotSiteCrawler collects public data from government websites to power Citibot’s AI civic engagement tools.",
|
|
1496
|
+
"followsRobotsTxt": false,
|
|
1497
|
+
"userAgentPatterns": [
|
|
1498
|
+
"CitibotSiteCrawler"
|
|
1499
|
+
],
|
|
1500
|
+
"userAgents": [
|
|
1501
|
+
"CitibotSiteCrawler/1.0"
|
|
1502
|
+
]
|
|
1503
|
+
},
|
|
1472
1504
|
{
|
|
1473
1505
|
"slug": "clickagy",
|
|
1474
1506
|
"name": "Clickagy",
|
|
@@ -1485,18 +1517,50 @@
|
|
|
1485
1517
|
"Clickagy Intelligence Bot v2"
|
|
1486
1518
|
]
|
|
1487
1519
|
},
|
|
1520
|
+
{
|
|
1521
|
+
"slug": "cloudflare-ai-search",
|
|
1522
|
+
"name": "AI Search",
|
|
1523
|
+
"kind": "BOT",
|
|
1524
|
+
"operator": "Cloudflare",
|
|
1525
|
+
"operatorUrl": "https://developers.cloudflare.com/ai-search",
|
|
1526
|
+
"category": "AI_SEARCH",
|
|
1527
|
+
"description": "Cloudflare AI Search is a managed service that lets you connect your data and easily build AI-powered search.",
|
|
1528
|
+
"followsRobotsTxt": true,
|
|
1529
|
+
"userAgentPatterns": [
|
|
1530
|
+
"Cloudflare-AI-Search"
|
|
1531
|
+
],
|
|
1532
|
+
"userAgents": [
|
|
1533
|
+
"Cloudflare-AI-Search (https://developers.cloudflare.com/ai-search; ai-search@cloudflare.com)"
|
|
1534
|
+
]
|
|
1535
|
+
},
|
|
1488
1536
|
{
|
|
1489
1537
|
"slug": "cloudflare-browser-rendering",
|
|
1490
1538
|
"name": "Cloudflare Browser Rendering",
|
|
1491
1539
|
"kind": "AGENT",
|
|
1492
1540
|
"operator": "Cloudflare",
|
|
1493
1541
|
"operatorUrl": "https://cloudflare.com",
|
|
1494
|
-
"category": "
|
|
1495
|
-
"description": "Cloudflare
|
|
1542
|
+
"category": "AI_ASSISTANT",
|
|
1543
|
+
"description": "Renders web pages in headless browsers for Cloudflare customers. Used for browser automation (screenshots, PDF generation, content extraction, etc.) and for AI agents to interact with the web. Used by Cloudflare customers via Workers bindings and REST API. Does not include the /crawl endpoint, which has a separate bot identity (Cloudflare Crawler - Signed Agent).",
|
|
1496
1544
|
"followsRobotsTxt": false,
|
|
1497
1545
|
"userAgentPatterns": [],
|
|
1498
1546
|
"userAgents": []
|
|
1499
1547
|
},
|
|
1548
|
+
{
|
|
1549
|
+
"slug": "cloudflare-browser-rendering-crawler",
|
|
1550
|
+
"name": "Cloudflare Crawler",
|
|
1551
|
+
"kind": "AGENT",
|
|
1552
|
+
"operator": "Cloudflare",
|
|
1553
|
+
"operatorUrl": "https://cloudflare.com",
|
|
1554
|
+
"category": "AI_CRAWLER",
|
|
1555
|
+
"description": "The Cloudflare Crawler is a well-behaved crawler that retrieves web content. By default, it self-identifies as a bot, honors robots.txt directives, and cannot bypass CAPTCHAs or bot protection. Used by Cloudflare customers via the Browser Rendering /crawl endpoint.",
|
|
1556
|
+
"followsRobotsTxt": false,
|
|
1557
|
+
"userAgentPatterns": [
|
|
1558
|
+
"CloudflareBrowserRenderingCrawler/1.0"
|
|
1559
|
+
],
|
|
1560
|
+
"userAgents": [
|
|
1561
|
+
"CloudflareBrowserRenderingCrawler/1.0"
|
|
1562
|
+
]
|
|
1563
|
+
},
|
|
1500
1564
|
{
|
|
1501
1565
|
"slug": "cloudflare-chv",
|
|
1502
1566
|
"name": "Cloudflare Custom Hostname Verification",
|
|
@@ -1536,7 +1600,7 @@
|
|
|
1536
1600
|
"operator": "Cloudflare",
|
|
1537
1601
|
"operatorUrl": null,
|
|
1538
1602
|
"category": "MONITORING_AND_ANALYTICS",
|
|
1539
|
-
"description": "Cloudflare
|
|
1603
|
+
"description": "Cloudflare system bot that performs health checks and diagnostic tests",
|
|
1540
1604
|
"followsRobotsTxt": false,
|
|
1541
1605
|
"userAgentPatterns": [
|
|
1542
1606
|
"CloudflareDiagnostics"
|
|
@@ -1561,6 +1625,22 @@
|
|
|
1561
1625
|
"Cloudflare-Healthchecks"
|
|
1562
1626
|
]
|
|
1563
1627
|
},
|
|
1628
|
+
{
|
|
1629
|
+
"slug": "cloudflare-observatory-curly",
|
|
1630
|
+
"name": "Cloudflare Observatory Curly",
|
|
1631
|
+
"kind": "BOT",
|
|
1632
|
+
"operator": "Cloudflare",
|
|
1633
|
+
"operatorUrl": "https://developers.cloudflare.com/speed/observatory/",
|
|
1634
|
+
"category": "MONITORING_AND_ANALYTICS",
|
|
1635
|
+
"description": "Synthetic network probes for HTTP timing measurements (TCP, TLS, TTFB). Measures connection timing for customer-owned URLs.",
|
|
1636
|
+
"followsRobotsTxt": false,
|
|
1637
|
+
"userAgentPatterns": [
|
|
1638
|
+
"curly-"
|
|
1639
|
+
],
|
|
1640
|
+
"userAgents": [
|
|
1641
|
+
"curly-*"
|
|
1642
|
+
]
|
|
1643
|
+
},
|
|
1564
1644
|
{
|
|
1565
1645
|
"slug": "cloudflare-prefetch",
|
|
1566
1646
|
"name": "Cloudflare Prefetch",
|
|
@@ -2059,6 +2139,42 @@
|
|
|
2059
2139
|
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/140.0.0.0 Safari/537.36 CybaaBot"
|
|
2060
2140
|
]
|
|
2061
2141
|
},
|
|
2142
|
+
{
|
|
2143
|
+
"slug": "daric2",
|
|
2144
|
+
"name": "Daric2",
|
|
2145
|
+
"kind": "BOT",
|
|
2146
|
+
"operator": null,
|
|
2147
|
+
"operatorUrl": "https://developers.cloudflare.com/ai-crawl-control/",
|
|
2148
|
+
"category": "AI_CRAWLER",
|
|
2149
|
+
"description": "Cloudflare AI Crawl Control bot 2",
|
|
2150
|
+
"followsRobotsTxt": false,
|
|
2151
|
+
"userAgentPatterns": [],
|
|
2152
|
+
"userAgents": []
|
|
2153
|
+
},
|
|
2154
|
+
{
|
|
2155
|
+
"slug": "daric3",
|
|
2156
|
+
"name": "Daric3",
|
|
2157
|
+
"kind": "BOT",
|
|
2158
|
+
"operator": null,
|
|
2159
|
+
"operatorUrl": "https://developers.cloudflare.com/ai-crawl-control/",
|
|
2160
|
+
"category": "AI_CRAWLER",
|
|
2161
|
+
"description": "Cloudflare AI Crawl Control bot 3",
|
|
2162
|
+
"followsRobotsTxt": false,
|
|
2163
|
+
"userAgentPatterns": [],
|
|
2164
|
+
"userAgents": []
|
|
2165
|
+
},
|
|
2166
|
+
{
|
|
2167
|
+
"slug": "daric4",
|
|
2168
|
+
"name": "Daric4",
|
|
2169
|
+
"kind": "BOT",
|
|
2170
|
+
"operator": null,
|
|
2171
|
+
"operatorUrl": "https://developers.cloudflare.com/ai-crawl-control/",
|
|
2172
|
+
"category": "AI_CRAWLER",
|
|
2173
|
+
"description": "Cloudflare AI Crawl Control bot 4",
|
|
2174
|
+
"followsRobotsTxt": false,
|
|
2175
|
+
"userAgentPatterns": [],
|
|
2176
|
+
"userAgents": []
|
|
2177
|
+
},
|
|
2062
2178
|
{
|
|
2063
2179
|
"slug": "datadog-synthetic-bot",
|
|
2064
2180
|
"name": "Synthetic Bot",
|
|
@@ -2146,7 +2262,7 @@
|
|
|
2146
2262
|
"operator": "Daum",
|
|
2147
2263
|
"operatorUrl": "https://cs.daum.net/faq/15/4118.html?faqId=28966",
|
|
2148
2264
|
"category": "SEARCH_ENGINE_CRAWLER",
|
|
2149
|
-
"description": "Korean search engine crawler
|
|
2265
|
+
"description": "Korean search engine crawler",
|
|
2150
2266
|
"followsRobotsTxt": false,
|
|
2151
2267
|
"userAgentPatterns": [
|
|
2152
2268
|
"Daum/4.1"
|
|
@@ -2181,10 +2297,10 @@
|
|
|
2181
2297
|
"description": "The DeepCrawl bot crawls the websites of its customers to collect performance analytics and suggest SEO optimizations.",
|
|
2182
2298
|
"followsRobotsTxt": false,
|
|
2183
2299
|
"userAgentPatterns": [
|
|
2184
|
-
"
|
|
2300
|
+
"lumar"
|
|
2185
2301
|
],
|
|
2186
2302
|
"userAgents": [
|
|
2187
|
-
"
|
|
2303
|
+
"lumar"
|
|
2188
2304
|
]
|
|
2189
2305
|
},
|
|
2190
2306
|
{
|
|
@@ -2464,6 +2580,22 @@
|
|
|
2464
2580
|
"easyDNS Monitoring ( http://easyurl.net/monitoring )"
|
|
2465
2581
|
]
|
|
2466
2582
|
},
|
|
2583
|
+
{
|
|
2584
|
+
"slug": "easyscan",
|
|
2585
|
+
"name": "EasyScan",
|
|
2586
|
+
"kind": "AGENT",
|
|
2587
|
+
"operator": "codire GmbH",
|
|
2588
|
+
"operatorUrl": "https://www.it-recht-kanzlei.de/website-scanner-fuer-mandanten.php",
|
|
2589
|
+
"category": "AI_ASSISTANT",
|
|
2590
|
+
"description": "Automated scanning service that reviews online content on behalf of end users to identify potential legal issues.",
|
|
2591
|
+
"followsRobotsTxt": false,
|
|
2592
|
+
"userAgentPatterns": [
|
|
2593
|
+
"EasyScan"
|
|
2594
|
+
],
|
|
2595
|
+
"userAgents": [
|
|
2596
|
+
"EasyScan/1.0"
|
|
2597
|
+
]
|
|
2598
|
+
},
|
|
2467
2599
|
{
|
|
2468
2600
|
"slug": "echoboxbot",
|
|
2469
2601
|
"name": "Echobot Bot",
|
|
@@ -3494,6 +3626,18 @@
|
|
|
3494
3626
|
"Notabot"
|
|
3495
3627
|
]
|
|
3496
3628
|
},
|
|
3629
|
+
{
|
|
3630
|
+
"slug": "henry-shopping-agent",
|
|
3631
|
+
"name": "Henry Shopping Agent",
|
|
3632
|
+
"kind": "AGENT",
|
|
3633
|
+
"operator": null,
|
|
3634
|
+
"operatorUrl": "https://docs.henrylabs.ai/",
|
|
3635
|
+
"category": "AI_ASSISTANT",
|
|
3636
|
+
"description": "Executes checkout via browser automation using a user's card and signed mandate",
|
|
3637
|
+
"followsRobotsTxt": false,
|
|
3638
|
+
"userAgentPatterns": [],
|
|
3639
|
+
"userAgents": []
|
|
3640
|
+
},
|
|
3497
3641
|
{
|
|
3498
3642
|
"slug": "hetrixtools",
|
|
3499
3643
|
"name": "HetrixTools",
|
|
@@ -3510,6 +3654,22 @@
|
|
|
3510
3654
|
"HetrixTools Uptime Monitoring Bot. https://hetrix.tools/uptime-monitoring-bot.html"
|
|
3511
3655
|
]
|
|
3512
3656
|
},
|
|
3657
|
+
{
|
|
3658
|
+
"slug": "hey-email-privacy-proxy-2",
|
|
3659
|
+
"name": "HEY Email Privacy Proxy",
|
|
3660
|
+
"kind": "BOT",
|
|
3661
|
+
"operator": null,
|
|
3662
|
+
"operatorUrl": "https://www.hey.com/spy-trackers/",
|
|
3663
|
+
"category": "PAGE_PREVIEW",
|
|
3664
|
+
"description": "HEY email stops spy pixels and prevents user IP tracking by proxying all HTML email images, fonts, and external assets",
|
|
3665
|
+
"followsRobotsTxt": false,
|
|
3666
|
+
"userAgentPatterns": [
|
|
3667
|
+
"hey.com/imageproxy"
|
|
3668
|
+
],
|
|
3669
|
+
"userAgents": [
|
|
3670
|
+
"hey.com/imageproxy Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/134.0.0.0 Safari/537.36"
|
|
3671
|
+
]
|
|
3672
|
+
},
|
|
3513
3673
|
{
|
|
3514
3674
|
"slug": "hifibot",
|
|
3515
3675
|
"name": "HIFIBot",
|
|
@@ -3995,6 +4155,18 @@
|
|
|
3995
4155
|
"Mozilla/5.0 (compatible; heritrix/3.4.0 +https://www.kb.dk/netarkivindsamling/) Firefox/57"
|
|
3996
4156
|
]
|
|
3997
4157
|
},
|
|
4158
|
+
{
|
|
4159
|
+
"slug": "kernel",
|
|
4160
|
+
"name": "Kernel",
|
|
4161
|
+
"kind": "AGENT",
|
|
4162
|
+
"operator": null,
|
|
4163
|
+
"operatorUrl": "https://www.kernel.sh/docs",
|
|
4164
|
+
"category": "AI_ASSISTANT",
|
|
4165
|
+
"description": "Kernel is a browsers as a service platform that enables AI agents to browse the internet.",
|
|
4166
|
+
"followsRobotsTxt": false,
|
|
4167
|
+
"userAgentPatterns": [],
|
|
4168
|
+
"userAgents": []
|
|
4169
|
+
},
|
|
3998
4170
|
{
|
|
3999
4171
|
"slug": "kinsta-bot",
|
|
4000
4172
|
"name": "Kinsta",
|
|
@@ -4453,6 +4625,22 @@
|
|
|
4453
4625
|
"MediaMonitoringBot/1.1 (+https://mediamonitoringbot.com/crawler; crawler@mediamonitoringbot.com)"
|
|
4454
4626
|
]
|
|
4455
4627
|
},
|
|
4628
|
+
{
|
|
4629
|
+
"slug": "mediaboardbot",
|
|
4630
|
+
"name": "mediaboardbot",
|
|
4631
|
+
"kind": "BOT",
|
|
4632
|
+
"operator": "Mediaboard",
|
|
4633
|
+
"operatorUrl": "https://media.mediaboard.com/docs/mediaboardbot",
|
|
4634
|
+
"category": "MONITORING_AND_ANALYTICS",
|
|
4635
|
+
"description": "Mediaboard's web crawler (media monitoring) detects client mentions in online news and public content.",
|
|
4636
|
+
"followsRobotsTxt": false,
|
|
4637
|
+
"userAgentPatterns": [
|
|
4638
|
+
"mediaboardbot"
|
|
4639
|
+
],
|
|
4640
|
+
"userAgents": [
|
|
4641
|
+
"Mozilla/5.0 (compatible; mediaboardbot/1.0; +https://www.mediaboard.com/)"
|
|
4642
|
+
]
|
|
4643
|
+
},
|
|
4456
4644
|
{
|
|
4457
4645
|
"slug": "medialogiabot",
|
|
4458
4646
|
"name": "Medialogia Bot",
|
|
@@ -4892,6 +5080,22 @@
|
|
|
4892
5080
|
"Mozilla/5.0 (compatible; Clearscopebot/1.0)"
|
|
4893
5081
|
]
|
|
4894
5082
|
},
|
|
5083
|
+
{
|
|
5084
|
+
"slug": "nava-labs-asp-dev",
|
|
5085
|
+
"name": "Nava Labs ASP (Dev)",
|
|
5086
|
+
"kind": "AGENT",
|
|
5087
|
+
"operator": null,
|
|
5088
|
+
"operatorUrl": "https://dev.labs-asp.navateam.com/bot-disclosure",
|
|
5089
|
+
"category": "AI_ASSISTANT",
|
|
5090
|
+
"description": "Bot to assist social workers in navigating safety net benefit websites.",
|
|
5091
|
+
"followsRobotsTxt": false,
|
|
5092
|
+
"userAgentPatterns": [
|
|
5093
|
+
"Nava/"
|
|
5094
|
+
],
|
|
5095
|
+
"userAgents": [
|
|
5096
|
+
"Nava/"
|
|
5097
|
+
]
|
|
5098
|
+
},
|
|
4895
5099
|
{
|
|
4896
5100
|
"slug": "naver",
|
|
4897
5101
|
"name": "Yeti",
|
|
@@ -5164,6 +5368,18 @@
|
|
|
5164
5368
|
"Mozilla/5.0 (compatible; NostoCrawlerBot/1.0; +http://my.nosto.com/tagging)"
|
|
5165
5369
|
]
|
|
5166
5370
|
},
|
|
5371
|
+
{
|
|
5372
|
+
"slug": "nostra",
|
|
5373
|
+
"name": "Nostra",
|
|
5374
|
+
"kind": "BOT",
|
|
5375
|
+
"operator": null,
|
|
5376
|
+
"operatorUrl": "https://www.nostra.ai/edge-optimization",
|
|
5377
|
+
"category": "SEARCH_ENGINE_OPTIMIZATION",
|
|
5378
|
+
"description": "Nostra accelerates site speed for managed web platforms",
|
|
5379
|
+
"followsRobotsTxt": false,
|
|
5380
|
+
"userAgentPatterns": [],
|
|
5381
|
+
"userAgents": []
|
|
5382
|
+
},
|
|
5167
5383
|
{
|
|
5168
5384
|
"slug": "novellum-ai-crawl",
|
|
5169
5385
|
"name": "Novellum AI Crawl",
|
|
@@ -5470,6 +5686,30 @@
|
|
|
5470
5686
|
"Mozilla/5.0 (compatible; parse.ly scraper/0.16; +http://parsely.com)"
|
|
5471
5687
|
]
|
|
5472
5688
|
},
|
|
5689
|
+
{
|
|
5690
|
+
"slug": "particlenewsbot",
|
|
5691
|
+
"name": "ParticleNewsBot",
|
|
5692
|
+
"kind": "BOT",
|
|
5693
|
+
"operator": null,
|
|
5694
|
+
"operatorUrl": "https://particle.news/bot",
|
|
5695
|
+
"category": "AGGREGATOR",
|
|
5696
|
+
"description": "Particle is an AI powered aggregator that collects news from many sources",
|
|
5697
|
+
"followsRobotsTxt": false,
|
|
5698
|
+
"userAgentPatterns": [],
|
|
5699
|
+
"userAgents": []
|
|
5700
|
+
},
|
|
5701
|
+
{
|
|
5702
|
+
"slug": "payhawk-invoice-fetching-bot",
|
|
5703
|
+
"name": "Payhawk Invoice Fetching Agent",
|
|
5704
|
+
"kind": "AGENT",
|
|
5705
|
+
"operator": "Payhawk",
|
|
5706
|
+
"operatorUrl": "https://payhawk.com/help/overview-of-the-financial-controller-agent",
|
|
5707
|
+
"category": "AI_ASSISTANT",
|
|
5708
|
+
"description": "Automated browser bot that fetches invoices for users from supplier websites and attaches them to their expense records.",
|
|
5709
|
+
"followsRobotsTxt": false,
|
|
5710
|
+
"userAgentPatterns": [],
|
|
5711
|
+
"userAgents": []
|
|
5712
|
+
},
|
|
5473
5713
|
{
|
|
5474
5714
|
"slug": "paypal",
|
|
5475
5715
|
"name": "PayPal",
|
|
@@ -6133,6 +6373,18 @@
|
|
|
6133
6373
|
"RSSAPI/2.0 (+https://rssapi.net/)"
|
|
6134
6374
|
]
|
|
6135
6375
|
},
|
|
6376
|
+
{
|
|
6377
|
+
"slug": "ryebot",
|
|
6378
|
+
"name": "RyeBot",
|
|
6379
|
+
"kind": "AGENT",
|
|
6380
|
+
"operator": null,
|
|
6381
|
+
"operatorUrl": "https://docs.rye.com/api-v2-experimental/ryebot",
|
|
6382
|
+
"category": "AI_ASSISTANT",
|
|
6383
|
+
"description": "Agentic checkout assistant that purchases products on behalf of end users with their explicit consent.",
|
|
6384
|
+
"followsRobotsTxt": false,
|
|
6385
|
+
"userAgentPatterns": [],
|
|
6386
|
+
"userAgents": []
|
|
6387
|
+
},
|
|
6136
6388
|
{
|
|
6137
6389
|
"slug": "salesforce",
|
|
6138
6390
|
"name": "Salesforce",
|
|
@@ -6508,7 +6760,7 @@
|
|
|
6508
6760
|
"slug": "serankingbacklinksbot",
|
|
6509
6761
|
"name": "SERankingBacklinksBot",
|
|
6510
6762
|
"kind": "BOT",
|
|
6511
|
-
"operator":
|
|
6763
|
+
"operator": "SE Ranking",
|
|
6512
6764
|
"operatorUrl": "https://seranking.com/backlinks-crawler",
|
|
6513
6765
|
"category": "SEARCH_ENGINE_OPTIMIZATION",
|
|
6514
6766
|
"description": "Crawls the Internet to assist in getting information on the link structure of sites on the web to assist SEO specialists",
|
|
@@ -6910,23 +7162,6 @@
|
|
|
6910
7162
|
"Snipcart/1.0"
|
|
6911
7163
|
]
|
|
6912
7164
|
},
|
|
6913
|
-
{
|
|
6914
|
-
"slug": "sogou",
|
|
6915
|
-
"name": "Sogou",
|
|
6916
|
-
"kind": "BOT",
|
|
6917
|
-
"operator": "Sogou",
|
|
6918
|
-
"operatorUrl": "http://www.sogou.com/docs/help/webmasters.htm#07",
|
|
6919
|
-
"category": "SEARCH_ENGINE_CRAWLER",
|
|
6920
|
-
"description": "The Sogou spider is the search engine crawler for Sogou. ",
|
|
6921
|
-
"followsRobotsTxt": false,
|
|
6922
|
-
"userAgentPatterns": [
|
|
6923
|
-
"www.sogou.com"
|
|
6924
|
-
],
|
|
6925
|
-
"userAgents": [
|
|
6926
|
-
"Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)",
|
|
6927
|
-
"Sogou Pic Spider/3.0( http://www.sogou.com/docs/help/webmasters.htm#07)"
|
|
6928
|
-
]
|
|
6929
|
-
},
|
|
6930
7165
|
{
|
|
6931
7166
|
"slug": "solarwinds-observability",
|
|
6932
7167
|
"name": "SolarWinds Observability",
|
|
@@ -7300,6 +7535,23 @@
|
|
|
7300
7535
|
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/W.X.Y.Z Safari/537.36 (compatible; TermlyBot/W.X; +http://www.termly.io/bot.html)"
|
|
7301
7536
|
]
|
|
7302
7537
|
},
|
|
7538
|
+
{
|
|
7539
|
+
"slug": "terracotta",
|
|
7540
|
+
"name": "Terracotta",
|
|
7541
|
+
"kind": "BOT",
|
|
7542
|
+
"operator": null,
|
|
7543
|
+
"operatorUrl": "https://github.com/CeramicTeam/CeramicTerracotta",
|
|
7544
|
+
"category": "SEARCH_ENGINE_CRAWLER",
|
|
7545
|
+
"description": "The Terracotta bot scrapes websites for use in generating indices for serving searches using Ceramic's search product.",
|
|
7546
|
+
"followsRobotsTxt": false,
|
|
7547
|
+
"userAgentPatterns": [
|
|
7548
|
+
"Terracotta"
|
|
7549
|
+
],
|
|
7550
|
+
"userAgents": [
|
|
7551
|
+
"Terracotta",
|
|
7552
|
+
"Terracotta-News"
|
|
7553
|
+
]
|
|
7554
|
+
},
|
|
7303
7555
|
{
|
|
7304
7556
|
"slug": "thousand-eyes",
|
|
7305
7557
|
"name": "Thousand Eyes Cloud Agent",
|
|
@@ -7493,6 +7745,22 @@
|
|
|
7493
7745
|
"Mozilla/5.0 (compatible; Uptime/1.0; http://uptime.com)"
|
|
7494
7746
|
]
|
|
7495
7747
|
},
|
|
7748
|
+
{
|
|
7749
|
+
"slug": "uptime-monitoring",
|
|
7750
|
+
"name": "Uptime Monitoring",
|
|
7751
|
+
"kind": "BOT",
|
|
7752
|
+
"operator": "GoDaddy",
|
|
7753
|
+
"operatorUrl": "https://docs.sucuri.net/website-monitoring/understanding-alerts/uptime-monitor-alerts/",
|
|
7754
|
+
"category": "MONITORING_AND_ANALYTICS",
|
|
7755
|
+
"description": "Uptime monitoring is a service that checks if a website is online. It will send you an alert if your website is “down”.",
|
|
7756
|
+
"followsRobotsTxt": false,
|
|
7757
|
+
"userAgentPatterns": [
|
|
7758
|
+
"UptimeMonitoring"
|
|
7759
|
+
],
|
|
7760
|
+
"userAgents": [
|
|
7761
|
+
"UptimeMonitoring"
|
|
7762
|
+
]
|
|
7763
|
+
},
|
|
7496
7764
|
{
|
|
7497
7765
|
"slug": "uptimebot",
|
|
7498
7766
|
"name": "UptimeBot",
|
|
@@ -7525,23 +7793,6 @@
|
|
|
7525
7793
|
"Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)"
|
|
7526
7794
|
]
|
|
7527
7795
|
},
|
|
7528
|
-
{
|
|
7529
|
-
"slug": "uptimestatistics",
|
|
7530
|
-
"name": "uptimedoctor",
|
|
7531
|
-
"kind": "BOT",
|
|
7532
|
-
"operator": "uptimedoctor",
|
|
7533
|
-
"operatorUrl": "http://uptimestatistics.com",
|
|
7534
|
-
"category": "MONITORING_AND_ANALYTICS",
|
|
7535
|
-
"description": "UptimeDoctor is a website uptime monitoring service. ",
|
|
7536
|
-
"followsRobotsTxt": false,
|
|
7537
|
-
"userAgentPatterns": [
|
|
7538
|
-
"www.uptimedoctor.com"
|
|
7539
|
-
],
|
|
7540
|
-
"userAgents": [
|
|
7541
|
-
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/64.0.3282.140 Safari/537.36 Edge/17.17134 www.uptimedoctor.com (username slowmail)",
|
|
7542
|
-
"Mozilla/4.0 (compatible; MSIE 6.0; www.hyperspin.com username mis.admin)"
|
|
7543
|
-
]
|
|
7544
|
-
},
|
|
7545
7796
|
{
|
|
7546
7797
|
"slug": "uptimia",
|
|
7547
7798
|
"name": "Uptimia",
|
|
@@ -7606,6 +7857,18 @@
|
|
|
7606
7857
|
"Mozilla/5.0 (compatible; videootvBot; +https://www.videoo.tv)"
|
|
7607
7858
|
]
|
|
7608
7859
|
},
|
|
7860
|
+
{
|
|
7861
|
+
"slug": "visually-io-shopify-editor",
|
|
7862
|
+
"name": "Visually.io Shopify Editor",
|
|
7863
|
+
"kind": "AGENT",
|
|
7864
|
+
"operator": null,
|
|
7865
|
+
"operatorUrl": "https://help.visually.io/visually.io-editor-cloudflare-signed-agent",
|
|
7866
|
+
"category": "AI_ASSISTANT",
|
|
7867
|
+
"description": "Shopify theme editor alternative for live, real-time store editing via a secure iframe and controlled proxy.",
|
|
7868
|
+
"followsRobotsTxt": false,
|
|
7869
|
+
"userAgentPatterns": [],
|
|
7870
|
+
"userAgents": []
|
|
7871
|
+
},
|
|
7609
7872
|
{
|
|
7610
7873
|
"slug": "w3-validator-services",
|
|
7611
7874
|
"name": "W3 Validator Services",
|
|
@@ -7719,6 +7982,22 @@
|
|
|
7719
7982
|
"websitepulse checker/3.0 (compatible; MSIE 5.5; Netscape 4.75; Linux)"
|
|
7720
7983
|
]
|
|
7721
7984
|
},
|
|
7985
|
+
{
|
|
7986
|
+
"slug": "webstatus247",
|
|
7987
|
+
"name": "Webstatus247",
|
|
7988
|
+
"kind": "BOT",
|
|
7989
|
+
"operator": null,
|
|
7990
|
+
"operatorUrl": "https://www.webstatus247.com/bot-information",
|
|
7991
|
+
"category": "MONITORING_AND_ANALYTICS",
|
|
7992
|
+
"description": "WebStatus247 is an intelligent website monitoring bot that continuously checks the availability and uptime",
|
|
7993
|
+
"followsRobotsTxt": false,
|
|
7994
|
+
"userAgentPatterns": [
|
|
7995
|
+
"Webstatus247"
|
|
7996
|
+
],
|
|
7997
|
+
"userAgents": [
|
|
7998
|
+
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/127.0.0.0 Safari/537.36 Webstatus247/1.0"
|
|
7999
|
+
]
|
|
8000
|
+
},
|
|
7722
8001
|
{
|
|
7723
8002
|
"slug": "webtotem",
|
|
7724
8003
|
"name": "WebTotemBot",
|
|
@@ -8016,7 +8295,7 @@
|
|
|
8016
8295
|
"operator": "Yahoo",
|
|
8017
8296
|
"operatorUrl": "https://www.yahoo-help.jp",
|
|
8018
8297
|
"category": "SEARCH_ENGINE_OPTIMIZATION",
|
|
8019
|
-
"description": "
|
|
8298
|
+
"description": "Yahoo Japan search engine crawler for SEO analysis",
|
|
8020
8299
|
"followsRobotsTxt": false,
|
|
8021
8300
|
"userAgentPatterns": [
|
|
8022
8301
|
"J-BRW",
|
|
@@ -8170,6 +8449,22 @@
|
|
|
8170
8449
|
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/87.0.4280.88 YextBot/Java Safari/537.36"
|
|
8171
8450
|
]
|
|
8172
8451
|
},
|
|
8452
|
+
{
|
|
8453
|
+
"slug": "ygs-group-falconer-scraper",
|
|
8454
|
+
"name": "YGS Group Falconer Scraper",
|
|
8455
|
+
"kind": "BOT",
|
|
8456
|
+
"operator": null,
|
|
8457
|
+
"operatorUrl": "https://ygscontentlicensing.com/falconer/",
|
|
8458
|
+
"category": "AI_CRAWLER",
|
|
8459
|
+
"description": "A content based scraper only for partners we collaborate with who have given permission to have their website scraped.",
|
|
8460
|
+
"followsRobotsTxt": false,
|
|
8461
|
+
"userAgentPatterns": [
|
|
8462
|
+
"ygs-scraper-bot"
|
|
8463
|
+
],
|
|
8464
|
+
"userAgents": [
|
|
8465
|
+
"ygs-scraper-bot/1.0"
|
|
8466
|
+
]
|
|
8467
|
+
},
|
|
8173
8468
|
{
|
|
8174
8469
|
"slug": "yokoy-group",
|
|
8175
8470
|
"name": "Yokoy Group Webhooks",
|
|
@@ -8186,6 +8481,22 @@
|
|
|
8186
8481
|
"YokoyGroupAG/1.0"
|
|
8187
8482
|
]
|
|
8188
8483
|
},
|
|
8484
|
+
{
|
|
8485
|
+
"slug": "youbot",
|
|
8486
|
+
"name": "YouBot",
|
|
8487
|
+
"kind": "BOT",
|
|
8488
|
+
"operator": null,
|
|
8489
|
+
"operatorUrl": "https://docs.you.com/youbot",
|
|
8490
|
+
"category": "SEARCH_ENGINE_CRAWLER",
|
|
8491
|
+
"description": "You.com Search Engine Crawler",
|
|
8492
|
+
"followsRobotsTxt": false,
|
|
8493
|
+
"userAgentPatterns": [
|
|
8494
|
+
"YouBot"
|
|
8495
|
+
],
|
|
8496
|
+
"userAgents": [
|
|
8497
|
+
"Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; YouBot/1.0; +https://docs.you.com/youbot; env:prod) Chrome/X.X.X.X Safari/537.36"
|
|
8498
|
+
]
|
|
8499
|
+
},
|
|
8189
8500
|
{
|
|
8190
8501
|
"slug": "zapier",
|
|
8191
8502
|
"name": "Zapier",
|