cloudflare-bot-directory 1.0.6 → 1.0.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/LICENSE.md CHANGED
@@ -1,6 +1,6 @@
1
1
  The MIT License (MIT)
2
2
 
3
- Copyright © 2026 Kiko Beats <josefrancisco.verdu@gmail.com> (kikobeats.com)
3
+ Copyright © 2019 Microlink <hello@microlink.io> (microlink.io)
4
4
 
5
5
  Permission is hereby granted, free of charge, to any person obtaining a copy
6
6
  of this software and associated documentation files (the "Software"), to deal
package/README.md CHANGED
@@ -6,7 +6,7 @@
6
6
  <br>
7
7
  </p>
8
8
 
9
- ![Last version](https://img.shields.io/github/tag/kikobeats/cloudflare-bot-directory.svg?style=flat-square)
9
+ ![Last version](https://img.shields.io/github/tag/microlinkhq/cloudflare-bot-directory.svg?style=flat-square)
10
10
  [![NPM Status](https://img.shields.io/npm/dm/cloudflare-bot-directory.svg?style=flat-square)](https://www.npmjs.org/package/cloudflare-bot-directory)
11
11
 
12
12
  > A comprehensive list of **500+ verified bots** and web crawlers from [CloudFlare Radar](https://radar.cloudflare.com/traffic/verified-bots), available as a JSON dataset for bot detection, user agent analysis, and web scraping identification.
@@ -69,7 +69,7 @@ const isKnownBot = (userAgent) =>
69
69
 
70
70
  ## License
71
71
 
72
- **cloudflare-bot-directory** © [Kiko Beats](https://kikobeats.com), released under the [MIT](https://microlinkhq/cloudflare-bot-directory/cloudflare-bot-directory/blob/master/LICENSE.md) License.<br>
73
- Authored and maintained by [Kiko Beats](https://kikobeats.com) with help from [contributors](https://microlinkhq/cloudflare-bot-directory/cloudflare-bot-directory/contributors).
72
+ **cloudflare-bot-directory** © [Microlink](https://microlink.io), released under the [MIT](https://github.com/microlinkhq/cloudflare-bot-directory/blob/master/LICENSE.md) License.<br>
73
+ Authored and maintained by [Kiko Beats](https://kikobeats.com) with help from [contributors](https://github.com/microlinkhq/cloudflare-bot-directory/contributors).
74
74
 
75
- > [kikobeats.com](https://kikobeats.com) · GitHub [Kiko Beats](https://microlinkhq/cloudflare-bot-directory) · X [@kikobeats](https://x.com/kikobeats)
75
+ > [microlink.io](https://microlink.io) · GitHub [microlinkhq](https://github.com/microlinkhq) · X [@microlinkhq](https://x.com/microlinkhq)
package/package.json CHANGED
@@ -1,8 +1,8 @@
1
1
  {
2
2
  "name": "cloudflare-bot-directory",
3
3
  "description": "CloudFlare Radar verified bots directory - 500+ web crawlers, search engine bots, and user agents as JSON for bot detection and traffic filtering",
4
- "homepage": "https://microlinkhq/cloudflare-bot-directory/cloudflare-bot-directory",
5
- "version": "1.0.6",
4
+ "homepage": "https://github.com/microlinkhq/cloudflare-bot-directory",
5
+ "version": "1.0.15",
6
6
  "types": "./src/index.d.ts",
7
7
  "main": "./src/index.js",
8
8
  "exports": {
@@ -16,10 +16,10 @@
16
16
  "contributors": [],
17
17
  "repository": {
18
18
  "type": "git",
19
- "url": "git+https://microlinkhq/cloudflare-bot-directory/cloudflare-bot-directory.git"
19
+ "url": "git+https://github.com/microlinkhq/cloudflare-bot-directory.git"
20
20
  },
21
21
  "bugs": {
22
- "url": "https://microlinkhq/cloudflare-bot-directory/cloudflare-bot-directory/issues"
22
+ "url": "https://github.com/microlinkhq/cloudflare-bot-directory/issues"
23
23
  },
24
24
  "keywords": [
25
25
  "bingbot",
package/src/index.json CHANGED
@@ -557,6 +557,22 @@
557
557
  "Anchor Browser"
558
558
  ]
559
559
  },
560
+ {
561
+ "slug": "apify-website-content-crawler",
562
+ "name": "Apify Website Content Crawler",
563
+ "kind": "AGENT",
564
+ "operator": null,
565
+ "operatorUrl": "https://apify.com/apify/website-content-crawler",
566
+ "category": "AI_ASSISTANT",
567
+ "description": "Crawl websites and extract content to feed AI apps. Convert web data to Markdown or HTML, download files, and more.",
568
+ "followsRobotsTxt": false,
569
+ "userAgentPatterns": [
570
+ "ApifyWebsiteContentCrawler"
571
+ ],
572
+ "userAgents": [
573
+ "ApifyWebsiteContentCrawler/1.0 (+https://apify.com/apify/website-content-crawler)"
574
+ ]
575
+ },
560
576
  {
561
577
  "slug": "apple",
562
578
  "name": "Applebot",
@@ -736,22 +752,6 @@
736
752
  "Tumblr/14.0.835.186"
737
753
  ]
738
754
  },
739
- {
740
- "slug": "autorag",
741
- "name": "AutoRAG",
742
- "kind": "BOT",
743
- "operator": "Cloudflare",
744
- "operatorUrl": "https://developers.cloudflare.com/autorag",
745
- "category": "AI_SEARCH",
746
- "description": "AutoRAG is an all-in-one AI search solution",
747
- "followsRobotsTxt": true,
748
- "userAgentPatterns": [
749
- "Cloudflare-AutoRAG"
750
- ],
751
- "userAgents": [
752
- "Cloudflare-AutoRAG (https://developers.cloudflare.com/autorag; autorag@cloudflare.com)"
753
- ]
754
- },
755
755
  {
756
756
  "slug": "awario",
757
757
  "name": "AwarioSmartBot",
@@ -808,7 +808,7 @@
808
808
  "operator": "Baidu",
809
809
  "operatorUrl": null,
810
810
  "category": "SEARCH_ENGINE_CRAWLER",
811
- "description": "Baidu's DDoS scrubbing proxy.",
811
+ "description": "Baidu's scrubbing proxy.",
812
812
  "followsRobotsTxt": false,
813
813
  "userAgentPatterns": [
814
814
  "Baidu-ADS"
@@ -1469,6 +1469,22 @@
1469
1469
  "Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/69.0.3464.0 Mobile Safari/537.36 Chrome-Lighthouse"
1470
1470
  ]
1471
1471
  },
1472
+ {
1473
+ "slug": "citibotsitecrawler",
1474
+ "name": "CitibotSiteCrawler",
1475
+ "kind": "BOT",
1476
+ "operator": null,
1477
+ "operatorUrl": "https://www.citibot.io/",
1478
+ "category": "AI_CRAWLER",
1479
+ "description": "CitibotSiteCrawler collects public data from government websites to power Citibot’s AI civic engagement tools.",
1480
+ "followsRobotsTxt": false,
1481
+ "userAgentPatterns": [
1482
+ "CitibotSiteCrawler"
1483
+ ],
1484
+ "userAgents": [
1485
+ "CitibotSiteCrawler/1.0"
1486
+ ]
1487
+ },
1472
1488
  {
1473
1489
  "slug": "clickagy",
1474
1490
  "name": "Clickagy",
@@ -1485,17 +1501,37 @@
1485
1501
  "Clickagy Intelligence Bot v2"
1486
1502
  ]
1487
1503
  },
1504
+ {
1505
+ "slug": "cloudflare-ai-search",
1506
+ "name": "AI Search",
1507
+ "kind": "BOT",
1508
+ "operator": "Cloudflare",
1509
+ "operatorUrl": "https://developers.cloudflare.com/ai-search",
1510
+ "category": "AI_SEARCH",
1511
+ "description": "Cloudflare AI Search is a managed service that lets you connect your data and easily build AI-powered search.",
1512
+ "followsRobotsTxt": true,
1513
+ "userAgentPatterns": [
1514
+ "Cloudflare-AI-Search"
1515
+ ],
1516
+ "userAgents": [
1517
+ "Cloudflare-AI-Search (https://developers.cloudflare.com/ai-search; ai-search@cloudflare.com)"
1518
+ ]
1519
+ },
1488
1520
  {
1489
1521
  "slug": "cloudflare-browser-rendering",
1490
1522
  "name": "Cloudflare Browser Rendering",
1491
1523
  "kind": "AGENT",
1492
1524
  "operator": "Cloudflare",
1493
1525
  "operatorUrl": "https://cloudflare.com",
1494
- "category": "PAGE_PREVIEW",
1526
+ "category": "AI_CRAWLER",
1495
1527
  "description": "Cloudflare Browser Rendering",
1496
1528
  "followsRobotsTxt": false,
1497
- "userAgentPatterns": [],
1498
- "userAgents": []
1529
+ "userAgentPatterns": [
1530
+ "CloudflareBrowserRenderingCraw"
1531
+ ],
1532
+ "userAgents": [
1533
+ "CloudflareBrowserRenderingCrawler/1.0"
1534
+ ]
1499
1535
  },
1500
1536
  {
1501
1537
  "slug": "cloudflare-chv",
@@ -1536,7 +1572,7 @@
1536
1572
  "operator": "Cloudflare",
1537
1573
  "operatorUrl": null,
1538
1574
  "category": "MONITORING_AND_ANALYTICS",
1539
- "description": "Cloudflare diagnostic and testing services.",
1575
+ "description": "Cloudflare system bot that performs health checks and diagnostic tests",
1540
1576
  "followsRobotsTxt": false,
1541
1577
  "userAgentPatterns": [
1542
1578
  "CloudflareDiagnostics"
@@ -2059,6 +2095,42 @@
2059
2095
  "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/140.0.0.0 Safari/537.36 CybaaBot"
2060
2096
  ]
2061
2097
  },
2098
+ {
2099
+ "slug": "daric2",
2100
+ "name": "Daric2",
2101
+ "kind": "BOT",
2102
+ "operator": null,
2103
+ "operatorUrl": "https://developers.cloudflare.com/ai-crawl-control/",
2104
+ "category": "AI_CRAWLER",
2105
+ "description": "Cloudflare AI Crawl Control bot 2",
2106
+ "followsRobotsTxt": false,
2107
+ "userAgentPatterns": [],
2108
+ "userAgents": []
2109
+ },
2110
+ {
2111
+ "slug": "daric3",
2112
+ "name": "Daric3",
2113
+ "kind": "BOT",
2114
+ "operator": null,
2115
+ "operatorUrl": "https://developers.cloudflare.com/ai-crawl-control/",
2116
+ "category": "AI_CRAWLER",
2117
+ "description": "Cloudflare AI Crawl Control bot 3",
2118
+ "followsRobotsTxt": false,
2119
+ "userAgentPatterns": [],
2120
+ "userAgents": []
2121
+ },
2122
+ {
2123
+ "slug": "daric4",
2124
+ "name": "Daric4",
2125
+ "kind": "BOT",
2126
+ "operator": null,
2127
+ "operatorUrl": "https://developers.cloudflare.com/ai-crawl-control/",
2128
+ "category": "AI_CRAWLER",
2129
+ "description": "Cloudflare AI Crawl Control bot 4",
2130
+ "followsRobotsTxt": false,
2131
+ "userAgentPatterns": [],
2132
+ "userAgents": []
2133
+ },
2062
2134
  {
2063
2135
  "slug": "datadog-synthetic-bot",
2064
2136
  "name": "Synthetic Bot",
@@ -2146,7 +2218,7 @@
2146
2218
  "operator": "Daum",
2147
2219
  "operatorUrl": "https://cs.daum.net/faq/15/4118.html?faqId=28966",
2148
2220
  "category": "SEARCH_ENGINE_CRAWLER",
2149
- "description": "Korean search engine crawler. Added from https://jira.cfops.it/browse/BOTS-1558.",
2221
+ "description": "Korean search engine crawler",
2150
2222
  "followsRobotsTxt": false,
2151
2223
  "userAgentPatterns": [
2152
2224
  "Daum/4.1"
@@ -2181,10 +2253,10 @@
2181
2253
  "description": "The DeepCrawl bot crawls the websites of its customers to collect performance analytics and suggest SEO optimizations.",
2182
2254
  "followsRobotsTxt": false,
2183
2255
  "userAgentPatterns": [
2184
- "deepcrawl.com/bot"
2256
+ "lumar"
2185
2257
  ],
2186
2258
  "userAgents": [
2187
- "https://deepcrawl.com/bot"
2259
+ "lumar"
2188
2260
  ]
2189
2261
  },
2190
2262
  {
@@ -3494,6 +3566,18 @@
3494
3566
  "Notabot"
3495
3567
  ]
3496
3568
  },
3569
+ {
3570
+ "slug": "henry-shopping-agent",
3571
+ "name": "Henry Shopping Agent",
3572
+ "kind": "AGENT",
3573
+ "operator": null,
3574
+ "operatorUrl": "https://docs.henrylabs.ai/",
3575
+ "category": "AI_ASSISTANT",
3576
+ "description": "Executes checkout via browser automation using a user's card and signed mandate",
3577
+ "followsRobotsTxt": false,
3578
+ "userAgentPatterns": [],
3579
+ "userAgents": []
3580
+ },
3497
3581
  {
3498
3582
  "slug": "hetrixtools",
3499
3583
  "name": "HetrixTools",
@@ -4453,6 +4537,22 @@
4453
4537
  "MediaMonitoringBot/1.1 (+https://mediamonitoringbot.com/crawler; crawler@mediamonitoringbot.com)"
4454
4538
  ]
4455
4539
  },
4540
+ {
4541
+ "slug": "mediaboardbot",
4542
+ "name": "mediaboardbot",
4543
+ "kind": "BOT",
4544
+ "operator": "Mediaboard",
4545
+ "operatorUrl": "https://media.mediaboard.com/docs/mediaboardbot",
4546
+ "category": "MONITORING_AND_ANALYTICS",
4547
+ "description": "Mediaboard's web crawler (media monitoring) detects client mentions in online news and public content.",
4548
+ "followsRobotsTxt": false,
4549
+ "userAgentPatterns": [
4550
+ "mediaboardbot"
4551
+ ],
4552
+ "userAgents": [
4553
+ "Mozilla/5.0 (compatible; mediaboardbot/1.0; +https://www.mediaboard.com/)"
4554
+ ]
4555
+ },
4456
4556
  {
4457
4557
  "slug": "medialogiabot",
4458
4558
  "name": "Medialogia Bot",
@@ -4892,6 +4992,22 @@
4892
4992
  "Mozilla/5.0 (compatible; Clearscopebot/1.0)"
4893
4993
  ]
4894
4994
  },
4995
+ {
4996
+ "slug": "nava-labs-asp-dev",
4997
+ "name": "Nava Labs ASP (Dev)",
4998
+ "kind": "AGENT",
4999
+ "operator": null,
5000
+ "operatorUrl": "https://dev.labs-asp.navateam.com/bot-disclosure",
5001
+ "category": "AI_ASSISTANT",
5002
+ "description": "Bot to assist social workers in navigating safety net benefit websites.",
5003
+ "followsRobotsTxt": false,
5004
+ "userAgentPatterns": [
5005
+ "Nava/"
5006
+ ],
5007
+ "userAgents": [
5008
+ "Nava/"
5009
+ ]
5010
+ },
4895
5011
  {
4896
5012
  "slug": "naver",
4897
5013
  "name": "Yeti",
@@ -5164,6 +5280,18 @@
5164
5280
  "Mozilla/5.0 (compatible; NostoCrawlerBot/1.0; +http://my.nosto.com/tagging)"
5165
5281
  ]
5166
5282
  },
5283
+ {
5284
+ "slug": "nostra",
5285
+ "name": "Nostra",
5286
+ "kind": "BOT",
5287
+ "operator": null,
5288
+ "operatorUrl": "https://www.nostra.ai/edge-optimization",
5289
+ "category": "SEARCH_ENGINE_OPTIMIZATION",
5290
+ "description": "Nostra accelerates site speed for managed web platforms",
5291
+ "followsRobotsTxt": false,
5292
+ "userAgentPatterns": [],
5293
+ "userAgents": []
5294
+ },
5167
5295
  {
5168
5296
  "slug": "novellum-ai-crawl",
5169
5297
  "name": "Novellum AI Crawl",
@@ -5470,6 +5598,30 @@
5470
5598
  "Mozilla/5.0 (compatible; parse.ly scraper/0.16; +http://parsely.com)"
5471
5599
  ]
5472
5600
  },
5601
+ {
5602
+ "slug": "particlenewsbot",
5603
+ "name": "ParticleNewsBot",
5604
+ "kind": "BOT",
5605
+ "operator": null,
5606
+ "operatorUrl": "https://particle.news/bot",
5607
+ "category": "AGGREGATOR",
5608
+ "description": "Particle is an AI powered aggregator that collects news from many sources",
5609
+ "followsRobotsTxt": false,
5610
+ "userAgentPatterns": [],
5611
+ "userAgents": []
5612
+ },
5613
+ {
5614
+ "slug": "payhawk-invoice-fetching-bot",
5615
+ "name": "Payhawk Invoice Fetching Agent",
5616
+ "kind": "AGENT",
5617
+ "operator": "Payhawk",
5618
+ "operatorUrl": "https://payhawk.com/help/overview-of-the-financial-controller-agent",
5619
+ "category": "AI_ASSISTANT",
5620
+ "description": "Automated browser bot that fetches invoices for users from supplier websites and attaches them to their expense records.",
5621
+ "followsRobotsTxt": false,
5622
+ "userAgentPatterns": [],
5623
+ "userAgents": []
5624
+ },
5473
5625
  {
5474
5626
  "slug": "paypal",
5475
5627
  "name": "PayPal",
@@ -6133,6 +6285,18 @@
6133
6285
  "RSSAPI/2.0 (+https://rssapi.net/)"
6134
6286
  ]
6135
6287
  },
6288
+ {
6289
+ "slug": "ryebot",
6290
+ "name": "RyeBot",
6291
+ "kind": "AGENT",
6292
+ "operator": null,
6293
+ "operatorUrl": "https://docs.rye.com/api-v2-experimental/ryebot",
6294
+ "category": "AI_ASSISTANT",
6295
+ "description": "Agentic checkout assistant that purchases products on behalf of end users with their explicit consent.",
6296
+ "followsRobotsTxt": false,
6297
+ "userAgentPatterns": [],
6298
+ "userAgents": []
6299
+ },
6136
6300
  {
6137
6301
  "slug": "salesforce",
6138
6302
  "name": "Salesforce",
@@ -6508,7 +6672,7 @@
6508
6672
  "slug": "serankingbacklinksbot",
6509
6673
  "name": "SERankingBacklinksBot",
6510
6674
  "kind": "BOT",
6511
- "operator": null,
6675
+ "operator": "SE Ranking",
6512
6676
  "operatorUrl": "https://seranking.com/backlinks-crawler",
6513
6677
  "category": "SEARCH_ENGINE_OPTIMIZATION",
6514
6678
  "description": "Crawls the Internet to assist in getting information on the link structure of sites on the web to assist SEO specialists",
@@ -6910,23 +7074,6 @@
6910
7074
  "Snipcart/1.0"
6911
7075
  ]
6912
7076
  },
6913
- {
6914
- "slug": "sogou",
6915
- "name": "Sogou",
6916
- "kind": "BOT",
6917
- "operator": "Sogou",
6918
- "operatorUrl": "http://www.sogou.com/docs/help/webmasters.htm#07",
6919
- "category": "SEARCH_ENGINE_CRAWLER",
6920
- "description": "The Sogou spider is the search engine crawler for Sogou. ",
6921
- "followsRobotsTxt": false,
6922
- "userAgentPatterns": [
6923
- "www.sogou.com"
6924
- ],
6925
- "userAgents": [
6926
- "Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)",
6927
- "Sogou Pic Spider/3.0( http://www.sogou.com/docs/help/webmasters.htm#07)"
6928
- ]
6929
- },
6930
7077
  {
6931
7078
  "slug": "solarwinds-observability",
6932
7079
  "name": "SolarWinds Observability",
@@ -7300,6 +7447,23 @@
7300
7447
  "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/W.X.Y.Z Safari/537.36 (compatible; TermlyBot/W.X; +http://www.termly.io/bot.html)"
7301
7448
  ]
7302
7449
  },
7450
+ {
7451
+ "slug": "terracotta",
7452
+ "name": "Terracotta",
7453
+ "kind": "BOT",
7454
+ "operator": null,
7455
+ "operatorUrl": "https://github.com/CeramicTeam/CeramicTerracotta",
7456
+ "category": "SEARCH_ENGINE_CRAWLER",
7457
+ "description": "The Terracotta bot scrapes websites for use in generating indices for serving searches using Ceramic's search product.",
7458
+ "followsRobotsTxt": false,
7459
+ "userAgentPatterns": [
7460
+ "Terracotta"
7461
+ ],
7462
+ "userAgents": [
7463
+ "Terracotta",
7464
+ "Terracotta-News"
7465
+ ]
7466
+ },
7303
7467
  {
7304
7468
  "slug": "thousand-eyes",
7305
7469
  "name": "Thousand Eyes Cloud Agent",
@@ -7493,6 +7657,22 @@
7493
7657
  "Mozilla/5.0 (compatible; Uptime/1.0; http://uptime.com)"
7494
7658
  ]
7495
7659
  },
7660
+ {
7661
+ "slug": "uptime-monitoring",
7662
+ "name": "Uptime Monitoring",
7663
+ "kind": "BOT",
7664
+ "operator": "GoDaddy",
7665
+ "operatorUrl": "https://docs.sucuri.net/website-monitoring/understanding-alerts/uptime-monitor-alerts/",
7666
+ "category": "MONITORING_AND_ANALYTICS",
7667
+ "description": "Uptime monitoring is a service that checks if a website is online. It will send you an alert if your website is “down”.",
7668
+ "followsRobotsTxt": false,
7669
+ "userAgentPatterns": [
7670
+ "UptimeMonitoring"
7671
+ ],
7672
+ "userAgents": [
7673
+ "UptimeMonitoring"
7674
+ ]
7675
+ },
7496
7676
  {
7497
7677
  "slug": "uptimebot",
7498
7678
  "name": "UptimeBot",
@@ -7525,23 +7705,6 @@
7525
7705
  "Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)"
7526
7706
  ]
7527
7707
  },
7528
- {
7529
- "slug": "uptimestatistics",
7530
- "name": "uptimedoctor",
7531
- "kind": "BOT",
7532
- "operator": "uptimedoctor",
7533
- "operatorUrl": "http://uptimestatistics.com",
7534
- "category": "MONITORING_AND_ANALYTICS",
7535
- "description": "UptimeDoctor is a website uptime monitoring service. ",
7536
- "followsRobotsTxt": false,
7537
- "userAgentPatterns": [
7538
- "www.uptimedoctor.com"
7539
- ],
7540
- "userAgents": [
7541
- "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/64.0.3282.140 Safari/537.36 Edge/17.17134 www.uptimedoctor.com (username slowmail)",
7542
- "Mozilla/4.0 (compatible; MSIE 6.0; www.hyperspin.com username mis.admin)"
7543
- ]
7544
- },
7545
7708
  {
7546
7709
  "slug": "uptimia",
7547
7710
  "name": "Uptimia",
@@ -7606,6 +7769,18 @@
7606
7769
  "Mozilla/5.0 (compatible; videootvBot; +https://www.videoo.tv)"
7607
7770
  ]
7608
7771
  },
7772
+ {
7773
+ "slug": "visually-io-shopify-editor",
7774
+ "name": "Visually.io Shopify Editor",
7775
+ "kind": "AGENT",
7776
+ "operator": null,
7777
+ "operatorUrl": "https://help.visually.io/visually.io-editor-cloudflare-signed-agent",
7778
+ "category": "AI_ASSISTANT",
7779
+ "description": "Shopify theme editor alternative for live, real-time store editing via a secure iframe and controlled proxy.",
7780
+ "followsRobotsTxt": false,
7781
+ "userAgentPatterns": [],
7782
+ "userAgents": []
7783
+ },
7609
7784
  {
7610
7785
  "slug": "w3-validator-services",
7611
7786
  "name": "W3 Validator Services",
@@ -7719,6 +7894,22 @@
7719
7894
  "websitepulse checker/3.0 (compatible; MSIE 5.5; Netscape 4.75; Linux)"
7720
7895
  ]
7721
7896
  },
7897
+ {
7898
+ "slug": "webstatus247",
7899
+ "name": "Webstatus247",
7900
+ "kind": "BOT",
7901
+ "operator": null,
7902
+ "operatorUrl": "https://www.webstatus247.com/bot-information",
7903
+ "category": "MONITORING_AND_ANALYTICS",
7904
+ "description": "WebStatus247 is an intelligent website monitoring bot that continuously checks the availability and uptime",
7905
+ "followsRobotsTxt": false,
7906
+ "userAgentPatterns": [
7907
+ "Webstatus247"
7908
+ ],
7909
+ "userAgents": [
7910
+ "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/127.0.0.0 Safari/537.36 Webstatus247/1.0"
7911
+ ]
7912
+ },
7722
7913
  {
7723
7914
  "slug": "webtotem",
7724
7915
  "name": "WebTotemBot",
@@ -8016,7 +8207,7 @@
8016
8207
  "operator": "Yahoo",
8017
8208
  "operatorUrl": "https://www.yahoo-help.jp",
8018
8209
  "category": "SEARCH_ENGINE_OPTIMIZATION",
8019
- "description": "SEO crawler for Yahoo Japan.",
8210
+ "description": "Yahoo Japan search engine crawler for SEO analysis",
8020
8211
  "followsRobotsTxt": false,
8021
8212
  "userAgentPatterns": [
8022
8213
  "J-BRW",
@@ -8170,6 +8361,22 @@
8170
8361
  "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/87.0.4280.88 YextBot/Java Safari/537.36"
8171
8362
  ]
8172
8363
  },
8364
+ {
8365
+ "slug": "ygs-group-falconer-scraper",
8366
+ "name": "YGS Group Falconer Scraper",
8367
+ "kind": "BOT",
8368
+ "operator": null,
8369
+ "operatorUrl": "https://ygscontentlicensing.com/falconer/",
8370
+ "category": "AI_CRAWLER",
8371
+ "description": "A content based scraper only for partners we collaborate with who have given permission to have their website scraped.",
8372
+ "followsRobotsTxt": false,
8373
+ "userAgentPatterns": [
8374
+ "ygs-scraper-bot"
8375
+ ],
8376
+ "userAgents": [
8377
+ "ygs-scraper-bot/1.0"
8378
+ ]
8379
+ },
8173
8380
  {
8174
8381
  "slug": "yokoy-group",
8175
8382
  "name": "Yokoy Group Webhooks",