crawler-user-agents 1.0.113 → 1.0.115
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/crawler-user-agents.json +297 -0
- package/package.json +1 -1
package/crawler-user-agents.json
CHANGED
|
@@ -4925,5 +4925,302 @@
|
|
|
4925
4925
|
"Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Nicecrawler/1.1; +http://www.nicecrawler.com/) Chrome/90.0.4430.97 Safari/537.36"
|
|
4926
4926
|
],
|
|
4927
4927
|
"url": "http://www.nicecrawler.com/"
|
|
4928
|
+
},
|
|
4929
|
+
{
|
|
4930
|
+
"pattern": "Neevabot",
|
|
4931
|
+
"addition_date": "2023/09/08",
|
|
4932
|
+
"instances": [
|
|
4933
|
+
"Mozilla/5.0 (compatible; Neevabot/1.0; +https://neeva.com/neevabot)"
|
|
4934
|
+
],
|
|
4935
|
+
"url": "https://neeva.com/neevabot"
|
|
4936
|
+
},
|
|
4937
|
+
{
|
|
4938
|
+
"pattern": "BrightEdge Crawler",
|
|
4939
|
+
"addition_date": "2023/09/08",
|
|
4940
|
+
"instances": [
|
|
4941
|
+
"BrightEdge Crawler/1.0 (crawler@brightedge.com)"
|
|
4942
|
+
],
|
|
4943
|
+
"url": "https://www.brightedge.com/"
|
|
4944
|
+
},
|
|
4945
|
+
{
|
|
4946
|
+
"pattern": "SiteCheckerBotCrawler",
|
|
4947
|
+
"addition_date": "2023/09/08",
|
|
4948
|
+
"instances": [
|
|
4949
|
+
"SiteCheckerBotCrawler/1.0 (+http://sitechecker.pro)"
|
|
4950
|
+
],
|
|
4951
|
+
"url": "http://sitechecker.pro"
|
|
4952
|
+
},
|
|
4953
|
+
{
|
|
4954
|
+
"pattern": "TombaPublicWebCrawler",
|
|
4955
|
+
"addition_date": "2023/09/08",
|
|
4956
|
+
"instances": [
|
|
4957
|
+
"Mozilla/5.0 (compatible; TombaPublicWebCrawler/1.0; +https://tombascraper.com)"
|
|
4958
|
+
],
|
|
4959
|
+
"url": "https://tombascraper.com"
|
|
4960
|
+
},
|
|
4961
|
+
{
|
|
4962
|
+
"pattern": "CrawlyProjectCrawler",
|
|
4963
|
+
"addition_date": "2023/09/08",
|
|
4964
|
+
"instances": [
|
|
4965
|
+
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/115.0.0.0 Safari/537.36 (compatible; CrawlyProjectCrawler/0.1.3; crawlyproject@digitaldragon.dev +https://crawlyproject.digitaldragon.dev/)"
|
|
4966
|
+
],
|
|
4967
|
+
"url": "https://crawlyproject.digitaldragon.dev/"
|
|
4968
|
+
},
|
|
4969
|
+
{
|
|
4970
|
+
"pattern": "KomodiaBot",
|
|
4971
|
+
"addition_date": "2023/09/08",
|
|
4972
|
+
"instances": [
|
|
4973
|
+
"Mozilla/5.0 (Windows NT 6.1; Win64; x64; +http://www.komodia.com/newwiki/index.php/URL_server_crawler) KomodiaBot/1.0"
|
|
4974
|
+
],
|
|
4975
|
+
"url": "http://www.komodia.com/newwiki/index.php/URL_server_crawler"
|
|
4976
|
+
},
|
|
4977
|
+
{
|
|
4978
|
+
"pattern": "KStandBot",
|
|
4979
|
+
"addition_date": "2023/09/08",
|
|
4980
|
+
"instances": [
|
|
4981
|
+
"Mozilla/5.0 (Windows NT 6.1; Win64; x64; +http://url-classification.io/wiki/index.php?title=URL_server_crawler) KStandBot/1.0"
|
|
4982
|
+
],
|
|
4983
|
+
"url": "http://url-classification.io"
|
|
4984
|
+
},
|
|
4985
|
+
{
|
|
4986
|
+
"pattern": "CISPA Webcrawler",
|
|
4987
|
+
"addition_date": "2023/09/08",
|
|
4988
|
+
"instances": [
|
|
4989
|
+
"CISPA Webcrawler (https://vuln-notify-checker.cispa.saarland)"
|
|
4990
|
+
],
|
|
4991
|
+
"url": "https://vuln-notify-checker.cispa.saarland"
|
|
4992
|
+
},
|
|
4993
|
+
{
|
|
4994
|
+
"pattern": "MTRobot",
|
|
4995
|
+
"addition_date": "2023/09/08",
|
|
4996
|
+
"instances": [
|
|
4997
|
+
"MTRobot/0.2 (Metrics Tools Analytics Crawler; https://metrics-tools.de/robot.html; crawler@metrics-tools.de)"
|
|
4998
|
+
],
|
|
4999
|
+
"url": "https://metrics-tools.de/robot.html"
|
|
5000
|
+
},
|
|
5001
|
+
{
|
|
5002
|
+
"pattern": "hyscore.io",
|
|
5003
|
+
"addition_date": "2023/09/08",
|
|
5004
|
+
"instances": [
|
|
5005
|
+
"Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1. 4 (compatible; HyScore/1.0; +https://hyscore.io/crawler/)"
|
|
5006
|
+
],
|
|
5007
|
+
"url": "https://hyscore.io/crawler/"
|
|
5008
|
+
},
|
|
5009
|
+
{
|
|
5010
|
+
"pattern": "AlexandriaOrgBot",
|
|
5011
|
+
"addition_date": "2023/09/08",
|
|
5012
|
+
"instances": [
|
|
5013
|
+
"Mozilla/5.0 (Linux) (compatible; AlexandriaOrgBot/1.0; +https://www.alexandria.org/bot.html)"
|
|
5014
|
+
],
|
|
5015
|
+
"url": "https://www.alexandria.org/bot.html"
|
|
5016
|
+
},
|
|
5017
|
+
{
|
|
5018
|
+
"pattern": "2ip bot",
|
|
5019
|
+
"addition_date": "2023/09/08",
|
|
5020
|
+
"instances": [
|
|
5021
|
+
"2ip bot/1.1 (+http://2ip.io)"
|
|
5022
|
+
],
|
|
5023
|
+
"url": "http://2ip.io"
|
|
5024
|
+
},
|
|
5025
|
+
{
|
|
5026
|
+
"pattern": "Yellowbrandprotectionbot",
|
|
5027
|
+
"addition_date": "2023/09/08",
|
|
5028
|
+
"instances": [
|
|
5029
|
+
"Mozilla/5.0 (compatible; Yellowbrandprotectionbot/1.0; +https://www.yellowbp.com/bot.html)"
|
|
5030
|
+
],
|
|
5031
|
+
"url": "https://www.yellowbp.com/bot.html"
|
|
5032
|
+
},
|
|
5033
|
+
{
|
|
5034
|
+
"pattern": "SEOlizer",
|
|
5035
|
+
"addition_date": "2023/09/08",
|
|
5036
|
+
"instances": [
|
|
5037
|
+
"SEOlizer/1.1 (Windows; U; Windows NT 5.1; en-US; rv:1.8.1.13) Gecko/20080311 Firefox/2.0.0.13 (+https://www.seolizer.de/bot.html)"
|
|
5038
|
+
],
|
|
5039
|
+
"url": "https://www.seolizer.de/bot.html"
|
|
5040
|
+
},
|
|
5041
|
+
{
|
|
5042
|
+
"pattern": "vuhuvBot",
|
|
5043
|
+
"addition_date": "2023/09/08",
|
|
5044
|
+
"instances": [
|
|
5045
|
+
"Mozilla/5.0 (compatible; vuhuvBot/1.0; +http://vuhuv.com/bot.html)"
|
|
5046
|
+
],
|
|
5047
|
+
"url": "http://vuhuv.com/bot.html"
|
|
5048
|
+
},
|
|
5049
|
+
{
|
|
5050
|
+
"pattern": "INETDEX-BOT",
|
|
5051
|
+
"addition_date": "2023/09/08",
|
|
5052
|
+
"instances": [
|
|
5053
|
+
"INETDEX-BOT/1.5 (Mozilla/5.0; https://inetdex.com/bot.html)"
|
|
5054
|
+
],
|
|
5055
|
+
"url": "https://inetdex.com/bot.html"
|
|
5056
|
+
},
|
|
5057
|
+
{
|
|
5058
|
+
"pattern": "Synapse",
|
|
5059
|
+
"addition_date": "2023/09/08",
|
|
5060
|
+
"instances": [
|
|
5061
|
+
"Synapse (bot; +https://github.com/matrix-org/synapse)"
|
|
5062
|
+
],
|
|
5063
|
+
"url": "https://github.com/matrix-org/synapse"
|
|
5064
|
+
},
|
|
5065
|
+
{
|
|
5066
|
+
"pattern": "t3versionsBot",
|
|
5067
|
+
"addition_date": "2023/09/08",
|
|
5068
|
+
"instances": [
|
|
5069
|
+
"Mozilla/5.0 (compatible; t3versionsBot/1.0; +https://www.t3versions.com/bot)"
|
|
5070
|
+
],
|
|
5071
|
+
"url": "https://www.t3versions.com/bot"
|
|
5072
|
+
},
|
|
5073
|
+
{
|
|
5074
|
+
"pattern": "deepnoc",
|
|
5075
|
+
"addition_date": "2023/09/08",
|
|
5076
|
+
"instances": [
|
|
5077
|
+
"deepnoc - https://deepnoc.com/bot"
|
|
5078
|
+
],
|
|
5079
|
+
"url": "https://deepnoc.com/bot"
|
|
5080
|
+
},
|
|
5081
|
+
{
|
|
5082
|
+
"pattern": "Cocolyzebot",
|
|
5083
|
+
"addition_date": "2023/09/08",
|
|
5084
|
+
"instances": [
|
|
5085
|
+
"Mozilla/5.0 (compatible; Cocolyzebot/1.0; https://cocolyze.com/bot)"
|
|
5086
|
+
],
|
|
5087
|
+
"url": "https://cocolyze.com/bot"
|
|
5088
|
+
},
|
|
5089
|
+
{
|
|
5090
|
+
"pattern": "hypestat",
|
|
5091
|
+
"addition_date": "2023/09/08",
|
|
5092
|
+
"instances": [
|
|
5093
|
+
"Mozilla/5.0 (compatible; hypestat/1.0; +https://hypestat.com/bot)"
|
|
5094
|
+
],
|
|
5095
|
+
"url": "https://hypestat.com/bot"
|
|
5096
|
+
},
|
|
5097
|
+
{
|
|
5098
|
+
"pattern": "ReverseEngineeringBot",
|
|
5099
|
+
"addition_date": "2023/09/08",
|
|
5100
|
+
"instances": [
|
|
5101
|
+
"Mozilla/5.0 (compatible; ReverseEngineeringBot/0.1; +https://torus.company/bot.html)"
|
|
5102
|
+
],
|
|
5103
|
+
"url": "https://torus.company/bot.html"
|
|
5104
|
+
},
|
|
5105
|
+
{
|
|
5106
|
+
"pattern": "sempi.tech",
|
|
5107
|
+
"addition_date": "2023/09/08",
|
|
5108
|
+
"instances": [
|
|
5109
|
+
"Mozilla/5.0 (compatible; Semanticbot/1.0; +http://sempi.tech/bot.html)"
|
|
5110
|
+
],
|
|
5111
|
+
"url": "http://sempi.tech/bot.html"
|
|
5112
|
+
},
|
|
5113
|
+
{
|
|
5114
|
+
"pattern": "Iframely",
|
|
5115
|
+
"addition_date": "2023/09/08",
|
|
5116
|
+
"instances": [
|
|
5117
|
+
"Iframely/1.3.1 (+https://iframely.com/docs/about) Atlassian"
|
|
5118
|
+
],
|
|
5119
|
+
"url": "https://iframely.com/docs/about"
|
|
5120
|
+
},
|
|
5121
|
+
{
|
|
5122
|
+
"pattern": "MetaInspector",
|
|
5123
|
+
"addition_date": "2023/09/08",
|
|
5124
|
+
"instances": [
|
|
5125
|
+
"MetaInspector/5.6.0 (+https://github.com/jaimeiniesta/metainspector)"
|
|
5126
|
+
],
|
|
5127
|
+
"url": "https://github.com/jaimeiniesta/metainspector"
|
|
5128
|
+
},
|
|
5129
|
+
{
|
|
5130
|
+
"pattern": "node-fetch",
|
|
5131
|
+
"addition_date": "2023/09/08",
|
|
5132
|
+
"instances": [
|
|
5133
|
+
"node-fetch/1.0 (+https://github.com/bitinn/node-fetch)"
|
|
5134
|
+
],
|
|
5135
|
+
"url": "https://github.com/bitinn/node-fetch"
|
|
5136
|
+
},
|
|
5137
|
+
{
|
|
5138
|
+
"pattern": "lkxscan",
|
|
5139
|
+
"addition_date": "2023/09/08",
|
|
5140
|
+
"instances": [
|
|
5141
|
+
"lkxscan/v0.1.0 (+https://leakix.net) l9explore/v1.0.0 (+https://github.com/LeakIX/l9explore)"
|
|
5142
|
+
],
|
|
5143
|
+
"url": "https://github.com/LeakIX/l9explore"
|
|
5144
|
+
},
|
|
5145
|
+
{
|
|
5146
|
+
"pattern": "python-opengraph",
|
|
5147
|
+
"addition_date": "2023/09/08",
|
|
5148
|
+
"instances": [
|
|
5149
|
+
"python-opengraph-jaywink/0.2.0 (+https://github.com/jaywink/python-opengraph)"
|
|
5150
|
+
],
|
|
5151
|
+
"url": "https://github.com/jaywink/python-opengraph"
|
|
5152
|
+
},
|
|
5153
|
+
{
|
|
5154
|
+
"pattern": "OpenGraphCheck",
|
|
5155
|
+
"addition_date": "2023/09/08",
|
|
5156
|
+
"instances": [
|
|
5157
|
+
"OpenGraphCheck/2.1 (+https://opengraphcheck.com)"
|
|
5158
|
+
],
|
|
5159
|
+
"url": "https://opengraphcheck.com"
|
|
5160
|
+
},
|
|
5161
|
+
{
|
|
5162
|
+
"pattern": "developers.google.com\\/\\+\\/web\\/snippet",
|
|
5163
|
+
"addition_date": "2023/09/08",
|
|
5164
|
+
"instances": [
|
|
5165
|
+
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/56.0.2924.87 Safari/537.36 Google-PageRenderer Google (+https://developers.google.com/+/web/snippet/)",
|
|
5166
|
+
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/56.0.2924.87 Safari/537.36 Google (+https://developers.google.com/+/web/snippet/"
|
|
5167
|
+
],
|
|
5168
|
+
"url": "https://developers.google.com/+/web/snippet"
|
|
5169
|
+
},
|
|
5170
|
+
{
|
|
5171
|
+
"pattern": "SenutoBot",
|
|
5172
|
+
"addition_date": "2023/09/08",
|
|
5173
|
+
"instances": [
|
|
5174
|
+
"SenutoBot/1.0 (compatible; SenutoBot/1.0; +https://www.senuto.com/)"
|
|
5175
|
+
],
|
|
5176
|
+
"url": "https://www.senuto.com"
|
|
5177
|
+
},
|
|
5178
|
+
{
|
|
5179
|
+
"pattern": "MaCoCu",
|
|
5180
|
+
"addition_date": "2023/09/08",
|
|
5181
|
+
"instances": [
|
|
5182
|
+
"Mozilla/5.0 (compatible; MaCoCu; +https://www.clarin.si/info/macocu-massive-collection-and-curation-of-monolingual-and-bilingual-data/)"
|
|
5183
|
+
],
|
|
5184
|
+
"url": "https://www.clarin.si/info/macocu-massive-collection-and-curation-of-monolingual-and-bilingual-data"
|
|
5185
|
+
},
|
|
5186
|
+
{
|
|
5187
|
+
"pattern": "NewsBlur",
|
|
5188
|
+
"addition_date": "2023/09/08",
|
|
5189
|
+
"instances": [
|
|
5190
|
+
"NewsBlur Feed Fetcher - 1 subscriber - http://www.newsblur.com/site/0000000/webpage (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/14.0.1 Safari/605.1.15)"
|
|
5191
|
+
],
|
|
5192
|
+
"url": "http://www.newsblur.com"
|
|
5193
|
+
},
|
|
5194
|
+
{
|
|
5195
|
+
"pattern": "inoreader",
|
|
5196
|
+
"addition_date": "2023/09/08",
|
|
5197
|
+
"instances": [
|
|
5198
|
+
"Mozilla/5.0 (compatible; inoreader.com; 1 subscribers)"
|
|
5199
|
+
],
|
|
5200
|
+
"url": "http://inoreader.com"
|
|
5201
|
+
},
|
|
5202
|
+
{
|
|
5203
|
+
"pattern": "NetSystemsResearch",
|
|
5204
|
+
"addition_date": "2023/09/08",
|
|
5205
|
+
"instances": [
|
|
5206
|
+
"NetSystemsResearch studies the availability of various services across the internet. Our website is netsystemsresearch.com"
|
|
5207
|
+
],
|
|
5208
|
+
"url": "http://netsystemsresearch.com"
|
|
5209
|
+
},
|
|
5210
|
+
{
|
|
5211
|
+
"pattern": "PageThing",
|
|
5212
|
+
"addition_date": "2023/09/08",
|
|
5213
|
+
"instances": [
|
|
5214
|
+
"PageThing http://pagething.com curl www"
|
|
5215
|
+
],
|
|
5216
|
+
"url": "http://pagething.com"
|
|
5217
|
+
},
|
|
5218
|
+
{
|
|
5219
|
+
"pattern": "WordPress\\/",
|
|
5220
|
+
"addition_date": "2023/10/24",
|
|
5221
|
+
"instances": [
|
|
5222
|
+
"WordPress/X.X.X; https://example.com"
|
|
5223
|
+
],
|
|
5224
|
+
"url": "https://wordpress.org"
|
|
4928
5225
|
}
|
|
4929
5226
|
]
|