crawler-user-agents 1.0.145 → 1.0.147

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -22,37 +22,32 @@
22
22
  "Nokia6820/2.0 (4.83) Profile/MIDP-1.0 Configuration/CLDC-1.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)",
23
23
  "SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)"
24
24
  ]
25
- }
26
- ,
25
+ },
27
26
  {
28
27
  "pattern": "Googlebot-Image",
29
28
  "instances": [
30
29
  "Googlebot-Image/1.0"
31
30
  ]
32
- }
33
- ,
31
+ },
34
32
  {
35
33
  "pattern": "Googlebot-News",
36
34
  "instances": [
37
35
  "Googlebot-News"
38
36
  ]
39
- }
40
- ,
37
+ },
41
38
  {
42
39
  "pattern": "Googlebot-Video",
43
40
  "instances": [
44
41
  "Googlebot-Video/1.0"
45
42
  ]
46
- }
47
- ,
43
+ },
48
44
  {
49
45
  "pattern": "AdsBot-Google([^-]|$)",
50
46
  "url": "https://support.google.com/webmasters/answer/1061943?hl=en",
51
47
  "instances": [
52
48
  "AdsBot-Google (+http://www.google.com/adsbot.html)"
53
49
  ]
54
- }
55
- ,
50
+ },
56
51
  {
57
52
  "pattern": "AdsBot-Google-Mobile",
58
53
  "addition_date": "2017/08/21",
@@ -62,8 +57,7 @@
62
57
  "Mozilla/5.0 (Linux; Android 5.0; SM-G920A) AppleWebKit (KHTML, like Gecko) Chrome Mobile Safari (compatible; AdsBot-Google-Mobile; +http://www.google.com/mobile/adsbot.html)",
63
58
  "Mozilla/5.0 (iPhone; CPU iPhone OS 9_1 like Mac OS X) AppleWebKit/601.1.46 (KHTML, like Gecko) Version/9.0 Mobile/13B143 Safari/601.1 (compatible; AdsBot-Google-Mobile; +http://www.google.com/mobile/adsbot.html)"
64
59
  ]
65
- }
66
- ,
60
+ },
67
61
  {
68
62
  "pattern": "Feedfetcher-Google",
69
63
  "addition_date": "2018/06/27",
@@ -71,8 +65,7 @@
71
65
  "instances": [
72
66
  "Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 1 subscribers; feed-id=728742641706423)"
73
67
  ]
74
- }
75
- ,
68
+ },
76
69
  {
77
70
  "pattern": "Mediapartners-Google",
78
71
  "url": "https://support.google.com/webmasters/answer/1061943?hl=en",
@@ -82,15 +75,13 @@
82
75
  "Mozilla/5.0 (iPhone; U; CPU iPhone OS 10_0 like Mac OS X; en-us) AppleWebKit/602.1.38 (KHTML, like Gecko) Version/10.0 Mobile/14A5297c Safari/602.1 (compatible; Mediapartners-Google/2.1; +http://www.google.com/bot.html)",
83
76
  "Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; Mediapartners-Google/2.1; +http://www.google.com/bot.html)"
84
77
  ]
85
- }
86
- ,
78
+ },
87
79
  {
88
80
  "pattern": "Mediapartners \\(Googlebot\\)",
89
81
  "addition_date": "2017/08/08",
90
82
  "url": "https://support.google.com/webmasters/answer/1061943?hl=en",
91
83
  "instances": []
92
- }
93
- ,
84
+ },
94
85
  {
95
86
  "pattern": "APIs-Google",
96
87
  "addition_date": "2017/08/08",
@@ -98,8 +89,7 @@
98
89
  "instances": [
99
90
  "APIs-Google (+https://developers.google.com/webmasters/APIs-Google.html)"
100
91
  ]
101
- }
102
- ,
92
+ },
103
93
  {
104
94
  "pattern": "Google-InspectionTool",
105
95
  "url": "https://developers.google.com/search/docs/crawling-indexing/overview-google-crawlers",
@@ -107,8 +97,7 @@
107
97
  "Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/W.X.Y.Z Mobile Safari/537.36 (compatible; Google-InspectionTool/1.0)",
108
98
  "Mozilla/5.0 (compatible; Google-InspectionTool/1.0)"
109
99
  ]
110
- }
111
- ,
100
+ },
112
101
  {
113
102
  "pattern": "Storebot-Google",
114
103
  "url": "https://developers.google.com/search/docs/crawling-indexing/overview-google-crawlers",
@@ -116,16 +105,14 @@
116
105
  "Mozilla/5.0 (X11; Linux x86_64; Storebot-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.88 Safari/537.36",
117
106
  "Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; Storebot-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Mobile Safari/537.36"
118
107
  ]
119
- }
120
- ,
108
+ },
121
109
  {
122
110
  "pattern": "GoogleOther",
123
111
  "url": "https://developers.google.com/search/docs/crawling-indexing/overview-google-crawlers",
124
112
  "instances": [
125
113
  "GoogleOther"
126
114
  ]
127
- }
128
- ,
115
+ },
129
116
  {
130
117
  "pattern": "bingbot",
131
118
  "url": "http://www.bing.com/bingbot.htm",
@@ -145,8 +132,7 @@
145
132
  "Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm) Safari/537.36",
146
133
  "Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm) Chrome/103.0.5060.134 Safari/537.36"
147
134
  ]
148
- }
149
- ,
135
+ },
150
136
  {
151
137
  "pattern": "Slurp",
152
138
  "url": "http://help.yahoo.com/help/us/ysearch/slurp",
@@ -155,8 +141,7 @@
155
141
  "Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)",
156
142
  "Mozilla/5.0 (compatible; Yahoo! Slurp China; http://misc.yahoo.com.cn/help.html)"
157
143
  ]
158
- }
159
- ,
144
+ },
160
145
  {
161
146
  "pattern": "[wW]get",
162
147
  "instances": [
@@ -164,8 +149,7 @@
164
149
  "Wget/1.14 (linux-gnu)",
165
150
  "Wget/1.20.3 (linux-gnu)"
166
151
  ]
167
- }
168
- ,
152
+ },
169
153
  {
170
154
  "pattern": "LinkedInBot",
171
155
  "instances": [
@@ -173,8 +157,7 @@
173
157
  "LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/4.3 +http://www.linkedin.com)",
174
158
  "LinkedInBot/1.0 (compatible; Mozilla/5.0; Apache-HttpClient +http://www.linkedin.com)"
175
159
  ]
176
- }
177
- ,
160
+ },
178
161
  {
179
162
  "pattern": "Python-urllib",
180
163
  "instances": [
@@ -189,9 +172,8 @@
189
172
  "Python-urllib/3.5",
190
173
  "Python-urllib/3.6",
191
174
  "Python-urllib/3.7"
192
- ]
193
- }
194
- ,
175
+ ]
176
+ },
195
177
  {
196
178
  "pattern": "python-requests",
197
179
  "addition_date": "2018/05/27",
@@ -204,8 +186,7 @@
204
186
  "python-requests/2.21.0",
205
187
  "python-requests/2.22.0"
206
188
  ]
207
- }
208
- ,
189
+ },
209
190
  {
210
191
  "pattern": "aiohttp",
211
192
  "addition_date": "2019/12/23",
@@ -215,19 +196,16 @@
215
196
  "Python/3.7 aiohttp/3.6.2a2"
216
197
  ],
217
198
  "url": "https://docs.aiohttp.org/en/stable/"
218
- }
219
- ,
199
+ },
220
200
  {
221
201
  "pattern": "httpx",
222
202
  "addition_date": "2019/12/23",
223
203
  "instances": [
224
204
  "python-httpx/0.16.1",
225
205
  "python-httpx/0.13.0.dev1"
226
-
227
206
  ],
228
207
  "url": "https://www.python-httpx.org"
229
- }
230
- ,
208
+ },
231
209
  {
232
210
  "pattern": "libwww-perl",
233
211
  "instances": [
@@ -235,15 +213,13 @@
235
213
  "2Bone_LinkChkr/1.0 libwww-perl/6.03",
236
214
  "amibot - http://www.amidalla.de - tech@amidalla.com libwww-perl/5.831"
237
215
  ]
238
- }
239
- ,
216
+ },
240
217
  {
241
218
  "pattern": "httpunit",
242
219
  "instances": [
243
220
  "httpunit/1.x"
244
221
  ]
245
- }
246
- ,
222
+ },
247
223
  {
248
224
  "pattern": "Nutch",
249
225
  "instances": [
@@ -251,8 +227,7 @@
251
227
  "NutchCVS/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)",
252
228
  "istellabot-nutch/Nutch-1.10"
253
229
  ]
254
- }
255
- ,
230
+ },
256
231
  {
257
232
  "pattern": "Go-http-client",
258
233
  "addition_date": "2016/03/26",
@@ -261,8 +236,7 @@
261
236
  "Go-http-client/1.1",
262
237
  "Go-http-client/2.0"
263
238
  ]
264
- }
265
- ,
239
+ },
266
240
  {
267
241
  "pattern": "phpcrawl",
268
242
  "addition_date": "2012/09/17",
@@ -270,8 +244,7 @@
270
244
  "instances": [
271
245
  "phpcrawl"
272
246
  ]
273
- }
274
- ,
247
+ },
275
248
  {
276
249
  "pattern": "msnbot",
277
250
  "url": "http://search.msn.com/msnbot.htm",
@@ -291,13 +264,11 @@
291
264
  "msnbot/2.0b (+http://search.msn.com/msnbot.htm).",
292
265
  "msnbot/2.0b (+http://search.msn.com/msnbot.htm)._"
293
266
  ]
294
- }
295
- ,
267
+ },
296
268
  {
297
269
  "pattern": "jyxobot",
298
270
  "instances": []
299
- }
300
- ,
271
+ },
301
272
  {
302
273
  "pattern": "FAST-WebCrawler",
303
274
  "instances": [
@@ -306,23 +277,20 @@
306
277
  "FAST-WebCrawler/3.7/FirstPage (atw-crawler at fast dot no;http://fast.no/support/crawler.asp)",
307
278
  "FAST-WebCrawler/3.8"
308
279
  ]
309
- }
310
- ,
280
+ },
311
281
  {
312
282
  "pattern": "FAST Enterprise Crawler",
313
283
  "instances": [
314
284
  "FAST Enterprise Crawler 6 / Scirus scirus-crawler@fast.no; http://www.scirus.com/srsapp/contactus/",
315
285
  "FAST Enterprise Crawler 6 used by Schibsted (webcrawl@schibstedsok.no)"
316
286
  ]
317
- }
318
- ,
287
+ },
319
288
  {
320
289
  "pattern": "BIGLOTRON",
321
290
  "instances": [
322
291
  "BIGLOTRON (Beta 2;GNU/Linux)"
323
292
  ]
324
- }
325
- ,
293
+ },
326
294
  {
327
295
  "pattern": "Teoma",
328
296
  "instances": [
@@ -330,24 +298,21 @@
330
298
  "Mozilla/2.0 (compatible; Ask Jeeves/Teoma; +http://about.ask.com/en/docs/about/webmasters.shtml)"
331
299
  ],
332
300
  "url": "http://about.ask.com/en/docs/about/webmasters.shtml"
333
- }
334
- ,
301
+ },
335
302
  {
336
303
  "pattern": "convera",
337
304
  "instances": [
338
305
  "ConveraCrawler/0.9e (+http://ews.converasearch.com/crawl.htm)"
339
306
  ],
340
307
  "url": "http://ews.converasearch.com/crawl.htm"
341
- }
342
- ,
308
+ },
343
309
  {
344
310
  "pattern": "seekbot",
345
311
  "instances": [
346
312
  "Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.2"
347
313
  ],
348
314
  "url": "http://www.seekbot.net/bot.html"
349
- }
350
- ,
315
+ },
351
316
  {
352
317
  "pattern": "Gigabot",
353
318
  "instances": [
@@ -355,16 +320,14 @@
355
320
  "Gigabot/2.0 (http://www.gigablast.com/spider.html)"
356
321
  ],
357
322
  "url": "http://www.gigablast.com/spider.html"
358
- }
359
- ,
323
+ },
360
324
  {
361
325
  "pattern": "Gigablast",
362
326
  "instances": [
363
327
  "GigablastOpenSource/1.0"
364
328
  ],
365
329
  "url": "https://github.com/gigablast/open-source-search-engine"
366
- }
367
- ,
330
+ },
368
331
  {
369
332
  "pattern": "exabot",
370
333
  "instances": [
@@ -375,35 +338,30 @@
375
338
  "Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)",
376
339
  "Mozilla/5.0 (compatible; Exabot/3.0; http://www.exabot.com/go/robot)"
377
340
  ]
378
- }
379
- ,
341
+ },
380
342
  {
381
343
  "pattern": "ia_archiver",
382
344
  "instances": [
383
345
  "ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)",
384
346
  "ia_archiver-web.archive.org"
385
347
  ]
386
- }
387
- ,
348
+ },
388
349
  {
389
350
  "pattern": "GingerCrawler",
390
351
  "instances": [
391
352
  "GingerCrawler/1.0 (Language Assistant for Dyslexics; www.gingersoftware.com/crawler_agent.htm; support at ginger software dot com)"
392
353
  ]
393
- }
394
- ,
354
+ },
395
355
  {
396
356
  "pattern": "webmon ",
397
357
  "instances": []
398
- }
399
- ,
358
+ },
400
359
  {
401
360
  "pattern": "HTTrack",
402
361
  "instances": [
403
362
  "Mozilla/4.5 (compatible; HTTrack 3.0x; Windows 98)"
404
363
  ]
405
- }
406
- ,
364
+ },
407
365
  {
408
366
  "pattern": "grub\\.org",
409
367
  "instances": [
@@ -419,23 +377,19 @@
419
377
  "Mozilla/4.0 (compatible; grub-client-1.4.3; Crawl your own stuff with http://grub.org)",
420
378
  "Mozilla/4.0 (compatible; grub-client-1.5.3; Crawl your own stuff with http://grub.org)"
421
379
  ]
422
- }
423
- ,
380
+ },
424
381
  {
425
382
  "pattern": "UsineNouvelleCrawler",
426
383
  "instances": []
427
- }
428
- ,
384
+ },
429
385
  {
430
386
  "pattern": "antibot",
431
387
  "instances": []
432
- }
433
- ,
388
+ },
434
389
  {
435
390
  "pattern": "netresearchserver",
436
391
  "instances": []
437
- }
438
- ,
392
+ },
439
393
  {
440
394
  "pattern": "speedy",
441
395
  "instances": [
@@ -445,13 +399,11 @@
445
399
  "Speedy Spider (Entireweb; Beta/1.2; http://www.entireweb.com/about/search_tech/speedyspider/)",
446
400
  "Speedy Spider (http://www.entireweb.com/about/search_tech/speedy_spider/)"
447
401
  ]
448
- }
449
- ,
402
+ },
450
403
  {
451
404
  "pattern": "fluffy",
452
405
  "instances": []
453
- }
454
- ,
406
+ },
455
407
  {
456
408
  "pattern": "findlink",
457
409
  "instances": [
@@ -479,20 +431,17 @@
479
431
  "findlinks/2.5 (+http://wortschatz.uni-leipzig.de/findlinks/)",
480
432
  "findlinks/2.6 (+http://wortschatz.uni-leipzig.de/findlinks/)"
481
433
  ]
482
- }
483
- ,
434
+ },
484
435
  {
485
436
  "pattern": "msrbot",
486
437
  "instances": []
487
- }
488
- ,
438
+ },
489
439
  {
490
440
  "pattern": "panscient",
491
441
  "instances": [
492
442
  "panscient.com"
493
443
  ]
494
- }
495
- ,
444
+ },
496
445
  {
497
446
  "pattern": "yacybot",
498
447
  "instances": [
@@ -544,13 +493,11 @@
544
493
  "yacybot (-global; amd64 Linux 5.2.9-Jinsol; java 12.0.2; Europe/en) http://yacy.net/bot.html",
545
494
  "yacybot (-global; amd64 Linux 5.2.11-Jinsol; java 12.0.2; Europe/en) http://yacy.net/bot.html"
546
495
  ]
547
- }
548
- ,
496
+ },
549
497
  {
550
498
  "pattern": "AISearchBot",
551
499
  "instances": []
552
- }
553
- ,
500
+ },
554
501
  {
555
502
  "pattern": "ips-agent",
556
503
  "instances": [
@@ -560,13 +507,11 @@
560
507
  "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.24; ips-agent) Gecko/20111107 Ubuntu/10.04 (lucid) Firefox/3.6.24",
561
508
  "Mozilla/5.0 (X11; Ubuntu; Linux i686; rv:14.0; ips-agent) Gecko/20100101 Firefox/14.0.1"
562
509
  ]
563
- }
564
- ,
510
+ },
565
511
  {
566
512
  "pattern": "tagoobot",
567
513
  "instances": []
568
- }
569
- ,
514
+ },
570
515
  {
571
516
  "pattern": "MJ12bot",
572
517
  "instances": [
@@ -591,37 +536,32 @@
591
536
  "Mozilla/5.0 (compatible; MJ12bot/v1.4.7; http://www.majestic12.co.uk/bot.php?+)",
592
537
  "Mozilla/5.0 (compatible; MJ12bot/v1.4.8; http://mj12bot.com/)"
593
538
  ]
594
- }
595
- ,
539
+ },
596
540
  {
597
541
  "pattern": "woriobot",
598
542
  "instances": [
599
543
  "Mozilla/5.0 (compatible; woriobot +http://worio.com)",
600
544
  "Mozilla/5.0 (compatible; woriobot support [at] zite [dot] com +http://zite.com)"
601
545
  ]
602
- }
603
- ,
546
+ },
604
547
  {
605
548
  "pattern": "yanga",
606
549
  "instances": [
607
550
  "Yanga WorldSearch Bot v1.1/beta (http://www.yanga.co.uk/)"
608
551
  ]
609
- }
610
- ,
552
+ },
611
553
  {
612
554
  "pattern": "buzzbot",
613
555
  "instances": [
614
556
  "Buzzbot/1.0 (Buzzbot; http://www.buzzstream.com; buzzbot@buzzstream.com)"
615
557
  ]
616
- }
617
- ,
558
+ },
618
559
  {
619
560
  "pattern": "mlbot",
620
561
  "instances": [
621
562
  "MLBot (www.metadatalabs.com/mlbot)"
622
563
  ]
623
- }
624
- ,
564
+ },
625
565
  {
626
566
  "pattern": "yandex\\.com\\/bots",
627
567
  "url": "https://yandex.ru/support/webmaster/robot-workings/check-yandex-robots.html#robot-in-logs",
@@ -669,14 +609,12 @@
669
609
  "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2228.0 Safari/537.36 (compatible; YandexScreenshotBot/3.0; +http://yandex.com/bots)"
670
610
  ],
671
611
  "addition_date": "2015/04/14"
672
- }
673
- ,
612
+ },
674
613
  {
675
614
  "pattern": "purebot",
676
615
  "addition_date": "2010/01/19",
677
616
  "instances": []
678
- }
679
- ,
617
+ },
680
618
  {
681
619
  "pattern": "Linguee Bot",
682
620
  "addition_date": "2010/01/26",
@@ -685,8 +623,7 @@
685
623
  "Linguee Bot (http://www.linguee.com/bot)",
686
624
  "Linguee Bot (http://www.linguee.com/bot; bot@linguee.com)"
687
625
  ]
688
- }
689
- ,
626
+ },
690
627
  {
691
628
  "pattern": "CyberPatrol",
692
629
  "addition_date": "2010/02/11",
@@ -694,8 +631,7 @@
694
631
  "instances": [
695
632
  "CyberPatrol SiteCat Webbot (http://www.cyberpatrol.com/cyberpatrolcrawler.asp)"
696
633
  ]
697
- }
698
- ,
634
+ },
699
635
  {
700
636
  "pattern": "voilabot",
701
637
  "addition_date": "2010/05/18",
@@ -703,8 +639,7 @@
703
639
  "Mozilla/5.0 (Windows NT 5.1; U; Win64; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)",
704
640
  "Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)"
705
641
  ]
706
- }
707
- ,
642
+ },
708
643
  {
709
644
  "pattern": "Baiduspider",
710
645
  "addition_date": "2010/07/15",
@@ -713,14 +648,12 @@
713
648
  "Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)",
714
649
  "Mozilla/5.0 (compatible; Baiduspider-render/2.0; +http://www.baidu.com/search/spider.html)"
715
650
  ]
716
- }
717
- ,
651
+ },
718
652
  {
719
653
  "pattern": "citeseerxbot",
720
654
  "addition_date": "2010/07/17",
721
655
  "instances": []
722
- }
723
- ,
656
+ },
724
657
  {
725
658
  "pattern": "spbot",
726
659
  "addition_date": "2010/07/31",
@@ -761,15 +694,13 @@
761
694
  "Mozilla/5.0 (compatible; spbot/5.0.3; +http://OpenLinkProfiler.org/bot )",
762
695
  "Mozilla/5.0 (compatible; spbot/5.0; +http://OpenLinkProfiler.org/bot )"
763
696
  ]
764
- }
765
- ,
697
+ },
766
698
  {
767
699
  "pattern": "twengabot",
768
700
  "addition_date": "2010/08/03",
769
701
  "url": "http://www.twenga.com/bot.html",
770
702
  "instances": []
771
- }
772
- ,
703
+ },
773
704
  {
774
705
  "pattern": "postrank",
775
706
  "addition_date": "2010/08/03",
@@ -778,8 +709,7 @@
778
709
  "PostRank/2.0 (postrank.com)",
779
710
  "PostRank/2.0 (postrank.com; 1 subscribers)"
780
711
  ]
781
- }
782
- ,
712
+ },
783
713
  {
784
714
  "pattern": "Turnitin",
785
715
  "addition_date": "2010/09/26",
@@ -788,15 +718,13 @@
788
718
  "TurnitinBot (https://turnitin.com/robot/crawlerinfo.html)",
789
719
  "Turnitin (https://bit.ly/2UvnfoQ)"
790
720
  ]
791
- }
792
- ,
721
+ },
793
722
  {
794
723
  "pattern": "scribdbot",
795
724
  "addition_date": "2010/09/28",
796
725
  "url": "http://www.scribd.com",
797
726
  "instances": []
798
- }
799
- ,
727
+ },
800
728
  {
801
729
  "pattern": "page2rss",
802
730
  "addition_date": "2010/10/07",
@@ -804,8 +732,7 @@
804
732
  "instances": [
805
733
  "Mozilla/5.0 (compatible; Page2RSS/0.7; +http://page2rss.com/)"
806
734
  ]
807
- }
808
- ,
735
+ },
809
736
  {
810
737
  "pattern": "sitebot",
811
738
  "addition_date": "2010/12/15",
@@ -813,8 +740,7 @@
813
740
  "instances": [
814
741
  "Mozilla/5.0 (compatible; Whoiswebsitebot/0.1; +http://www.whoiswebsite.net)"
815
742
  ]
816
- }
817
- ,
743
+ },
818
744
  {
819
745
  "pattern": "linkdex",
820
746
  "addition_date": "2011/01/06",
@@ -828,14 +754,12 @@
828
754
  "linkdex.com/v2.0",
829
755
  "linkdexbot/Nutch-1.0-dev (http://www.linkdex.com/; crawl at linkdex dot com)"
830
756
  ]
831
- }
832
- ,
757
+ },
833
758
  {
834
759
  "pattern": "Adidxbot",
835
- "url": "http://onlinehelp.microsoft.com/en-us/bing/hh204496.aspx",
760
+ "url": "https://www.bing.com/webmasters/help/which-crawlers-does-bing-use-8c184ec0",
836
761
  "instances": []
837
- }
838
- ,
762
+ },
839
763
  {
840
764
  "pattern": "ezooms",
841
765
  "addition_date": "2011/04/27",
@@ -843,8 +767,7 @@
843
767
  "instances": [
844
768
  "Mozilla/5.0 (compatible; Ezooms/1.0; ezooms.bot@gmail.com)"
845
769
  ]
846
- }
847
- ,
770
+ },
848
771
  {
849
772
  "pattern": "dotbot",
850
773
  "addition_date": "2011/04/27",
@@ -852,8 +775,7 @@
852
775
  "Mozilla/5.0 (compatible; DotBot/1.1; http://www.opensiteexplorer.org/dotbot, help@moz.com)",
853
776
  "dotbot"
854
777
  ]
855
- }
856
- ,
778
+ },
857
779
  {
858
780
  "pattern": "Mail\\.RU_Bot",
859
781
  "addition_date": "2011/04/27",
@@ -863,8 +785,7 @@
863
785
  "Mozilla/5.0 (compatible; Mail.RU_Bot/2.0; +http://go.mail.ru/",
864
786
  "Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Robots/2.0; +http://go.mail.ru/help/robots)"
865
787
  ]
866
- }
867
- ,
788
+ },
868
789
  {
869
790
  "pattern": "discobot",
870
791
  "addition_date": "2011/05/03",
@@ -874,8 +795,7 @@
874
795
  "Mozilla/5.0 (compatible; discobot/2.0; +http://discoveryengine.com/discobot.html)",
875
796
  "mozilla/5.0 (compatible; discobot/1.1; +http://discoveryengine.com/discobot.html)"
876
797
  ]
877
- }
878
- ,
798
+ },
879
799
  {
880
800
  "pattern": "heritrix",
881
801
  "addition_date": "2011/06/21",
@@ -904,15 +824,13 @@
904
824
  "Mozilla/5.0 (compatible; heritrix/3.3.0-SNAPSHOT-20160309-0050; UniLeipzigASV +http://corpora.informatik.uni-leipzig.de/crawler_faq.html)",
905
825
  "Mozilla/5.0 (compatible; sukibot_heritrix/3.1.1 +http://suki.ling.helsinki.fi/eng/webmasters.html)"
906
826
  ]
907
- }
908
- ,
827
+ },
909
828
  {
910
829
  "pattern": "findthatfile",
911
830
  "addition_date": "2011/06/21",
912
831
  "url": "http://www.findthatfile.com/",
913
832
  "instances": []
914
- }
915
- ,
833
+ },
916
834
  {
917
835
  "pattern": "europarchive\\.org",
918
836
  "addition_date": "2011/06/21",
@@ -920,8 +838,7 @@
920
838
  "instances": [
921
839
  "Mozilla/5.0 (compatible; MSIE 7.0 +http://www.europarchive.org)"
922
840
  ]
923
- }
924
- ,
841
+ },
925
842
  {
926
843
  "pattern": "NerdByNature\\.Bot",
927
844
  "addition_date": "2011/07/12",
@@ -929,14 +846,15 @@
929
846
  "instances": [
930
847
  "Mozilla/5.0 (compatible; NerdByNature.Bot; http://www.nerdbynature.net/bot)"
931
848
  ]
932
- }
933
- ,
849
+ },
934
850
  {
935
- "pattern": "sistrix crawler",
851
+ "pattern": "(sistrix|SISTRIX) [cC]rawler",
936
852
  "addition_date": "2011/08/02",
937
- "instances": []
938
- }
939
- ,
853
+ "url": "https://www.sistrix.com/tutorials/crawling-errors-in-the-optimizer/",
854
+ "instances": [
855
+ "Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)"
856
+ ]
857
+ },
940
858
  {
941
859
  "pattern": "Ahrefs(Bot|SiteAudit)",
942
860
  "addition_date": "2011/08/28",
@@ -949,104 +867,91 @@
949
867
  "Mozilla/5.0 (compatible; AhrefsBot/6.1; News; +http://ahrefs.com/robot/)",
950
868
  "Mozilla/5.0 (compatible; AhrefsBot/7.0; +http://ahrefs.com/robot/)"
951
869
  ]
952
- }
953
- ,
870
+ },
954
871
  {
955
872
  "pattern": "fuelbot",
956
873
  "addition_date": "2018/06/28",
957
874
  "instances": [
958
875
  "fuelbot"
959
876
  ]
960
- }
961
- ,
877
+ },
962
878
  {
963
879
  "pattern": "CrunchBot",
964
880
  "addition_date": "2018/06/28",
965
881
  "instances": [
966
882
  "CrunchBot/1.0 (+http://www.leadcrunch.com/crunchbot)"
967
883
  ]
968
- }
969
- ,
884
+ },
970
885
  {
971
886
  "pattern": "IndeedBot",
972
887
  "addition_date": "2018/06/28",
973
888
  "instances": [
974
889
  "Mozilla/5.0 (Windows NT 6.1; rv:38.0) Gecko/20100101 Firefox/38.0 (IndeedBot 1.1)"
975
890
  ]
976
- }
977
- ,
891
+ },
978
892
  {
979
893
  "pattern": "mappydata",
980
894
  "addition_date": "2018/06/28",
981
895
  "instances": [
982
896
  "Mozilla/5.0 (compatible; Mappy/1.0; +http://mappydata.net/bot/)"
983
897
  ]
984
- }
985
- ,
898
+ },
986
899
  {
987
900
  "pattern": "woobot",
988
901
  "addition_date": "2018/06/28",
989
902
  "instances": [
990
903
  "woobot"
991
904
  ]
992
- }
993
- ,
905
+ },
994
906
  {
995
907
  "pattern": "ZoominfoBot",
996
908
  "addition_date": "2018/06/28",
997
909
  "instances": [
998
910
  "ZoominfoBot (zoominfobot at zoominfo dot com)"
999
911
  ]
1000
- }
1001
- ,
912
+ },
1002
913
  {
1003
914
  "pattern": "PrivacyAwareBot",
1004
915
  "addition_date": "2018/06/28",
1005
916
  "instances": [
1006
917
  "Mozilla/5.0 (compatible; PrivacyAwareBot/1.1; +http://www.privacyaware.org)"
1007
918
  ]
1008
- }
1009
- ,
919
+ },
1010
920
  {
1011
921
  "pattern": "Multiviewbot",
1012
922
  "addition_date": "2018/06/28",
1013
923
  "instances": [
1014
924
  "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Multiviewbot"
1015
925
  ]
1016
- }
1017
- ,
926
+ },
1018
927
  {
1019
928
  "pattern": "SWIMGBot",
1020
929
  "addition_date": "2018/06/28",
1021
930
  "instances": [
1022
931
  "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_5) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/45.0.2454.101 Safari/537.36 SWIMGBot"
1023
932
  ]
1024
- }
1025
- ,
933
+ },
1026
934
  {
1027
935
  "pattern": "Grobbot",
1028
936
  "addition_date": "2018/06/28",
1029
937
  "instances": [
1030
938
  "Mozilla/5.0 (compatible; Grobbot/2.2; +https://grob.it)"
1031
939
  ]
1032
- }
1033
- ,
940
+ },
1034
941
  {
1035
942
  "pattern": "eright",
1036
943
  "addition_date": "2018/06/28",
1037
944
  "instances": [
1038
945
  "Mozilla/5.0 (compatible; eright/1.0; +bot@eright.com)"
1039
946
  ]
1040
- }
1041
- ,
947
+ },
1042
948
  {
1043
949
  "pattern": "Apercite",
1044
950
  "addition_date": "2018/06/28",
1045
951
  "instances": [
1046
952
  "Mozilla/5.0 (compatible; Apercite; +http://www.apercite.fr/robot/index.html)"
1047
953
  ]
1048
- }
1049
- ,
954
+ },
1050
955
  {
1051
956
  "pattern": "semanticbot",
1052
957
  "addition_date": "2018/06/28",
@@ -1054,8 +959,7 @@
1054
959
  "semanticbot",
1055
960
  "semanticbot (info@semanticaudience.com)"
1056
961
  ]
1057
- }
1058
- ,
962
+ },
1059
963
  {
1060
964
  "pattern": "Aboundex",
1061
965
  "addition_date": "2011/09/28",
@@ -1064,23 +968,20 @@
1064
968
  "Aboundex/0.2 (http://www.aboundex.com/crawler/)",
1065
969
  "Aboundex/0.3 (http://www.aboundex.com/crawler/)"
1066
970
  ]
1067
- }
1068
- ,
971
+ },
1069
972
  {
1070
973
  "pattern": "domaincrawler",
1071
974
  "addition_date": "2011/10/21",
1072
975
  "instances": [
1073
976
  "CipaCrawler/3.0 (info@domaincrawler.com; http://www.domaincrawler.com/www.example.com)"
1074
977
  ]
1075
- }
1076
- ,
978
+ },
1077
979
  {
1078
980
  "pattern": "wbsearchbot",
1079
981
  "addition_date": "2011/12/21",
1080
982
  "url": "http://www.warebay.com/bot.html",
1081
983
  "instances": []
1082
- }
1083
- ,
984
+ },
1084
985
  {
1085
986
  "pattern": "summify",
1086
987
  "addition_date": "2012/01/04",
@@ -1088,8 +989,7 @@
1088
989
  "instances": [
1089
990
  "Summify (Summify/1.0.1; +http://summify.com)"
1090
991
  ]
1091
- }
1092
- ,
992
+ },
1093
993
  {
1094
994
  "pattern": "CCBot",
1095
995
  "addition_date": "2012/02/05",
@@ -1098,14 +998,12 @@
1098
998
  "CCBot/2.0 (http://commoncrawl.org/faq/)",
1099
999
  "CCBot/2.0 (https://commoncrawl.org/faq/)"
1100
1000
  ]
1101
- }
1102
- ,
1001
+ },
1103
1002
  {
1104
1003
  "pattern": "edisterbot",
1105
1004
  "addition_date": "2012/02/25",
1106
1005
  "instances": []
1107
- }
1108
- ,
1006
+ },
1109
1007
  {
1110
1008
  "pattern": "SeznamBot",
1111
1009
  "addition_date": "2012/03/14",
@@ -1117,36 +1015,31 @@
1117
1015
  "Mozilla/5.0 (compatible; SeznamBot/3.2; +http://napoveda.seznam.cz/en/seznambot-intro/)",
1118
1016
  "Mozilla/5.0 (compatible; SeznamBot/4.0; +http://napoveda.seznam.cz/seznambot-intro/)"
1119
1017
  ]
1120
- }
1121
- ,
1018
+ },
1122
1019
  {
1123
1020
  "pattern": "ec2linkfinder",
1124
1021
  "addition_date": "2012/03/22",
1125
1022
  "instances": [
1126
1023
  "ec2linkfinder"
1127
1024
  ]
1128
- }
1129
- ,
1025
+ },
1130
1026
  {
1131
1027
  "pattern": "gslfbot",
1132
1028
  "addition_date": "2012/04/03",
1133
1029
  "instances": []
1134
- }
1135
- ,
1030
+ },
1136
1031
  {
1137
1032
  "pattern": "aiHitBot",
1138
1033
  "addition_date": "2012/04/16",
1139
1034
  "instances": [
1140
1035
  "Mozilla/5.0 (compatible; aiHitBot/2.9; +https://www.aihitdata.com/about)"
1141
1036
  ]
1142
- }
1143
- ,
1037
+ },
1144
1038
  {
1145
1039
  "pattern": "intelium_bot",
1146
1040
  "addition_date": "2012/05/07",
1147
1041
  "instances": []
1148
- }
1149
- ,
1042
+ },
1150
1043
  {
1151
1044
  "pattern": "facebookexternalhit",
1152
1045
  "addition_date": "2012/05/07",
@@ -1156,8 +1049,7 @@
1156
1049
  "facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)"
1157
1050
  ],
1158
1051
  "url": "https://developers.facebook.com/docs/sharing/webmasters/crawler/"
1159
- }
1160
- ,
1052
+ },
1161
1053
  {
1162
1054
  "pattern": "Yeti",
1163
1055
  "addition_date": "2012/05/07",
@@ -1165,22 +1057,19 @@
1165
1057
  "instances": [
1166
1058
  "Mozilla/5.0 (compatible; Yeti/1.1; +http://naver.me/bot)"
1167
1059
  ]
1168
- }
1169
- ,
1060
+ },
1170
1061
  {
1171
1062
  "pattern": "RetrevoPageAnalyzer",
1172
1063
  "addition_date": "2012/05/07",
1173
1064
  "instances": [
1174
1065
  "Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; RetrevoPageAnalyzer; +http://www.retrevo.com/content/about-us)"
1175
1066
  ]
1176
- }
1177
- ,
1067
+ },
1178
1068
  {
1179
1069
  "pattern": "lb-spider",
1180
1070
  "addition_date": "2012/05/07",
1181
1071
  "instances": []
1182
- }
1183
- ,
1072
+ },
1184
1073
  {
1185
1074
  "pattern": "Sogou",
1186
1075
  "addition_date": "2012/05/13",
@@ -1190,21 +1079,19 @@
1190
1079
  "Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)",
1191
1080
  "Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)"
1192
1081
  ]
1193
- }
1194
- ,
1082
+ },
1195
1083
  {
1196
1084
  "pattern": "lssbot",
1197
1085
  "addition_date": "2012/05/15",
1086
+ "url": "https://www.lssbot.com/",
1198
1087
  "instances": []
1199
- }
1200
- ,
1088
+ },
1201
1089
  {
1202
1090
  "pattern": "careerbot",
1203
1091
  "addition_date": "2012/05/23",
1204
1092
  "url": "http://www.career-x.de/bot.html",
1205
1093
  "instances": []
1206
- }
1207
- ,
1094
+ },
1208
1095
  {
1209
1096
  "pattern": "wotbox",
1210
1097
  "addition_date": "2012/06/12",
@@ -1213,15 +1100,13 @@
1213
1100
  "Wotbox/2.0 (bot@wotbox.com; http://www.wotbox.com)",
1214
1101
  "Wotbox/2.01 (+http://www.wotbox.com/bot/)"
1215
1102
  ]
1216
- }
1217
- ,
1103
+ },
1218
1104
  {
1219
1105
  "pattern": "wocbot",
1220
1106
  "addition_date": "2012/07/25",
1221
1107
  "url": "http://www.wocodi.com/crawler",
1222
1108
  "instances": []
1223
- }
1224
- ,
1109
+ },
1225
1110
  {
1226
1111
  "pattern": "ichiro",
1227
1112
  "addition_date": "2012/08/28",
@@ -1243,8 +1128,7 @@
1243
1128
  "ichiro/4.0 (http://help.goo.ne.jp/door/crawler.html)",
1244
1129
  "ichiro/5.0 (http://help.goo.ne.jp/door/crawler.html)"
1245
1130
  ]
1246
- }
1247
- ,
1131
+ },
1248
1132
  {
1249
1133
  "pattern": "DuckDuckBot",
1250
1134
  "addition_date": "2012/09/19",
@@ -1255,14 +1139,12 @@
1255
1139
  "Mozilla/5.0 (compatible; DuckDuckBot-Https/1.1; https://duckduckgo.com/duckduckbot)",
1256
1140
  "'Mozilla/5.0 (compatible; DuckDuckBot-Https/1.1; https://duckduckgo.com/duckduckbot)'"
1257
1141
  ]
1258
- }
1259
- ,
1142
+ },
1260
1143
  {
1261
1144
  "pattern": "lssrocketcrawler",
1262
1145
  "addition_date": "2012/09/24",
1263
1146
  "instances": []
1264
- }
1265
- ,
1147
+ },
1266
1148
  {
1267
1149
  "pattern": "drupact",
1268
1150
  "addition_date": "2012/09/27",
@@ -1270,45 +1152,39 @@
1270
1152
  "instances": [
1271
1153
  "drupact/0.7; http://www.arocom.de/drupact"
1272
1154
  ]
1273
- }
1274
- ,
1155
+ },
1275
1156
  {
1276
1157
  "pattern": "webcompanycrawler",
1277
1158
  "addition_date": "2012/10/03",
1278
1159
  "instances": []
1279
- }
1280
- ,
1160
+ },
1281
1161
  {
1282
1162
  "pattern": "acoonbot",
1283
1163
  "addition_date": "2012/10/07",
1284
1164
  "url": "http://www.acoon.de/robot.asp",
1285
1165
  "instances": []
1286
- }
1287
- ,
1166
+ },
1288
1167
  {
1289
1168
  "pattern": "openindexspider",
1290
1169
  "addition_date": "2012/10/26",
1291
1170
  "url": "http://www.openindex.io/en/webmasters/spider.html",
1292
1171
  "instances": []
1293
- }
1294
- ,
1172
+ },
1295
1173
  {
1296
1174
  "pattern": "gnam gnam spider",
1297
1175
  "addition_date": "2012/10/31",
1298
1176
  "instances": []
1299
- }
1300
- ,
1177
+ },
1301
1178
  {
1302
1179
  "pattern": "web-archive-net\\.com\\.bot",
1303
1180
  "instances": []
1304
- }
1305
- ,
1181
+ },
1306
1182
  {
1307
1183
  "pattern": "backlinkcrawler",
1308
1184
  "addition_date": "2013/01/04",
1185
+ "url": "http://www.backlinktest.com/crawler.html",
1309
1186
  "instances": []
1310
- }
1311
- ,
1187
+ },
1312
1188
  {
1313
1189
  "pattern": "coccoc",
1314
1190
  "addition_date": "2013/01/04",
@@ -1326,8 +1202,7 @@
1326
1202
  "coccoc/1.0 (http://help.coccoc.com/)",
1327
1203
  "coccoc/1.0 (http://help.coccoc.vn/)"
1328
1204
  ]
1329
- }
1330
- ,
1205
+ },
1331
1206
  {
1332
1207
  "pattern": "integromedb",
1333
1208
  "addition_date": "2013/01/10",
@@ -1335,20 +1210,17 @@
1335
1210
  "instances": [
1336
1211
  "www.integromedb.org/Crawler"
1337
1212
  ]
1338
- }
1339
- ,
1213
+ },
1340
1214
  {
1341
1215
  "pattern": "content crawler spider",
1342
1216
  "addition_date": "2013/01/11",
1343
1217
  "instances": []
1344
- }
1345
- ,
1218
+ },
1346
1219
  {
1347
1220
  "pattern": "toplistbot",
1348
1221
  "addition_date": "2013/02/05",
1349
1222
  "instances": []
1350
- }
1351
- ,
1223
+ },
1352
1224
  {
1353
1225
  "pattern": "it2media-domain-crawler",
1354
1226
  "addition_date": "2013/03/12",
@@ -1356,14 +1228,12 @@
1356
1228
  "it2media-domain-crawler/1.0 on crawler-prod.it2media.de",
1357
1229
  "it2media-domain-crawler/2.0"
1358
1230
  ]
1359
- }
1360
- ,
1231
+ },
1361
1232
  {
1362
1233
  "pattern": "ip-web-crawler\\.com",
1363
1234
  "addition_date": "2013/03/22",
1364
1235
  "instances": []
1365
- }
1366
- ,
1236
+ },
1367
1237
  {
1368
1238
  "pattern": "siteexplorer\\.info",
1369
1239
  "addition_date": "2013/05/01",
@@ -1371,14 +1241,12 @@
1371
1241
  "Mozilla/5.0 (compatible; SiteExplorer/1.0b; +http://siteexplorer.info/)",
1372
1242
  "Mozilla/5.0 (compatible; SiteExplorer/1.1b; +http://siteexplorer.info/Backlink-Checker-Spider/)"
1373
1243
  ]
1374
- }
1375
- ,
1244
+ },
1376
1245
  {
1377
1246
  "pattern": "elisabot",
1378
1247
  "addition_date": "2013/06/27",
1379
1248
  "instances": []
1380
- }
1381
- ,
1249
+ },
1382
1250
  {
1383
1251
  "pattern": "proximic",
1384
1252
  "addition_date": "2013/09/12",
@@ -1387,8 +1255,7 @@
1387
1255
  "Mozilla/5.0 (compatible; proximic; +http://www.proximic.com)",
1388
1256
  "Mozilla/5.0 (compatible; proximic; +http://www.proximic.com/info/spider.php)"
1389
1257
  ]
1390
- }
1391
- ,
1258
+ },
1392
1259
  {
1393
1260
  "pattern": "changedetection",
1394
1261
  "addition_date": "2013/09/13",
@@ -1396,14 +1263,12 @@
1396
1263
  "instances": [
1397
1264
  "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://www.changedetection.com/bot.html )"
1398
1265
  ]
1399
- }
1400
- ,
1266
+ },
1401
1267
  {
1402
1268
  "pattern": "arabot",
1403
1269
  "addition_date": "2013/10/09",
1404
1270
  "instances": []
1405
- }
1406
- ,
1271
+ },
1407
1272
  {
1408
1273
  "pattern": "WeSEE:Search",
1409
1274
  "addition_date": "2013/11/18",
@@ -1411,21 +1276,18 @@
1411
1276
  "WeSEE:Search",
1412
1277
  "WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)"
1413
1278
  ]
1414
- }
1415
- ,
1279
+ },
1416
1280
  {
1417
1281
  "pattern": "niki-bot",
1418
1282
  "addition_date": "2014/01/01",
1419
1283
  "instances": []
1420
- }
1421
- ,
1284
+ },
1422
1285
  {
1423
1286
  "pattern": "CrystalSemanticsBot",
1424
1287
  "addition_date": "2014/02/17",
1425
1288
  "url": "http://www.crystalsemantics.com/user-agent/",
1426
1289
  "instances": []
1427
- }
1428
- ,
1290
+ },
1429
1291
  {
1430
1292
  "pattern": "rogerbot",
1431
1293
  "addition_date": "2014/02/28",
@@ -1445,8 +1307,7 @@
1445
1307
  "rogerbot/1.1 (http://moz.com/help/guides/search-overview/crawl-diagnostics#more-help, rogerbot-crawler+pr4-crawler-15@moz.com)",
1446
1308
  "rogerbot/1.2 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+phaser-testing-crawler-01@moz.com)"
1447
1309
  ]
1448
- }
1449
- ,
1310
+ },
1450
1311
  {
1451
1312
  "pattern": "360Spider",
1452
1313
  "addition_date": "2014/03/14",
@@ -1463,8 +1324,7 @@
1463
1324
  "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider(compatible; HaosouSpider; http://www.haosou.com/help/help_3_2.html)",
1464
1325
  "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36; 360Spider"
1465
1326
  ]
1466
- }
1467
- ,
1327
+ },
1468
1328
  {
1469
1329
  "pattern": "psbot",
1470
1330
  "addition_date": "2014/03/31",
@@ -1474,15 +1334,13 @@
1474
1334
  "psbot-page (+http://www.picsearch.com/bot.html)",
1475
1335
  "psbot/0.1 (+http://www.picsearch.com/bot.html)"
1476
1336
  ]
1477
- }
1478
- ,
1337
+ },
1479
1338
  {
1480
1339
  "pattern": "InterfaxScanBot",
1481
1340
  "addition_date": "2014/03/31",
1482
1341
  "url": "http://scan-interfax.ru",
1483
1342
  "instances": []
1484
- }
1485
- ,
1343
+ },
1486
1344
  {
1487
1345
  "pattern": "CC Metadata Scaper",
1488
1346
  "addition_date": "2014/04/01",
@@ -1490,15 +1348,13 @@
1490
1348
  "instances": [
1491
1349
  "CC Metadata Scaper http://wiki.creativecommons.org/Metadata_Scraper"
1492
1350
  ]
1493
- }
1494
- ,
1351
+ },
1495
1352
  {
1496
1353
  "pattern": "g00g1e\\.net",
1497
1354
  "addition_date": "2014/04/01",
1498
1355
  "url": "http://www.g00g1e.net/",
1499
1356
  "instances": []
1500
- }
1501
- ,
1357
+ },
1502
1358
  {
1503
1359
  "pattern": "GrapeshotCrawler",
1504
1360
  "addition_date": "2014/04/01",
@@ -1506,8 +1362,7 @@
1506
1362
  "instances": [
1507
1363
  "Mozilla/5.0 (compatible; GrapeshotCrawler/2.0; +http://www.grapeshot.co.uk/crawler.php)"
1508
1364
  ]
1509
- }
1510
- ,
1365
+ },
1511
1366
  {
1512
1367
  "pattern": "urlappendbot",
1513
1368
  "addition_date": "2014/05/10",
@@ -1515,22 +1370,19 @@
1515
1370
  "instances": [
1516
1371
  "Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)"
1517
1372
  ]
1518
- }
1519
- ,
1373
+ },
1520
1374
  {
1521
1375
  "pattern": "brainobot",
1522
1376
  "addition_date": "2014/06/24",
1523
1377
  "instances": []
1524
- }
1525
- ,
1378
+ },
1526
1379
  {
1527
1380
  "pattern": "fr-crawler",
1528
1381
  "addition_date": "2014/07/31",
1529
1382
  "instances": [
1530
1383
  "Mozilla/5.0 (compatible; fr-crawler/1.1)"
1531
1384
  ]
1532
- }
1533
- ,
1385
+ },
1534
1386
  {
1535
1387
  "pattern": "binlar",
1536
1388
  "addition_date": "2014/09/12",
@@ -1541,16 +1393,14 @@
1541
1393
  "binlar_2.6.3 phanendra_kalapala@McAfee.com",
1542
1394
  "binlar_2.6.3 test@mgmt.mic"
1543
1395
  ]
1544
- }
1545
- ,
1396
+ },
1546
1397
  {
1547
1398
  "pattern": "SimpleCrawler",
1548
1399
  "addition_date": "2014/09/12",
1549
1400
  "instances": [
1550
1401
  "SimpleCrawler/0.1"
1551
1402
  ]
1552
- }
1553
- ,
1403
+ },
1554
1404
  {
1555
1405
  "pattern": "Twitterbot",
1556
1406
  "addition_date": "2014/09/12",
@@ -1559,8 +1409,7 @@
1559
1409
  "Twitterbot/0.1",
1560
1410
  "Twitterbot/1.0"
1561
1411
  ]
1562
- }
1563
- ,
1412
+ },
1564
1413
  {
1565
1414
  "pattern": "cXensebot",
1566
1415
  "addition_date": "2014/10/05",
@@ -1568,8 +1417,7 @@
1568
1417
  "cXensebot/1.1a"
1569
1418
  ],
1570
1419
  "url": "http://www.cxense.com/bot.html"
1571
- }
1572
- ,
1420
+ },
1573
1421
  {
1574
1422
  "pattern": "smtbot",
1575
1423
  "addition_date": "2014/10/04",
@@ -1581,8 +1429,7 @@
1581
1429
  "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.75 Safari/537.36 (compatible; SMTBot/1.0; http://www.similartech.com/smtbot)"
1582
1430
  ],
1583
1431
  "url": "http://www.similartech.com/smtbot"
1584
- }
1585
- ,
1432
+ },
1586
1433
  {
1587
1434
  "pattern": "bnf\\.fr_bot",
1588
1435
  "addition_date": "2014/11/18",
@@ -1591,8 +1438,7 @@
1591
1438
  "Mozilla/5.0 (compatible; bnf.fr_bot; +http://bibnum.bnf.fr/robot/bnf.html)",
1592
1439
  "Mozilla/5.0 (compatible; bnf.fr_bot; +http://www.bnf.fr/fr/outils/a.dl_web_capture_robot.html)"
1593
1440
  ]
1594
- }
1595
- ,
1441
+ },
1596
1442
  {
1597
1443
  "pattern": "A6-Indexer",
1598
1444
  "addition_date": "2014/12/05",
@@ -1600,8 +1446,7 @@
1600
1446
  "instances": [
1601
1447
  "A6-Indexer"
1602
1448
  ]
1603
- }
1604
- ,
1449
+ },
1605
1450
  {
1606
1451
  "pattern": "ADmantX",
1607
1452
  "addition_date": "2014/12/05",
@@ -1609,8 +1454,7 @@
1609
1454
  "instances": [
1610
1455
  "ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com"
1611
1456
  ]
1612
- }
1613
- ,
1457
+ },
1614
1458
  {
1615
1459
  "pattern": "Facebot",
1616
1460
  "url": "https://developers.facebook.com/docs/sharing/best-practices#crawl",
@@ -1618,16 +1462,14 @@
1618
1462
  "instances": [
1619
1463
  "Facebot/1.0"
1620
1464
  ]
1621
- }
1622
- ,
1465
+ },
1623
1466
  {
1624
1467
  "pattern": "OrangeBot\\/",
1625
1468
  "instances": [
1626
1469
  "Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com"
1627
1470
  ],
1628
1471
  "addition_date": "2015/01/12"
1629
- }
1630
- ,
1472
+ },
1631
1473
  {
1632
1474
  "pattern": "memorybot",
1633
1475
  "url": "http://mignify.com/bot.htm",
@@ -1635,8 +1477,7 @@
1635
1477
  "Mozilla/5.0 (compatible; memorybot/1.21.14 +http://mignify.com/bot.html)"
1636
1478
  ],
1637
1479
  "addition_date": "2015/02/01"
1638
- }
1639
- ,
1480
+ },
1640
1481
  {
1641
1482
  "pattern": "AdvBot",
1642
1483
  "url": "http://advbot.net/bot.html",
@@ -1644,8 +1485,7 @@
1644
1485
  "Mozilla/5.0 (compatible; AdvBot/2.0; +http://advbot.net/bot.html)"
1645
1486
  ],
1646
1487
  "addition_date": "2015/02/01"
1647
- }
1648
- ,
1488
+ },
1649
1489
  {
1650
1490
  "pattern": "MegaIndex",
1651
1491
  "url": "https://www.megaindex.ru/?tab=linkAnalyze",
@@ -1654,8 +1494,7 @@
1654
1494
  "Mozilla/5.0 (compatible; MegaIndex.ru/2.0; +http://megaindex.com/crawler)"
1655
1495
  ],
1656
1496
  "addition_date": "2015/03/28"
1657
- }
1658
- ,
1497
+ },
1659
1498
  {
1660
1499
  "pattern": "SemanticScholarBot",
1661
1500
  "url": "https://www.semanticscholar.org/crawler",
@@ -1664,8 +1503,7 @@
1664
1503
  "Mozilla/5.0 (compatible) SemanticScholarBot (+https://www.semanticscholar.org/crawler)"
1665
1504
  ],
1666
1505
  "addition_date": "2015/03/28"
1667
- }
1668
- ,
1506
+ },
1669
1507
  {
1670
1508
  "pattern": "ltx71",
1671
1509
  "url": "http://ltx71.com/",
@@ -1673,8 +1511,7 @@
1673
1511
  "ltx71 - (http://ltx71.com/)"
1674
1512
  ],
1675
1513
  "addition_date": "2015/04/04"
1676
- }
1677
- ,
1514
+ },
1678
1515
  {
1679
1516
  "pattern": "nerdybot",
1680
1517
  "url": "http://nerdybot.com/",
@@ -1682,8 +1519,7 @@
1682
1519
  "nerdybot"
1683
1520
  ],
1684
1521
  "addition_date": "2015/04/05"
1685
- }
1686
- ,
1522
+ },
1687
1523
  {
1688
1524
  "pattern": "xovibot",
1689
1525
  "url": "http://www.xovibot.net/",
@@ -1691,8 +1527,7 @@
1691
1527
  "Mozilla/5.0 (compatible; XoviBot/2.0; +http://www.xovibot.net/)"
1692
1528
  ],
1693
1529
  "addition_date": "2015/04/05"
1694
- }
1695
- ,
1530
+ },
1696
1531
  {
1697
1532
  "pattern": "BUbiNG",
1698
1533
  "url": "http://law.di.unimi.it/BUbiNG.html",
@@ -1700,8 +1535,7 @@
1700
1535
  "BUbiNG (+http://law.di.unimi.it/BUbiNG.html)"
1701
1536
  ],
1702
1537
  "addition_date": "2015/04/06"
1703
- }
1704
- ,
1538
+ },
1705
1539
  {
1706
1540
  "pattern": "Qwantify",
1707
1541
  "url": "https://www.qwant.com/",
@@ -1712,12 +1546,13 @@
1712
1546
  "Mozilla/5.0 (compatible; Qwantify/Bleriot/1.2.1; +https://help.qwant.com/bot)"
1713
1547
  ],
1714
1548
  "addition_date": "2015/04/06"
1715
- }
1716
- ,
1549
+ },
1717
1550
  {
1718
1551
  "pattern": "archive\\.org_bot",
1719
1552
  "url": "http://www.archive.org/details/archive.org_bot",
1720
- "depends_on": ["heritrix"],
1553
+ "depends_on": [
1554
+ "heritrix"
1555
+ ],
1721
1556
  "instances": [
1722
1557
  "Mozilla/5.0 (compatible; heritrix/3.1.1-SNAPSHOT-20120116.200628 +http://www.archive.org/details/archive.org_bot)",
1723
1558
  "Mozilla/5.0 (compatible; archive.org_bot/heritrix-1.15.4 +http://www.archive.org)",
@@ -1727,8 +1562,7 @@
1727
1562
  "Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)"
1728
1563
  ],
1729
1564
  "addition_date": "2015/04/14"
1730
- }
1731
- ,
1565
+ },
1732
1566
  {
1733
1567
  "pattern": "Applebot",
1734
1568
  "url": "http://www.apple.com/go/applebot",
@@ -1740,8 +1574,7 @@
1740
1574
  "Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Applebot/0.3; +http://www.apple.com/go/applebot)",
1741
1575
  "Mozilla/5.0 (iPhone; CPU iPhone OS 8_1 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12B410 Safari/600.1.4 (Applebot/0.1; +http://www.apple.com/go/applebot)"
1742
1576
  ]
1743
- }
1744
- ,
1577
+ },
1745
1578
  {
1746
1579
  "pattern": "TweetmemeBot",
1747
1580
  "url": "http://datasift.com/bot.html",
@@ -1749,8 +1582,7 @@
1749
1582
  "Mozilla/5.0 (TweetmemeBot/4.0; +http://datasift.com/bot.html) Gecko/20100101 Firefox/31.0"
1750
1583
  ],
1751
1584
  "addition_date": "2015/04/15"
1752
- }
1753
- ,
1585
+ },
1754
1586
  {
1755
1587
  "pattern": "crawler4j",
1756
1588
  "url": "https://github.com/yasserg/crawler4j",
@@ -1759,8 +1591,7 @@
1759
1591
  "crawler4j (https://github.com/yasserg/crawler4j/)"
1760
1592
  ],
1761
1593
  "addition_date": "2015/05/07"
1762
- }
1763
- ,
1594
+ },
1764
1595
  {
1765
1596
  "pattern": "findxbot",
1766
1597
  "url": "http://www.findxbot.com",
@@ -1768,8 +1599,7 @@
1768
1599
  "Mozilla/5.0 (compatible; Findxbot/1.0; +http://www.findxbot.com)"
1769
1600
  ],
1770
1601
  "addition_date": "2015/05/07"
1771
- }
1772
- ,
1602
+ },
1773
1603
  {
1774
1604
  "pattern": "S[eE][mM]rushBot",
1775
1605
  "url": "http://www.semrush.com/bot.html",
@@ -1784,8 +1614,7 @@
1784
1614
  "SEMrushBot"
1785
1615
  ],
1786
1616
  "addition_date": "2015/05/26"
1787
- }
1788
- ,
1617
+ },
1789
1618
  {
1790
1619
  "pattern": "yoozBot",
1791
1620
  "url": "http://yooz.ir",
@@ -1793,8 +1622,7 @@
1793
1622
  "Mozilla/5.0 (compatible; yoozBot-2.2; http://yooz.ir; info@yooz.ir)"
1794
1623
  ],
1795
1624
  "addition_date": "2015/05/26"
1796
- }
1797
- ,
1625
+ },
1798
1626
  {
1799
1627
  "pattern": "lipperhey",
1800
1628
  "url": "http://www.lipperhey.com/",
@@ -1805,8 +1633,7 @@
1805
1633
  "Mozilla/5.0 (compatible; Lipperhey-Kaus-Australis/5.0; +https://www.lipperhey.com/en/about/)"
1806
1634
  ],
1807
1635
  "addition_date": "2015/08/26"
1808
- }
1809
- ,
1636
+ },
1810
1637
  {
1811
1638
  "pattern": "Y!J",
1812
1639
  "url": "https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716/~/%E3%82%A6%E3%82%A7%E3%83%96%E3%83%9A%E3%83%BC%E3%82%B8%E3%81%AB%E3%82%A2%E3%82%AF%E3%82%BB%E3%82%B9%E3%81%99%E3%82%8B%E3%82%B7%E3%82%B9%E3%83%86%E3%83%A0%E3%81%AE%E3%83%A6%E3%83%BC%E3%82%B6%E3%83%BC%E3%82%A8%E3%83%BC%E3%82%B8%E3%82%A7%E3%83%B3%E3%83%88%E3%81%AB%E3%81%A4%E3%81%84%E3%81%A6",
@@ -1819,8 +1646,7 @@
1819
1646
  "Mozilla/5.0 (compatible; Y!J SearchMonkey/1.0 (Y!J-AGENT; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html))"
1820
1647
  ],
1821
1648
  "addition_date": "2015/05/26"
1822
- }
1823
- ,
1649
+ },
1824
1650
  {
1825
1651
  "pattern": "Domain Re-Animator Bot",
1826
1652
  "url": "http://domainreanimator.com",
@@ -1828,8 +1654,7 @@
1828
1654
  "Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com"
1829
1655
  ],
1830
1656
  "addition_date": "2015/04/14"
1831
- }
1832
- ,
1657
+ },
1833
1658
  {
1834
1659
  "pattern": "AddThis",
1835
1660
  "url": "https://www.addthis.com",
@@ -1837,8 +1662,7 @@
1837
1662
  "AddThis.com robot tech.support@clearspring.com"
1838
1663
  ],
1839
1664
  "addition_date": "2015/06/02"
1840
- }
1841
- ,
1665
+ },
1842
1666
  {
1843
1667
  "pattern": "Screaming Frog SEO Spider",
1844
1668
  "url": "http://www.screamingfrog.co.uk/seo-spider",
@@ -1846,8 +1670,7 @@
1846
1670
  "Screaming Frog SEO Spider/5.1"
1847
1671
  ],
1848
1672
  "addition_date": "2016/01/08"
1849
- }
1850
- ,
1673
+ },
1851
1674
  {
1852
1675
  "pattern": "MetaURI",
1853
1676
  "url": "http://www.useragentstring.com/MetaURI_id_17683.php",
@@ -1855,8 +1678,7 @@
1855
1678
  "MetaURI API/2.0 +metauri.com"
1856
1679
  ],
1857
1680
  "addition_date": "2016/01/02"
1858
- }
1859
- ,
1681
+ },
1860
1682
  {
1861
1683
  "pattern": "Scrapy",
1862
1684
  "url": "http://scrapy.org/",
@@ -1864,8 +1686,7 @@
1864
1686
  "Scrapy/1.0.3 (+http://scrapy.org)"
1865
1687
  ],
1866
1688
  "addition_date": "2016/01/02"
1867
- }
1868
- ,
1689
+ },
1869
1690
  {
1870
1691
  "pattern": "Livelap[bB]ot",
1871
1692
  "url": "http://site.livelap.com/crawler",
@@ -1874,8 +1695,7 @@
1874
1695
  "Livelapbot/0.1"
1875
1696
  ],
1876
1697
  "addition_date": "2016/01/02"
1877
- }
1878
- ,
1698
+ },
1879
1699
  {
1880
1700
  "pattern": "OpenHoseBot",
1881
1701
  "url": "http://www.openhose.org/bot.html",
@@ -1883,8 +1703,7 @@
1883
1703
  "Mozilla/5.0 (compatible; OpenHoseBot/2.1; +http://www.openhose.org/bot.html)"
1884
1704
  ],
1885
1705
  "addition_date": "2016/01/02"
1886
- }
1887
- ,
1706
+ },
1888
1707
  {
1889
1708
  "pattern": "CapsuleChecker",
1890
1709
  "url": "http://www.capsulink.com/about",
@@ -1892,8 +1711,7 @@
1892
1711
  "CapsuleChecker (http://www.capsulink.com/)"
1893
1712
  ],
1894
1713
  "addition_date": "2016/01/02"
1895
- }
1896
- ,
1714
+ },
1897
1715
  {
1898
1716
  "pattern": "collection@infegy\\.com",
1899
1717
  "url": "http://infegy.com/",
@@ -1901,8 +1719,7 @@
1901
1719
  "Mozilla/5.0 (compatible) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/47.0.2526.73 Safari/537.36 collection@infegy.com"
1902
1720
  ],
1903
1721
  "addition_date": "2016/01/03"
1904
- }
1905
- ,
1722
+ },
1906
1723
  {
1907
1724
  "pattern": "IstellaBot",
1908
1725
  "url": "http://www.tiscali.it/",
@@ -1910,8 +1727,7 @@
1910
1727
  "Mozilla/5.0 (compatible; IstellaBot/1.23.15 +http://www.tiscali.it/)"
1911
1728
  ],
1912
1729
  "addition_date": "2016/01/09"
1913
- }
1914
- ,
1730
+ },
1915
1731
  {
1916
1732
  "pattern": "DeuSu\\/",
1917
1733
  "addition_date": "2016/01/23",
@@ -1920,14 +1736,12 @@
1920
1736
  "Mozilla/5.0 (compatible; DeuSu/0.1.0; +https://deusu.org)",
1921
1737
  "Mozilla/5.0 (compatible; DeuSu/5.0.2; +https://deusu.de/robot.html)"
1922
1738
  ]
1923
- }
1924
- ,
1739
+ },
1925
1740
  {
1926
1741
  "pattern": "betaBot",
1927
1742
  "addition_date": "2016/01/23",
1928
1743
  "instances": []
1929
- }
1930
- ,
1744
+ },
1931
1745
  {
1932
1746
  "pattern": "Cliqzbot\\/",
1933
1747
  "addition_date": "2016/01/23",
@@ -1939,8 +1753,7 @@
1939
1753
  "Mozilla/5.0 (compatible; Cliqzbot/0.1 +http://cliqz.com/company/cliqzbot)",
1940
1754
  "Mozilla/5.0 (compatible; Cliqzbot/1.0 +http://cliqz.com/company/cliqzbot)"
1941
1755
  ]
1942
- }
1943
- ,
1756
+ },
1944
1757
  {
1945
1758
  "pattern": "MojeekBot\\/",
1946
1759
  "addition_date": "2016/01/23",
@@ -1953,8 +1766,7 @@
1953
1766
  "Mozilla/5.0 (compatible; MojeekBot/0.6; +https://www.mojeek.com/bot.html)",
1954
1767
  "Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)"
1955
1768
  ]
1956
- }
1957
- ,
1769
+ },
1958
1770
  {
1959
1771
  "pattern": "netEstate NE Crawler",
1960
1772
  "addition_date": "2016/01/23",
@@ -1963,8 +1775,7 @@
1963
1775
  "netEstate NE Crawler (+http://www.sengine.info/)",
1964
1776
  "netEstate NE Crawler (+http://www.website-datenbank.de/)"
1965
1777
  ]
1966
- }
1967
- ,
1778
+ },
1968
1779
  {
1969
1780
  "pattern": "SafeSearch microdata crawler",
1970
1781
  "addition_date": "2016/01/23",
@@ -1972,8 +1783,7 @@
1972
1783
  "instances": [
1973
1784
  "SafeSearch microdata crawler (https://safesearch.avira.com, safesearch-abuse@avira.com)"
1974
1785
  ]
1975
- }
1976
- ,
1786
+ },
1977
1787
  {
1978
1788
  "pattern": "Gluten Free Crawler\\/",
1979
1789
  "addition_date": "2016/01/23",
@@ -1981,8 +1791,7 @@
1981
1791
  "instances": [
1982
1792
  "Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)"
1983
1793
  ]
1984
- }
1985
- ,
1794
+ },
1986
1795
  {
1987
1796
  "pattern": "Sonic",
1988
1797
  "addition_date": "2016/02/08",
@@ -1992,8 +1801,7 @@
1992
1801
  "Mozilla/5.0 (compatible; Sonic/1.0; http://www.yama.info.waseda.ac.jp/~crawler/info.html)",
1993
1802
  "Mozzila/5.0 (compatible; Sonic/1.0; http://www.yama.info.waseda.ac.jp/~crawler/info.html)"
1994
1803
  ]
1995
- }
1996
- ,
1804
+ },
1997
1805
  {
1998
1806
  "pattern": "Sysomos",
1999
1807
  "addition_date": "2016/02/08",
@@ -2001,15 +1809,13 @@
2001
1809
  "instances": [
2002
1810
  "Mozilla/5.0 (compatible; Sysomos/1.0; +http://www.sysomos.com/; Sysomos)"
2003
1811
  ]
2004
- }
2005
- ,
1812
+ },
2006
1813
  {
2007
1814
  "pattern": "Trove",
2008
1815
  "addition_date": "2016/02/08",
2009
1816
  "url": "http://www.trove.com",
2010
1817
  "instances": []
2011
- }
2012
- ,
1818
+ },
2013
1819
  {
2014
1820
  "pattern": "deadlinkchecker",
2015
1821
  "addition_date": "2016/02/08",
@@ -2019,8 +1825,7 @@
2019
1825
  "www.deadlinkchecker.com XMLHTTP/1.0",
2020
1826
  "www.deadlinkchecker.com XMLHTTP/1.0 Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/46.0.2490.86 Safari/537.36"
2021
1827
  ]
2022
- }
2023
- ,
1828
+ },
2024
1829
  {
2025
1830
  "pattern": "Slack-ImgProxy",
2026
1831
  "addition_date": "2016/04/25",
@@ -2033,8 +1838,7 @@
2033
1838
  "Slack-ImgProxy 1.138 (+https://api.slack.com/robots)",
2034
1839
  "Slack-ImgProxy 149 (+https://api.slack.com/robots)"
2035
1840
  ]
2036
- }
2037
- ,
1841
+ },
2038
1842
  {
2039
1843
  "pattern": "Embedly",
2040
1844
  "addition_date": "2016/04/25",
@@ -2044,8 +1848,7 @@
2044
1848
  "Mozilla/5.0 (compatible; Embedly/0.2; +http://support.embed.ly/)",
2045
1849
  "Mozilla/5.0 (compatible; Embedly/0.2; snap; +http://support.embed.ly/)"
2046
1850
  ]
2047
- }
2048
- ,
1851
+ },
2049
1852
  {
2050
1853
  "pattern": "RankActiveLinkBot",
2051
1854
  "addition_date": "2016/06/20",
@@ -2053,8 +1856,7 @@
2053
1856
  "instances": [
2054
1857
  "Mozilla/5.0 (compatible; RankActiveLinkBot; +https://rankactive.com/resources/rankactive-linkbot)"
2055
1858
  ]
2056
- }
2057
- ,
1859
+ },
2058
1860
  {
2059
1861
  "pattern": "iskanie",
2060
1862
  "addition_date": "2016/09/02",
@@ -2062,8 +1864,7 @@
2062
1864
  "instances": [
2063
1865
  "iskanie (+http://www.iskanie.com)"
2064
1866
  ]
2065
- }
2066
- ,
1867
+ },
2067
1868
  {
2068
1869
  "pattern": "SafeDNSBot",
2069
1870
  "addition_date": "2016/09/10",
@@ -2071,16 +1872,14 @@
2071
1872
  "instances": [
2072
1873
  "SafeDNSBot (https://www.safedns.com/searchbot)"
2073
1874
  ]
2074
- }
2075
- ,
1875
+ },
2076
1876
  {
2077
1877
  "pattern": "SkypeUriPreview",
2078
1878
  "addition_date": "2016/10/10",
2079
1879
  "instances": [
2080
1880
  "Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5"
2081
1881
  ]
2082
- }
2083
- ,
1882
+ },
2084
1883
  {
2085
1884
  "pattern": "Veoozbot",
2086
1885
  "addition_date": "2016/11/03",
@@ -2088,8 +1887,7 @@
2088
1887
  "instances": [
2089
1888
  "Mozilla/5.0 (compatible; Veoozbot/1.0; +http://www.veooz.com/veoozbot.html)"
2090
1889
  ]
2091
- }
2092
- ,
1890
+ },
2093
1891
  {
2094
1892
  "pattern": "Slackbot",
2095
1893
  "addition_date": "2016/11/03",
@@ -2099,8 +1897,7 @@
2099
1897
  "Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)",
2100
1898
  "Slackbot 1.0 (+https://api.slack.com/robots)"
2101
1899
  ]
2102
- }
2103
- ,
1900
+ },
2104
1901
  {
2105
1902
  "pattern": "redditbot",
2106
1903
  "addition_date": "2016/11/03",
@@ -2108,8 +1905,7 @@
2108
1905
  "instances": [
2109
1906
  "Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)"
2110
1907
  ]
2111
- }
2112
- ,
1908
+ },
2113
1909
  {
2114
1910
  "pattern": "datagnionbot",
2115
1911
  "addition_date": "2016/11/03",
@@ -2117,8 +1913,7 @@
2117
1913
  "instances": [
2118
1914
  "datagnionbot (+http://www.datagnion.com/bot.html)"
2119
1915
  ]
2120
- }
2121
- ,
1916
+ },
2122
1917
  {
2123
1918
  "pattern": "Google-Adwords-Instant",
2124
1919
  "addition_date": "2016/11/03",
@@ -2126,8 +1921,7 @@
2126
1921
  "instances": [
2127
1922
  "Google-Adwords-Instant (+http://www.google.com/adsbot.html)"
2128
1923
  ]
2129
- }
2130
- ,
1924
+ },
2131
1925
  {
2132
1926
  "pattern": "adbeat_bot",
2133
1927
  "addition_date": "2016/11/04",
@@ -2135,8 +1929,7 @@
2135
1929
  "Mozilla/5.0 (compatible; adbeat_bot; +support@adbeat.com; support@adbeat.com)",
2136
1930
  "adbeat_bot"
2137
1931
  ]
2138
- }
2139
- ,
1932
+ },
2140
1933
  {
2141
1934
  "pattern": "WhatsApp",
2142
1935
  "addition_date": "2016/11/15",
@@ -2168,16 +1961,14 @@
2168
1961
  "WhatsApp/2.19.308 A",
2169
1962
  "WhatsApp/2.19.330 A"
2170
1963
  ]
2171
- }
2172
- ,
1964
+ },
2173
1965
  {
2174
1966
  "pattern": "contxbot",
2175
1967
  "addition_date": "2017/02/25",
2176
1968
  "instances": [
2177
1969
  "Mozilla/5.0 (compatible;contxbot/1.0)"
2178
1970
  ]
2179
- }
2180
- ,
1971
+ },
2181
1972
  {
2182
1973
  "pattern": "pinterest\\.com\\/bot",
2183
1974
  "addition_date": "2017/03/03",
@@ -2186,8 +1977,7 @@
2186
1977
  "Pinterest/0.2 (+http://www.pinterest.com/bot.html)"
2187
1978
  ],
2188
1979
  "url": "http://www.pinterest.com/bot.html"
2189
- }
2190
- ,
1980
+ },
2191
1981
  {
2192
1982
  "pattern": "electricmonk",
2193
1983
  "addition_date": "2017/03/04",
@@ -2195,8 +1985,7 @@
2195
1985
  "Mozilla/5.0 (compatible; electricmonk/3.2.0 +https://www.duedil.com/our-crawler/)"
2196
1986
  ],
2197
1987
  "url": "https://www.duedil.com/our-crawler/"
2198
- }
2199
- ,
1988
+ },
2200
1989
  {
2201
1990
  "pattern": "GarlikCrawler",
2202
1991
  "addition_date": "2017/03/18",
@@ -2204,8 +1993,7 @@
2204
1993
  "GarlikCrawler/1.2 (http://garlik.com/, crawler@garlik.com)"
2205
1994
  ],
2206
1995
  "url": "http://garlik.com/"
2207
- }
2208
- ,
1996
+ },
2209
1997
  {
2210
1998
  "pattern": "BingPreview\\/",
2211
1999
  "addition_date": "2017/04/23",
@@ -2217,8 +2005,7 @@
2217
2005
  "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0; WOW64; Trident/5.0; BingPreview/1.0b)",
2218
2006
  "Mozilla/5.0 (iPhone; CPU iPhone OS 7_0 like Mac OS X) AppleWebKit/537.51.1 (KHTML, like Gecko) Version/7.0 Mobile/11A465 Safari/9537.53 BingPreview/1.0b"
2219
2007
  ]
2220
- }
2221
- ,
2008
+ },
2222
2009
  {
2223
2010
  "pattern": "vebidoobot",
2224
2011
  "addition_date": "2017/05/08",
@@ -2226,8 +2013,7 @@
2226
2013
  "Mozilla/5.0 (compatible; vebidoobot/1.0; +https://blog.vebidoo.de/vebidoobot/"
2227
2014
  ],
2228
2015
  "url": "https://blog.vebidoo.de/vebidoobot/"
2229
- }
2230
- ,
2016
+ },
2231
2017
  {
2232
2018
  "pattern": "FemtosearchBot",
2233
2019
  "addition_date": "2017/05/16",
@@ -2235,8 +2021,7 @@
2235
2021
  "Mozilla/5.0 (compatible; FemtosearchBot/1.0; http://femtosearch.com)"
2236
2022
  ],
2237
2023
  "url": "http://femtosearch.com"
2238
- }
2239
- ,
2024
+ },
2240
2025
  {
2241
2026
  "pattern": "Yahoo Link Preview",
2242
2027
  "addition_date": "2017/06/28",
@@ -2244,8 +2029,7 @@
2244
2029
  "Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)"
2245
2030
  ],
2246
2031
  "url": "https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html"
2247
- }
2248
- ,
2032
+ },
2249
2033
  {
2250
2034
  "pattern": "MetaJobBot",
2251
2035
  "addition_date": "2017/08/16",
@@ -2253,8 +2037,7 @@
2253
2037
  "Mozilla/5.0 (compatible; MetaJobBot; http://www.metajob.de/crawler)"
2254
2038
  ],
2255
2039
  "url": "http://www.metajob.de/the/crawler"
2256
- }
2257
- ,
2040
+ },
2258
2041
  {
2259
2042
  "pattern": "DomainStatsBot",
2260
2043
  "addition_date": "2017/08/16",
@@ -2262,8 +2045,7 @@
2262
2045
  "DomainStatsBot/1.0 (http://domainstats.io/our-bot)"
2263
2046
  ],
2264
2047
  "url": "http://domainstats.io/our-bot"
2265
- }
2266
- ,
2048
+ },
2267
2049
  {
2268
2050
  "pattern": "mindUpBot",
2269
2051
  "addition_date": "2017/08/16",
@@ -2271,8 +2053,7 @@
2271
2053
  "mindUpBot (datenbutler.de)"
2272
2054
  ],
2273
2055
  "url": "http://www.datenbutler.de/"
2274
- }
2275
- ,
2056
+ },
2276
2057
  {
2277
2058
  "pattern": "Daum\\/",
2278
2059
  "addition_date": "2017/08/16",
@@ -2280,8 +2061,7 @@
2280
2061
  "Mozilla/5.0 (compatible; Daum/4.1; +http://cs.daum.net/faq/15/4118.html?faqId=28966)"
2281
2062
  ],
2282
2063
  "url": "http://cs.daum.net/faq/15/4118.html?faqId=28966"
2283
- }
2284
- ,
2064
+ },
2285
2065
  {
2286
2066
  "pattern": "Jugendschutzprogramm-Crawler",
2287
2067
  "addition_date": "2017/08/16",
@@ -2289,8 +2069,7 @@
2289
2069
  "Jugendschutzprogramm-Crawler; Info: http://www.jugendschutzprogramm.de"
2290
2070
  ],
2291
2071
  "url": "http://www.jugendschutzprogramm.de"
2292
- }
2293
- ,
2072
+ },
2294
2073
  {
2295
2074
  "pattern": "Xenu Link Sleuth",
2296
2075
  "addition_date": "2017/08/19",
@@ -2298,8 +2077,7 @@
2298
2077
  "Xenu Link Sleuth/1.3.8"
2299
2078
  ],
2300
2079
  "url": "http://home.snafu.de/tilman/xenulink.html"
2301
- }
2302
- ,
2080
+ },
2303
2081
  {
2304
2082
  "pattern": "Pcore-HTTP",
2305
2083
  "addition_date": "2017/08/19",
@@ -2308,8 +2086,7 @@
2308
2086
  "Pcore-HTTP/v0.44.0"
2309
2087
  ],
2310
2088
  "url": "https://bitbucket.org/softvisio/pcore/overview"
2311
- }
2312
- ,
2089
+ },
2313
2090
  {
2314
2091
  "pattern": "moatbot",
2315
2092
  "addition_date": "2017/09/16",
@@ -2318,8 +2095,7 @@
2318
2095
  "Mozilla/5.0 (iPhone; CPU iPhone OS 8_0 like Mac OS X) AppleWebKit/600.1.3 (KHTML, like Gecko) Version/8.0 Mobile/12A4345d Safari/600.1.4 moatbot"
2319
2096
  ],
2320
2097
  "url": "https://moat.com"
2321
- }
2322
- ,
2098
+ },
2323
2099
  {
2324
2100
  "pattern": "KosmioBot",
2325
2101
  "addition_date": "2017/09/16",
@@ -2327,8 +2103,7 @@
2327
2103
  "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/44.0.2403.125 Safari/537.36 (compatible; KosmioBot/1.0; +http://kosm.io/bot.html)"
2328
2104
  ],
2329
2105
  "url": "http://kosm.io/bot.html"
2330
- }
2331
- ,
2106
+ },
2332
2107
  {
2333
2108
  "pattern": "[pP]ingdom",
2334
2109
  "addition_date": "2017/09/16",
@@ -2344,8 +2119,7 @@
2344
2119
  "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Ubuntu Chromium/61.0.3163.100 Chrome/61.0.3163.100 Safari/537.36 PingdomPageSpeed/1.0 (pingbot/2.0; http://www.pingdom.com/)"
2345
2120
  ],
2346
2121
  "url": "http://www.pingdom.com"
2347
- }
2348
- ,
2122
+ },
2349
2123
  {
2350
2124
  "pattern": "AppInsights",
2351
2125
  "addition_date": "2019/03/09",
@@ -2353,8 +2127,7 @@
2353
2127
  "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0; AppInsights)"
2354
2128
  ],
2355
2129
  "url": "https://docs.microsoft.com/en-us/azure/azure-monitor/app/app-insights-overview"
2356
- }
2357
- ,
2130
+ },
2358
2131
  {
2359
2132
  "pattern": "PhantomJS",
2360
2133
  "addition_date": "2017/09/18",
@@ -2362,8 +2135,7 @@
2362
2135
  "Mozilla/5.0 (Unknown; Linux x86_64) AppleWebKit/538.1 (KHTML, like Gecko) PhantomJS/2.1.1 Safari/538.1 bl.uk_lddc_renderbot/2.0.0 (+ http://www.bl.uk/aboutus/legaldeposit/websites/websites/faqswebmaster/index.html)"
2363
2136
  ],
2364
2137
  "url": "http://phantomjs.org/"
2365
- }
2366
- ,
2138
+ },
2367
2139
  {
2368
2140
  "pattern": "Gowikibot",
2369
2141
  "addition_date": "2017/10/26",
@@ -2371,8 +2143,7 @@
2371
2143
  "Mozilla/5.0 (compatible; Gowikibot/1.0; +http://www.gowikibot.com)"
2372
2144
  ],
2373
2145
  "url": "http://www.gowikibot.com"
2374
- }
2375
- ,
2146
+ },
2376
2147
  {
2377
2148
  "pattern": "PiplBot",
2378
2149
  "addition_date": "2017/10/30",
@@ -2381,8 +2152,7 @@
2381
2152
  "Mozilla/5.0+(compatible;+PiplBot;+http://www.pipl.com/bot/)"
2382
2153
  ],
2383
2154
  "url": "http://www.pipl.com/bot/"
2384
- }
2385
- ,
2155
+ },
2386
2156
  {
2387
2157
  "pattern": "Discordbot",
2388
2158
  "addition_date": "2017/09/22",
@@ -2390,16 +2160,14 @@
2390
2160
  "instances": [
2391
2161
  "Mozilla/5.0 (compatible; Discordbot/2.0; +https://discordapp.com)"
2392
2162
  ]
2393
- }
2394
- ,
2163
+ },
2395
2164
  {
2396
2165
  "pattern": "TelegramBot",
2397
2166
  "addition_date": "2017/10/01",
2398
2167
  "instances": [
2399
2168
  "TelegramBot (like TwitterBot)"
2400
2169
  ]
2401
- }
2402
- ,
2170
+ },
2403
2171
  {
2404
2172
  "pattern": "Jetslide",
2405
2173
  "addition_date": "2017/09/27",
@@ -2407,8 +2175,7 @@
2407
2175
  "instances": [
2408
2176
  "Mozilla/5.0 (compatible; Jetslide; +http://jetsli.de/crawler)"
2409
2177
  ]
2410
- }
2411
- ,
2178
+ },
2412
2179
  {
2413
2180
  "pattern": "newsharecounts",
2414
2181
  "addition_date": "2017/09/30",
@@ -2416,8 +2183,7 @@
2416
2183
  "instances": [
2417
2184
  "Mozilla/5.0 (compatible; NewShareCounts.com/1.0; +http://newsharecounts.com/crawler)"
2418
2185
  ]
2419
- }
2420
- ,
2186
+ },
2421
2187
  {
2422
2188
  "pattern": "James BOT",
2423
2189
  "addition_date": "2017/10/12",
@@ -2425,8 +2191,7 @@
2425
2191
  "instances": [
2426
2192
  "Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.1.6) Gecko/20070725 Firefox/2.0.0.6 - James BOT - WebCrawler http://cognitiveseo.com/bot.html"
2427
2193
  ]
2428
- }
2429
- ,
2194
+ },
2430
2195
  {
2431
2196
  "pattern": "Bark[rR]owler",
2432
2197
  "addition_date": "2017/10/09",
@@ -2437,8 +2202,7 @@
2437
2202
  "BarkRowler/0.7 (+http://www.exensa.com/crawling)",
2438
2203
  "Barkrowler/0.9 (+http://www.exensa.com/crawl)"
2439
2204
  ]
2440
- }
2441
- ,
2205
+ },
2442
2206
  {
2443
2207
  "pattern": "TinEye",
2444
2208
  "addition_date": "2017/10/14",
@@ -2447,8 +2211,7 @@
2447
2211
  "Mozilla/5.0 (compatible; TinEye-bot/1.31; +http://www.tineye.com/crawler.html)",
2448
2212
  "TinEye/1.1 (http://tineye.com/crawler.html)"
2449
2213
  ]
2450
- }
2451
- ,
2214
+ },
2452
2215
  {
2453
2216
  "pattern": "SocialRankIOBot",
2454
2217
  "addition_date": "2017/10/19",
@@ -2456,8 +2219,7 @@
2456
2219
  "instances": [
2457
2220
  "SocialRankIOBot; http://socialrank.io/about"
2458
2221
  ]
2459
- }
2460
- ,
2222
+ },
2461
2223
  {
2462
2224
  "pattern": "trendictionbot",
2463
2225
  "addition_date": "2017/10/30",
@@ -2466,16 +2228,14 @@
2466
2228
  "Mozilla/5.0 (Windows; U; Windows NT 6.0; en-GB; rv:1.0; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20071127 Firefox/3.0.0.11",
2467
2229
  "Mozilla/5.0 (Windows NT 10.0; Win64; x64; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20170101 Firefox/67.0"
2468
2230
  ]
2469
- }
2470
- ,
2231
+ },
2471
2232
  {
2472
2233
  "pattern": "Ocarinabot",
2473
2234
  "addition_date": "2017/09/27",
2474
2235
  "instances": [
2475
2236
  "Ocarinabot"
2476
2237
  ]
2477
- }
2478
- ,
2238
+ },
2479
2239
  {
2480
2240
  "pattern": "epicbot",
2481
2241
  "addition_date": "2017/10/31",
@@ -2483,8 +2243,7 @@
2483
2243
  "instances": [
2484
2244
  "Mozilla/5.0 (compatible; epicbot; +http://www.epictions.com/epicbot)"
2485
2245
  ]
2486
- }
2487
- ,
2246
+ },
2488
2247
  {
2489
2248
  "pattern": "Primalbot",
2490
2249
  "addition_date": "2017/09/27",
@@ -2492,8 +2251,7 @@
2492
2251
  "instances": [
2493
2252
  "Mozilla/5.0 (compatible; Primalbot; +https://www.primal.com;)"
2494
2253
  ]
2495
- }
2496
- ,
2254
+ },
2497
2255
  {
2498
2256
  "pattern": "DuckDuckGo-Favicons-Bot",
2499
2257
  "addition_date": "2017/10/06",
@@ -2501,8 +2259,7 @@
2501
2259
  "instances": [
2502
2260
  "Mozilla/5.0 (compatible; DuckDuckGo-Favicons-Bot/1.0; +http://duckduckgo.com)"
2503
2261
  ]
2504
- }
2505
- ,
2262
+ },
2506
2263
  {
2507
2264
  "pattern": "GnowitNewsbot",
2508
2265
  "addition_date": "2017/10/30",
@@ -2510,8 +2267,7 @@
2510
2267
  "instances": [
2511
2268
  "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:49.0) Gecko/20100101 Firefox/49.0 / GnowitNewsbot / Contact information at http://www.gnowit.com"
2512
2269
  ]
2513
- }
2514
- ,
2270
+ },
2515
2271
  {
2516
2272
  "pattern": "Leikibot",
2517
2273
  "addition_date": "2017/09/24",
@@ -2519,16 +2275,15 @@
2519
2275
  "instances": [
2520
2276
  "Mozilla/5.0 (Windows NT 6.3;compatible; Leikibot/1.0; +http://www.leiki.com)"
2521
2277
  ]
2522
- }
2523
- ,
2278
+ },
2524
2279
  {
2525
2280
  "pattern": "LinkArchiver",
2526
2281
  "addition_date": "2017/09/24",
2282
+ "url": "https://github.com/thisisparker/linkarchiver",
2527
2283
  "instances": [
2528
2284
  "@LinkArchiver twitter bot"
2529
2285
  ]
2530
- }
2531
- ,
2286
+ },
2532
2287
  {
2533
2288
  "pattern": "YaK\\/",
2534
2289
  "addition_date": "2017/09/25",
@@ -2536,8 +2291,7 @@
2536
2291
  "instances": [
2537
2292
  "Mozilla/5.0 (compatible; YaK/1.0; http://linkfluence.com/; bot@linkfluence.com)"
2538
2293
  ]
2539
- }
2540
- ,
2294
+ },
2541
2295
  {
2542
2296
  "pattern": "PaperLiBot",
2543
2297
  "addition_date": "2017/09/25",
@@ -2545,10 +2299,8 @@
2545
2299
  "instances": [
2546
2300
  "Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)",
2547
2301
  "Mozilla/5.0 (compatible; PaperLiBot/2.1; https://support.paper.li/entries/20023257-what-is-paper-li)"
2548
-
2549
2302
  ]
2550
- }
2551
- ,
2303
+ },
2552
2304
  {
2553
2305
  "pattern": "Digg Deeper",
2554
2306
  "addition_date": "2017/09/26",
@@ -2556,16 +2308,15 @@
2556
2308
  "instances": [
2557
2309
  "Digg Deeper/v1 (http://digg.com/about)"
2558
2310
  ]
2559
- }
2560
- ,
2311
+ },
2561
2312
  {
2562
2313
  "pattern": "dcrawl",
2563
2314
  "addition_date": "2017/09/22",
2315
+ "url": "https://github.com/kgretzky/dcrawl",
2564
2316
  "instances": [
2565
2317
  "dcrawl/1.0"
2566
2318
  ]
2567
- }
2568
- ,
2319
+ },
2569
2320
  {
2570
2321
  "pattern": "Snacktory",
2571
2322
  "addition_date": "2017/09/23",
@@ -2573,8 +2324,7 @@
2573
2324
  "instances": [
2574
2325
  "Mozilla/5.0 (compatible; Snacktory; +https://github.com/karussell/snacktory)"
2575
2326
  ]
2576
- }
2577
- ,
2327
+ },
2578
2328
  {
2579
2329
  "pattern": "AndersPinkBot",
2580
2330
  "addition_date": "2017/09/24",
@@ -2582,16 +2332,14 @@
2582
2332
  "instances": [
2583
2333
  "Mozilla/5.0 (compatible; AndersPinkBot/1.0; +http://anderspink.com/bot.html)"
2584
2334
  ]
2585
- }
2586
- ,
2335
+ },
2587
2336
  {
2588
2337
  "pattern": "Fyrebot",
2589
2338
  "addition_date": "2017/09/22",
2590
2339
  "instances": [
2591
2340
  "Fyrebot/1.0"
2592
2341
  ]
2593
- }
2594
- ,
2342
+ },
2595
2343
  {
2596
2344
  "pattern": "EveryoneSocialBot",
2597
2345
  "addition_date": "2017/09/22",
@@ -2599,8 +2347,7 @@
2599
2347
  "instances": [
2600
2348
  "Mozilla/5.0 (compatible; EveryoneSocialBot/1.0; support@everyonesocial.com http://everyonesocial.com/)"
2601
2349
  ]
2602
- }
2603
- ,
2350
+ },
2604
2351
  {
2605
2352
  "pattern": "Mediatoolkitbot",
2606
2353
  "addition_date": "2017/10/06",
@@ -2608,16 +2355,14 @@
2608
2355
  "instances": [
2609
2356
  "Mediatoolkitbot (complaints@mediatoolkit.com)"
2610
2357
  ]
2611
- }
2612
- ,
2358
+ },
2613
2359
  {
2614
2360
  "pattern": "Luminator-robots",
2615
2361
  "addition_date": "2017/09/22",
2616
2362
  "instances": [
2617
2363
  "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_8_2) AppleWebKit/537.13 (KHTML, like Gecko) Chrome/30.0.1599.66 Safari/537.13 Luminator-robots/2.0"
2618
2364
  ]
2619
- }
2620
- ,
2365
+ },
2621
2366
  {
2622
2367
  "pattern": "ExtLinksBot",
2623
2368
  "addition_date": "2017/11/02",
@@ -2625,24 +2370,21 @@
2625
2370
  "instances": [
2626
2371
  "Mozilla/5.0 (compatible; ExtLinksBot/1.5 +https://extlinks.com/Bot.html)"
2627
2372
  ]
2628
- }
2629
- ,
2373
+ },
2630
2374
  {
2631
2375
  "pattern": "SurveyBot",
2632
2376
  "addition_date": "2017/11/02",
2633
2377
  "instances": [
2634
2378
  "Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)"
2635
2379
  ]
2636
- }
2637
- ,
2380
+ },
2638
2381
  {
2639
2382
  "pattern": "NING\\/",
2640
2383
  "addition_date": "2017/11/02",
2641
2384
  "instances": [
2642
2385
  "NING/1.0"
2643
2386
  ]
2644
- }
2645
- ,
2387
+ },
2646
2388
  {
2647
2389
  "pattern": "okhttp",
2648
2390
  "addition_date": "2017/11/02",
@@ -2653,16 +2395,14 @@
2653
2395
  "okhttp/3.5.0",
2654
2396
  "okhttp/4.1.0"
2655
2397
  ]
2656
- }
2657
- ,
2398
+ },
2658
2399
  {
2659
2400
  "pattern": "Nuzzel",
2660
2401
  "addition_date": "2017/11/02",
2661
2402
  "instances": [
2662
2403
  "Nuzzel"
2663
2404
  ]
2664
- }
2665
- ,
2405
+ },
2666
2406
  {
2667
2407
  "pattern": "omgili",
2668
2408
  "addition_date": "2017/11/02",
@@ -2670,8 +2410,7 @@
2670
2410
  "instances": [
2671
2411
  "omgili/0.5 +http://omgili.com"
2672
2412
  ]
2673
- }
2674
- ,
2413
+ },
2675
2414
  {
2676
2415
  "pattern": "PocketParser",
2677
2416
  "addition_date": "2017/11/02",
@@ -2679,8 +2418,7 @@
2679
2418
  "instances": [
2680
2419
  "PocketParser/2.0 (+https://getpocket.com/pocketparser_ua)"
2681
2420
  ]
2682
- }
2683
- ,
2421
+ },
2684
2422
  {
2685
2423
  "pattern": "YisouSpider",
2686
2424
  "addition_date": "2017/11/02",
@@ -2688,16 +2426,14 @@
2688
2426
  "YisouSpider",
2689
2427
  "Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.81 YisouSpider/5.0 Safari/537.36"
2690
2428
  ]
2691
- }
2692
- ,
2429
+ },
2693
2430
  {
2694
2431
  "pattern": "um-LN",
2695
2432
  "addition_date": "2017/11/02",
2696
2433
  "instances": [
2697
2434
  "Mozilla/5.0 (compatible; um-LN/1.0; mailto: techinfo@ubermetrics-technologies.com)"
2698
2435
  ]
2699
- }
2700
- ,
2436
+ },
2701
2437
  {
2702
2438
  "pattern": "ToutiaoSpider",
2703
2439
  "addition_date": "2017/11/02",
@@ -2705,8 +2441,7 @@
2705
2441
  "instances": [
2706
2442
  "Mozilla/5.0 (compatible; ToutiaoSpider/1.0; http://web.toutiao.com/media_cooperation/;)"
2707
2443
  ]
2708
- }
2709
- ,
2444
+ },
2710
2445
  {
2711
2446
  "pattern": "MuckRack",
2712
2447
  "addition_date": "2017/11/02",
@@ -2714,8 +2449,7 @@
2714
2449
  "instances": [
2715
2450
  "Mozilla/5.0 (compatible; MuckRack/1.0; +http://muckrack.com)"
2716
2451
  ]
2717
- }
2718
- ,
2452
+ },
2719
2453
  {
2720
2454
  "pattern": "Jamie's Spider",
2721
2455
  "addition_date": "2017/11/02",
@@ -2723,32 +2457,29 @@
2723
2457
  "instances": [
2724
2458
  "Jamie's Spider (http://jamiembrown.com/)"
2725
2459
  ]
2726
- }
2727
- ,
2460
+ },
2728
2461
  {
2729
2462
  "pattern": "AHC\\/",
2730
2463
  "addition_date": "2017/11/02",
2464
+ "url": "https://github.com/AsyncHttpClient/async-http-client",
2731
2465
  "instances": [
2732
2466
  "AHC/2.0"
2733
2467
  ]
2734
- }
2735
- ,
2468
+ },
2736
2469
  {
2737
2470
  "pattern": "NetcraftSurveyAgent",
2738
2471
  "addition_date": "2017/11/02",
2739
2472
  "instances": [
2740
2473
  "Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)"
2741
2474
  ]
2742
- }
2743
- ,
2475
+ },
2744
2476
  {
2745
2477
  "pattern": "Laserlikebot",
2746
2478
  "addition_date": "2017/11/02",
2747
2479
  "instances": [
2748
2480
  "Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1.4 (compatible; Laserlikebot/0.1)"
2749
2481
  ]
2750
- }
2751
- ,
2482
+ },
2752
2483
  {
2753
2484
  "pattern": "^Apache-HttpClient",
2754
2485
  "addition_date": "2017/11/02",
@@ -2768,8 +2499,7 @@
2768
2499
  "Apache-HttpClient/4.5.7 (Java/11.0.3)",
2769
2500
  "Apache-HttpClient/4.5.10 (Java/1.8.0_201)"
2770
2501
  ]
2771
- }
2772
- ,
2502
+ },
2773
2503
  {
2774
2504
  "pattern": "AppEngine-Google",
2775
2505
  "addition_date": "2017/11/02",
@@ -2777,24 +2507,21 @@
2777
2507
  "AppEngine-Google; (+http://code.google.com/appengine; appid: example)",
2778
2508
  "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_4) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36 AppEngine-Google; (+http://code.google.com/appengine; appid: s~feedly-nikon3)"
2779
2509
  ]
2780
- }
2781
- ,
2510
+ },
2782
2511
  {
2783
2512
  "pattern": "Jetty",
2784
2513
  "addition_date": "2017/11/02",
2785
2514
  "instances": [
2786
2515
  "Jetty/9.3.z-SNAPSHOT"
2787
2516
  ]
2788
- }
2789
- ,
2517
+ },
2790
2518
  {
2791
2519
  "pattern": "Upflow",
2792
2520
  "addition_date": "2017/11/02",
2793
2521
  "instances": [
2794
2522
  "Upflow/1.0"
2795
2523
  ]
2796
- }
2797
- ,
2524
+ },
2798
2525
  {
2799
2526
  "pattern": "Thinklab",
2800
2527
  "addition_date": "2017/11/02",
@@ -2802,17 +2529,15 @@
2802
2529
  "instances": [
2803
2530
  "Thinklab (thinklab.com)"
2804
2531
  ]
2805
- }
2806
- ,
2532
+ },
2807
2533
  {
2808
2534
  "pattern": "Traackr\\.com",
2809
2535
  "addition_date": "2017/11/02",
2810
- "url": "Traackr.com",
2536
+ "url": "https://www.traackr.com/",
2811
2537
  "instances": [
2812
2538
  "Traackr.com"
2813
2539
  ]
2814
- }
2815
- ,
2540
+ },
2816
2541
  {
2817
2542
  "pattern": "Twurly",
2818
2543
  "addition_date": "2017/11/02",
@@ -2820,56 +2545,49 @@
2820
2545
  "instances": [
2821
2546
  "Ruby, Twurly v1.1 (http://twurly.org)"
2822
2547
  ]
2823
- }
2824
- ,
2548
+ },
2825
2549
  {
2826
2550
  "pattern": "Mastodon",
2827
2551
  "addition_date": "2017/11/02",
2828
2552
  "instances": [
2829
2553
  "http.rb/2.2.2 (Mastodon/1.5.1; +https://example-masto-instance.org/)"
2830
2554
  ]
2831
- }
2832
- ,
2555
+ },
2833
2556
  {
2834
2557
  "pattern": "http_get",
2835
2558
  "addition_date": "2017/11/02",
2836
2559
  "instances": [
2837
2560
  "http_get"
2838
2561
  ]
2839
- }
2840
- ,
2562
+ },
2841
2563
  {
2842
2564
  "pattern": "DnyzBot",
2843
2565
  "addition_date": "2017/11/20",
2844
2566
  "instances": [
2845
2567
  "Mozilla/5.0 (compatible; DnyzBot/1.0)"
2846
2568
  ]
2847
- }
2848
- ,
2569
+ },
2849
2570
  {
2850
2571
  "pattern": "botify",
2851
2572
  "addition_date": "2018/02/01",
2852
2573
  "instances": [
2853
2574
  "Mozilla/5.0 (compatible; botify; http://botify.com)"
2854
2575
  ]
2855
- }
2856
- ,
2576
+ },
2857
2577
  {
2858
2578
  "pattern": "007ac9 Crawler",
2859
2579
  "addition_date": "2018/02/09",
2860
2580
  "instances": [
2861
2581
  "Mozilla/5.0 (compatible; 007ac9 Crawler; http://crawler.007ac9.net/)"
2862
2582
  ]
2863
- }
2864
- ,
2583
+ },
2865
2584
  {
2866
2585
  "pattern": "BehloolBot",
2867
2586
  "addition_date": "2018/02/09",
2868
2587
  "instances": [
2869
2588
  "Mozilla/5.0 (compatible; BehloolBot/beta; +http://www.webeaver.com/bot)"
2870
2589
  ]
2871
- }
2872
- ,
2590
+ },
2873
2591
  {
2874
2592
  "pattern": "BrandVerity",
2875
2593
  "addition_date": "2018/02/27",
@@ -2878,16 +2596,14 @@
2878
2596
  "Mozilla/5.0 (iPhone; CPU iPhone OS 7_0 like Mac OS X) AppleWebKit/537.51.1 (KHTML, like Gecko) Mobile/11A465 Twitter for iPhone BrandVerity/1.0 (http://www.brandverity.com/why-is-brandverity-visiting-me)"
2879
2597
  ],
2880
2598
  "url": "http://www.brandverity.com/why-is-brandverity-visiting-me"
2881
- }
2882
- ,
2599
+ },
2883
2600
  {
2884
2601
  "pattern": "check_http",
2885
2602
  "addition_date": "2018/02/09",
2886
2603
  "instances": [
2887
2604
  "check_http/v2.2.1 (nagios-plugins 2.2.1)"
2888
2605
  ]
2889
- }
2890
- ,
2606
+ },
2891
2607
  {
2892
2608
  "pattern": "BDCbot",
2893
2609
  "addition_date": "2018/02/09",
@@ -2895,24 +2611,21 @@
2895
2611
  "Mozilla/5.0 (Windows NT 6.1; compatible; BDCbot/1.0; +http://bigweb.bigdatacorp.com.br/faq.aspx) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36",
2896
2612
  "Mozilla/5.0 (Windows NT 10.0; Win64; x64; BDCbot/1.0; +http://bigweb.bigdatacorp.com.br/faq.aspx) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36"
2897
2613
  ]
2898
- }
2899
- ,
2614
+ },
2900
2615
  {
2901
2616
  "pattern": "ZumBot",
2902
2617
  "addition_date": "2018/02/09",
2903
2618
  "instances": [
2904
2619
  "Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)"
2905
2620
  ]
2906
- }
2907
- ,
2621
+ },
2908
2622
  {
2909
2623
  "pattern": "EZID",
2910
2624
  "addition_date": "2018/02/09",
2911
2625
  "instances": [
2912
2626
  "EZID (EZID link checker; https://ezid.cdlib.org/)"
2913
2627
  ]
2914
- }
2915
- ,
2628
+ },
2916
2629
  {
2917
2630
  "pattern": "ICC-Crawler",
2918
2631
  "addition_date": "2018/02/28",
@@ -2920,8 +2633,7 @@
2920
2633
  "ICC-Crawler/2.0 (Mozilla-compatible; ; http://ucri.nict.go.jp/en/icccrawler.html)"
2921
2634
  ],
2922
2635
  "url": "http://ucri.nict.go.jp/en/icccrawler.html"
2923
- }
2924
- ,
2636
+ },
2925
2637
  {
2926
2638
  "pattern": "ArchiveBot",
2927
2639
  "addition_date": "2018/02/28",
@@ -2929,8 +2641,7 @@
2929
2641
  "ArchiveTeam ArchiveBot/20170106.02 (wpull 2.0.2)"
2930
2642
  ],
2931
2643
  "url": "https://github.com/ArchiveTeam/ArchiveBot"
2932
- }
2933
- ,
2644
+ },
2934
2645
  {
2935
2646
  "pattern": "^LCC ",
2936
2647
  "addition_date": "2018/02/28",
@@ -2938,8 +2649,7 @@
2938
2649
  "LCC (+http://corpora.informatik.uni-leipzig.de/crawler_faq.html)"
2939
2650
  ],
2940
2651
  "url": "http://corpora.informatik.uni-leipzig.de/crawler_faq.html"
2941
- }
2942
- ,
2652
+ },
2943
2653
  {
2944
2654
  "pattern": "filterdb\\.iss\\.net\\/crawler",
2945
2655
  "addition_date": "2018/03/16",
@@ -2947,16 +2657,14 @@
2947
2657
  "Mozilla/5.0 (compatible; oBot/2.3.1; +http://filterdb.iss.net/crawler/)"
2948
2658
  ],
2949
2659
  "url": "http://filterdb.iss.net/crawler/"
2950
- }
2951
- ,
2660
+ },
2952
2661
  {
2953
2662
  "pattern": "BLP_bbot",
2954
2663
  "addition_date": "2018/03/27",
2955
2664
  "instances": [
2956
2665
  "BLP_bbot/0.1"
2957
2666
  ]
2958
- }
2959
- ,
2667
+ },
2960
2668
  {
2961
2669
  "pattern": "BomboraBot",
2962
2670
  "addition_date": "2018/03/27",
@@ -2964,8 +2672,7 @@
2964
2672
  "Mozilla/5.0 (compatible; BomboraBot/1.0; +http://www.bombora.com/bot)"
2965
2673
  ],
2966
2674
  "url": "http://www.bombora.com/bot"
2967
- }
2968
- ,
2675
+ },
2969
2676
  {
2970
2677
  "pattern": "Buck\\/",
2971
2678
  "addition_date": "2018/03/27",
@@ -2973,8 +2680,7 @@
2973
2680
  "Buck/2.2; (+https://app.hypefactors.com/media-monitoring/about.html)"
2974
2681
  ],
2975
2682
  "url": "https://app.hypefactors.com/media-monitoring/about.html"
2976
- }
2977
- ,
2683
+ },
2978
2684
  {
2979
2685
  "pattern": "Companybook-Crawler",
2980
2686
  "addition_date": "2018/03/27",
@@ -2982,8 +2688,7 @@
2982
2688
  "Companybook-Crawler (+https://www.companybooknetworking.com/)"
2983
2689
  ],
2984
2690
  "url": "https://www.companybooknetworking.com/"
2985
- }
2986
- ,
2691
+ },
2987
2692
  {
2988
2693
  "pattern": "Genieo",
2989
2694
  "addition_date": "2018/03/27",
@@ -2991,8 +2696,7 @@
2991
2696
  "Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)"
2992
2697
  ],
2993
2698
  "url": "http://www.genieo.com/webfilter.html"
2994
- }
2995
- ,
2699
+ },
2996
2700
  {
2997
2701
  "pattern": "magpie-crawler",
2998
2702
  "addition_date": "2018/03/27",
@@ -3000,8 +2704,7 @@
3000
2704
  "magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)"
3001
2705
  ],
3002
2706
  "url": "http://www.brandwatch.net"
3003
- }
3004
- ,
2707
+ },
3005
2708
  {
3006
2709
  "pattern": "MeltwaterNews",
3007
2710
  "addition_date": "2018/03/27",
@@ -3009,8 +2712,7 @@
3009
2712
  "MeltwaterNews www.meltwater.com"
3010
2713
  ],
3011
2714
  "url": "http://www.meltwater.com"
3012
- }
3013
- ,
2715
+ },
3014
2716
  {
3015
2717
  "pattern": "Moreover",
3016
2718
  "addition_date": "2018/03/27",
@@ -3018,8 +2720,7 @@
3018
2720
  "Mozilla/5.0 Moreover/5.1 (+http://www.moreover.com)"
3019
2721
  ],
3020
2722
  "url": "http://www.moreover.com"
3021
- }
3022
- ,
2723
+ },
3023
2724
  {
3024
2725
  "pattern": "newspaper\\/",
3025
2726
  "addition_date": "2018/03/27",
@@ -3029,8 +2730,7 @@
3029
2730
  "newspaper/0.2.6",
3030
2731
  "newspaper/0.2.8"
3031
2732
  ]
3032
- }
3033
- ,
2733
+ },
3034
2734
  {
3035
2735
  "pattern": "ScoutJet",
3036
2736
  "addition_date": "2018/03/27",
@@ -3038,8 +2738,7 @@
3038
2738
  "Mozilla/5.0 (compatible; ScoutJet; +http://www.scoutjet.com/)"
3039
2739
  ],
3040
2740
  "url": "http://www.scoutjet.com/"
3041
- }
3042
- ,
2741
+ },
3043
2742
  {
3044
2743
  "pattern": "(^| )sentry\\/",
3045
2744
  "addition_date": "2018/03/27",
@@ -3047,8 +2746,7 @@
3047
2746
  "sentry/8.22.0 (https://sentry.io)"
3048
2747
  ],
3049
2748
  "url": "https://sentry.io"
3050
- }
3051
- ,
2749
+ },
3052
2750
  {
3053
2751
  "pattern": "StorygizeBot",
3054
2752
  "addition_date": "2018/03/27",
@@ -3056,8 +2754,7 @@
3056
2754
  "Mozilla/5.0 (compatible; StorygizeBot; http://www.storygize.com)"
3057
2755
  ],
3058
2756
  "url": "http://www.storygize.com"
3059
- }
3060
- ,
2757
+ },
3061
2758
  {
3062
2759
  "pattern": "UptimeRobot",
3063
2760
  "addition_date": "2018/03/27",
@@ -3065,8 +2762,7 @@
3065
2762
  "Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)"
3066
2763
  ],
3067
2764
  "url": "http://www.uptimerobot.com/"
3068
- }
3069
- ,
2765
+ },
3070
2766
  {
3071
2767
  "pattern": "OutclicksBot",
3072
2768
  "addition_date": "2018/04/21",
@@ -3077,8 +2773,7 @@
3077
2773
  "OutclicksBot/2 +https://www.outclicks.net/agent/p2i4sNUh7eylJF1S6SGgRs5mP40ExlYvsr9GBxVQG6h"
3078
2774
  ],
3079
2775
  "url": "https://www.outclicks.net"
3080
- }
3081
- ,
2776
+ },
3082
2777
  {
3083
2778
  "pattern": "seoscanners",
3084
2779
  "addition_date": "2018/05/27",
@@ -3086,8 +2781,7 @@
3086
2781
  "Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)"
3087
2782
  ],
3088
2783
  "url": "http://www.seoscanners.net/"
3089
- }
3090
- ,
2784
+ },
3091
2785
  {
3092
2786
  "pattern": "Hatena",
3093
2787
  "addition_date": "2018/05/29",
@@ -3099,8 +2793,7 @@
3099
2793
  "HatenaBookmark/4.0 (Hatena::Bookmark; Analyzer)",
3100
2794
  "Hatena::Fetcher/0.01 (master) Furl/3.13"
3101
2795
  ]
3102
- }
3103
- ,
2796
+ },
3104
2797
  {
3105
2798
  "pattern": "Google Web Preview",
3106
2799
  "addition_date": "2018/05/31",
@@ -3108,16 +2801,14 @@
3108
2801
  "Mozilla/5.0 (Linux; U; Android 2.3.4; generic) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Version/4.0 Mobile Safari/537.36",
3109
2802
  "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36"
3110
2803
  ]
3111
- }
3112
- ,
2804
+ },
3113
2805
  {
3114
2806
  "pattern": "MauiBot",
3115
2807
  "addition_date": "2018/06/06",
3116
2808
  "instances": [
3117
2809
  "MauiBot (crawler.feedback+wc@gmail.com)"
3118
2810
  ]
3119
- }
3120
- ,
2811
+ },
3121
2812
  {
3122
2813
  "pattern": "AlphaBot",
3123
2814
  "addition_date": "2018/05/27",
@@ -3125,8 +2816,7 @@
3125
2816
  "Mozilla/5.0 (compatible; AlphaBot/3.2; +http://alphaseobot.com/bot.html)"
3126
2817
  ],
3127
2818
  "url": "http://alphaseobot.com/bot.html"
3128
- }
3129
- ,
2819
+ },
3130
2820
  {
3131
2821
  "pattern": "SBL-BOT",
3132
2822
  "addition_date": "2018/06/06",
@@ -3134,9 +2824,8 @@
3134
2824
  "SBL-BOT (http://sbl.net)"
3135
2825
  ],
3136
2826
  "url": "http://sbl.net",
3137
- "description" : "Bot of SoftByte BlackWidow"
3138
- }
3139
- ,
2827
+ "description": "Bot of SoftByte BlackWidow"
2828
+ },
3140
2829
  {
3141
2830
  "pattern": "IAS crawler",
3142
2831
  "addition_date": "2018/06/06",
@@ -3144,17 +2833,15 @@
3144
2833
  "IAS crawler (ias_crawler; http://integralads.com/site-indexing-policy/)"
3145
2834
  ],
3146
2835
  "url": "http://integralads.com/site-indexing-policy/",
3147
- "description" : "Bot of Integral Ad Science, Inc."
3148
- }
3149
- ,
2836
+ "description": "Bot of Integral Ad Science, Inc."
2837
+ },
3150
2838
  {
3151
2839
  "pattern": "adscanner",
3152
2840
  "addition_date": "2018/06/24",
3153
2841
  "instances": [
3154
2842
  "Mozilla/5.0 (compatible; adscanner/)"
3155
2843
  ]
3156
- }
3157
- ,
2844
+ },
3158
2845
  {
3159
2846
  "pattern": "Netvibes",
3160
2847
  "addition_date": "2018/06/24",
@@ -3163,8 +2850,7 @@
3163
2850
  "Netvibes (crawler; http://www.netvibes.com)"
3164
2851
  ],
3165
2852
  "url": "http://www.netvibes.com"
3166
- }
3167
- ,
2853
+ },
3168
2854
  {
3169
2855
  "pattern": "acapbot",
3170
2856
  "addition_date": "2018/06/27",
@@ -3172,8 +2858,7 @@
3172
2858
  "Mozilla/5.0 (compatible;acapbot/0.1;treat like Googlebot)",
3173
2859
  "Mozilla/5.0 (compatible;acapbot/0.1.;treat like Googlebot)"
3174
2860
  ]
3175
- }
3176
- ,
2861
+ },
3177
2862
  {
3178
2863
  "pattern": "Baidu-YunGuanCe",
3179
2864
  "addition_date": "2018/06/27",
@@ -3186,8 +2871,7 @@
3186
2871
  ],
3187
2872
  "url": "https://ce.baidu.com/topic/topic20150908",
3188
2873
  "description": "Baidu Cloud Watch"
3189
- }
3190
- ,
2874
+ },
3191
2875
  {
3192
2876
  "pattern": "bitlybot",
3193
2877
  "addition_date": "2018/06/27",
@@ -3197,8 +2881,7 @@
3197
2881
  "bitlybot"
3198
2882
  ],
3199
2883
  "url": "http://bit.ly/"
3200
- }
3201
- ,
2884
+ },
3202
2885
  {
3203
2886
  "pattern": "blogmuraBot",
3204
2887
  "addition_date": "2018/06/27",
@@ -3207,8 +2890,7 @@
3207
2890
  ],
3208
2891
  "url": "http://www.blogmura.com",
3209
2892
  "description": "A blog ranking site which links to blogs on just about every theme possible."
3210
- }
3211
- ,
2893
+ },
3212
2894
  {
3213
2895
  "pattern": "Bot\\.AraTurka\\.com",
3214
2896
  "addition_date": "2018/06/27",
@@ -3216,16 +2898,14 @@
3216
2898
  "Bot.AraTurka.com/0.0.1"
3217
2899
  ],
3218
2900
  "url": "http://www.araturka.com"
3219
- }
3220
- ,
2901
+ },
3221
2902
  {
3222
2903
  "pattern": "bot-pge\\.chlooe\\.com",
3223
2904
  "addition_date": "2018/06/27",
3224
2905
  "instances": [
3225
2906
  "bot-pge.chlooe.com/1.0.0 (+http://www.chlooe.com/)"
3226
2907
  ]
3227
- }
3228
- ,
2908
+ },
3229
2909
  {
3230
2910
  "pattern": "BoxcarBot",
3231
2911
  "addition_date": "2018/06/27",
@@ -3233,8 +2913,7 @@
3233
2913
  "Mozilla/5.0 (compatible; BoxcarBot/1.1; +awesome@boxcar.io)"
3234
2914
  ],
3235
2915
  "url": "https://boxcar.io/"
3236
- }
3237
- ,
2916
+ },
3238
2917
  {
3239
2918
  "pattern": "BTWebClient",
3240
2919
  "addition_date": "2018/06/27",
@@ -3243,8 +2922,7 @@
3243
2922
  ],
3244
2923
  "url": "http://www.utorrent.com/",
3245
2924
  "description": "µTorrent BitTorrent Client"
3246
- }
3247
- ,
2925
+ },
3248
2926
  {
3249
2927
  "pattern": "ContextAd Bot",
3250
2928
  "addition_date": "2018/06/27",
@@ -3252,8 +2930,7 @@
3252
2930
  "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0;.NET CLR 1.0.3705; ContextAd Bot 1.0)",
3253
2931
  "ContextAd Bot 1.0"
3254
2932
  ]
3255
- }
3256
- ,
2933
+ },
3257
2934
  {
3258
2935
  "pattern": "Digincore bot",
3259
2936
  "addition_date": "2018/06/27",
@@ -3261,8 +2938,7 @@
3261
2938
  "Mozilla/5.0 (compatible; Digincore bot; https://www.digincore.com/crawler.html for rules and instructions.)"
3262
2939
  ],
3263
2940
  "url": "http://www.digincore.com/crawler.html"
3264
- }
3265
- ,
2941
+ },
3266
2942
  {
3267
2943
  "pattern": "Disqus",
3268
2944
  "addition_date": "2018/06/27",
@@ -3271,8 +2947,7 @@
3271
2947
  ],
3272
2948
  "url": "https://disqus.com/",
3273
2949
  "description": "validate and quality check pages."
3274
- }
3275
- ,
2950
+ },
3276
2951
  {
3277
2952
  "pattern": "Feedly",
3278
2953
  "addition_date": "2018/06/27",
@@ -3282,16 +2957,14 @@
3282
2957
  ],
3283
2958
  "url": "https://www.feedly.com/fetcher.html",
3284
2959
  "description": "Feedly Fetcher is how Feedly grabs RSS or Atom feeds when users choose to add them to their Feedly or any of the other applications built on top of the feedly cloud."
3285
- }
3286
- ,
2960
+ },
3287
2961
  {
3288
2962
  "pattern": "Fetch\\/",
3289
2963
  "addition_date": "2018/06/27",
3290
2964
  "instances": [
3291
2965
  "Fetch/2.0a (CMS Detection/Web/SEO analysis tool, see http://guess.scritch.org)"
3292
2966
  ]
3293
- }
3294
- ,
2967
+ },
3295
2968
  {
3296
2969
  "pattern": "Fever",
3297
2970
  "addition_date": "2018/06/27",
@@ -3299,16 +2972,14 @@
3299
2972
  "Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)"
3300
2973
  ],
3301
2974
  "url": "http://feedafever.com"
3302
- }
3303
- ,
2975
+ },
3304
2976
  {
3305
2977
  "pattern": "Flamingo_SearchEngine",
3306
2978
  "addition_date": "2018/06/27",
3307
2979
  "instances": [
3308
2980
  "Flamingo_SearchEngine (+http://www.flamingosearch.com/bot)"
3309
2981
  ]
3310
- }
3311
- ,
2982
+ },
3312
2983
  {
3313
2984
  "pattern": "FlipboardProxy",
3314
2985
  "addition_date": "2018/06/27",
@@ -3321,8 +2992,7 @@
3321
2992
  ],
3322
2993
  "url": "https://about.flipboard.com/browserproxy/",
3323
2994
  "description": "a proxy service to fetch, validate, and prepare certain elements of websites for presentation through the Flipboard Application"
3324
- }
3325
- ,
2995
+ },
3326
2996
  {
3327
2997
  "pattern": "g2reader-bot",
3328
2998
  "addition_date": "2018/06/27",
@@ -3330,8 +3000,7 @@
3330
3000
  "g2reader-bot/1.0 (+http://www.g2reader.com/)"
3331
3001
  ],
3332
3002
  "url": "http://www.g2reader.com/"
3333
- }
3334
- ,
3003
+ },
3335
3004
  {
3336
3005
  "pattern": "G2 Web Services",
3337
3006
  "addition_date": "2019/03/01",
@@ -3339,8 +3008,7 @@
3339
3008
  "G2 Web Services/1.0 (built with StormCrawler Archetype 1.8; https://www.g2webservices.com/; developers@g2llc.com)"
3340
3009
  ],
3341
3010
  "url": "https://www.g2webservices.com/"
3342
- }
3343
- ,
3011
+ },
3344
3012
  {
3345
3013
  "pattern": "imrbot",
3346
3014
  "addition_date": "2018/06/27",
@@ -3348,8 +3016,7 @@
3348
3016
  "Mozilla/5.0 (compatible; imrbot/1.10.8 +http://www.mignify.com)"
3349
3017
  ],
3350
3018
  "url": "http://www.mignify.com"
3351
- }
3352
- ,
3019
+ },
3353
3020
  {
3354
3021
  "pattern": "K7MLWCBot",
3355
3022
  "addition_date": "2018/06/27",
@@ -3358,8 +3025,7 @@
3358
3025
  ],
3359
3026
  "url": "http://www.k7computing.com",
3360
3027
  "description": "Virus scanner"
3361
- }
3362
- ,
3028
+ },
3363
3029
  {
3364
3030
  "pattern": "Kemvibot",
3365
3031
  "addition_date": "2018/06/27",
@@ -3367,8 +3033,7 @@
3367
3033
  "Kemvibot/1.0 (http://kemvi.com, marco@kemvi.com)"
3368
3034
  ],
3369
3035
  "url": "http://kemvi.com"
3370
- }
3371
- ,
3036
+ },
3372
3037
  {
3373
3038
  "pattern": "Landau-Media-Spider",
3374
3039
  "addition_date": "2018/06/27",
@@ -3376,8 +3041,7 @@
3376
3041
  "Landau-Media-Spider/1.0(http://bots.landaumedia.de/bot.html)"
3377
3042
  ],
3378
3043
  "url": "http://bots.landaumedia.de/bot.html"
3379
- }
3380
- ,
3044
+ },
3381
3045
  {
3382
3046
  "pattern": "linkapediabot",
3383
3047
  "addition_date": "2018/06/27",
@@ -3385,8 +3049,7 @@
3385
3049
  "linkapediabot (+http://www.linkapedia.com)"
3386
3050
  ],
3387
3051
  "url": "http://www.linkapedia.com"
3388
- }
3389
- ,
3052
+ },
3390
3053
  {
3391
3054
  "pattern": "vkShare",
3392
3055
  "addition_date": "2018/07/02",
@@ -3394,8 +3057,7 @@
3394
3057
  "Mozilla/5.0 (compatible; vkShare; +http://vk.com/dev/Share)"
3395
3058
  ],
3396
3059
  "url": "http://vk.com/dev/Share"
3397
- }
3398
- ,
3060
+ },
3399
3061
  {
3400
3062
  "pattern": "Siteimprove\\.com",
3401
3063
  "addition_date": "2018/06/22",
@@ -3405,121 +3067,109 @@
3405
3067
  "Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; Trident/6.0) SiteCheck-sitecrawl by Siteimprove.com",
3406
3068
  "Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.0) LinkCheck by Siteimprove.com"
3407
3069
  ]
3408
- }
3409
- ,
3410
- {
3411
- "pattern": "BLEXBot\\/",
3412
- "addition_date": "2018/07/07",
3413
- "instances": [
3414
- "Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)"
3415
- ],
3416
- "url": "http://webmeup-crawler.com"
3417
- }
3418
- ,
3419
- {
3420
- "pattern": "DareBoost",
3421
- "addition_date": "2018/07/07",
3422
- "instances": [
3423
- "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3202.75 Safari/537.36 DareBoost"
3424
- ],
3425
- "url": "https://www.dareboost.com/",
3426
- "description": "Bot to test, Analyze and Optimize website"
3427
- }
3428
- ,
3070
+ },
3429
3071
  {
3430
- "pattern": "ZuperlistBot\\/",
3431
- "addition_date": "2018/07/07",
3432
- "instances": [
3433
- "Mozilla/5.0 (compatible; ZuperlistBot/1.0)"
3434
- ]
3435
- }
3436
- ,
3437
- {
3438
- "pattern": "Miniflux\\/",
3439
- "addition_date": "2018/07/07",
3440
- "instances": [
3441
- "Mozilla/5.0 (compatible; Miniflux/2.0.x-dev; +https://miniflux.net)",
3442
- "Mozilla/5.0 (compatible; Miniflux/2.0.3; +https://miniflux.net)",
3443
- "Mozilla/5.0 (compatible; Miniflux/2.0.7; +https://miniflux.net)",
3444
- "Mozilla/5.0 (compatible; Miniflux/2.0.10; +https://miniflux.net)",
3445
- "Mozilla/5.0 (compatibl$; Miniflux/2.0.x-dev; +https://miniflux.app)",
3446
- "Mozilla/5.0 (compatible; Miniflux/2.0.11; +https://miniflux.app)",
3447
- "Mozilla/5.0 (compatible; Miniflux/2.0.12; +https://miniflux.app)",
3448
- "Mozilla/5.0 (compatible; Miniflux/ae1dc1a; +https://miniflux.app)",
3449
- "Mozilla/5.0 (compatible; Miniflux/3b6e44c; +https://miniflux.app)"
3450
- ],
3451
- "url": "https://miniflux.net",
3452
- "description": "Miniflux is a minimalist and opinionated feed reader."
3453
- }
3454
- ,
3455
- {
3456
- "pattern": "Feedspot",
3457
- "addition_date": "2018/07/07",
3458
- "instances": [
3459
- "Mozilla/5.0 (compatible; Feedspotbot/1.0; +http://www.feedspot.com/fs/bot)",
3460
- "Mozilla/5.0 (compatible; Feedspot/1.0 (+https://www.feedspot.com/fs/fetcher; like FeedFetcher-Google)"
3461
- ],
3462
- "url": "http://www.feedspot.com/fs/bot"
3463
- }
3464
- ,
3465
- {
3466
- "pattern": "Diffbot\\/",
3467
- "addition_date": "2018/07/07",
3468
- "instances": [
3469
- "Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.9.1.2) Gecko/20090729 Firefox/3.5.2 (.NET CLR 3.5.30729; Diffbot/0.1; +http://www.diffbot.com)"
3470
- ],
3471
- "url": "http://www.diffbot.com"
3472
- }
3473
- ,
3474
- {
3475
- "pattern": "SEOkicks",
3476
- "addition_date": "2018/08/22",
3477
- "instances": [
3478
- "Mozilla/5.0 (compatible; SEOkicks; +https://www.seokicks.de/robot.html)"
3479
- ],
3480
- "url": "https://www.seokicks.de/robot.html"
3481
- }
3482
- ,
3072
+ "pattern": "BLEXBot\\/",
3073
+ "addition_date": "2018/07/07",
3074
+ "instances": [
3075
+ "Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)"
3076
+ ],
3077
+ "url": "http://webmeup-crawler.com"
3078
+ },
3483
3079
  {
3484
- "pattern": "tracemyfile",
3485
- "addition_date": "2018/08/23",
3486
- "instances": [
3487
- "Mozilla/5.0 (compatible; tracemyfile/1.0; +bot@tracemyfile.com)"
3488
- ]
3489
- }
3490
- ,
3080
+ "pattern": "DareBoost",
3081
+ "addition_date": "2018/07/07",
3082
+ "instances": [
3083
+ "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3202.75 Safari/537.36 DareBoost"
3084
+ ],
3085
+ "url": "https://www.dareboost.com/",
3086
+ "description": "Bot to test, Analyze and Optimize website"
3087
+ },
3491
3088
  {
3492
- "pattern": "Nimbostratus-Bot",
3493
- "addition_date": "2018/08/29",
3494
- "instances": [
3495
- "Mozilla/5.0 (compatible; Nimbostratus-Bot/v1.3.2; http://cloudsystemnetworks.com)"
3496
- ]
3497
- }
3498
- ,
3499
- {
3500
- "pattern": "zgrab",
3501
- "addition_date": "2018/08/30",
3502
- "instances": [
3503
- "Mozilla/5.0 zgrab/0.x"
3504
- ],
3505
- "url": "https://zmap.io/"
3506
- }
3507
- ,
3089
+ "pattern": "ZuperlistBot\\/",
3090
+ "addition_date": "2018/07/07",
3091
+ "instances": [
3092
+ "Mozilla/5.0 (compatible; ZuperlistBot/1.0)"
3093
+ ]
3094
+ },
3095
+ {
3096
+ "pattern": "Miniflux\\/",
3097
+ "addition_date": "2018/07/07",
3098
+ "instances": [
3099
+ "Mozilla/5.0 (compatible; Miniflux/2.0.x-dev; +https://miniflux.net)",
3100
+ "Mozilla/5.0 (compatible; Miniflux/2.0.3; +https://miniflux.net)",
3101
+ "Mozilla/5.0 (compatible; Miniflux/2.0.7; +https://miniflux.net)",
3102
+ "Mozilla/5.0 (compatible; Miniflux/2.0.10; +https://miniflux.net)",
3103
+ "Mozilla/5.0 (compatibl$; Miniflux/2.0.x-dev; +https://miniflux.app)",
3104
+ "Mozilla/5.0 (compatible; Miniflux/2.0.11; +https://miniflux.app)",
3105
+ "Mozilla/5.0 (compatible; Miniflux/2.0.12; +https://miniflux.app)",
3106
+ "Mozilla/5.0 (compatible; Miniflux/ae1dc1a; +https://miniflux.app)",
3107
+ "Mozilla/5.0 (compatible; Miniflux/3b6e44c; +https://miniflux.app)"
3108
+ ],
3109
+ "url": "https://miniflux.net",
3110
+ "description": "Miniflux is a minimalist and opinionated feed reader."
3111
+ },
3112
+ {
3113
+ "pattern": "Feedspot",
3114
+ "addition_date": "2018/07/07",
3115
+ "instances": [
3116
+ "Mozilla/5.0 (compatible; Feedspotbot/1.0; +http://www.feedspot.com/fs/bot)",
3117
+ "Mozilla/5.0 (compatible; Feedspot/1.0 (+https://www.feedspot.com/fs/fetcher; like FeedFetcher-Google)"
3118
+ ],
3119
+ "url": "http://www.feedspot.com/fs/bot"
3120
+ },
3121
+ {
3122
+ "pattern": "Diffbot\\/",
3123
+ "addition_date": "2018/07/07",
3124
+ "instances": [
3125
+ "Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.9.1.2) Gecko/20090729 Firefox/3.5.2 (.NET CLR 3.5.30729; Diffbot/0.1; +http://www.diffbot.com)"
3126
+ ],
3127
+ "url": "http://www.diffbot.com"
3128
+ },
3129
+ {
3130
+ "pattern": "SEOkicks",
3131
+ "addition_date": "2018/08/22",
3132
+ "instances": [
3133
+ "Mozilla/5.0 (compatible; SEOkicks; +https://www.seokicks.de/robot.html)"
3134
+ ],
3135
+ "url": "https://www.seokicks.de/robot.html"
3136
+ },
3508
3137
  {
3509
- "pattern": "PR-CY\\.RU",
3510
- "addition_date": "2018/08/30",
3511
- "instances": [
3512
- "Mozilla/5.0 (compatible; PR-CY.RU; + https://a.pr-cy.ru)"
3513
- ],
3138
+ "pattern": "tracemyfile",
3139
+ "addition_date": "2018/08/23",
3140
+ "instances": [
3141
+ "Mozilla/5.0 (compatible; tracemyfile/1.0; +bot@tracemyfile.com)"
3142
+ ]
3143
+ },
3144
+ {
3145
+ "pattern": "Nimbostratus-Bot",
3146
+ "addition_date": "2018/08/29",
3147
+ "instances": [
3148
+ "Mozilla/5.0 (compatible; Nimbostratus-Bot/v1.3.2; http://cloudsystemnetworks.com)"
3149
+ ]
3150
+ },
3151
+ {
3152
+ "pattern": "zgrab",
3153
+ "addition_date": "2018/08/30",
3154
+ "instances": [
3155
+ "Mozilla/5.0 zgrab/0.x"
3156
+ ],
3157
+ "url": "https://github.com/zmap/zgrab2"
3158
+ },
3159
+ {
3160
+ "pattern": "PR-CY\\.RU",
3161
+ "addition_date": "2018/08/30",
3162
+ "instances": [
3163
+ "Mozilla/5.0 (compatible; PR-CY.RU; + https://a.pr-cy.ru)"
3164
+ ],
3514
3165
  "url": "https://a.pr-cy.ru/"
3515
- }
3516
- ,
3166
+ },
3517
3167
  {
3518
- "pattern": "AdsTxtCrawler",
3519
- "addition_date": "2018/08/30",
3520
- "instances": [
3521
- "AdsTxtCrawler/1.0"
3522
- ]
3168
+ "pattern": "AdsTxtCrawler",
3169
+ "addition_date": "2018/08/30",
3170
+ "instances": [
3171
+ "AdsTxtCrawler/1.0"
3172
+ ]
3523
3173
  },
3524
3174
  {
3525
3175
  "pattern": "Datafeedwatch",
@@ -3528,8 +3178,7 @@
3528
3178
  "Datafeedwatch/2.1.x"
3529
3179
  ],
3530
3180
  "url": "https://www.datafeedwatch.com/"
3531
- }
3532
- ,
3181
+ },
3533
3182
  {
3534
3183
  "pattern": "Zabbix",
3535
3184
  "addition_date": "2018/09/05",
@@ -3537,8 +3186,7 @@
3537
3186
  "Zabbix"
3538
3187
  ],
3539
3188
  "url": "https://www.zabbix.com/documentation/3.4/manual/web_monitoring"
3540
- }
3541
- ,
3189
+ },
3542
3190
  {
3543
3191
  "pattern": "TangibleeBot",
3544
3192
  "addition_date": "2018/09/05",
@@ -3546,8 +3194,7 @@
3546
3194
  "TangibleeBot/1.0.0.0 (http://tangiblee.com/bot)"
3547
3195
  ],
3548
3196
  "url": "http://tangiblee.com/bot"
3549
- }
3550
- ,
3197
+ },
3551
3198
  {
3552
3199
  "pattern": "google-xrawler",
3553
3200
  "addition_date": "2018/09/05",
@@ -3555,8 +3202,7 @@
3555
3202
  "google-xrawler"
3556
3203
  ],
3557
3204
  "url": "https://webmasters.stackexchange.com/questions/105560/what-is-the-google-xrawler-user-agent-used-for"
3558
- }
3559
- ,
3205
+ },
3560
3206
  {
3561
3207
  "pattern": "axios",
3562
3208
  "addition_date": "2018/09/06",
@@ -3565,8 +3211,7 @@
3565
3211
  "axios/0.19.0"
3566
3212
  ],
3567
3213
  "url": "https://github.com/axios/axios"
3568
- }
3569
- ,
3214
+ },
3570
3215
  {
3571
3216
  "pattern": "Amazon CloudFront",
3572
3217
  "addition_date": "2018/09/07",
@@ -3574,16 +3219,14 @@
3574
3219
  "Amazon CloudFront"
3575
3220
  ],
3576
3221
  "url": "https://aws.amazon.com/cloudfront/"
3577
- }
3578
- ,
3222
+ },
3579
3223
  {
3580
3224
  "pattern": "Pulsepoint",
3581
3225
  "addition_date": "2018/09/24",
3582
3226
  "instances": [
3583
3227
  "Pulsepoint XT3 web scraper"
3584
3228
  ]
3585
- }
3586
- ,
3229
+ },
3587
3230
  {
3588
3231
  "pattern": "CloudFlare-AlwaysOnline",
3589
3232
  "addition_date": "2018/09/27",
@@ -3591,27 +3234,24 @@
3591
3234
  "Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34",
3592
3235
  "Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +https://www.cloudflare.com/always-online) AppleWebKit/534.34"
3593
3236
  ],
3594
- "url" : "https://www.cloudflare.com/always-online/"
3595
- }
3596
- ,
3237
+ "url": "https://www.cloudflare.com/always-online/"
3238
+ },
3597
3239
  {
3598
- "pattern": "Google-Structured-Data-Testing-Tool",
3240
+ "pattern": "Google-Structured-Data-Testing-Tool",
3599
3241
  "addition_date": "2018/10/02",
3600
3242
  "instances": [
3601
3243
  "Mozilla/5.0 (compatible; Google-Structured-Data-Testing-Tool +https://search.google.com/structured-data/testing-tool)",
3602
3244
  "Mozilla/5.0 (compatible; Google-Structured-Data-Testing-Tool +http://developers.google.com/structured-data/testing-tool/)"
3603
3245
  ],
3604
3246
  "url": "https://search.google.com/structured-data/testing-tool"
3605
- }
3606
- ,
3247
+ },
3607
3248
  {
3608
- "pattern": "WordupInfoSearch",
3249
+ "pattern": "WordupInfoSearch",
3609
3250
  "addition_date": "2018/10/07",
3610
3251
  "instances": [
3611
3252
  "WordupInfoSearch/1.0"
3612
3253
  ]
3613
- }
3614
- ,
3254
+ },
3615
3255
  {
3616
3256
  "pattern": "WebDataStats",
3617
3257
  "addition_date": "2018/10/08",
@@ -3619,16 +3259,14 @@
3619
3259
  "Mozilla/5.0 (compatible; WebDataStats/1.0 ; +https://webdatastats.com/policy.html)"
3620
3260
  ],
3621
3261
  "url": "https://webdatastats.com/"
3622
- }
3623
- ,
3262
+ },
3624
3263
  {
3625
3264
  "pattern": "HttpUrlConnection",
3626
3265
  "addition_date": "2018/10/08",
3627
3266
  "instances": [
3628
3267
  "Jersey/2.25.1 (HttpUrlConnection 1.8.0_141)"
3629
3268
  ]
3630
- }
3631
- ,
3269
+ },
3632
3270
  {
3633
3271
  "pattern": "ZoomBot",
3634
3272
  "addition_date": "2018/10/10",
@@ -3636,24 +3274,22 @@
3636
3274
  "ZoomBot (Linkbot 1.0 http://suite.seozoom.it/bot.html)"
3637
3275
  ],
3638
3276
  "url": "http://suite.seozoom.it/bot.html"
3639
- }
3640
- ,
3277
+ },
3641
3278
  {
3642
3279
  "pattern": "VelenPublicWebCrawler",
3643
3280
  "addition_date": "2018/10/09",
3281
+ "url": "https://velen.io/",
3644
3282
  "instances": [
3645
3283
  "VelenPublicWebCrawler (velen.io)"
3646
3284
  ]
3647
- }
3648
- ,
3285
+ },
3649
3286
  {
3650
3287
  "pattern": "MoodleBot",
3651
3288
  "addition_date": "2018/10/10",
3652
3289
  "instances": [
3653
3290
  "MoodleBot/1.0"
3654
3291
  ]
3655
- }
3656
- ,
3292
+ },
3657
3293
  {
3658
3294
  "pattern": "jpg-newsbot",
3659
3295
  "addition_date": "2018/10/10",
@@ -3661,8 +3297,7 @@
3661
3297
  "jpg-newsbot/2.0; (+https://vipnytt.no/bots/)"
3662
3298
  ],
3663
3299
  "url": "https://vipnytt.no/bots/"
3664
- }
3665
- ,
3300
+ },
3666
3301
  {
3667
3302
  "pattern": "outbrain",
3668
3303
  "addition_date": "2018/10/14",
@@ -3670,8 +3305,7 @@
3670
3305
  "Mozilla/5.0 (Java) outbrain"
3671
3306
  ],
3672
3307
  "url": "https://www.outbrain.com/help/advertisers/invalid-url/"
3673
- }
3674
- ,
3308
+ },
3675
3309
  {
3676
3310
  "pattern": "W3C_Validator",
3677
3311
  "addition_date": "2018/10/14",
@@ -3679,8 +3313,7 @@
3679
3313
  "W3C_Validator/1.3"
3680
3314
  ],
3681
3315
  "url": "https://validator.w3.org/services"
3682
- }
3683
- ,
3316
+ },
3684
3317
  {
3685
3318
  "pattern": "Validator\\.nu",
3686
3319
  "addition_date": "2018/10/14",
@@ -3688,12 +3321,13 @@
3688
3321
  "Validator.nu/LV"
3689
3322
  ],
3690
3323
  "url": "https://validator.w3.org/services"
3691
- }
3692
- ,
3324
+ },
3693
3325
  {
3694
3326
  "pattern": "W3C-checklink",
3695
3327
  "addition_date": "2018/10/14",
3696
- "depends_on": ["libwww-perl"],
3328
+ "depends_on": [
3329
+ "libwww-perl"
3330
+ ],
3697
3331
  "instances": [
3698
3332
  "W3C-checklink/2.90 libwww-perl/5.64",
3699
3333
  "W3C-checklink/3.6.2.3 libwww-perl/5.64",
@@ -3706,8 +3340,7 @@
3706
3340
  "W3C-checklink/4.5 [4.160] libwww-perl/5.823"
3707
3341
  ],
3708
3342
  "url": "https://validator.w3.org/services"
3709
- }
3710
- ,
3343
+ },
3711
3344
  {
3712
3345
  "pattern": "W3C-mobileOK",
3713
3346
  "addition_date": "2018/10/14",
@@ -3715,8 +3348,7 @@
3715
3348
  "W3C-mobileOK/DDC-1.0"
3716
3349
  ],
3717
3350
  "url": "https://validator.w3.org/services"
3718
- }
3719
- ,
3351
+ },
3720
3352
  {
3721
3353
  "pattern": "W3C_I18n-Checker",
3722
3354
  "addition_date": "2018/10/14",
@@ -3724,8 +3356,7 @@
3724
3356
  "W3C_I18n-Checker/1.0"
3725
3357
  ],
3726
3358
  "url": "https://validator.w3.org/services"
3727
- }
3728
- ,
3359
+ },
3729
3360
  {
3730
3361
  "pattern": "FeedValidator",
3731
3362
  "addition_date": "2018/10/14",
@@ -3733,8 +3364,7 @@
3733
3364
  "FeedValidator/1.3"
3734
3365
  ],
3735
3366
  "url": "https://validator.w3.org/services"
3736
- }
3737
- ,
3367
+ },
3738
3368
  {
3739
3369
  "pattern": "W3C_CSS_Validator",
3740
3370
  "addition_date": "2018/10/14",
@@ -3742,8 +3372,7 @@
3742
3372
  "Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0"
3743
3373
  ],
3744
3374
  "url": "https://validator.w3.org/services"
3745
- }
3746
- ,
3375
+ },
3747
3376
  {
3748
3377
  "pattern": "W3C_Unicorn",
3749
3378
  "addition_date": "2018/10/14",
@@ -3751,16 +3380,14 @@
3751
3380
  "W3C_Unicorn/1.0"
3752
3381
  ],
3753
3382
  "url": "https://validator.w3.org/services"
3754
- }
3755
- ,
3383
+ },
3756
3384
  {
3757
3385
  "pattern": "Google-PhysicalWeb",
3758
3386
  "addition_date": "2018/10/21",
3759
3387
  "instances": [
3760
3388
  "Mozilla/5.0 (Google-PhysicalWeb)"
3761
3389
  ]
3762
- }
3763
- ,
3390
+ },
3764
3391
  {
3765
3392
  "pattern": "Blackboard",
3766
3393
  "addition_date": "2018/10/28",
@@ -3840,8 +3467,7 @@
3840
3467
  "Mozilla/5.0 (compatible; theoldreader.com)"
3841
3468
  ],
3842
3469
  "url": "https://www.theoldreader.com/"
3843
- }
3844
- ,
3470
+ },
3845
3471
  {
3846
3472
  "pattern": "AnyEvent",
3847
3473
  "addition_date": "2018/12/07",
@@ -3849,8 +3475,7 @@
3849
3475
  "Mozilla/5.0 (compatible; U; AnyEvent-HTTP/2.24; +http://software.schmorp.de/pkg/AnyEvent)"
3850
3476
  ],
3851
3477
  "url": "http://software.schmorp.de/pkg/AnyEvent.html"
3852
- }
3853
- ,
3478
+ },
3854
3479
  {
3855
3480
  "pattern": "Uptimebot\\.org",
3856
3481
  "addition_date": "2019/01/17",
@@ -3858,8 +3483,7 @@
3858
3483
  "Uptimebot.org - Free website monitoring"
3859
3484
  ],
3860
3485
  "url": "http://uptimebot.org/"
3861
- }
3862
- ,
3486
+ },
3863
3487
  {
3864
3488
  "pattern": "Nmap Scripting Engine",
3865
3489
  "addition_date": "2019/02/04",
@@ -3867,8 +3491,7 @@
3867
3491
  "Mozilla/5.0 (compatible; Nmap Scripting Engine; https://nmap.org/book/nse.html)"
3868
3492
  ],
3869
3493
  "url": "https://nmap.org/book/nse.html"
3870
- }
3871
- ,
3494
+ },
3872
3495
  {
3873
3496
  "pattern": "2ip\\.ru",
3874
3497
  "addition_date": "2019/02/12",
@@ -3958,9 +3581,9 @@
3958
3581
  "url": "https://developers.google.com/web/updates/2017/04/headless-chrome",
3959
3582
  "addition_date": "2019/06/17",
3960
3583
  "instances": [
3961
- "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/74.0.3729.169 Safari/537.36",
3962
- "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/69.0.3494.0 Safari/537.36",
3963
- "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/76.0.3803.0 Safari/537.36"
3584
+ "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/74.0.3729.169 Safari/537.36",
3585
+ "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/69.0.3494.0 Safari/537.36",
3586
+ "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/76.0.3803.0 Safari/537.36"
3964
3587
  ]
3965
3588
  },
3966
3589
  {
@@ -3978,8 +3601,7 @@
3978
3601
  "Mozilla/5.0 (compatible; Uptimebot/1.0; +http://www.uptime.com/uptimebot)"
3979
3602
  ],
3980
3603
  "url": "http://www.uptime.com/uptimebot"
3981
- }
3982
- ,
3604
+ },
3983
3605
  {
3984
3606
  "pattern": "Streamline3Bot\\/",
3985
3607
  "addition_date": "2019/07/21",
@@ -3988,8 +3610,7 @@
3988
3610
  "Mozilla/5.0 (Windows NT 6.1; Win64; x64; +https://www.ubtsupport.com/legal/Streamline3Bot.php) Streamline3Bot/1.0"
3989
3611
  ],
3990
3612
  "url": "https://www.ubtsupport.com/legal/Streamline3Bot.php"
3991
- }
3992
- ,
3613
+ },
3993
3614
  {
3994
3615
  "pattern": "serpstatbot\\/",
3995
3616
  "addition_date": "2019/07/25",
@@ -3998,8 +3619,7 @@
3998
3619
  "serpstatbot/1.0 (advanced backlink tracking bot; curl/7.58.0; http://serpstatbot.com/; abuse@serpstatbot.com)"
3999
3620
  ],
4000
3621
  "url": "http://serpstatbot.com"
4001
- }
4002
- ,
3622
+ },
4003
3623
  {
4004
3624
  "pattern": "MixnodeCache\\/",
4005
3625
  "addition_date": "2019/08/04",
@@ -4007,8 +3627,7 @@
4007
3627
  "MixnodeCache/1.8(+https://cache.mixnode.com/)"
4008
3628
  ],
4009
3629
  "url": "https://cache.mixnode.com/"
4010
- }
4011
- ,
3630
+ },
4012
3631
  {
4013
3632
  "pattern": "^curl",
4014
3633
  "addition_date": "2019/08/15",
@@ -4023,8 +3642,7 @@
4023
3642
  "curl/7.65.3"
4024
3643
  ],
4025
3644
  "url": "https://curl.haxx.se/"
4026
- }
4027
- ,
3645
+ },
4028
3646
  {
4029
3647
  "pattern": "SimpleScraper",
4030
3648
  "addition_date": "2019/08/16",
@@ -4032,8 +3650,7 @@
4032
3650
  "Mozilla/5.0 (compatible; SimpleScraper)"
4033
3651
  ],
4034
3652
  "url": "https://github.com/ramonkcom/simple-scraper/"
4035
- }
4036
- ,
3653
+ },
4037
3654
  {
4038
3655
  "pattern": "RSSingBot",
4039
3656
  "addition_date": "2019/09/15",
@@ -4041,8 +3658,7 @@
4041
3658
  "RSSingBot (http://www.rssing.com)"
4042
3659
  ],
4043
3660
  "url": "http://www.rssing.com"
4044
- }
4045
- ,
3661
+ },
4046
3662
  {
4047
3663
  "pattern": "Jooblebot",
4048
3664
  "addition_date": "2019/09/25",
@@ -4050,8 +3666,7 @@
4050
3666
  "Mozilla/5.0 (compatible; Jooblebot/2.0; Windows NT 6.1; WOW64; +http://jooble.org/jooble-bot) AppleWebKit/537.36 (KHTML, like Gecko) Safari/537.36"
4051
3667
  ],
4052
3668
  "url": "http://jooble.org/jooble-bot"
4053
- }
4054
- ,
3669
+ },
4055
3670
  {
4056
3671
  "pattern": "fedoraplanet",
4057
3672
  "addition_date": "2019/09/28",
@@ -4059,8 +3674,7 @@
4059
3674
  "venus/fedoraplanet"
4060
3675
  ],
4061
3676
  "url": "http://fedoraplanet.org/"
4062
- }
4063
- ,
3677
+ },
4064
3678
  {
4065
3679
  "pattern": "Friendica",
4066
3680
  "addition_date": "2019/09/28",
@@ -4068,8 +3682,7 @@
4068
3682
  "Friendica 'The Tazmans Flax-lily' 2019.01-1293; https://hoyer.xyz"
4069
3683
  ],
4070
3684
  "url": "https://hoyer.xyz"
4071
- }
4072
- ,
3685
+ },
4073
3686
  {
4074
3687
  "pattern": "NextCloud",
4075
3688
  "addition_date": "2019/09/30",
@@ -4077,8 +3690,7 @@
4077
3690
  "NextCloud-News/1.0"
4078
3691
  ],
4079
3692
  "url": "https://nextcloud.com/"
4080
- }
4081
- ,
3693
+ },
4082
3694
  {
4083
3695
  "pattern": "Tiny Tiny RSS",
4084
3696
  "addition_date": "2019/10/04",
@@ -4089,8 +3701,7 @@
4089
3701
  "Tiny Tiny RSS/19.8 (http://tt-rss.org/)"
4090
3702
  ],
4091
3703
  "url": "http://tt-rss.org/"
4092
- }
4093
- ,
3704
+ },
4094
3705
  {
4095
3706
  "pattern": "RegionStuttgartBot",
4096
3707
  "addition_date": "2019/10/17",
@@ -4098,35 +3709,33 @@
4098
3709
  "Mozilla/5.0 (compatible; RegionStuttgartBot/1.0; +http://it.region-stuttgart.de/competenzatlas/unternehmen-suchen/)"
4099
3710
  ],
4100
3711
  "url": "http://it.region-stuttgart.de/competenzatlas/unternehmen-suchen/"
4101
- }
4102
- ,
3712
+ },
4103
3713
  {
4104
3714
  "pattern": "Bytespider",
4105
3715
  "addition_date": "2019/11/11",
4106
3716
  "instances": [
4107
- "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/40.0.3754.1902 Mobile Safari/537.36; Bytespider",
4108
- "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.4454.1745 Mobile Safari/537.36; Bytespider",
4109
- "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.7597.1164 Mobile Safari/537.36; Bytespider;bytespider@bytedance.com",
4110
- "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/46.0.2988.1545 Mobile Safari/537.36; Bytespider",
4111
- "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.4141.1682 Mobile Safari/537.36; Bytespider",
4112
- "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/54.0.3478.1649 Mobile Safari/537.36; Bytespider",
4113
- "Mozilla/5.0 (Linux; Android 5.0; SM-G900P Build/LRX21T) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/47.0.5267.1259 Mobile Safari/537.36; Bytespider",
4114
- "Mozilla/5.0 (Linux; Android 5.0; SM-G900P Build/LRX21T) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.7990.1979 Mobile Safari/537.36; Bytespider",
4115
- "Mozilla/5.0 (Linux; Android 5.0; SM-G900P Build/LRX21T) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.2268.1523 Mobile Safari/537.36; Bytespider",
4116
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/40.0.2576.1836 Mobile Safari/537.36; Bytespider",
4117
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.9681.1227 Mobile Safari/537.36; Bytespider",
4118
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/44.0.6023.1635 Mobile Safari/537.36; Bytespider",
4119
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.4944.1981 Mobile Safari/537.36; Bytespider",
4120
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.3613.1739 Mobile Safari/537.36; Bytespider",
4121
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.4022.1033 Mobile Safari/537.36; Bytespider",
4122
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/52.0.3248.1547 Mobile Safari/537.36; Bytespider",
4123
- "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/57.0.5527.1507 Mobile Safari/537.36; Bytespider",
4124
- "Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/54.0.5216.1326 Mobile Safari/537.36; Bytespider",
4125
- "Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.9038.1080 Mobile Safari/537.36; Bytespider"
3717
+ "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/40.0.3754.1902 Mobile Safari/537.36; Bytespider",
3718
+ "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.4454.1745 Mobile Safari/537.36; Bytespider",
3719
+ "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.7597.1164 Mobile Safari/537.36; Bytespider;bytespider@bytedance.com",
3720
+ "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/46.0.2988.1545 Mobile Safari/537.36; Bytespider",
3721
+ "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.4141.1682 Mobile Safari/537.36; Bytespider",
3722
+ "Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/54.0.3478.1649 Mobile Safari/537.36; Bytespider",
3723
+ "Mozilla/5.0 (Linux; Android 5.0; SM-G900P Build/LRX21T) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/47.0.5267.1259 Mobile Safari/537.36; Bytespider",
3724
+ "Mozilla/5.0 (Linux; Android 5.0; SM-G900P Build/LRX21T) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.7990.1979 Mobile Safari/537.36; Bytespider",
3725
+ "Mozilla/5.0 (Linux; Android 5.0; SM-G900P Build/LRX21T) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.2268.1523 Mobile Safari/537.36; Bytespider",
3726
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/40.0.2576.1836 Mobile Safari/537.36; Bytespider",
3727
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.9681.1227 Mobile Safari/537.36; Bytespider",
3728
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/44.0.6023.1635 Mobile Safari/537.36; Bytespider",
3729
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.4944.1981 Mobile Safari/537.36; Bytespider",
3730
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.3613.1739 Mobile Safari/537.36; Bytespider",
3731
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.4022.1033 Mobile Safari/537.36; Bytespider",
3732
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/52.0.3248.1547 Mobile Safari/537.36; Bytespider",
3733
+ "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/57.0.5527.1507 Mobile Safari/537.36; Bytespider",
3734
+ "Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/54.0.5216.1326 Mobile Safari/537.36; Bytespider",
3735
+ "Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.9038.1080 Mobile Safari/537.36; Bytespider"
4126
3736
  ],
4127
3737
  "url": "https://stackoverflow.com/questions/57908900/what-is-the-bytespider-user-agent"
4128
- }
4129
- ,
3738
+ },
4130
3739
  {
4131
3740
  "pattern": "Datanyze",
4132
3741
  "addition_date": "2019/11/17",
@@ -4134,8 +3743,7 @@
4134
3743
  "Mozilla/5.0 (X11; Datanyze; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36"
4135
3744
  ],
4136
3745
  "url": "https://www.datanyze.com/dnyzbot/"
4137
- }
4138
- ,
3746
+ },
4139
3747
  {
4140
3748
  "pattern": "Google-Site-Verification",
4141
3749
  "addition_date": "2019/12/11",
@@ -4143,8 +3751,7 @@
4143
3751
  "Mozilla/5.0 (compatible; Google-Site-Verification/1.0)"
4144
3752
  ],
4145
3753
  "url": "https://support.google.com/webmasters/answer/9008080"
4146
- }
4147
- ,
3754
+ },
4148
3755
  {
4149
3756
  "pattern": "TrendsmapResolver",
4150
3757
  "addition_date": "2020/02/24",
@@ -4152,8 +3759,7 @@
4152
3759
  "Mozilla/5.0 (compatible; TrendsmapResolver/0.1)"
4153
3760
  ],
4154
3761
  "url": "https://www.trendsmap.com/"
4155
- }
4156
- ,
3762
+ },
4157
3763
  {
4158
3764
  "pattern": "tweetedtimes",
4159
3765
  "addition_date": "2020/02/24",
@@ -4335,7 +3941,7 @@
4335
3941
  "instances": [
4336
3942
  "SentiBot www.sentibot.eu (compatible with Googlebot)"
4337
3943
  ],
4338
- "url": "https://www.sentibot.eu"
3944
+ "url": "https://sites.google.com/senti1.com/sentibot-eu/home"
4339
3945
  },
4340
3946
  {
4341
3947
  "pattern": "Domains Project\\/",
@@ -4421,7 +4027,7 @@
4421
4027
  "instances": [
4422
4028
  "rssbot/1.4.3 (+https://t.me/RustRssBot)"
4423
4029
  ],
4424
- "url": "https://t.me/RustRssBot"
4030
+ "url": "https://github.com/iovxw/rssbot"
4425
4031
  },
4426
4032
  {
4427
4033
  "pattern": "startmebot\\/",
@@ -4485,7 +4091,7 @@
4485
4091
  "Mozilla/5.0 (compatible; RidderBot/1.0; bot@ridder.co)",
4486
4092
  "Mozilla/5.0 (compatible; RidderBot/1.0; bot@ridder.co) (iPhone; CPU iPhone OS 8_4_1 like Mac OS X) Mobile/12H321"
4487
4093
  ],
4488
- "url": "http://brandonmedia.net"
4094
+ "url": "https://ridder.co/"
4489
4095
  },
4490
4096
  {
4491
4097
  "pattern": "Taboolabot",
@@ -4609,8 +4215,7 @@
4609
4215
  "addition_date": "2022/04/26",
4610
4216
  "instances": [
4611
4217
  "Mozilla/5.0 (compatible; Go-http-client/1.1; +centurybot9@gmail.com)"
4612
- ],
4613
- "url": "unknown"
4218
+ ]
4614
4219
  },
4615
4220
  {
4616
4221
  "pattern": "Viber",
@@ -4623,6 +4228,7 @@
4623
4228
  {
4624
4229
  "pattern": "e\\.ventures Investment Crawler",
4625
4230
  "addition_date": "2021/06/05",
4231
+ "url": "https://www.eventures.vc/",
4626
4232
  "instances": [
4627
4233
  "e.ventures Investment Crawler (eventures.vc)"
4628
4234
  ]
@@ -4630,6 +4236,7 @@
4630
4236
  {
4631
4237
  "pattern": "evc-batch",
4632
4238
  "addition_date": "2021/06/07",
4239
+ "url": "https://www.eventures.vc/",
4633
4240
  "instances": [
4634
4241
  "Mozilla/5.0 (compatible; evc-batch/2.0)"
4635
4242
  ]
@@ -4647,8 +4254,8 @@
4647
4254
  "pattern": "virustotal",
4648
4255
  "addition_date": "2021/09/22",
4649
4256
  "instances": [
4650
- "Mozilla\/5.0 (Windows; U; MSIE 9.0; Windows NT 9.0; en-US) AppEngine-Google; (+http:\/\/code.google.com\/appengine; appid: s~virustotalcloud)",
4651
- "AppEngine-Google; (+http:\/\/code.google.com\/appengine; appid: s~virustotalcloud)"
4257
+ "Mozilla/5.0 (Windows; U; MSIE 9.0; Windows NT 9.0; en-US) AppEngine-Google; (+http://code.google.com/appengine; appid: s~virustotalcloud)",
4258
+ "AppEngine-Google; (+http://code.google.com/appengine; appid: s~virustotalcloud)"
4652
4259
  ],
4653
4260
  "url": "https://www.virustotal.com/gui/home/url"
4654
4261
  },
@@ -4677,14 +4284,14 @@
4677
4284
  "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; Cookiebot/1.0; +http://cookiebot.com/) Chrome/97.0.4692.71 Safari/537.36"
4678
4285
  ]
4679
4286
  },
4680
- {
4681
- "pattern": "trovitBot",
4682
- "addition_date": "2022/06/08",
4683
- "url": "http://www.trovit.com/bot.html",
4684
- "instances": [
4685
- "Mozilla/5.0 (compatible; trovitBot 1.0; +http://www.trovit.com/bot.html)"
4686
- ]
4687
- },
4287
+ {
4288
+ "pattern": "trovitBot",
4289
+ "addition_date": "2022/06/08",
4290
+ "url": "http://www.trovit.com/bot.html",
4291
+ "instances": [
4292
+ "Mozilla/5.0 (compatible; trovitBot 1.0; +http://www.trovit.com/bot.html)"
4293
+ ]
4294
+ },
4688
4295
  {
4689
4296
  "pattern": "seostar\\.co",
4690
4297
  "addition_date": "2022/08/04",
@@ -4762,7 +4369,9 @@
4762
4369
  "pattern": "RuxitSynthetic",
4763
4370
  "addition_date": "2023/02/16",
4764
4371
  "url": "https://www.dynatrace.com/support/help/platform-modules/digital-experience/synthetic-monitoring/browser-monitors/configure-browser-monitors#expand--default-user-agent",
4765
- "instances" : ["RuxitSynthetic/1.0"]
4372
+ "instances": [
4373
+ "RuxitSynthetic/1.0"
4374
+ ]
4766
4375
  },
4767
4376
  {
4768
4377
  "pattern": "Google-Read-Aloud",
@@ -4785,7 +4394,7 @@
4785
4394
  "addition_date": "2023/05/24",
4786
4395
  "instances": [
4787
4396
  "OdklBot/1.0 (share@odnoklassniki.ru)",
4788
- "Mozilla/5.0 (compatible; OdklBot/1.0 like Linux; klass@odnoklassniki.ru)"
4397
+ "Mozilla/5.0 (compatible; OdklBot/1.0 like Linux; klass@odnoklassniki.ru)"
4789
4398
  ],
4790
4399
  "url": "https://odnoklassniki.ru/"
4791
4400
  },
@@ -4876,7 +4485,7 @@
4876
4485
  "addition_date": "2023/08/24",
4877
4486
  "instances": [
4878
4487
  "Mozilla/5.0 (compatible; Linespider/1.1; +https://lin.ee/4dwXkTH)",
4879
- "Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Linespider/1.1; +https://lin.ee/4dwXkTH) Chrome/W.X.Y.Z Safari/537.36"
4488
+ "Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Linespider/1.1; +https://lin.ee/4dwXkTH) Chrome/W.X.Y.Z Safari/537.36"
4880
4489
  ],
4881
4490
  "url": "https://help2.line.me/linesearchbot/web/?contentId=50006055&lang=en"
4882
4491
  },
@@ -5238,7 +4847,7 @@
5238
4847
  "instances": [
5239
4848
  "Mozilla/5.0 (compatible; ImagesiftBot; +imagesift.com)"
5240
4849
  ],
5241
- "url": "https://imagesift.com"
4850
+ "url": "https://imagesift.com/about"
5242
4851
  },
5243
4852
  {
5244
4853
  "pattern": "Expanse",
@@ -5304,19 +4913,25 @@
5304
4913
  {
5305
4914
  "pattern": "Monsidobot",
5306
4915
  "addition_date": "2024/05/14",
5307
- "instances": ["Mozilla/5.0 (compatible; Monsidobot/2.2; +http://monsido.com/bot.html; info@monsido.com)"],
4916
+ "instances": [
4917
+ "Mozilla/5.0 (compatible; Monsidobot/2.2; +http://monsido.com/bot.html; info@monsido.com)"
4918
+ ],
5308
4919
  "url": "http://monsido.com/bot.html"
5309
4920
  },
5310
4921
  {
5311
4922
  "pattern": "GroupMeBot",
5312
4923
  "addition_date": "2024/05/19",
5313
- "instances": ["GroupMeBot/1.0"],
4924
+ "instances": [
4925
+ "GroupMeBot/1.0"
4926
+ ],
5314
4927
  "url": "https://groupme.com/"
5315
4928
  },
5316
4929
  {
5317
4930
  "pattern": "Vercelbot",
5318
4931
  "addition_date": "2024/08/30",
5319
- "instances": ["Vercelbot (+https://vercel.com)"],
4932
+ "instances": [
4933
+ "Vercelbot (+https://vercel.com)"
4934
+ ],
5320
4935
  "url": "https://github.com/vercel/vercel/discussions/5095#discussioncomment-58705"
5321
4936
  },
5322
4937
  {