device_detector 1.0.5 → 1.0.6

Sign up to get free protection for your applications and to get access to all the features.
Files changed (90) hide show
  1. checksums.yaml +4 -4
  2. data/README.md +7 -6
  3. data/lib/device_detector/browser.rb +364 -0
  4. data/lib/device_detector/client.rb +8 -0
  5. data/lib/device_detector/device.rb +1124 -4
  6. data/lib/device_detector/os.rb +36 -11
  7. data/lib/device_detector/version.rb +1 -1
  8. data/lib/device_detector/version_extractor.rb +9 -0
  9. data/lib/device_detector.rb +57 -13
  10. data/regexes/bots.yml +551 -58
  11. data/regexes/client/browser_engine.yml +7 -1
  12. data/regexes/client/browsers.yml +594 -71
  13. data/regexes/client/feed_readers.yml +4 -10
  14. data/regexes/client/libraries.yml +47 -2
  15. data/regexes/client/mediaplayers.yml +25 -1
  16. data/regexes/client/mobile_apps.yml +447 -77
  17. data/regexes/client/pim.yml +49 -1
  18. data/regexes/device/cameras.yml +5 -5
  19. data/regexes/device/car_browsers.yml +16 -0
  20. data/regexes/device/consoles.yml +6 -0
  21. data/regexes/device/mobiles.yml +12905 -4561
  22. data/regexes/device/portable_media_player.yml +20 -3
  23. data/regexes/device/shell_tv.yml +117 -0
  24. data/regexes/device/televisions.yml +426 -35
  25. data/regexes/oss.yml +567 -139
  26. data/spec/device_detector/concrete_user_agent_spec.rb +30 -42
  27. data/spec/device_detector/detector_fixtures_spec.rb +9 -5
  28. data/spec/device_detector/device_spec.rb +26 -10
  29. data/spec/fixtures/client/browser.yml +1463 -391
  30. data/spec/fixtures/client/feed_reader.yml +0 -12
  31. data/spec/fixtures/client/library.yml +91 -37
  32. data/spec/fixtures/client/mediaplayer.yml +30 -0
  33. data/spec/fixtures/client/mobile_app.yml +498 -45
  34. data/spec/fixtures/client/pim.yml +60 -0
  35. data/spec/fixtures/detector/bots.yml +1189 -568
  36. data/spec/fixtures/detector/camera.yml +12 -26
  37. data/spec/fixtures/detector/car_browser.yml +151 -15
  38. data/spec/fixtures/detector/console.yml +70 -48
  39. data/spec/fixtures/detector/desktop.yml +2041 -916
  40. data/spec/fixtures/detector/feature_phone.yml +895 -189
  41. data/spec/fixtures/detector/feed_reader.yml +50 -77
  42. data/spec/fixtures/detector/mediaplayer.yml +79 -26
  43. data/spec/fixtures/detector/mobile_apps.yml +726 -72
  44. data/spec/fixtures/detector/peripheral.yml +271 -0
  45. data/spec/fixtures/detector/phablet.yml +3635 -1596
  46. data/spec/fixtures/detector/portable_media_player.yml +355 -46
  47. data/spec/fixtures/detector/smart_display.yml +183 -9
  48. data/spec/fixtures/detector/smart_speaker.yml +13 -8
  49. data/spec/fixtures/detector/smartphone-1.yml +4002 -4286
  50. data/spec/fixtures/detector/smartphone-10.yml +3771 -4763
  51. data/spec/fixtures/detector/smartphone-11.yml +3615 -4692
  52. data/spec/fixtures/detector/smartphone-12.yml +3856 -4764
  53. data/spec/fixtures/detector/smartphone-13.yml +4213 -4713
  54. data/spec/fixtures/detector/smartphone-14.yml +4039 -4497
  55. data/spec/fixtures/detector/smartphone-15.yml +5642 -2956
  56. data/spec/fixtures/detector/smartphone-16.yml +4739 -5082
  57. data/spec/fixtures/detector/smartphone-17.yml +4832 -4275
  58. data/spec/fixtures/detector/smartphone-18.yml +9806 -0
  59. data/spec/fixtures/detector/smartphone-19.yml +9965 -0
  60. data/spec/fixtures/detector/smartphone-2.yml +4842 -2589
  61. data/spec/fixtures/detector/smartphone-20.yml +9710 -0
  62. data/spec/fixtures/detector/smartphone-21.yml +8693 -0
  63. data/spec/fixtures/detector/smartphone-22.yml +10178 -0
  64. data/spec/fixtures/detector/smartphone-23.yml +9453 -0
  65. data/spec/fixtures/detector/smartphone-24.yml +9843 -0
  66. data/spec/fixtures/detector/smartphone-25.yml +9703 -0
  67. data/spec/fixtures/detector/smartphone-26.yml +10007 -0
  68. data/spec/fixtures/detector/smartphone-27.yml +4927 -0
  69. data/spec/fixtures/detector/smartphone-3.yml +4387 -4427
  70. data/spec/fixtures/detector/smartphone-4.yml +3597 -4582
  71. data/spec/fixtures/detector/smartphone-5.yml +4066 -5022
  72. data/spec/fixtures/detector/smartphone-6.yml +3455 -4621
  73. data/spec/fixtures/detector/smartphone-7.yml +3574 -4574
  74. data/spec/fixtures/detector/smartphone-8.yml +4617 -4704
  75. data/spec/fixtures/detector/smartphone-9.yml +4080 -5035
  76. data/spec/fixtures/detector/smartphone.yml +3244 -4234
  77. data/spec/fixtures/detector/tablet-1.yml +4652 -4492
  78. data/spec/fixtures/detector/tablet-2.yml +3515 -4434
  79. data/spec/fixtures/detector/tablet-3.yml +3418 -4351
  80. data/spec/fixtures/detector/tablet-4.yml +5149 -3200
  81. data/spec/fixtures/detector/tablet-5.yml +9273 -0
  82. data/spec/fixtures/detector/tablet-6.yml +4588 -0
  83. data/spec/fixtures/detector/tablet.yml +1621 -2613
  84. data/spec/fixtures/detector/tv-1.yml +2501 -0
  85. data/spec/fixtures/detector/tv.yml +7826 -3114
  86. data/spec/fixtures/detector/unknown.yml +370 -531
  87. data/spec/fixtures/detector/wearable.yml +863 -9
  88. data/spec/fixtures/parser/oss.yml +1350 -21
  89. data/spec/fixtures/parser/vendorfragments.yml +53 -53
  90. metadata +35 -5
@@ -1,45 +1,51 @@
1
1
  ---
2
- -
2
+ -
3
3
  user_agent: 360spider-image
4
4
  bot:
5
5
  name: 360Spider
6
6
  category: Search bot
7
- url: http://www.so.com/help/help_3_2.html
7
+ url: https://www.so.com/help/help_3_2.html
8
8
  producer:
9
9
  name: Online Media Group, Inc.
10
10
  url: ""
11
- -
11
+ -
12
12
  user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
13
13
  bot:
14
14
  name: 360Spider
15
15
  category: Search bot
16
- url: http://www.so.com/help/help_3_2.html
16
+ url: https://www.so.com/help/help_3_2.html
17
17
  producer:
18
18
  name: Online Media Group, Inc.
19
19
  url: ""
20
- -
20
+ -
21
21
  user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
22
22
  bot:
23
23
  name: 360Spider
24
24
  category: Search bot
25
- url: http://www.so.com/help/help_3_2.html
25
+ url: https://www.so.com/help/help_3_2.html
26
26
  producer:
27
27
  name: Online Media Group, Inc.
28
28
  url: ""
29
- -
29
+ -
30
30
  user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
31
31
  bot:
32
32
  name: 360Spider
33
33
  category: Search bot
34
- url: http://www.so.com/help/help_3_2.html
34
+ url: https://www.so.com/help/help_3_2.html
35
35
  producer:
36
36
  name: Online Media Group, Inc.
37
37
  url: ""
38
- -
38
+ -
39
39
  user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
40
40
  bot:
41
41
  name: ADMantX
42
- -
42
+ -
43
+ user_agent: ias-va/3.1 (+https://www.admantx.com/service-fetcher.html)
44
+ bot:
45
+ name: ADmantX Service Fetcher
46
+ category: Service bot
47
+ url: https://www.admantx.com/service-fetcher.html
48
+ -
43
49
  user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
44
50
  bot:
45
51
  name: Aboundexbot
@@ -48,7 +54,7 @@
48
54
  producer:
49
55
  name: Aboundex.com
50
56
  url: http://www.aboundex.com
51
- -
57
+ -
52
58
  user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
53
59
  bot:
54
60
  name: Acoon
@@ -57,7 +63,7 @@
57
63
  producer:
58
64
  name: Acoon GmbH
59
65
  url: http://www.acoon.de
60
- -
66
+ -
61
67
  user_agent: AddThis.com robot tech.support@clearspring.com
62
68
  bot:
63
69
  name: AddThis.com
@@ -66,25 +72,34 @@
66
72
  producer:
67
73
  name: Clearspring Technologies, Inc.
68
74
  url: http://www.clearspring.com
69
- -
75
+ -
70
76
  user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
71
77
  bot:
72
78
  name: Alexa Crawler
73
79
  category: Search bot
74
- url: https://alexa.zendesk.com/hc/en-us/sections/200100794-Crawlers
80
+ url: https://support.alexa.com/hc/en-us/sections/200100794-Crawlers
75
81
  producer:
76
82
  name: Alexa Internet
77
- url: http://www.alexa.com
78
- -
83
+ url: https://www.alexa.com
84
+ -
79
85
  user_agent: Mozilla/5.0 (compatible; alexa site audit/1.0; http://www.alexa.com/help/webmasters; )
80
86
  bot:
81
87
  name: Alexa Site Audit
82
88
  category: Site Monitor
83
- url: http://www.alexa.com/help/webmasters
89
+ url: https://support.alexa.com/hc/en-us/articles/200450194
84
90
  producer:
85
91
  name: Alexa Internet
86
- url: http://www.alexa.com
87
- -
92
+ url: https://www.alexa.com
93
+ -
94
+ user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Amazonbot/0.1; +https://developer.amazon.com/support/amazonbot)
95
+ bot:
96
+ name: Amazon Bot
97
+ category: Crawler
98
+ url: https://developer.amazon.com/support/amazonbot
99
+ producer:
100
+ name: Amazon.com, Inc.
101
+ url: https://www.amazon.com/
102
+ -
88
103
  user_agent: Amazon Route 53 Health Check Service; ref:xxxxxxxx-xxxx-xxxxxxxxx-xxxxxxxxxxxx; report http://amzn.to/xxxxxxx
89
104
  bot:
90
105
  name: Amazon Route53 Health Check
@@ -92,7 +107,7 @@
92
107
  producer:
93
108
  name: Amazon Web Services
94
109
  url: https://aws.amazon.com/
95
- -
110
+ -
96
111
  user_agent: Amazon-Route53-Health-Check-Service (ref b0eb04d5-cb5e-40e7-839b-558e52fc3f0d; report http://amzn.to/1vsZADi)
97
112
  bot:
98
113
  name: Amazon Route53 Health Check
@@ -100,7 +115,7 @@
100
115
  producer:
101
116
  name: Amazon Web Services
102
117
  url: https://aws.amazon.com/
103
- -
118
+ -
104
119
  user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
105
120
  bot:
106
121
  name: Amorank Spider
@@ -109,7 +124,7 @@
109
124
  producer:
110
125
  name: Amorank
111
126
  url: http://www.amorank.com
112
- -
127
+ -
113
128
  user_agent: 'Curious George - www.analyticsseo.com/crawler'
114
129
  bot:
115
130
  name: Analytics SEO Crawler
@@ -118,7 +133,7 @@
118
133
  producer:
119
134
  name: Analytics SEO
120
135
  url: http://www.analyticsseo.com
121
- -
136
+ -
122
137
  user_agent: ApacheBench/2.3
123
138
  bot:
124
139
  name: ApacheBench
@@ -126,35 +141,44 @@
126
141
  url: https://httpd.apache.org/docs/2.4/programs/ab.html
127
142
  producer:
128
143
  name: The Apache Software Foundation
129
- url: http://www.apache.org/foundation/
130
- -
144
+ url: https://www.apache.org/foundation/
145
+ -
131
146
  user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
132
147
  bot:
133
148
  name: Applebot
134
149
  category: Crawler
135
- url: http://www.apple.com/go/applebot
150
+ url: https://support.apple.com/en-us/HT204683
136
151
  producer:
137
152
  name: Apple Inc
138
- url: http://www.apple.com
139
- -
153
+ url: https://www.apple.com
154
+ -
155
+ user_agent: AppSignalBot/1.0 (+https://appsignal.com)
156
+ bot:
157
+ name: AppSignalBot
158
+ category: Site Monitor
159
+ url: https://docs.appsignal.com/uptime-monitoring/
160
+ producer:
161
+ name: AppSignal
162
+ url: https://appsignal.com/
163
+ -
140
164
  user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
141
165
  bot:
142
166
  name: Applebot
143
167
  category: Crawler
144
- url: http://www.apple.com/go/applebot
168
+ url: https://support.apple.com/en-us/HT204683
145
169
  producer:
146
170
  name: Apple Inc
147
- url: http://www.apple.com
148
- -
171
+ url: https://www.apple.com
172
+ -
149
173
  user_agent: Arachni/v1.5.1
150
174
  bot:
151
175
  name: Arachni
152
176
  category: Security Checker
153
- url: http://www.arachni-scanner.com
177
+ url: https://www.arachni-scanner.com/
154
178
  producer:
155
179
  name: Sarosys LLC
156
- url: http://www.sarosys.com/
157
- -
180
+ url: https://www.sarosys.com/
181
+ -
158
182
  user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
159
183
  bot:
160
184
  name: Ask Jeeves
@@ -163,7 +187,7 @@
163
187
  producer:
164
188
  name: Ask Jeeves Inc.
165
189
  url: http://www.ask.com
166
- -
190
+ -
167
191
  user_agent: Mozilla/5.0 (compatible;AspiegelBot)
168
192
  bot:
169
193
  name: AspiegelBot
@@ -172,7 +196,7 @@
172
196
  producer:
173
197
  name: Huawei
174
198
  url: https://www.huawei.com/
175
- -
199
+ -
176
200
  user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; AspiegelBot)
177
201
  bot:
178
202
  name: AspiegelBot
@@ -181,7 +205,7 @@
181
205
  producer:
182
206
  name: Huawei
183
207
  url: https://www.huawei.com/
184
- -
208
+ -
185
209
  user_agent: AwarioRssBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
186
210
  bot:
187
211
  name: Awario
@@ -190,7 +214,7 @@
190
214
  producer:
191
215
  name: Awario
192
216
  url: https://awario.com/
193
- -
217
+ -
194
218
  user_agent: AwarioSmartBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
195
219
  bot:
196
220
  name: Awario
@@ -199,7 +223,7 @@
199
223
  producer:
200
224
  name: Awario
201
225
  url: https://awario.com/
202
- -
226
+ -
203
227
  user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
204
228
  bot:
205
229
  name: BLEXBot Crawler
@@ -208,7 +232,7 @@
208
232
  producer:
209
233
  name: WebMeUp
210
234
  url: http://webmeup.com
211
- -
235
+ -
212
236
  user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
213
237
  bot:
214
238
  name: BUbiNG
@@ -217,7 +241,7 @@
217
241
  producer:
218
242
  name: The Laboratory for Web Algorithmics (LAW)
219
243
  url: 'http://law.di.unimi.it/software.php#buging'
220
- -
244
+ -
221
245
  user_agent: Backlink-Check.de (+http://www.backlink-check.de/bot.html)
222
246
  bot:
223
247
  name: Backlink-Check.de
@@ -226,7 +250,7 @@
226
250
  producer:
227
251
  name: Mediagreen Medienservice
228
252
  url: http://www.backlink-check.de
229
- -
253
+ -
230
254
  user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
231
255
  bot:
232
256
  name: BacklinkCrawler
@@ -235,7 +259,7 @@
235
259
  producer:
236
260
  name: 2.0Promotion GbR
237
261
  url: http://www.backlinktest.com
238
- -
262
+ -
239
263
  user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
240
264
  bot:
241
265
  name: Baidu Spider
@@ -244,7 +268,7 @@
244
268
  producer:
245
269
  name: Baidu
246
270
  url: http://www.baidu.com
247
- -
271
+ -
248
272
  user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
249
273
  bot:
250
274
  name: Baidu Spider
@@ -253,7 +277,7 @@
253
277
  producer:
254
278
  name: Baidu
255
279
  url: http://www.baidu.com
256
- -
280
+ -
257
281
  user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
258
282
  bot:
259
283
  name: Baidu Spider
@@ -262,7 +286,7 @@
262
286
  producer:
263
287
  name: Baidu
264
288
  url: http://www.baidu.com
265
- -
289
+ -
266
290
  user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
267
291
  bot:
268
292
  name: Baidu Spider
@@ -271,7 +295,7 @@
271
295
  producer:
272
296
  name: Baidu
273
297
  url: http://www.baidu.com
274
- -
298
+ -
275
299
  user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
276
300
  bot:
277
301
  name: Baidu Spider
@@ -280,7 +304,7 @@
280
304
  producer:
281
305
  name: Baidu
282
306
  url: http://www.baidu.com
283
- -
307
+ -
284
308
  user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
285
309
  bot:
286
310
  name: Baidu Spider
@@ -289,7 +313,7 @@
289
313
  producer:
290
314
  name: Baidu
291
315
  url: http://www.baidu.com
292
- -
316
+ -
293
317
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
294
318
  bot:
295
319
  name: Baidu Spider
@@ -298,7 +322,13 @@
298
322
  producer:
299
323
  name: Baidu
300
324
  url: http://www.baidu.com
301
- -
325
+ -
326
+ user_agent: Barkrowler/0.9 (+http://www.exensa.com/crawl)
327
+ bot:
328
+ name: Barkrowler
329
+ category: Crawler
330
+ url: http://www.exensa.com/crawl
331
+ -
302
332
  user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
303
333
  bot:
304
334
  name: BazQux Reader
@@ -307,7 +337,7 @@
307
337
  producer:
308
338
  name: ""
309
339
  url: ""
310
- -
340
+ -
311
341
  user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
312
342
  bot:
313
343
  name: BingBot
@@ -316,7 +346,7 @@
316
346
  producer:
317
347
  name: Microsoft Corporation
318
348
  url: http://www.microsoft.com
319
- -
349
+ -
320
350
  user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
321
351
  bot:
322
352
  name: BingBot
@@ -325,7 +355,7 @@
325
355
  producer:
326
356
  name: Microsoft Corporation
327
357
  url: http://www.microsoft.com
328
- -
358
+ -
329
359
  user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
330
360
  bot:
331
361
  name: BingBot
@@ -334,7 +364,7 @@
334
364
  producer:
335
365
  name: Microsoft Corporation
336
366
  url: http://www.microsoft.com
337
- -
367
+ -
338
368
  user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
339
369
  bot:
340
370
  name: BingBot
@@ -343,7 +373,7 @@
343
373
  producer:
344
374
  name: Microsoft Corporation
345
375
  url: http://www.microsoft.com
346
- -
376
+ -
347
377
  user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
348
378
  bot:
349
379
  name: BingBot
@@ -352,7 +382,7 @@
352
382
  producer:
353
383
  name: Microsoft Corporation
354
384
  url: http://www.microsoft.com
355
- -
385
+ -
356
386
  user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
357
387
  bot:
358
388
  name: BingBot
@@ -361,7 +391,7 @@
361
391
  producer:
362
392
  name: Microsoft Corporation
363
393
  url: http://www.microsoft.com
364
- -
394
+ -
365
395
  user_agent: msnbot/2.0b v1394720947.6703
366
396
  bot:
367
397
  name: BingBot
@@ -370,7 +400,7 @@
370
400
  producer:
371
401
  name: Microsoft Corporation
372
402
  url: http://www.microsoft.com
373
- -
403
+ -
374
404
  user_agent: MSNBot/Nutch-1.5.1
375
405
  bot:
376
406
  name: BingBot
@@ -379,7 +409,7 @@
379
409
  producer:
380
410
  name: Microsoft Corporation
381
411
  url: http://www.microsoft.com
382
- -
412
+ -
383
413
  user_agent: bitlybot/3.0
384
414
  bot:
385
415
  name: BitlyBot
@@ -388,7 +418,7 @@
388
418
  producer:
389
419
  name: Bitly, Inc.
390
420
  url: https://bitly.com
391
- -
421
+ -
392
422
  user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
393
423
  bot:
394
424
  name: Blekkobot
@@ -397,7 +427,7 @@
397
427
  producer:
398
428
  name: Blekko
399
429
  url: http://blekko.com
400
- -
430
+ -
401
431
  user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
402
432
  bot:
403
433
  name: Bloglovin
@@ -406,7 +436,7 @@
406
436
  producer:
407
437
  name: ""
408
438
  url: ""
409
- -
439
+ -
410
440
  user_agent: Blogtrottr/2.0
411
441
  bot:
412
442
  name: Blogtrottr
@@ -415,24 +445,24 @@
415
445
  producer:
416
446
  name: Blogtrottr Ltd
417
447
  url: https://blogtrottr.com/
418
- -
448
+ -
419
449
  user_agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com
420
450
  bot:
421
451
  name: BoardReader
422
452
  category: Search bot
423
- url: http://boardreader.com/
453
+ url: https://boardreader.com/
424
454
  producer:
425
455
  name: Effyis Inc
426
- url: http://boardreader.com/
427
- -
456
+ url: https://boardreader.com/
457
+ -
428
458
  user_agent: BoardReader Blog Indexer(http://boardreader.com)
429
459
  bot:
430
460
  name: BoardReader Blog Indexer
431
461
  category: Crawler
432
462
  producer:
433
463
  name: BoardReader
434
- url: http://boardreader.com/
435
- -
464
+ url: https://boardreader.com/
465
+ -
436
466
  user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
437
467
  bot:
438
468
  name: Bountii Bot
@@ -441,7 +471,7 @@
441
471
  producer:
442
472
  name: Bountii Inc.
443
473
  url: http://bountii.com
444
- -
474
+ -
445
475
  user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10.10; rv:41.0) Gecko/20100101 Firefox/55.0 BrandVerity/1.0 (http://www.brandverity.com/why-is-brandverity-visiting-me)
446
476
  bot:
447
477
  name: BrandVerity
@@ -450,7 +480,7 @@
450
480
  producer:
451
481
  name: BrandVerity, Inc.
452
482
  url: https://www.brandverity.com/
453
- -
483
+ -
454
484
  user_agent: Browsershots
455
485
  bot:
456
486
  name: Browsershots
@@ -459,7 +489,7 @@
459
489
  producer:
460
490
  name: Browsershots.org
461
491
  url: http://browsershots.org
462
- -
492
+ -
463
493
  user_agent: Buck/2.2; (+https://app.hypefactors.com/media-monitoring/about.html)
464
494
  bot:
465
495
  name: Buck
@@ -468,7 +498,7 @@
468
498
  producer:
469
499
  name: Hypefactors A/S
470
500
  url: https://hypefactors.com/
471
- -
501
+ -
472
502
  user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
473
503
  bot:
474
504
  name: Butterfly Robot
@@ -477,7 +507,7 @@
477
507
  producer:
478
508
  name: Topsy Labs
479
509
  url: http://labs.topsy.com
480
- -
510
+ -
481
511
  user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
482
512
  bot:
483
513
  name: Butterfly Robot
@@ -486,7 +516,7 @@
486
516
  producer:
487
517
  name: Topsy Labs
488
518
  url: http://labs.topsy.com
489
- -
519
+ -
490
520
  user_agent: Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.5668.1446 Mobile Safari/537.36; Bytespider;bytespider@bytedance.com
491
521
  bot:
492
522
  name: Bytespider
@@ -495,7 +525,7 @@
495
525
  producer:
496
526
  name: ByteDance Ltd.
497
527
  url: https://bytedance.com/
498
- -
528
+ -
499
529
  user_agent: CATExplorador/1.0beta (sistemes at domini dot cat; http://domini.cat/catexplorador.html)
500
530
  bot:
501
531
  name: CATExplorador
@@ -504,7 +534,7 @@
504
534
  producer:
505
535
  name: Fundació puntCAT
506
536
  url: https://fundacio.cat/ca/domini/
507
- -
537
+ -
508
538
  user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
509
539
  bot:
510
540
  name: CareerBot
@@ -513,7 +543,7 @@
513
543
  producer:
514
544
  name: career-x GmbH
515
545
  url: http://www.career-x.de
516
- -
546
+ -
517
547
  user_agent: Castro 2, Episode Duration Lookup
518
548
  bot:
519
549
  name: Castro 2
@@ -522,7 +552,7 @@
522
552
  producer:
523
553
  name: Supertop
524
554
  url: http://supertop.co
525
- -
555
+ -
526
556
  user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
527
557
  bot:
528
558
  name: Cliqzbot
@@ -531,7 +561,7 @@
531
561
  producer:
532
562
  name: 10betterpages GmbH
533
563
  url: http://cliqz.com
534
- -
564
+ -
535
565
  user_agent: Mozilla/5.0 (compatible; Cloudflare-AMP/1.0; +https://amp.cloudflare.com/doc/fetcher.html) AppleWebKit/534.34
536
566
  bot:
537
567
  name: CloudFlare AMP Fetcher
@@ -540,7 +570,7 @@
540
570
  producer:
541
571
  name: CloudFlare
542
572
  url: http://www.cloudflare.com
543
- -
573
+ -
544
574
  user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
545
575
  bot:
546
576
  name: CloudFlare Always Online
@@ -549,7 +579,7 @@
549
579
  producer:
550
580
  name: CloudFlare
551
581
  url: http://www.cloudflare.com
552
- -
582
+ -
553
583
  user_agent: collectd/5.5.1
554
584
  bot:
555
585
  name: Collectd
@@ -558,7 +588,7 @@
558
588
  producer:
559
589
  name: Collectd
560
590
  url: https://collectd.org/
561
- -
591
+ -
562
592
  user_agent: CommaFeed/1.0 (http://www.commafeed.com)
563
593
  bot:
564
594
  name: CommaFeed
@@ -567,79 +597,79 @@
567
597
  producer:
568
598
  name: ""
569
599
  url: ""
570
- -
600
+ -
571
601
  user_agent: coccocbot-web/1.0 (+http://help.coccoc.com/searchengine)
572
602
  bot:
573
603
  name: Cốc Cốc Bot
574
- category: Search bot
575
604
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
605
+ category: Search bot
576
606
  producer:
577
607
  name: Cốc Cốc
578
608
  url: https://coccoc.com/
579
- -
609
+ -
580
610
  user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
581
611
  bot:
582
612
  name: Cốc Cốc Bot
583
- category: Search bot
584
613
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
614
+ category: Search bot
585
615
  producer:
586
616
  name: Cốc Cốc
587
617
  url: https://coccoc.com/
588
- -
618
+ -
589
619
  user_agent: Mozilla/5.0 (compatible; coccocbot-ads/1.0; +http://help.coccoc.com/searchengine)
590
620
  bot:
591
621
  name: Cốc Cốc Bot
592
- category: Search bot
593
622
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
623
+ category: Search bot
594
624
  producer:
595
625
  name: Cốc Cốc
596
626
  url: https://coccoc.com/
597
- -
627
+ -
598
628
  user_agent: Mozilla/5.0 (compatible; coccocbot-fast/1.0; +http://help.coccoc.com/searchengine)
599
629
  bot:
600
630
  name: Cốc Cốc Bot
601
- category: Search bot
602
631
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
632
+ category: Search bot
603
633
  producer:
604
634
  name: Cốc Cốc
605
635
  url: https://coccoc.com/
606
- -
636
+ -
607
637
  user_agent: Mozilla/5.0 (compatible; coccocbot-image/1.0; +http://help.coccoc.com/searchengine)
608
638
  bot:
609
639
  name: Cốc Cốc Bot
610
- category: Search bot
611
640
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
641
+ category: Search bot
612
642
  producer:
613
643
  name: Cốc Cốc
614
644
  url: https://coccoc.com/
615
- -
645
+ -
616
646
  user_agent: Mozilla/5.0 (compatible; coccocbot-shopping/1.0; +http://help.coccoc.com/searchengine)
617
647
  bot:
618
648
  name: Cốc Cốc Bot
619
- category: Search bot
620
649
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
650
+ category: Search bot
621
651
  producer:
622
652
  name: Cốc Cốc
623
653
  url: https://coccoc.com/
624
- -
654
+ -
625
655
  user_agent: Mozilla/5.0 (compatible; coccocbot-web/1.0; +http://help.coccoc.com/searchengine)
626
656
  bot:
627
657
  name: Cốc Cốc Bot
628
- category: Search bot
629
658
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
659
+ category: Search bot
630
660
  producer:
631
661
  name: Cốc Cốc
632
662
  url: https://coccoc.com/
633
- -
663
+ -
634
664
  user_agent: Mozilla/5.0 (compatible; coccocbot/1.0; +http://help.coccoc.com/searchengine)
635
665
  bot:
636
666
  name: Cốc Cốc Bot
637
- category: Search bot
638
667
  url: https://help.coccoc.com/en/search-engine/coccoc-robots
668
+ category: Search bot
639
669
  producer:
640
670
  name: Cốc Cốc
641
671
  url: https://coccoc.com/
642
- -
672
+ -
643
673
  user_agent: Datadog Agent/5.10.1
644
674
  bot:
645
675
  name: Datadog Agent
@@ -648,7 +678,7 @@
648
678
  producer:
649
679
  name: Datadog
650
680
  url: https://www.datadoghq.com/
651
- -
681
+ -
652
682
  user_agent: Mozilla/5.0 (X11; Datanyze; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36
653
683
  bot:
654
684
  name: Datanyze
@@ -657,7 +687,7 @@
657
687
  producer:
658
688
  name: Datanyze
659
689
  url: https://www.datanyze.com
660
- -
690
+ -
661
691
  user_agent: Mozilla/5.0 (compatible; Dataprovider/6.92; +https://www.dataprovider.com/)
662
692
  bot:
663
693
  name: Dataprovider
@@ -666,7 +696,7 @@
666
696
  producer:
667
697
  name: Dataprovider B.V.
668
698
  url: https://www.dataprovider.com/
669
- -
699
+ -
670
700
  user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
671
701
  bot:
672
702
  name: Daum
@@ -675,7 +705,7 @@
675
705
  producer:
676
706
  name: Daum Communications Corp.
677
707
  url: http://www.kakaocorp.com/main
678
- -
708
+ -
679
709
  user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
680
710
  bot:
681
711
  name: Daum
@@ -684,7 +714,7 @@
684
714
  producer:
685
715
  name: Daum Communications Corp.
686
716
  url: http://www.kakaocorp.com/main
687
- -
717
+ -
688
718
  user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
689
719
  bot:
690
720
  name: Dazoobot
@@ -693,7 +723,7 @@
693
723
  producer:
694
724
  name: DAZOO.FR
695
725
  url: http://dazoo.fr
696
- -
726
+ -
697
727
  user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
698
728
  bot:
699
729
  name: Discobot
@@ -702,7 +732,7 @@
702
732
  producer:
703
733
  name: Discovery Engine
704
734
  url: http://discoveryengine.com
705
- -
735
+ -
706
736
  user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
707
737
  bot:
708
738
  name: Domain Re-Animator Bot
@@ -711,7 +741,7 @@
711
741
  producer:
712
742
  name: Domain Re-Animator, LLC
713
743
  url: http://domainreanimator.com
714
- -
744
+ -
715
745
  user_agent: support@domainreanimator.com
716
746
  bot:
717
747
  name: Domain Re-Animator Bot
@@ -720,7 +750,13 @@
720
750
  producer:
721
751
  name: Domain Re-Animator, LLC
722
752
  url: http://domainreanimator.com
723
- -
753
+ -
754
+ user_agent: Mozilla/5.0 (compatible; Domains Project/1.1.0; +https://domainsproject.org)
755
+ bot:
756
+ name: Domains Project
757
+ category: Crawler
758
+ url: https://domainsproject.org
759
+ -
724
760
  user_agent: dotbot
725
761
  bot:
726
762
  name: DotBot
@@ -729,7 +765,7 @@
729
765
  producer:
730
766
  name: SEOmoz, Inc.
731
767
  url: http://moz.com/
732
- -
768
+ -
733
769
  user_agent: DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)
734
770
  bot:
735
771
  name: DuckDuckGo Bot
@@ -738,7 +774,7 @@
738
774
  producer:
739
775
  name: DuckDuckGo
740
776
  url: https://duckduckgo.com/
741
- -
777
+ -
742
778
  user_agent: Mozilla/5.0 (compatible; DuckDuckGo-Favicons-Bot/1.0; +http://duckduckgo.com)
743
779
  bot:
744
780
  name: DuckDuckGo Bot
@@ -747,7 +783,7 @@
747
783
  producer:
748
784
  name: DuckDuckGo
749
785
  url: https://duckduckgo.com/
750
- -
786
+ -
751
787
  user_agent: EMail Exractor
752
788
  bot:
753
789
  name: EMail Exractor
@@ -756,7 +792,7 @@
756
792
  producer:
757
793
  name: ""
758
794
  url: ""
759
- -
795
+ -
760
796
  user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
761
797
  bot:
762
798
  name: Easou Spider
@@ -765,7 +801,7 @@
765
801
  producer:
766
802
  name: easou ICP
767
803
  url: http://www.easou.com
768
- -
804
+ -
769
805
  user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
770
806
  bot:
771
807
  name: Easou Spider
@@ -774,7 +810,7 @@
774
810
  producer:
775
811
  name: easou ICP
776
812
  url: http://www.easou.com
777
- -
813
+ -
778
814
  user_agent: Mozilla/5.0 (compatible; Embedly/0.2; +http://support.embed.ly/)
779
815
  bot:
780
816
  name: Embedly
@@ -783,7 +819,7 @@
783
819
  producer:
784
820
  name: A Medium, Corp.
785
821
  url: https://medium.com/
786
- -
822
+ -
787
823
  user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
788
824
  bot:
789
825
  name: ExaBot
@@ -792,7 +828,7 @@
792
828
  producer:
793
829
  name: Dassault Systèmes
794
830
  url: http://www.3ds.com
795
- -
831
+ -
796
832
  user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
797
833
  bot:
798
834
  name: ExaBot
@@ -801,7 +837,7 @@
801
837
  producer:
802
838
  name: Dassault Systèmes
803
839
  url: http://www.3ds.com
804
- -
840
+ -
805
841
  user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
806
842
  bot:
807
843
  name: ExaBot
@@ -810,7 +846,7 @@
810
846
  producer:
811
847
  name: Dassault Systèmes
812
848
  url: http://www.3ds.com
813
- -
849
+ -
814
850
  user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
815
851
  bot:
816
852
  name: ExactSeek Crawler
@@ -819,7 +855,7 @@
819
855
  producer:
820
856
  name: Jayde Online, Inc.
821
857
  url: http://www.jaydeonlineinc.com
822
- -
858
+ -
823
859
  user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
824
860
  bot:
825
861
  name: Ezooms
@@ -828,7 +864,7 @@
828
864
  producer:
829
865
  name: SEOmoz, Inc.
830
866
  url: http://moz.com/
831
- -
867
+ -
832
868
  user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
833
869
  bot:
834
870
  name: Facebook External Hit
@@ -837,7 +873,7 @@
837
873
  producer:
838
874
  name: Facebook
839
875
  url: http://www.facebook.com
840
- -
876
+ -
841
877
  user_agent: facebookexternalua
842
878
  bot:
843
879
  name: Facebook External Hit
@@ -846,7 +882,7 @@
846
882
  producer:
847
883
  name: Facebook
848
884
  url: http://www.facebook.com
849
- -
885
+ -
850
886
  user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
851
887
  bot:
852
888
  name: Facebook External Hit
@@ -855,7 +891,7 @@
855
891
  producer:
856
892
  name: Facebook
857
893
  url: http://www.facebook.com
858
- -
894
+ -
859
895
  user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
860
896
  bot:
861
897
  name: Feed Wrangler
@@ -864,7 +900,7 @@
864
900
  producer:
865
901
  name: 'David Smith & Developing Perspective, LLC'
866
902
  url: https://david-smith.org
867
- -
903
+ -
868
904
  user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
869
905
  bot:
870
906
  name: FeedBurner
@@ -873,7 +909,7 @@
873
909
  producer:
874
910
  name: ""
875
911
  url: ""
876
- -
912
+ -
877
913
  user_agent: 'Feedbin - 9 subscribers'
878
914
  bot:
879
915
  name: Feedbin
@@ -882,7 +918,7 @@
882
918
  producer:
883
919
  name: ""
884
920
  url: ""
885
- -
921
+ -
886
922
  user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
887
923
  bot:
888
924
  name: Feedly
@@ -891,7 +927,7 @@
891
927
  producer:
892
928
  name: ""
893
929
  url: ""
894
- -
930
+ -
895
931
  user_agent: FeedlyApp/1.0 (http://www.feedly.com)
896
932
  bot:
897
933
  name: Feedly
@@ -900,7 +936,7 @@
900
936
  producer:
901
937
  name: ""
902
938
  url: ""
903
- -
939
+ -
904
940
  user_agent: FeedlyBot/1.0 (http://feedly.com)
905
941
  bot:
906
942
  name: Feedly
@@ -909,7 +945,7 @@
909
945
  producer:
910
946
  name: ""
911
947
  url: ""
912
- -
948
+ -
913
949
  user_agent: MetaFeedly/1.0 (http://www.feedly.com)
914
950
  bot:
915
951
  name: Feedly
@@ -918,7 +954,7 @@
918
954
  producer:
919
955
  name: ""
920
956
  url: ""
921
- -
957
+ -
922
958
  user_agent: Feedspot http://www.feedspot.com
923
959
  bot:
924
960
  name: Feedspot
@@ -927,7 +963,7 @@
927
963
  producer:
928
964
  name: ""
929
965
  url: ""
930
- -
966
+ -
931
967
  user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
932
968
  bot:
933
969
  name: Fever
@@ -936,13 +972,13 @@
936
972
  producer:
937
973
  name: ""
938
974
  url: ""
939
- -
975
+ -
940
976
  user_agent: Mozilla/5.0 (compatible; Findxbot/1.0; +http://www.findxbot.com)
941
977
  bot:
942
978
  name: Findxbot
943
979
  category: Crawler
944
980
  url: http://www.findxbot.com
945
- -
981
+ -
946
982
  user_agent: Mozilla/5.0 (compatible; FlipboardProxy/1.2; +http://flipboard.com/browserproxy)
947
983
  bot:
948
984
  name: Flipboard
@@ -951,7 +987,7 @@
951
987
  producer:
952
988
  name: Flipboard
953
989
  url: http://flipboard.com/
954
- -
990
+ -
955
991
  user_agent: Mozilla/5.0 (compatible; FlipboardRSS/1.2; +http://flipboard.com/browserproxy)
956
992
  bot:
957
993
  name: Flipboard
@@ -960,19 +996,19 @@
960
996
  producer:
961
997
  name: Flipboard
962
998
  url: http://flipboard.com/
963
- -
999
+ -
964
1000
  user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
965
1001
  bot:
966
1002
  name: FreshRSS
967
1003
  category: Feed Fetcher
968
1004
  url: https://freshrss.org/
969
- -
1005
+ -
970
1006
  user_agent: FreshRSS/1.12.0 (Linux; https://freshrss.org)
971
1007
  bot:
972
1008
  name: FreshRSS
973
1009
  category: Feed Fetcher
974
1010
  url: https://freshrss.org/
975
- -
1011
+ -
976
1012
  user_agent: Mozilla/5.0 (X11; Linux x86_64; GTmetrix https://gtmetrix.com/) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/75.0.3770.100 Safari/537.36
977
1013
  bot:
978
1014
  name: GTmetrix
@@ -981,55 +1017,55 @@
981
1017
  producer:
982
1018
  name: Carbon60 Operating Co. Ltd.
983
1019
  url: https://www.carbon60.com/
984
- -
1020
+ -
985
1021
  user_agent: 7Siters/1.07 (+https://7ooo.ru/siters/)
986
1022
  bot:
987
1023
  name: Generic Bot
988
- -
1024
+ -
989
1025
  user_agent: COMODO SSL Checker
990
1026
  bot:
991
1027
  name: Generic Bot
992
- -
1028
+ -
993
1029
  user_agent: help@dataminr.com
994
1030
  bot:
995
1031
  name: Generic Bot
996
- -
1032
+ -
997
1033
  user_agent: 'HybridBot (hybrid.ru/about. If our bot caused problems please contact us. Contact email: m.lyashkov@targetix.net)'
998
1034
  bot:
999
1035
  name: Generic Bot
1000
- -
1036
+ -
1001
1037
  user_agent: 'Mozilla/5.0 (compatible; +centuryb.o.t9[at]gmail.com)'
1002
1038
  bot:
1003
1039
  name: Generic Bot
1004
- -
1040
+ -
1005
1041
  user_agent: Mozilla/5.0 (compatible; +http://tweetedtimes.com)
1006
1042
  bot:
1007
1043
  name: Generic Bot
1008
- -
1044
+ -
1009
1045
  user_agent: Mozilla/5.0 (compatible; Shareaholicbot/2.0; +http://www.shareaholic.com/bot)
1010
1046
  bot:
1011
1047
  name: Generic Bot
1012
- -
1048
+ -
1013
1049
  user_agent: Mozilla/5.0 (compatible; TrendsmapResolver/0.1)
1014
1050
  bot:
1015
1051
  name: Generic Bot
1016
- -
1052
+ -
1017
1053
  user_agent: niki-bot
1018
1054
  bot:
1019
1055
  name: Generic Bot
1020
- -
1056
+ -
1021
1057
  user_agent: PHPCrawl
1022
1058
  bot:
1023
1059
  name: Generic Bot
1024
- -
1060
+ -
1025
1061
  user_agent: robots
1026
1062
  bot:
1027
1063
  name: Generic Bot
1028
- -
1064
+ -
1029
1065
  user_agent: SeopultContentAnalyzer/1.0
1030
1066
  bot:
1031
1067
  name: Generic Bot
1032
- -
1068
+ -
1033
1069
  user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
1034
1070
  bot:
1035
1071
  name: Genieo Web filter
@@ -1038,7 +1074,7 @@
1038
1074
  producer:
1039
1075
  name: Genieo
1040
1076
  url: http://www.genieo.com
1041
- -
1077
+ -
1042
1078
  user_agent: GigablastOpenSource/1.0
1043
1079
  bot:
1044
1080
  name: Gigablast
@@ -1047,7 +1083,7 @@
1047
1083
  producer:
1048
1084
  name: Matt Wells
1049
1085
  url: http://www.gigablast.com/faq.html
1050
- -
1086
+ -
1051
1087
  user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
1052
1088
  bot:
1053
1089
  name: Gluten Free Crawler
@@ -1056,7 +1092,7 @@
1056
1092
  producer:
1057
1093
  name: ""
1058
1094
  url: ""
1059
- -
1095
+ -
1060
1096
  user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
1061
1097
  bot:
1062
1098
  name: Gmail Image Proxy
@@ -1065,7 +1101,7 @@
1065
1101
  producer:
1066
1102
  name: Google Inc.
1067
1103
  url: http://www.google.com
1068
- -
1104
+ -
1069
1105
  user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
1070
1106
  bot:
1071
1107
  name: Goo
@@ -1074,12 +1110,12 @@
1074
1110
  producer:
1075
1111
  name: NTT Resonant
1076
1112
  url: http://goo.ne.jp
1077
- -
1113
+ -
1078
1114
  user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.75 Safari/537.36 Google Favicon
1079
1115
  bot:
1080
1116
  name: Google Favicon
1081
1117
  category: Crawler
1082
- -
1118
+ -
1083
1119
  user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
1084
1120
  bot:
1085
1121
  name: Google PageSpeed Insights
@@ -1088,7 +1124,7 @@
1088
1124
  producer:
1089
1125
  name: Google Inc.
1090
1126
  url: http://www.google.com
1091
- -
1127
+ -
1092
1128
  user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
1093
1129
  bot:
1094
1130
  name: Google Partner Monitoring
@@ -1097,7 +1133,7 @@
1097
1133
  producer:
1098
1134
  name: Google Inc.
1099
1135
  url: http://www.google.com
1100
- -
1136
+ -
1101
1137
  user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Search Console) Chrome/41.0.2272.118 Safari/537.36
1102
1138
  bot:
1103
1139
  name: Google Search Console
@@ -1106,7 +1142,7 @@
1106
1142
  producer:
1107
1143
  name: Google Inc.
1108
1144
  url: http://www.google.com
1109
- -
1145
+ -
1110
1146
  user_agent: Google-Structured-Data-Testing-Tool +https://search.google.com/structured-data/testing-tool)
1111
1147
  bot:
1112
1148
  name: Google Structured Data Testing Tool
@@ -1115,7 +1151,7 @@
1115
1151
  producer:
1116
1152
  name: Google Inc.
1117
1153
  url: http://www.google.com
1118
- -
1154
+ -
1119
1155
  user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
1120
1156
  bot:
1121
1157
  name: Googlebot
@@ -1124,7 +1160,7 @@
1124
1160
  producer:
1125
1161
  name: Google Inc.
1126
1162
  url: http://www.google.com
1127
- -
1163
+ -
1128
1164
  user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
1129
1165
  bot:
1130
1166
  name: Googlebot
@@ -1133,7 +1169,7 @@
1133
1169
  producer:
1134
1170
  name: Google Inc.
1135
1171
  url: http://www.google.com
1136
- -
1172
+ -
1137
1173
  user_agent: APIs-Google (+https://developers.google.com/webmasters/APIs-Google.html)
1138
1174
  bot:
1139
1175
  name: Googlebot
@@ -1142,7 +1178,7 @@
1142
1178
  producer:
1143
1179
  name: Google Inc.
1144
1180
  url: http://www.google.com
1145
- -
1181
+ -
1146
1182
  user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
1147
1183
  bot:
1148
1184
  name: Googlebot
@@ -1151,7 +1187,7 @@
1151
1187
  producer:
1152
1188
  name: Google Inc.
1153
1189
  url: http://www.google.com
1154
- -
1190
+ -
1155
1191
  user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
1156
1192
  bot:
1157
1193
  name: Googlebot
@@ -1160,7 +1196,7 @@
1160
1196
  producer:
1161
1197
  name: Google Inc.
1162
1198
  url: http://www.google.com
1163
- -
1199
+ -
1164
1200
  user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
1165
1201
  bot:
1166
1202
  name: Googlebot
@@ -1169,7 +1205,7 @@
1169
1205
  producer:
1170
1206
  name: Google Inc.
1171
1207
  url: http://www.google.com
1172
- -
1208
+ -
1173
1209
  user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
1174
1210
  bot:
1175
1211
  name: Googlebot
@@ -1178,7 +1214,7 @@
1178
1214
  producer:
1179
1215
  name: Google Inc.
1180
1216
  url: http://www.google.com
1181
- -
1217
+ -
1182
1218
  user_agent: Google-AdWords-Express
1183
1219
  bot:
1184
1220
  name: Googlebot
@@ -1187,7 +1223,7 @@
1187
1223
  producer:
1188
1224
  name: Google Inc.
1189
1225
  url: http://www.google.com
1190
- -
1226
+ -
1191
1227
  user_agent: Google-Adwords-Instant (+http://www.google.com/adsbot.html)
1192
1228
  bot:
1193
1229
  name: Googlebot
@@ -1196,7 +1232,7 @@
1196
1232
  producer:
1197
1233
  name: Google Inc.
1198
1234
  url: http://www.google.com
1199
- -
1235
+ -
1200
1236
  user_agent: Google-speakr
1201
1237
  bot:
1202
1238
  name: Googlebot
@@ -1205,7 +1241,7 @@
1205
1241
  producer:
1206
1242
  name: Google Inc.
1207
1243
  url: http://www.google.com
1208
- -
1244
+ -
1209
1245
  user_agent: Googlebot (gocrawl v0.4)
1210
1246
  bot:
1211
1247
  name: Googlebot
@@ -1214,7 +1250,7 @@
1214
1250
  producer:
1215
1251
  name: Google Inc.
1216
1252
  url: http://www.google.com
1217
- -
1253
+ -
1218
1254
  user_agent: Googlebot-Image/1.0
1219
1255
  bot:
1220
1256
  name: Googlebot
@@ -1223,7 +1259,7 @@
1223
1259
  producer:
1224
1260
  name: Google Inc.
1225
1261
  url: http://www.google.com
1226
- -
1262
+ -
1227
1263
  user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
1228
1264
  bot:
1229
1265
  name: Googlebot
@@ -1232,7 +1268,7 @@
1232
1268
  producer:
1233
1269
  name: Google Inc.
1234
1270
  url: http://www.google.com
1235
- -
1271
+ -
1236
1272
  user_agent: Googlebot-Video/1.0
1237
1273
  bot:
1238
1274
  name: Googlebot
@@ -1241,7 +1277,7 @@
1241
1277
  producer:
1242
1278
  name: Google Inc.
1243
1279
  url: http://www.google.com
1244
- -
1280
+ -
1245
1281
  user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
1246
1282
  bot:
1247
1283
  name: Googlebot
@@ -1250,7 +1286,7 @@
1250
1286
  producer:
1251
1287
  name: Google Inc.
1252
1288
  url: http://www.google.com
1253
- -
1289
+ -
1254
1290
  user_agent: Googlebot/Nutch-1.7
1255
1291
  bot:
1256
1292
  name: Googlebot
@@ -1259,7 +1295,7 @@
1259
1295
  producer:
1260
1296
  name: Google Inc.
1261
1297
  url: http://www.google.com
1262
- -
1298
+ -
1263
1299
  user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
1264
1300
  bot:
1265
1301
  name: Googlebot
@@ -1268,7 +1304,7 @@
1268
1304
  producer:
1269
1305
  name: Google Inc.
1270
1306
  url: http://www.google.com
1271
- -
1307
+ -
1272
1308
  user_agent: Mediapartners-Google
1273
1309
  bot:
1274
1310
  name: Googlebot
@@ -1277,7 +1313,7 @@
1277
1313
  producer:
1278
1314
  name: Google Inc.
1279
1315
  url: http://www.google.com
1280
- -
1316
+ -
1281
1317
  user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
1282
1318
  bot:
1283
1319
  name: Googlebot
@@ -1286,7 +1322,7 @@
1286
1322
  producer:
1287
1323
  name: Google Inc.
1288
1324
  url: http://www.google.com
1289
- -
1325
+ -
1290
1326
  user_agent: Mozilla/5.0 (compatible; Google-Youtube-Links)
1291
1327
  bot:
1292
1328
  name: Googlebot
@@ -1295,7 +1331,7 @@
1295
1331
  producer:
1296
1332
  name: Google Inc.
1297
1333
  url: http://www.google.com
1298
- -
1334
+ -
1299
1335
  user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
1300
1336
  bot:
1301
1337
  name: Googlebot
@@ -1304,7 +1340,7 @@
1304
1340
  producer:
1305
1341
  name: Google Inc.
1306
1342
  url: http://www.google.com
1307
- -
1343
+ -
1308
1344
  user_agent: Mozilla/5.0 (en-US) AppleWebKit/537.36 (KHTML, like Gecko; Google-Assess) Chrome/34.0.1847.116 Safari/537.36
1309
1345
  bot:
1310
1346
  name: Googlebot
@@ -1313,7 +1349,7 @@
1313
1349
  producer:
1314
1350
  name: Google Inc.
1315
1351
  url: http://www.google.com
1316
- -
1352
+ -
1317
1353
  user_agent: Mozilla/5.0 (en-us) AppleWebKit/537.36(KHTML, like Gecko; Google-Adwords-DisplayAds-WebRender;) Chrome/41.0.2272.118Safari/537.36
1318
1354
  bot:
1319
1355
  name: Googlebot
@@ -1322,7 +1358,7 @@
1322
1358
  producer:
1323
1359
  name: Google Inc.
1324
1360
  url: http://www.google.com
1325
- -
1361
+ -
1326
1362
  user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
1327
1363
  bot:
1328
1364
  name: Googlebot
@@ -1331,7 +1367,7 @@
1331
1367
  producer:
1332
1368
  name: Google Inc.
1333
1369
  url: http://www.google.com
1334
- -
1370
+ -
1335
1371
  user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
1336
1372
  bot:
1337
1373
  name: Googlebot
@@ -1340,7 +1376,7 @@
1340
1376
  producer:
1341
1377
  name: Google Inc.
1342
1378
  url: http://www.google.com
1343
- -
1379
+ -
1344
1380
  user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-AMPHTML)
1345
1381
  bot:
1346
1382
  name: Googlebot
@@ -1349,7 +1385,7 @@
1349
1385
  producer:
1350
1386
  name: Google Inc.
1351
1387
  url: http://www.google.com
1352
- -
1388
+ -
1353
1389
  user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-Read-Aloud; +https://support.google.com/webmasters/answer/1061943)
1354
1390
  bot:
1355
1391
  name: Googlebot
@@ -1358,7 +1394,7 @@
1358
1394
  producer:
1359
1395
  name: Google Inc.
1360
1396
  url: http://www.google.com
1361
- -
1397
+ -
1362
1398
  user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; DuplexWeb-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.131 Mobile Safari/537.36
1363
1399
  bot:
1364
1400
  name: Googlebot
@@ -1367,7 +1403,7 @@
1367
1403
  producer:
1368
1404
  name: Google Inc.
1369
1405
  url: http://www.google.com
1370
- -
1406
+ -
1371
1407
  user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
1372
1408
  bot:
1373
1409
  name: Googlebot
@@ -1376,7 +1412,7 @@
1376
1412
  producer:
1377
1413
  name: Google Inc.
1378
1414
  url: http://www.google.com
1379
- -
1415
+ -
1380
1416
  user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/27.0.1453 Safari/537.36 (compatible; Google-HotelAdsVerifier/2.0)
1381
1417
  bot:
1382
1418
  name: Googlebot
@@ -1385,7 +1421,7 @@
1385
1421
  producer:
1386
1422
  name: Google Inc.
1387
1423
  url: http://www.google.com
1388
- -
1424
+ -
1389
1425
  user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
1390
1426
  bot:
1391
1427
  name: Googlebot
@@ -1394,7 +1430,7 @@
1394
1430
  producer:
1395
1431
  name: Google Inc.
1396
1432
  url: http://www.google.com
1397
- -
1433
+ -
1398
1434
  user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36 (compatible; Google-Shopping-Quality +http://www.google.com/merchants/tos/extend/DE/tos.html)
1399
1435
  bot:
1400
1436
  name: Googlebot
@@ -1403,7 +1439,7 @@
1403
1439
  producer:
1404
1440
  name: Google Inc.
1405
1441
  url: http://www.google.com
1406
- -
1442
+ -
1407
1443
  user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
1408
1444
  bot:
1409
1445
  name: Googlebot
@@ -1412,7 +1448,7 @@
1412
1448
  producer:
1413
1449
  name: Google Inc.
1414
1450
  url: http://www.google.com
1415
- -
1451
+ -
1416
1452
  user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
1417
1453
  bot:
1418
1454
  name: Googlebot
@@ -1421,7 +1457,13 @@
1421
1457
  producer:
1422
1458
  name: Google Inc.
1423
1459
  url: http://www.google.com
1424
- -
1460
+ -
1461
+ user_agent: Grammarly/1.0 (http://www.grammarly.com)
1462
+ bot:
1463
+ name: Grammarly
1464
+ category: Service bot
1465
+ url: https://www.grammarly.com
1466
+ -
1425
1467
  user_agent: Mozilla/5.0 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
1426
1468
  bot:
1427
1469
  name: Grapeshot
@@ -1430,7 +1472,7 @@
1430
1472
  producer:
1431
1473
  name: Grapeshot
1432
1474
  url: https://www.grapeshot.com
1433
- -
1475
+ -
1434
1476
  user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1. 4 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
1435
1477
  bot:
1436
1478
  name: Grapeshot
@@ -1439,7 +1481,7 @@
1439
1481
  producer:
1440
1482
  name: Grapeshot
1441
1483
  url: https://www.grapeshot.com
1442
- -
1484
+ -
1443
1485
  user_agent: HTTPMon/1.0b (http://www.httpmon.com)
1444
1486
  bot:
1445
1487
  name: HTTPMon
@@ -1448,7 +1490,7 @@
1448
1490
  producer:
1449
1491
  name: towards GmbH
1450
1492
  url: http://www.towards.ch/
1451
- -
1493
+ -
1452
1494
  user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
1453
1495
  bot:
1454
1496
  name: Heritrix
@@ -1456,8 +1498,8 @@
1456
1498
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1457
1499
  producer:
1458
1500
  name: The Internet Archive
1459
- url: http://www.archive.org
1460
- -
1501
+ url: https://archive.org
1502
+ -
1461
1503
  user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
1462
1504
  bot:
1463
1505
  name: Heritrix
@@ -1465,8 +1507,8 @@
1465
1507
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1466
1508
  producer:
1467
1509
  name: The Internet Archive
1468
- url: http://www.archive.org
1469
- -
1510
+ url: https://archive.org
1511
+ -
1470
1512
  user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
1471
1513
  bot:
1472
1514
  name: Heritrix
@@ -1474,8 +1516,8 @@
1474
1516
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1475
1517
  producer:
1476
1518
  name: The Internet Archive
1477
- url: http://www.archive.org
1478
- -
1519
+ url: https://archive.org
1520
+ -
1479
1521
  user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
1480
1522
  bot:
1481
1523
  name: Heritrix
@@ -1483,8 +1525,8 @@
1483
1525
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1484
1526
  producer:
1485
1527
  name: The Internet Archive
1486
- url: http://www.archive.org
1487
- -
1528
+ url: https://archive.org
1529
+ -
1488
1530
  user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
1489
1531
  bot:
1490
1532
  name: Heritrix
@@ -1492,8 +1534,8 @@
1492
1534
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1493
1535
  producer:
1494
1536
  name: The Internet Archive
1495
- url: http://www.archive.org
1496
- -
1537
+ url: https://archive.org
1538
+ -
1497
1539
  user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
1498
1540
  bot:
1499
1541
  name: Heritrix
@@ -1501,8 +1543,8 @@
1501
1543
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1502
1544
  producer:
1503
1545
  name: The Internet Archive
1504
- url: http://www.archive.org
1505
- -
1546
+ url: https://archive.org
1547
+ -
1506
1548
  user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
1507
1549
  bot:
1508
1550
  name: Heritrix
@@ -1510,8 +1552,8 @@
1510
1552
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1511
1553
  producer:
1512
1554
  name: The Internet Archive
1513
- url: http://www.archive.org
1514
- -
1555
+ url: https://archive.org
1556
+ -
1515
1557
  user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
1516
1558
  bot:
1517
1559
  name: Heritrix
@@ -1519,8 +1561,8 @@
1519
1561
  url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1520
1562
  producer:
1521
1563
  name: The Internet Archive
1522
- url: http://www.archive.org
1523
- -
1564
+ url: https://archive.org
1565
+ -
1524
1566
  user_agent: Heurekabot-Feed/1.0 (+https://sluzby.heureka.cz/napoveda/heurekabot/)
1525
1567
  bot:
1526
1568
  name: Heureka Feed
@@ -1529,16 +1571,16 @@
1529
1571
  producer:
1530
1572
  name: Heureka.cz, a.s.
1531
1573
  url: https://www.heureka.cz/
1532
- -
1574
+ -
1533
1575
  user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
1534
1576
  bot:
1535
1577
  name: HubPages
1536
1578
  category: Crawler
1537
- url: http://hubpages.com/help/crawlingpolicy
1579
+ url: https://hubpages.com/help/crawlingpolicy
1538
1580
  producer:
1539
- name: HubPages
1540
- url: http://hubpages.com/
1541
- -
1581
+ name: HubPages, Inc.
1582
+ url: https://discover.hubpages.com/
1583
+ -
1542
1584
  user_agent: HubSpot Website Grader (web-crawlers@hubspot.com)
1543
1585
  bot:
1544
1586
  name: HubSpot
@@ -1546,7 +1588,7 @@
1546
1588
  producer:
1547
1589
  name: HubSpot Inc.
1548
1590
  url: https://www.hubspot.com
1549
- -
1591
+ -
1550
1592
  user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
1551
1593
  bot:
1552
1594
  name: ICC-Crawler
@@ -1555,7 +1597,7 @@
1555
1597
  producer:
1556
1598
  name: ""
1557
1599
  url: ""
1558
- -
1600
+ -
1559
1601
  user_agent: IDG/IT (http://spaziodati.eu/)
1560
1602
  bot:
1561
1603
  name: IDG/IT
@@ -1564,7 +1606,7 @@
1564
1606
  producer:
1565
1607
  name: SpazioDati S.r.l.
1566
1608
  url: https://spaziodati.eu/
1567
- -
1609
+ -
1568
1610
  user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
1569
1611
  bot:
1570
1612
  name: IIS Site Analysis
@@ -1573,7 +1615,7 @@
1573
1615
  producer:
1574
1616
  name: Microsoft Corporation
1575
1617
  url: http://www.microsoft.com
1576
- -
1618
+ -
1577
1619
  user_agent: IP-Guide.com Crawler/1.0 (https://ip-guide.com)
1578
1620
  bot:
1579
1621
  name: IP-Guide Crawler
@@ -1582,15 +1624,15 @@
1582
1624
  producer:
1583
1625
  name: ""
1584
1626
  url: https://ip-guide.com
1585
- -
1627
+ -
1586
1628
  user_agent: Mozilla/5.0 (compatible; ips-agent)
1587
1629
  bot:
1588
1630
  name: IPS Agent
1589
- category: crawler
1631
+ category: Crawler
1590
1632
  producer:
1591
1633
  name: VeriSign, Inc
1592
1634
  url: http://www.verisign.com/
1593
- -
1635
+ -
1594
1636
  user_agent: Kaspersky Lab CFR link resolver cfradmins@kaspersky.com
1595
1637
  bot:
1596
1638
  name: Kaspersky
@@ -1599,7 +1641,7 @@
1599
1641
  producer:
1600
1642
  name: AO Kaspersky Lab
1601
1643
  url: https://www.kaspersky.com/
1602
- -
1644
+ -
1603
1645
  user_agent: kouio.com RSS reader
1604
1646
  bot:
1605
1647
  name: Kouio
@@ -1608,7 +1650,7 @@
1608
1650
  producer:
1609
1651
  name: ""
1610
1652
  url: ""
1611
- -
1653
+ -
1612
1654
  user_agent: 'kouio.com RSS reader - 6 subscribers'
1613
1655
  bot:
1614
1656
  name: Kouio
@@ -1617,7 +1659,7 @@
1617
1659
  producer:
1618
1660
  name: ""
1619
1661
  url: ""
1620
- -
1662
+ -
1621
1663
  user_agent: LCC (+http://corpora.informatik.uni-leipzig.de/crawler_faq.html)
1622
1664
  bot:
1623
1665
  name: LCC
@@ -1626,7 +1668,7 @@
1626
1668
  producer:
1627
1669
  name: Universität Leipzig
1628
1670
  url: https://www.uni-leipzig.de/
1629
- -
1671
+ -
1630
1672
  user_agent: 'ltx71 - (http://ltx71.com/)'
1631
1673
  bot:
1632
1674
  name: LTX71
@@ -1634,7 +1676,7 @@
1634
1676
  producer:
1635
1677
  name: ""
1636
1678
  url: ""
1637
- -
1679
+ -
1638
1680
  user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
1639
1681
  bot:
1640
1682
  name: Larbin web crawler
@@ -1643,7 +1685,7 @@
1643
1685
  producer:
1644
1686
  name: ""
1645
1687
  url: ""
1646
- -
1688
+ -
1647
1689
  user_agent: "Mozilla/5.0 (compatible; Let's Encrypt validation server; +https://www.letsencrypt.org)"
1648
1690
  bot:
1649
1691
  name: "Let's Encrypt Validation"
@@ -1652,7 +1694,7 @@
1652
1694
  producer:
1653
1695
  name: "Let's Encrypt"
1654
1696
  url: https://letsencrypt.org
1655
- -
1697
+ -
1656
1698
  user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/61.0.3116.0 Mobile Safari/537.36 Chrome-Lighthouse
1657
1699
  bot:
1658
1700
  name: Lighthouse
@@ -1661,7 +1703,7 @@
1661
1703
  producer:
1662
1704
  name: Lighthouse
1663
1705
  url: https://developers.google.com/web/tools/lighthouse
1664
- -
1706
+ -
1665
1707
  user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
1666
1708
  bot:
1667
1709
  name: Linkdex Bot
@@ -1670,7 +1712,7 @@
1670
1712
  producer:
1671
1713
  name: Mojeek Ltd.
1672
1714
  url: http://www.mojeek.com
1673
- -
1715
+ -
1674
1716
  user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
1675
1717
  bot:
1676
1718
  name: Linkdex Bot
@@ -1679,7 +1721,7 @@
1679
1721
  producer:
1680
1722
  name: Mojeek Ltd.
1681
1723
  url: http://www.mojeek.com
1682
- -
1724
+ -
1683
1725
  user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
1684
1726
  bot:
1685
1727
  name: Linkdex Bot
@@ -1688,7 +1730,7 @@
1688
1730
  producer:
1689
1731
  name: Mojeek Ltd.
1690
1732
  url: http://www.mojeek.com
1691
- -
1733
+ -
1692
1734
  user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
1693
1735
  bot:
1694
1736
  name: LinkedIn Bot
@@ -1697,7 +1739,7 @@
1697
1739
  producer:
1698
1740
  name: LinkedIn
1699
1741
  url: http://www.linkedin.com
1700
- -
1742
+ -
1701
1743
  user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
1702
1744
  bot:
1703
1745
  name: MJ12 Bot
@@ -1706,7 +1748,7 @@
1706
1748
  producer:
1707
1749
  name: Majestic-12
1708
1750
  url: http://majestic12.co.uk
1709
- -
1751
+ -
1710
1752
  user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
1711
1753
  bot:
1712
1754
  name: Magpie-Crawler
@@ -1715,7 +1757,7 @@
1715
1757
  producer:
1716
1758
  name: Brandwatch
1717
1759
  url: http://www.brandwatch.com
1718
- -
1760
+ -
1719
1761
  user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
1720
1762
  bot:
1721
1763
  name: MagpieRSS
@@ -1724,7 +1766,7 @@
1724
1766
  producer:
1725
1767
  name: ""
1726
1768
  url: ""
1727
- -
1769
+ -
1728
1770
  user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
1729
1771
  bot:
1730
1772
  name: Mail.Ru Bot
@@ -1733,7 +1775,7 @@
1733
1775
  producer:
1734
1776
  name: Mail.Ru Group
1735
1777
  url: http://corp.mail.ru
1736
- -
1778
+ -
1737
1779
  user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
1738
1780
  bot:
1739
1781
  name: Mail.Ru Bot
@@ -1742,17 +1784,17 @@
1742
1784
  producer:
1743
1785
  name: Mail.Ru Group
1744
1786
  url: http://corp.mail.ru
1745
- -
1787
+ -
1746
1788
  user_agent: http.rb/2.2.2 (Mastodon/1.6.1; +https://mathtod.online/)
1747
1789
  bot:
1748
1790
  name: Mastodon Bot
1749
1791
  category: Social Media Agent
1750
- -
1792
+ -
1751
1793
  user_agent: http.rb/3.2.0 (Mastodon/2.4.3; +https://uwu.social/)
1752
1794
  bot:
1753
1795
  name: Mastodon Bot
1754
1796
  category: Social Media Agent
1755
- -
1797
+ -
1756
1798
  user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
1757
1799
  bot:
1758
1800
  name: Meanpath Bot
@@ -1761,13 +1803,13 @@
1761
1803
  producer:
1762
1804
  name: Meanpath
1763
1805
  url: http://www.meanpath.com
1764
- -
1806
+ -
1765
1807
  user_agent: MetaInspector/5.4.0 (+https://github.com/jaimeiniesta/metainspector)
1766
1808
  bot:
1767
1809
  name: MetaInspector
1768
1810
  category: Crawler
1769
1811
  url: https://github.com/jaimeiniesta/metainspector
1770
- -
1812
+ -
1771
1813
  user_agent: Mozilla/5.0 (compatible; MetaJobBot; http://www.metajob.de/crawler)
1772
1814
  bot:
1773
1815
  name: MetaJobBot
@@ -1776,7 +1818,7 @@
1776
1818
  producer:
1777
1819
  name: MetaJob
1778
1820
  url: http://www.metajob.at
1779
- -
1821
+ -
1780
1822
  user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
1781
1823
  bot:
1782
1824
  name: Mixrank Bot
@@ -1785,7 +1827,7 @@
1785
1827
  producer:
1786
1828
  name: Online Media Group, Inc.
1787
1829
  url: ""
1788
- -
1830
+ -
1789
1831
  user_agent: Mnogosearch-3.1.21
1790
1832
  bot:
1791
1833
  name: Mnogosearch
@@ -1794,7 +1836,7 @@
1794
1836
  producer:
1795
1837
  name: Lavtech.Com Corp.
1796
1838
  url: ""
1797
- -
1839
+ -
1798
1840
  user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
1799
1841
  bot:
1800
1842
  name: MojeekBot
@@ -1803,7 +1845,7 @@
1803
1845
  producer:
1804
1846
  name: Mojeek Ltd.
1805
1847
  url: http://www.mojeek.com
1806
- -
1848
+ -
1807
1849
  user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
1808
1850
  bot:
1809
1851
  name: Monitor.Us
@@ -1812,7 +1854,7 @@
1812
1854
  producer:
1813
1855
  name: Monitor.Us
1814
1856
  url: http://www.monitor.us
1815
- -
1857
+ -
1816
1858
  user_agent: munin/2.0.30-1 (libwww-perl/6.15)
1817
1859
  bot:
1818
1860
  name: Munin
@@ -1821,7 +1863,7 @@
1821
1863
  producer:
1822
1864
  name: Munin
1823
1865
  url: http://munin-monitoring.org/
1824
- -
1866
+ -
1825
1867
  user_agent: munin/http_loadtime
1826
1868
  bot:
1827
1869
  name: Munin
@@ -1830,7 +1872,7 @@
1830
1872
  producer:
1831
1873
  name: Munin
1832
1874
  url: http://munin-monitoring.org/
1833
- -
1875
+ -
1834
1876
  user_agent: nlcrawler/1.0 (+http://northernlight.com/)
1835
1877
  bot:
1836
1878
  name: NLCrawler
@@ -1839,7 +1881,7 @@
1839
1881
  producer:
1840
1882
  name: Northern Light
1841
1883
  url: http://northernlight.com
1842
- -
1884
+ -
1843
1885
  user_agent: check_http/v1.5 (nagios-plugins 1.5)
1844
1886
  bot:
1845
1887
  name: Nagios check_http
@@ -1848,7 +1890,7 @@
1848
1890
  producer:
1849
1891
  name: Nagios Plugins Development Team
1850
1892
  url: https://nagios.org
1851
- -
1893
+ -
1852
1894
  user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
1853
1895
  bot:
1854
1896
  name: NalezenCzBot
@@ -1857,11 +1899,11 @@
1857
1899
  producer:
1858
1900
  name: Jaroslav Kuboš
1859
1901
  url: ""
1860
- -
1902
+ -
1861
1903
  user_agent: NetLyzer FastProbe
1862
1904
  bot:
1863
1905
  name: NetLyzer FastProbe
1864
- -
1906
+ -
1865
1907
  user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
1866
1908
  bot:
1867
1909
  name: Netcraft Survey Bot
@@ -1870,7 +1912,7 @@
1870
1912
  producer:
1871
1913
  name: Netcraft
1872
1914
  url: http://www.netcraft.com
1873
- -
1915
+ -
1874
1916
  user_agent: Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)
1875
1917
  bot:
1876
1918
  name: Netcraft Survey Bot
@@ -1879,7 +1921,7 @@
1879
1921
  producer:
1880
1922
  name: Netcraft
1881
1923
  url: http://www.netcraft.com
1882
- -
1924
+ -
1883
1925
  user_agent: 'Netcraft SSL Server Survey - contact info@netcraft.com'
1884
1926
  bot:
1885
1927
  name: Netcraft Survey Bot
@@ -1888,7 +1930,7 @@
1888
1930
  producer:
1889
1931
  name: Netcraft
1890
1932
  url: http://www.netcraft.com
1891
- -
1933
+ -
1892
1934
  user_agent: Netvibes (http://www.netvibes.com)
1893
1935
  bot:
1894
1936
  name: Netvibes
@@ -1897,7 +1939,7 @@
1897
1939
  producer:
1898
1940
  name: ""
1899
1941
  url: ""
1900
- -
1942
+ -
1901
1943
  user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
1902
1944
  bot:
1903
1945
  name: Netvibes
@@ -1906,7 +1948,7 @@
1906
1948
  producer:
1907
1949
  name: ""
1908
1950
  url: ""
1909
- -
1951
+ -
1910
1952
  user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1911
1953
  bot:
1912
1954
  name: NewsBlur
@@ -1915,7 +1957,7 @@
1915
1957
  producer:
1916
1958
  name: ""
1917
1959
  url: ""
1918
- -
1960
+ -
1919
1961
  user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1920
1962
  bot:
1921
1963
  name: NewsBlur
@@ -1924,7 +1966,7 @@
1924
1966
  producer:
1925
1967
  name: ""
1926
1968
  url: ""
1927
- -
1969
+ -
1928
1970
  user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1929
1971
  bot:
1930
1972
  name: NewsBlur
@@ -1933,7 +1975,7 @@
1933
1975
  producer:
1934
1976
  name: ""
1935
1977
  url: ""
1936
- -
1978
+ -
1937
1979
  user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1938
1980
  bot:
1939
1981
  name: NewsBlur
@@ -1942,7 +1984,7 @@
1942
1984
  producer:
1943
1985
  name: ""
1944
1986
  url: ""
1945
- -
1987
+ -
1946
1988
  user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
1947
1989
  bot:
1948
1990
  name: NewsGator
@@ -1951,7 +1993,7 @@
1951
1993
  producer:
1952
1994
  name: ""
1953
1995
  url: ""
1954
- -
1996
+ -
1955
1997
  user_agent: Mozilla/5.0 (compatible; Nmap Scripting Engine; https://nmap.org/book/nse.html)
1956
1998
  bot:
1957
1999
  name: Nmap
@@ -1960,7 +2002,7 @@
1960
2002
  producer:
1961
2003
  name: Nmap
1962
2004
  url: https://nmap.org/
1963
- -
2005
+ -
1964
2006
  user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
1965
2007
  bot:
1966
2008
  name: Nutch-based Bot
@@ -1968,8 +2010,8 @@
1968
2010
  url: https://nutch.apache.org
1969
2011
  producer:
1970
2012
  name: The Apache Software Foundation
1971
- url: http://www.apache.org/foundation/
1972
- -
2013
+ url: https://www.apache.org/foundation/
2014
+ -
1973
2015
  user_agent: CB/Nutch-1.7
1974
2016
  bot:
1975
2017
  name: Nutch-based Bot
@@ -1977,8 +2019,8 @@
1977
2019
  url: https://nutch.apache.org
1978
2020
  producer:
1979
2021
  name: The Apache Software Foundation
1980
- url: http://www.apache.org/foundation/
1981
- -
2022
+ url: https://www.apache.org/foundation/
2023
+ -
1982
2024
  user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
1983
2025
  bot:
1984
2026
  name: Nutch-based Bot
@@ -1986,8 +2028,8 @@
1986
2028
  url: https://nutch.apache.org
1987
2029
  producer:
1988
2030
  name: The Apache Software Foundation
1989
- url: http://www.apache.org/foundation/
1990
- -
2031
+ url: https://www.apache.org/foundation/
2032
+ -
1991
2033
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
1992
2034
  bot:
1993
2035
  name: Nutch-based Bot
@@ -1995,8 +2037,8 @@
1995
2037
  url: https://nutch.apache.org
1996
2038
  producer:
1997
2039
  name: The Apache Software Foundation
1998
- url: http://www.apache.org/foundation/
1999
- -
2040
+ url: https://www.apache.org/foundation/
2041
+ -
2000
2042
  user_agent: My Nutch Spider/Nutch-1.6
2001
2043
  bot:
2002
2044
  name: Nutch-based Bot
@@ -2004,8 +2046,8 @@
2004
2046
  url: https://nutch.apache.org
2005
2047
  producer:
2006
2048
  name: The Apache Software Foundation
2007
- url: http://www.apache.org/foundation/
2008
- -
2049
+ url: https://www.apache.org/foundation/
2050
+ -
2009
2051
  user_agent: MySpider/Nutch-2.2
2010
2052
  bot:
2011
2053
  name: Nutch-based Bot
@@ -2013,8 +2055,8 @@
2013
2055
  url: https://nutch.apache.org
2014
2056
  producer:
2015
2057
  name: The Apache Software Foundation
2016
- url: http://www.apache.org/foundation/
2017
- -
2058
+ url: https://www.apache.org/foundation/
2059
+ -
2018
2060
  user_agent: Nutch12/Nutch-1.2
2019
2061
  bot:
2020
2062
  name: Nutch-based Bot
@@ -2022,8 +2064,8 @@
2022
2064
  url: https://nutch.apache.org
2023
2065
  producer:
2024
2066
  name: The Apache Software Foundation
2025
- url: http://www.apache.org/foundation/
2026
- -
2067
+ url: https://www.apache.org/foundation/
2068
+ -
2027
2069
  user_agent: NutchSpider/Nutch-1.4
2028
2070
  bot:
2029
2071
  name: Nutch-based Bot
@@ -2031,8 +2073,8 @@
2031
2073
  url: https://nutch.apache.org
2032
2074
  producer:
2033
2075
  name: The Apache Software Foundation
2034
- url: http://www.apache.org/foundation/
2035
- -
2076
+ url: https://www.apache.org/foundation/
2077
+ -
2036
2078
  user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
2037
2079
  bot:
2038
2080
  name: Nutch-based Bot
@@ -2040,8 +2082,8 @@
2040
2082
  url: https://nutch.apache.org
2041
2083
  producer:
2042
2084
  name: The Apache Software Foundation
2043
- url: http://www.apache.org/foundation/
2044
- -
2085
+ url: https://www.apache.org/foundation/
2086
+ -
2045
2087
  user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
2046
2088
  bot:
2047
2089
  name: Nutch-based Bot
@@ -2049,8 +2091,8 @@
2049
2091
  url: https://nutch.apache.org
2050
2092
  producer:
2051
2093
  name: The Apache Software Foundation
2052
- url: http://www.apache.org/foundation/
2053
- -
2094
+ url: https://www.apache.org/foundation/
2095
+ -
2054
2096
  user_agent: testnutch/Nutch-1.8
2055
2097
  bot:
2056
2098
  name: Nutch-based Bot
@@ -2058,8 +2100,8 @@
2058
2100
  url: https://nutch.apache.org
2059
2101
  producer:
2060
2102
  name: The Apache Software Foundation
2061
- url: http://www.apache.org/foundation/
2062
- -
2103
+ url: https://www.apache.org/foundation/
2104
+ -
2063
2105
  user_agent: Your Nutch Spider/Nutch-2.2.1
2064
2106
  bot:
2065
2107
  name: Nutch-based Bot
@@ -2067,8 +2109,8 @@
2067
2109
  url: https://nutch.apache.org
2068
2110
  producer:
2069
2111
  name: The Apache Software Foundation
2070
- url: http://www.apache.org/foundation/
2071
- -
2112
+ url: https://www.apache.org/foundation/
2113
+ -
2072
2114
  user_agent: your sipder name/Nutch-1.7
2073
2115
  bot:
2074
2116
  name: Nutch-based Bot
@@ -2076,8 +2118,8 @@
2076
2118
  url: https://nutch.apache.org
2077
2119
  producer:
2078
2120
  name: The Apache Software Foundation
2079
- url: http://www.apache.org/foundation/
2080
- -
2121
+ url: https://www.apache.org/foundation/
2122
+ -
2081
2123
  user_agent: Nuzzel
2082
2124
  bot:
2083
2125
  name: Nuzzel
@@ -2085,11 +2127,11 @@
2085
2127
  producer:
2086
2128
  name: Nuzzel
2087
2129
  url: https://www.nuzzel.com/
2088
- -
2130
+ -
2089
2131
  user_agent: Octopus 1.0.2
2090
2132
  bot:
2091
2133
  name: Octopus
2092
- -
2134
+ -
2093
2135
  user_agent: omgili/0.5 +http://omgili.com
2094
2136
  bot:
2095
2137
  name: Omgili bot
@@ -2098,7 +2140,7 @@
2098
2140
  producer:
2099
2141
  name: Omgili
2100
2142
  url: http://www.omgili.com
2101
- -
2143
+ -
2102
2144
  user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
2103
2145
  bot:
2104
2146
  name: Omgili bot
@@ -2107,7 +2149,7 @@
2107
2149
  producer:
2108
2150
  name: Omgili
2109
2151
  url: http://www.omgili.com
2110
- -
2152
+ -
2111
2153
  user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
2112
2154
  bot:
2113
2155
  name: OpenLinkProfiler
@@ -2116,7 +2158,7 @@
2116
2158
  producer:
2117
2159
  name: Axandra GmbH
2118
2160
  url: http://www.axandra.com
2119
- -
2161
+ -
2120
2162
  user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
2121
2163
  bot:
2122
2164
  name: OpenWebSpider
@@ -2125,7 +2167,7 @@
2125
2167
  producer:
2126
2168
  name: OpenWebSpider Lab
2127
2169
  url: http://lab.openwebspider.org
2128
- -
2170
+ -
2129
2171
  user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
2130
2172
  bot:
2131
2173
  name: Openindex Spider
@@ -2134,7 +2176,7 @@
2134
2176
  producer:
2135
2177
  name: Openindex B.V.
2136
2178
  url: http://www.openindex.io
2137
- -
2179
+ -
2138
2180
  user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
2139
2181
  bot:
2140
2182
  name: Orange Bot
@@ -2143,7 +2185,7 @@
2143
2185
  producer:
2144
2186
  name: Orange
2145
2187
  url: http://www.orange.fr
2146
- -
2188
+ -
2147
2189
  user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
2148
2190
  bot:
2149
2191
  name: Orange Bot
@@ -2152,7 +2194,7 @@
2152
2194
  producer:
2153
2195
  name: Orange
2154
2196
  url: http://www.orange.fr
2155
- -
2197
+ -
2156
2198
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
2157
2199
  bot:
2158
2200
  name: Orange Bot
@@ -2161,7 +2203,7 @@
2161
2203
  producer:
2162
2204
  name: Orange
2163
2205
  url: http://www.orange.fr
2164
- -
2206
+ -
2165
2207
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
2166
2208
  bot:
2167
2209
  name: Orange Bot
@@ -2170,7 +2212,7 @@
2170
2212
  producer:
2171
2213
  name: Orange
2172
2214
  url: http://www.orange.fr
2173
- -
2215
+ -
2174
2216
  user_agent: Mozilla/5.0 (Java) outbrain
2175
2217
  bot:
2176
2218
  name: Outbrain
@@ -2179,7 +2221,7 @@
2179
2221
  producer:
2180
2222
  name: Outbrain
2181
2223
  url: http://www.outbrain.com/
2182
- -
2224
+ -
2183
2225
  user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
2184
2226
  bot:
2185
2227
  name: PHP Server Monitor
@@ -2188,7 +2230,16 @@
2188
2230
  producer:
2189
2231
  name: PHP Server Monitor
2190
2232
  url: http://www.phpservermonitor.org/
2191
- -
2233
+ -
2234
+ user_agent: Mozilla/5.0 (compatible; PRTG Network Monitor (www.paessler.com); Windows)
2235
+ bot:
2236
+ name: PRTG Network Monitor
2237
+ category: Network Monitor
2238
+ url: https://www.paessler.com/prtg
2239
+ producer:
2240
+ name: Paessler AG
2241
+ url: https://www.paessler.com
2242
+ -
2192
2243
  user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
2193
2244
  bot:
2194
2245
  name: PaperLiBot
@@ -2197,13 +2248,19 @@
2197
2248
  producer:
2198
2249
  name: Smallrivers SA
2199
2250
  url: http://www.paper.li
2200
- -
2251
+ -
2252
+ user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; PetalBot;+https://aspiegel.com/petalbot)
2253
+ bot:
2254
+ name: Petal Bot
2255
+ category: Crawler
2256
+ url: https://aspiegel.com/petalbot
2257
+ -
2201
2258
  user_agent: phantomas/1.11.0 (PhantomJS/1.9.8; linux x64)
2202
2259
  bot:
2203
2260
  name: Phantomas
2204
2261
  category: Site Monitor
2205
2262
  url: https://github.com/macbre/phantomas
2206
- -
2263
+ -
2207
2264
  user_agent: psbot-page (+http://www.picsearch.com/bot.html)
2208
2265
  bot:
2209
2266
  name: Picsearch bot
@@ -2212,7 +2269,7 @@
2212
2269
  producer:
2213
2270
  name: Picsearch
2214
2271
  url: http://www.picsearch.com
2215
- -
2272
+ -
2216
2273
  user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
2217
2274
  bot:
2218
2275
  name: Picsearch bot
@@ -2221,7 +2278,7 @@
2221
2278
  producer:
2222
2279
  name: Picsearch
2223
2280
  url: http://www.picsearch.com
2224
- -
2281
+ -
2225
2282
  user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
2226
2283
  bot:
2227
2284
  name: Pingdom Bot
@@ -2230,25 +2287,34 @@
2230
2287
  producer:
2231
2288
  name: Pingdom AB
2232
2289
  url: https://www.pingdom.com
2233
- -
2290
+ -
2234
2291
  user_agent: Mozilla/5.0 (compatible; Pinterestbot/1.0; http://www.pinterest.com/bot.html)
2235
2292
  bot:
2236
2293
  name: Pinterest
2237
- url: http://www.pinterest.com/bot.html
2294
+ url: https://help.pinterest.com/en/business/article/pinterest-crawler
2238
2295
  category: Crawler
2239
2296
  producer:
2240
2297
  name: Pinterest
2241
- url: http://www.pinterest.com/
2242
- -
2298
+ url: https://www.pinterest.com/
2299
+ -
2243
2300
  user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
2244
2301
  bot:
2245
2302
  name: Pinterest
2246
- url: http://www.pinterest.com/bot.html
2303
+ url: https://help.pinterest.com/en/business/article/pinterest-crawler
2304
+ category: Crawler
2305
+ producer:
2306
+ name: Pinterest
2307
+ url: https://www.pinterest.com/
2308
+ -
2309
+ user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Pinterestbot/1.0; https://www.pinterest.com/bot.html)
2310
+ bot:
2311
+ name: Pinterest
2312
+ url: https://help.pinterest.com/en/business/article/pinterest-crawler
2247
2313
  category: Crawler
2248
2314
  producer:
2249
2315
  name: Pinterest
2250
- url: http://www.pinterest.com/
2251
- -
2316
+ url: https://www.pinterest.com/
2317
+ -
2252
2318
  user_agent: PocketParser/2.0 (+https://getpocket.com/pocketparser_ua)
2253
2319
  bot:
2254
2320
  name: PocketParser
@@ -2257,7 +2323,7 @@
2257
2323
  producer:
2258
2324
  name: Pocket
2259
2325
  url: https://getpocket.com/
2260
- -
2326
+ -
2261
2327
  user_agent: PritTorrent/1.0
2262
2328
  bot:
2263
2329
  name: PritTorrent
@@ -2266,7 +2332,7 @@
2266
2332
  producer:
2267
2333
  name: Bitlove
2268
2334
  url: http://bitlove.org/
2269
- -
2335
+ -
2270
2336
  user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
2271
2337
  bot:
2272
2338
  name: QuerySeekerSpider
@@ -2275,7 +2341,7 @@
2275
2341
  producer:
2276
2342
  name: QueryEye Inc.
2277
2343
  url: http://queryeye.com
2278
- -
2344
+ -
2279
2345
  user_agent: Quora Link Preview/1.0 (http://www.quora.com)
2280
2346
  bot:
2281
2347
  name: Quora Link Preview
@@ -2284,7 +2350,7 @@
2284
2350
  producer:
2285
2351
  name: Quora
2286
2352
  url: http://www.quora.com
2287
- -
2353
+ -
2288
2354
  user_agent: 'Mozilla/5.0 (compatible; Qwantify/2.2w; +https://www.qwant.com/)/*'
2289
2355
  bot:
2290
2356
  name: Qwantify
@@ -2293,7 +2359,7 @@
2293
2359
  producer:
2294
2360
  name: Qwant Corporation
2295
2361
  url: https://www.qwant.com/
2296
- -
2362
+ -
2297
2363
  user_agent: ROI Hunter; https://api-dev.roihunter.com
2298
2364
  bot:
2299
2365
  name: ROI Hunter
@@ -2302,17 +2368,17 @@
2302
2368
  producer:
2303
2369
  name: Roihunter a.s.
2304
2370
  url: http://roihunter.com/
2305
- -
2371
+ -
2306
2372
  user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
2307
2373
  bot:
2308
2374
  name: RSSRadio Bot
2309
- -
2375
+ -
2310
2376
  user_agent: Rainmeter WebParser plugin
2311
2377
  bot:
2312
2378
  name: Rainmeter
2313
2379
  category: Crawler
2314
2380
  url: https://www.rainmeter.net
2315
- -
2381
+ -
2316
2382
  user_agent: RamblerMail/6.0 (incompatible; ImageProxy/6.0)
2317
2383
  bot:
2318
2384
  name: RamblerMail Image Proxy
@@ -2321,7 +2387,7 @@
2321
2387
  producer:
2322
2388
  name: 'Rambler&Co'
2323
2389
  url: https://rambler-co.ru/
2324
- -
2390
+ -
2325
2391
  user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
2326
2392
  bot:
2327
2393
  name: Reddit Bot
@@ -2330,7 +2396,12 @@
2330
2396
  producer:
2331
2397
  name: reddit inc.
2332
2398
  url: http://www.reddit.com
2333
- -
2399
+ -
2400
+ user_agent: Robozilla/1.0
2401
+ bot:
2402
+ name: Robozilla
2403
+ category: Crawler
2404
+ -
2334
2405
  user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
2335
2406
  bot:
2336
2407
  name: Rogerbot
@@ -2339,7 +2410,7 @@
2339
2410
  producer:
2340
2411
  name: SEOmoz, Inc.
2341
2412
  url: http://moz.com/
2342
- -
2413
+ -
2343
2414
  user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
2344
2415
  bot:
2345
2416
  name: Rogerbot
@@ -2348,7 +2419,7 @@
2348
2419
  producer:
2349
2420
  name: SEOmoz, Inc.
2350
2421
  url: http://moz.com/
2351
- -
2422
+ -
2352
2423
  user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
2353
2424
  bot:
2354
2425
  name: Rogerbot
@@ -2357,7 +2428,7 @@
2357
2428
  producer:
2358
2429
  name: SEOmoz, Inc.
2359
2430
  url: http://moz.com/
2360
- -
2431
+ -
2361
2432
  user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
2362
2433
  bot:
2363
2434
  name: SEOENGBot
@@ -2366,7 +2437,7 @@
2366
2437
  producer:
2367
2438
  name: SEO Engine
2368
2439
  url: http://www.seoengine.com
2369
- -
2440
+ -
2370
2441
  user_agent: Mozilla/5.0 (compatible; SEOkicks-Robot; +http://www.seokicks.de/robot.html)
2371
2442
  bot:
2372
2443
  name: SEOkicks-Robot
@@ -2375,7 +2446,7 @@
2375
2446
  producer:
2376
2447
  name: SEOkicks
2377
2448
  url: https://www.seokicks.de/
2378
- -
2449
+ -
2379
2450
  user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
2380
2451
  bot:
2381
2452
  name: SISTRIX Crawler
@@ -2402,7 +2473,7 @@
2402
2473
  producer:
2403
2474
  name: SISTRIX GmbH
2404
2475
  url: http://www.sistrix.de
2405
- -
2476
+ -
2406
2477
  user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer; Uptime; +https://www.sistrix.com/faq/uptime)
2407
2478
  bot:
2408
2479
  name: SISTRIX Optimizer
@@ -2411,7 +2482,7 @@
2411
2482
  producer:
2412
2483
  name: SISTRIX GmbH
2413
2484
  url: http://www.sistrix.de
2414
- -
2485
+ -
2415
2486
  user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.75 Safari/537.36 (compatible; SMTBot/1.0; +http://www.similartech.com/smtbot)
2416
2487
  bot:
2417
2488
  name: SMTBot
@@ -2420,7 +2491,7 @@
2420
2491
  producer:
2421
2492
  name: SimilarTech Ltd.
2422
2493
  url: https://www.similartech.com/
2423
- -
2494
+ -
2424
2495
  user_agent: SSL Labs (https://www.ssllabs.com/about/assessment.html)
2425
2496
  bot:
2426
2497
  name: SSL Labs
@@ -2429,7 +2500,7 @@
2429
2500
  producer:
2430
2501
  name: SSL Labs
2431
2502
  url: https://www.ssllabs.com/about/assessment.html
2432
- -
2503
+ -
2433
2504
  user_agent: SafeDNSBot (https://www.safedns.com/searchbot)
2434
2505
  bot:
2435
2506
  name: SafeDNSBot
@@ -2438,13 +2509,13 @@
2438
2509
  producer:
2439
2510
  name: SafeDNS, Inc.
2440
2511
  url: https://www.safedns.com/
2441
- -
2512
+ -
2442
2513
  user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
2443
2514
  bot:
2444
2515
  name: Scrapy
2445
2516
  category: Crawler
2446
2517
  url: http://scrapy.org
2447
- -
2518
+ -
2448
2519
  user_agent: Screaming Frog SEO Spider/2.22
2449
2520
  bot:
2450
2521
  name: Screaming Frog SEO Spider
@@ -2453,7 +2524,7 @@
2453
2524
  producer:
2454
2525
  name: Screaming Frog Ltd
2455
2526
  url: http://www.screamingfrog.co.uk
2456
- -
2527
+ -
2457
2528
  user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
2458
2529
  bot:
2459
2530
  name: ScreenerBot
@@ -2462,7 +2533,13 @@
2462
2533
  producer:
2463
2534
  name: ""
2464
2535
  url: ""
2465
- -
2536
+ -
2537
+ user_agent: Mozilla/5.0 (compatible) SemanticScholarBot (+https://www.semanticscholar.org/crawler)
2538
+ bot:
2539
+ name: Semantic Scholar Bot
2540
+ category: Crawler
2541
+ url: https://www.semanticscholar.org/crawler
2542
+ -
2466
2543
  user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
2467
2544
  bot:
2468
2545
  name: Semrush Bot
@@ -2471,7 +2548,7 @@
2471
2548
  producer:
2472
2549
  name: SEMrush
2473
2550
  url: http://www.semrush.com
2474
- -
2551
+ -
2475
2552
  user_agent: SensikaBot/x.33 (+http://sensika.com)
2476
2553
  bot:
2477
2554
  name: Sensika Bot
@@ -2480,24 +2557,36 @@
2480
2557
  producer:
2481
2558
  name: Sensika
2482
2559
  url: http://sensika.com
2483
- -
2560
+ -
2484
2561
  user_agent: sentry/8.6.0 (https://getsentry.com)
2485
2562
  bot:
2486
2563
  name: Sentry Bot
2487
2564
  producer:
2488
2565
  name: Sentry
2489
2566
  url: https://sentry.io
2490
- -
2567
+ -
2568
+ user_agent: Seobility
2569
+ bot:
2570
+ name: Seobility
2571
+ category: Crawler
2572
+ url: 'https://www.seobility.net/en/faq/?category=crawling#!aboutourbot'
2573
+ -
2491
2574
  user_agent: Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)
2492
2575
  bot:
2493
2576
  name: Seoscanners.net
2494
2577
  category: Crawler
2495
2578
  url: ""
2496
- -
2579
+ -
2580
+ user_agent: SerendeputyBot/0.8.6 (http://serendeputy.com/about/serendeputy-bot)
2581
+ bot:
2582
+ name: Serendeputy Bot
2583
+ category: Crawler
2584
+ url: https://serendeputy.com/about/serendeputy-bot
2585
+ -
2497
2586
  user_agent: Server Density Service Monitoring v2
2498
2587
  bot:
2499
2588
  name: Server Density
2500
- -
2589
+ -
2501
2590
  user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
2502
2591
  bot:
2503
2592
  name: Seznam Bot
@@ -2506,7 +2595,7 @@
2506
2595
  producer:
2507
2596
  name: Seznam.cz, a.s.
2508
2597
  url: http://www.seznam.cz/
2509
- -
2598
+ -
2510
2599
  user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
2511
2600
  bot:
2512
2601
  name: Seznam Bot
@@ -2515,7 +2604,7 @@
2515
2604
  producer:
2516
2605
  name: Seznam.cz, a.s.
2517
2606
  url: http://www.seznam.cz/
2518
- -
2607
+ -
2519
2608
  user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
2520
2609
  bot:
2521
2610
  name: Seznam Bot
@@ -2524,7 +2613,7 @@
2524
2613
  producer:
2525
2614
  name: Seznam.cz, a.s.
2526
2615
  url: http://www.seznam.cz/
2527
- -
2616
+ -
2528
2617
  user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
2529
2618
  bot:
2530
2619
  name: Seznam Bot
@@ -2533,7 +2622,7 @@
2533
2622
  producer:
2534
2623
  name: Seznam.cz, a.s.
2535
2624
  url: http://www.seznam.cz/
2536
- -
2625
+ -
2537
2626
  user_agent: Mozilla/5.0 SeznamEmailProxy/2.0.174
2538
2627
  bot:
2539
2628
  name: Seznam Email Proxy
@@ -2542,7 +2631,7 @@
2542
2631
  producer:
2543
2632
  name: Seznam.cz, a.s.
2544
2633
  url: http://www.seznam.cz/
2545
- -
2634
+ -
2546
2635
  user_agent: Seznam-Zbozi-robot/3.0
2547
2636
  bot:
2548
2637
  name: Seznam Zbozi.cz
@@ -2551,7 +2640,7 @@
2551
2640
  producer:
2552
2641
  name: Seznam.cz, a.s.
2553
2642
  url: https://www.zbozi.cz/
2554
- -
2643
+ -
2555
2644
  user_agent: Mozilla/5.0 (ShopAlike; LadenZeile) FeedBot
2556
2645
  bot:
2557
2646
  name: ShopAlike
@@ -2560,7 +2649,7 @@
2560
2649
  producer:
2561
2650
  name: Visual Meta
2562
2651
  url: https://www.shopalike.cz/
2563
- -
2652
+ -
2564
2653
  user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
2565
2654
  bot:
2566
2655
  name: ShopWiki
@@ -2569,7 +2658,7 @@
2569
2658
  producer:
2570
2659
  name: ShopWiki Corp.
2571
2660
  url: http://www.shopwiki.com
2572
- -
2661
+ -
2573
2662
  user_agent: shopify-partner-homepage-scraper
2574
2663
  bot:
2575
2664
  name: Shopify Partner
@@ -2578,7 +2667,7 @@
2578
2667
  producer:
2579
2668
  name: Shopify
2580
2669
  url: https://www.shopify.com/
2581
- -
2670
+ -
2582
2671
  user_agent: SilverReader/1.0; http://silverreader.com
2583
2672
  bot:
2584
2673
  name: SilverReader
@@ -2587,7 +2676,7 @@
2587
2676
  producer:
2588
2677
  name: ""
2589
2678
  url: ""
2590
- -
2679
+ -
2591
2680
  user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
2592
2681
  bot:
2593
2682
  name: SimplePie
@@ -2596,7 +2685,7 @@
2596
2685
  producer:
2597
2686
  name: ""
2598
2687
  url: ""
2599
- -
2688
+ -
2600
2689
  user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
2601
2690
  bot:
2602
2691
  name: SimplePie
@@ -2605,7 +2694,7 @@
2605
2694
  producer:
2606
2695
  name: ""
2607
2696
  url: ""
2608
- -
2697
+ -
2609
2698
  user_agent: Site24x7
2610
2699
  bot:
2611
2700
  name: Site24x7 Website Monitoring
@@ -2614,13 +2703,13 @@
2614
2703
  producer:
2615
2704
  name: Site24x7
2616
2705
  url: https://www.site24x7.com
2617
- -
2706
+ -
2618
2707
  user_agent: SiteSucker for macOS/2.10.5
2619
2708
  bot:
2620
2709
  name: SiteSucker
2621
2710
  category: Crawler
2622
2711
  url: http://ricks-apps.com/osx/sitesucker/
2623
- -
2712
+ -
2624
2713
  user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.0) Match by Siteimprove.com
2625
2714
  bot:
2626
2715
  name: Siteimprove
@@ -2629,7 +2718,7 @@
2629
2718
  producer:
2630
2719
  name: Siteimprove GmbH
2631
2720
  url: https://siteimprove.com/
2632
- -
2721
+ -
2633
2722
  user_agent: Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; Trident/6.0) LinkCheck by Siteimprove.com
2634
2723
  bot:
2635
2724
  name: Siteimprove
@@ -2638,7 +2727,7 @@
2638
2727
  producer:
2639
2728
  name: Siteimprove GmbH
2640
2729
  url: https://siteimprove.com/
2641
- -
2730
+ -
2642
2731
  user_agent: sixy.ch/1.0
2643
2732
  bot:
2644
2733
  name: Sixy.ch
@@ -2647,7 +2736,7 @@
2647
2736
  producer:
2648
2737
  name: Manuel Kasper
2649
2738
  url: https://neon1.net/
2650
- -
2739
+ -
2651
2740
  user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
2652
2741
  bot:
2653
2742
  name: Skype URI Preview
@@ -2656,7 +2745,7 @@
2656
2745
  producer:
2657
2746
  name: Skype Communications S.à.r.l.
2658
2747
  url: https://www.skype.com
2659
- -
2748
+ -
2660
2749
  user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
2661
2750
  bot:
2662
2751
  name: Slackbot
@@ -2665,7 +2754,7 @@
2665
2754
  producer:
2666
2755
  name: Slack Technologies
2667
2756
  url: http://slack.com
2668
- -
2757
+ -
2669
2758
  user_agent: 'AppEngine-Google; (+http://code.google.com/appengine; appid: s~snapchat-proxy)'
2670
2759
  bot:
2671
2760
  name: Snapchat Proxy
@@ -2674,7 +2763,7 @@
2674
2763
  producer:
2675
2764
  name: Snapchat Inc.
2676
2765
  url: https://www.snapchat.com
2677
- -
2766
+ -
2678
2767
  user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
2679
2768
  bot:
2680
2769
  name: Sogou Spider
@@ -2683,7 +2772,7 @@
2683
2772
  producer:
2684
2773
  name: Sohu, Inc.
2685
2774
  url: http://www.sogou.com
2686
- -
2775
+ -
2687
2776
  user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
2688
2777
  bot:
2689
2778
  name: Sogou Spider
@@ -2692,7 +2781,7 @@
2692
2781
  producer:
2693
2782
  name: Sohu, Inc.
2694
2783
  url: http://www.sogou.com
2695
- -
2784
+ -
2696
2785
  user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
2697
2786
  bot:
2698
2787
  name: Sogou Spider
@@ -2701,7 +2790,7 @@
2701
2790
  producer:
2702
2791
  name: Sohu, Inc.
2703
2792
  url: http://www.sogou.com
2704
- -
2793
+ -
2705
2794
  user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
2706
2795
  bot:
2707
2796
  name: Sogou Spider
@@ -2710,7 +2799,7 @@
2710
2799
  producer:
2711
2800
  name: Sohu, Inc.
2712
2801
  url: http://www.sogou.com
2713
- -
2802
+ -
2714
2803
  user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
2715
2804
  bot:
2716
2805
  name: Soso Spider
@@ -2719,13 +2808,13 @@
2719
2808
  producer:
2720
2809
  name: Tencent Holdings
2721
2810
  url: http://www.soso.com
2722
- -
2811
+ -
2723
2812
  user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_6) AppleWebKit/537.36 (KHTML, like Gecko) Sparkler/0.2.0-SNAPSHOT
2724
2813
  bot:
2725
2814
  name: Sparkler
2726
2815
  category: Crawler
2727
2816
  url: https://github.com/USCDataScience/sparkler
2728
- -
2817
+ -
2729
2818
  user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
2730
2819
  bot:
2731
2820
  name: Spinn3r
@@ -2734,32 +2823,26 @@
2734
2823
  producer:
2735
2824
  name: Tailrank Inc
2736
2825
  url: http://spinn3r.com
2737
- -
2826
+ -
2738
2827
  user_agent: Spotify/1.0
2739
2828
  bot:
2740
2829
  name: Spotify
2741
2830
  producer:
2742
2831
  name: Spotify
2743
2832
  url: https://www.spotify.com
2744
- -
2833
+ -
2745
2834
  user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
2746
2835
  bot:
2747
2836
  name: Sputnik Bot
2748
- category: ""
2837
+ category: "Crawler"
2749
2838
  url: ""
2750
- producer:
2751
- name: ""
2752
- url: ""
2753
- -
2839
+ -
2754
2840
  user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
2755
2841
  bot:
2756
- name: Sputnik Bot
2757
- category: ""
2842
+ name: Sputnik Image Bot
2843
+ category: "Crawler"
2758
2844
  url: ""
2759
- producer:
2760
- name: ""
2761
- url: ""
2762
- -
2845
+ -
2763
2846
  user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_8_5) AppleWebKit/536.30.1 (KHTML, like Gecko) (compatible; Startpagina-Linkchecker/1.0; +https://www.startpagina.nl/linkchecker)
2764
2847
  bot:
2765
2848
  name: Startpagina Linkchecker
@@ -2768,7 +2851,7 @@
2768
2851
  producer:
2769
2852
  name: Startpagina B.V.
2770
2853
  url: https://www.startpagina.nl/
2771
- -
2854
+ -
2772
2855
  user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.4 (KHTML, like Gecko) Chrome/98 Safari/537.4 (StatusCake)
2773
2856
  bot:
2774
2857
  name: StatusCake
@@ -2777,7 +2860,7 @@
2777
2860
  producer:
2778
2861
  name: StatusCake
2779
2862
  url: https://www.statuscake.com
2780
- -
2863
+ -
2781
2864
  user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
2782
2865
  bot:
2783
2866
  name: Superfeedr Bot
@@ -2786,7 +2869,7 @@
2786
2869
  producer:
2787
2870
  name: Superfeedr
2788
2871
  url: https://superfeedr.com/
2789
- -
2872
+ -
2790
2873
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
2791
2874
  bot:
2792
2875
  name: Survey Bot
@@ -2795,7 +2878,7 @@
2795
2878
  producer:
2796
2879
  name: Domain Tools
2797
2880
  url: http://www.domaintools.com
2798
- -
2881
+ -
2799
2882
  user_agent: TLSProbe/1.0 (+https://scan.trustnet.venafi.com/)
2800
2883
  bot:
2801
2884
  name: TLSProbe
@@ -2804,23 +2887,23 @@
2804
2887
  producer:
2805
2888
  name: Venafi TrustNet
2806
2889
  url: https://www.venafi.com
2807
- -
2890
+ -
2808
2891
  user_agent: Tarmot Gezgin/1.0 (compatible; TarmotGezgin/1.1; +http://www.tarmot.com/gezgin)
2809
2892
  bot:
2810
2893
  name: Tarmot Gezgin
2811
2894
  url: http://www.tarmot.com/gezgin/
2812
2895
  category: Search bot
2813
- -
2896
+ -
2814
2897
  user_agent: TelegramBot (like TwitterBot)
2815
2898
  bot:
2816
2899
  name: TelegramBot
2817
2900
  url: https://telegram.org/blog/bot-revolution
2818
- -
2901
+ -
2819
2902
  user_agent: The Knowledge AI
2820
2903
  bot:
2821
2904
  name: The Knowledge AI
2822
2905
  category: Crawler
2823
- -
2906
+ -
2824
2907
  user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
2825
2908
  bot:
2826
2909
  name: TinEye Crawler
@@ -2829,7 +2912,7 @@
2829
2912
  producer:
2830
2913
  name: Idée Inc.
2831
2914
  url: http://ideeinc.com
2832
- -
2915
+ -
2833
2916
  user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
2834
2917
  bot:
2835
2918
  name: Tiny Tiny RSS
@@ -2838,7 +2921,7 @@
2838
2921
  producer:
2839
2922
  name: ""
2840
2923
  url: ""
2841
- -
2924
+ -
2842
2925
  user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
2843
2926
  bot:
2844
2927
  name: Tiny Tiny RSS
@@ -2847,7 +2930,7 @@
2847
2930
  producer:
2848
2931
  name: ""
2849
2932
  url: ""
2850
- -
2933
+ -
2851
2934
  user_agent: Mozilla/5.0 (compatible; tracemyfile/1.0)
2852
2935
  bot:
2853
2936
  name: TraceMyFile
@@ -2856,7 +2939,7 @@
2856
2939
  producer:
2857
2940
  name: Idee Inc.
2858
2941
  url: http://ideeinc.com/
2859
- -
2942
+ -
2860
2943
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 6.0; en-GB; rv:1.0; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20071127 Firefox/3.0.0.11
2861
2944
  bot:
2862
2945
  name: Trendiction Bot
@@ -2865,7 +2948,7 @@
2865
2948
  producer:
2866
2949
  name: Talkwalker Inc.
2867
2950
  url: http://www.talkwalker.com
2868
- -
2951
+ -
2869
2952
  user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
2870
2953
  bot:
2871
2954
  name: TurnitinBot
@@ -2874,7 +2957,7 @@
2874
2957
  producer:
2875
2958
  name: iParadigms, LLC.
2876
2959
  url: http://www.turnitin.com
2877
- -
2960
+ -
2878
2961
  user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
2879
2962
  bot:
2880
2963
  name: TweetedTimes Bot
@@ -2883,7 +2966,7 @@
2883
2966
  producer:
2884
2967
  name: TweetedTimes
2885
2968
  url: http://tweetedtimes.com/
2886
- -
2969
+ -
2887
2970
  user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
2888
2971
  bot:
2889
2972
  name: TweetedTimes Bot
@@ -2892,7 +2975,7 @@
2892
2975
  producer:
2893
2976
  name: TweetedTimes
2894
2977
  url: http://tweetedtimes.com/
2895
- -
2978
+ -
2896
2979
  user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
2897
2980
  bot:
2898
2981
  name: Tweetmeme Bot
@@ -2901,7 +2984,7 @@
2901
2984
  producer:
2902
2985
  name: Mediasift
2903
2986
  url: ""
2904
- -
2987
+ -
2905
2988
  user_agent: Mozilla/5.0 (compatible; Twingly Recon; twingly.com)
2906
2989
  bot:
2907
2990
  name: Twingly Recon
@@ -2909,7 +2992,7 @@
2909
2992
  producer:
2910
2993
  name: Twingly
2911
2994
  url: https://www.twingly.com
2912
- -
2995
+ -
2913
2996
  user_agent: Twitterbot/1.0
2914
2997
  bot:
2915
2998
  name: Twitterbot
@@ -2918,7 +3001,7 @@
2918
3001
  producer:
2919
3002
  name: Twitter
2920
3003
  url: http://www.twitter.com
2921
- -
3004
+ -
2922
3005
  user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
2923
3006
  bot:
2924
3007
  name: URLAppendBot
@@ -2927,7 +3010,7 @@
2927
3010
  producer:
2928
3011
  name: Profound Networks
2929
3012
  url: http://www.profound.net
2930
- -
3013
+ -
2931
3014
  user_agent: 'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36 (via secureurl.fwdcdn.com - mail.ukr.net proxy)'
2932
3015
  bot:
2933
3016
  name: UkrNet Mail Proxy
@@ -2936,7 +3019,7 @@
2936
3019
  producer:
2937
3020
  name: UkrNet Ltd
2938
3021
  url: https://www.ukr.net/
2939
- -
3022
+ -
2940
3023
  user_agent: UniversalFeedParser/5.2.1 +https://code.google.com/p/feedparser/
2941
3024
  bot:
2942
3025
  name: UniversalFeedParser
@@ -2945,7 +3028,7 @@
2945
3028
  producer:
2946
3029
  name: Kurt McKee
2947
3030
  url: https://github.com/kurtmckee
2948
- -
3031
+ -
2949
3032
  user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
2950
3033
  bot:
2951
3034
  name: Uptime Robot
@@ -2954,7 +3037,7 @@
2954
3037
  producer:
2955
3038
  name: Uptime Robot
2956
3039
  url: http://uptimerobot.com
2957
- -
3040
+ -
2958
3041
  user_agent: Mozilla/5.0 (compatible; Uptimebot/1.0; +http://www.uptime.com/uptimebot)
2959
3042
  bot:
2960
3043
  name: Uptimebot
@@ -2963,7 +3046,7 @@
2963
3046
  producer:
2964
3047
  name: Uptime
2965
3048
  url: https://uptime.com
2966
- -
3049
+ -
2967
3050
  user_agent: Mozilla/5.0 (compatible; vkShare; +http://vk.com/dev/Share)
2968
3051
  bot:
2969
3052
  name: VK Share Button
@@ -2972,7 +3055,7 @@
2972
3055
  producer:
2973
3056
  name: VK
2974
3057
  url: http://vk.com/
2975
- -
3058
+ -
2976
3059
  user_agent: 'Mozilla/4.0 (compatible; Vagabondo/4.0; http://webagent.wise-guys.nl/; http://www.wise-guys.nl/)'
2977
3060
  bot:
2978
3061
  name: Vagabondo
@@ -2981,7 +3064,19 @@
2981
3064
  producer:
2982
3065
  name: WiseGuys
2983
3066
  url: http://www.wise-guys.nl/
2984
- -
3067
+ -
3068
+ user_agent: Mozilla/5.0 (compatible; VelenPublicWebCrawler/1.0; +https://velen.io)
3069
+ bot:
3070
+ name: Velen Public Web Crawler
3071
+ category: Crawler
3072
+ url: https://hunter.io/robot
3073
+ -
3074
+ user_agent: Vercelbot (+https://vercel.com)
3075
+ bot:
3076
+ name: Vercel Bot
3077
+ category: Service bot
3078
+ url: https://vercel.com
3079
+ -
2985
3080
  user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
2986
3081
  bot:
2987
3082
  name: Visual Site Mapper Crawler
@@ -2990,7 +3085,7 @@
2990
3085
  producer:
2991
3086
  name: Alentum Software Ltd.
2992
3087
  url: http://www.alentum.com
2993
- -
3088
+ -
2994
3089
  user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
2995
3090
  bot:
2996
3091
  name: W3C CSS Validator
@@ -2999,7 +3094,7 @@
2999
3094
  producer:
3000
3095
  name: W3C
3001
3096
  url: http://www.w3.org
3002
- -
3097
+ -
3003
3098
  user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
3004
3099
  bot:
3005
3100
  name: W3C I18N Checker
@@ -3008,7 +3103,7 @@
3008
3103
  producer:
3009
3104
  name: W3C
3010
3105
  url: http://www.w3.org
3011
- -
3106
+ -
3012
3107
  user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
3013
3108
  bot:
3014
3109
  name: W3C Link Checker
@@ -3017,7 +3112,7 @@
3017
3112
  producer:
3018
3113
  name: W3C
3019
3114
  url: http://www.w3.org
3020
- -
3115
+ -
3021
3116
  user_agent: W3C-checklink/4.81 libwww-perl/5.836
3022
3117
  bot:
3023
3118
  name: W3C Link Checker
@@ -3026,7 +3121,7 @@
3026
3121
  producer:
3027
3122
  name: W3C
3028
3123
  url: http://www.w3.org
3029
- -
3124
+ -
3030
3125
  user_agent: Validator.nu/LV http://validator.w3.org/services
3031
3126
  bot:
3032
3127
  name: W3C Markup Validation Service
@@ -3035,7 +3130,7 @@
3035
3130
  producer:
3036
3131
  name: W3C
3037
3132
  url: http://www.w3.org
3038
- -
3133
+ -
3039
3134
  user_agent: W3C_Validator/1.3 http://validator.w3.org/services
3040
3135
  bot:
3041
3136
  name: W3C Markup Validation Service
@@ -3044,7 +3139,7 @@
3044
3139
  producer:
3045
3140
  name: W3C
3046
3141
  url: http://www.w3.org
3047
- -
3142
+ -
3048
3143
  user_agent: W3C_Validator/1.767
3049
3144
  bot:
3050
3145
  name: W3C Markup Validation Service
@@ -3053,7 +3148,7 @@
3053
3148
  producer:
3054
3149
  name: W3C
3055
3150
  url: http://www.w3.org
3056
- -
3151
+ -
3057
3152
  user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
3058
3153
  bot:
3059
3154
  name: W3C MobileOK Checker
@@ -3062,7 +3157,7 @@
3062
3157
  producer:
3063
3158
  name: W3C
3064
3159
  url: http://www.w3.org
3065
- -
3160
+ -
3066
3161
  user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
3067
3162
  bot:
3068
3163
  name: W3C Unified Validator
@@ -3071,7 +3166,7 @@
3071
3166
  producer:
3072
3167
  name: W3C
3073
3168
  url: http://www.w3.org
3074
- -
3169
+ -
3075
3170
  user_agent: Mozilla/5.0 (compatible; Wappalyzer; +https://github.com/AliasIO/Wappalyzer)
3076
3171
  bot:
3077
3172
  name: Wappalyzer
@@ -3079,7 +3174,7 @@
3079
3174
  producer:
3080
3175
  name: AliasIO
3081
3176
  url: https://github.com/AliasIO
3082
- -
3177
+ -
3083
3178
  user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
3084
3179
  bot:
3085
3180
  name: WeSEE:Search
@@ -3088,13 +3183,13 @@
3088
3183
  producer:
3089
3184
  name: WeSEE Ltd
3090
3185
  url: http://www.wesee.com
3091
- -
3186
+ -
3092
3187
  user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Moto G (4) Build/MPJ24.139-64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.146 Mobile Safari/537.36 PTST/180829.190838
3093
3188
  bot:
3094
3189
  name: WebPageTest
3095
3190
  category: Site Monitor
3096
3191
  url: https://www.webpagetest.org
3097
- -
3192
+ -
3098
3193
  user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
3099
3194
  bot:
3100
3195
  name: WebSitePulse
@@ -3103,7 +3198,7 @@
3103
3198
  producer:
3104
3199
  name: WebSitePulse
3105
3200
  url: http://www.websitepulse.com/
3106
- -
3201
+ -
3107
3202
  user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
3108
3203
  bot:
3109
3204
  name: WebbCrawler
@@ -3112,7 +3207,7 @@
3112
3207
  producer:
3113
3208
  name: Steve Webb
3114
3209
  url: http://badcheese.com
3115
- -
3210
+ -
3116
3211
  user_agent: weborama-fetcher (+http://www.weborama.com)
3117
3212
  bot:
3118
3213
  name: Weborama
@@ -3121,7 +3216,7 @@
3121
3216
  producer:
3122
3217
  name: Weborama SA
3123
3218
  url: https://weborama.com/
3124
- -
3219
+ -
3125
3220
  user_agent: WikiDo/1.1 (http://wikido.com; crawler@wikido.com)
3126
3221
  bot:
3127
3222
  name: WikiDo
@@ -3130,7 +3225,7 @@
3130
3225
  producer:
3131
3226
  name: Fotolitografie Fiorentine di Becchi Antonio s.n.c.
3132
3227
  url: https://www.wikido.com/
3133
- -
3228
+ -
3134
3229
  user_agent: Mozilla/5.0 (compatible; woorankreview/2.0; +https://www.woorank.com/)
3135
3230
  bot:
3136
3231
  name: WooRank
@@ -3139,7 +3234,7 @@
3139
3234
  producer:
3140
3235
  name: WooRank sprl
3141
3236
  url: https://www.woorank.com/
3142
- -
3237
+ -
3143
3238
  user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/604.1.38 (KHTML, like Gecko) Version/11.0 Mobile/15A372 Safari/604.1 (compatible; woorankreview/2.0; +https://www.woorank.com/)
3144
3239
  bot:
3145
3240
  name: WooRank
@@ -3148,7 +3243,7 @@
3148
3243
  producer:
3149
3244
  name: WooRank sprl
3150
3245
  url: https://www.woorank.com/
3151
- -
3246
+ -
3152
3247
  user_agent: WordPress/4.7.2; https://example.com
3153
3248
  bot:
3154
3249
  name: WordPress
@@ -3157,7 +3252,7 @@
3157
3252
  producer:
3158
3253
  name: Wordpress.org
3159
3254
  url: https://wordpress.org/
3160
- -
3255
+ -
3161
3256
  user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
3162
3257
  bot:
3163
3258
  name: Wotbox
@@ -3166,7 +3261,7 @@
3166
3261
  producer:
3167
3262
  name: Wotbox
3168
3263
  url: http://www.wotbox.com
3169
- -
3264
+ -
3170
3265
  user_agent: XenForo/2.x (https://www.example.com)
3171
3266
  bot:
3172
3267
  name: XenForo
@@ -3175,7 +3270,7 @@
3175
3270
  producer:
3176
3271
  name: XenForo Ltd.
3177
3272
  url: https://xenforo.com/
3178
- -
3273
+ -
3179
3274
  user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
3180
3275
  bot:
3181
3276
  name: YaCy
@@ -3184,7 +3279,7 @@
3184
3279
  producer:
3185
3280
  name: YaCy
3186
3281
  url: http://yacy.net
3187
- -
3282
+ -
3188
3283
  user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
3189
3284
  bot:
3190
3285
  name: YaCy
@@ -3193,7 +3288,7 @@
3193
3288
  producer:
3194
3289
  name: YaCy
3195
3290
  url: http://yacy.net
3196
- -
3291
+ -
3197
3292
  user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
3198
3293
  bot:
3199
3294
  name: Yahoo Gemini
@@ -3202,7 +3297,7 @@
3202
3297
  producer:
3203
3298
  name: Yahoo! Inc.
3204
3299
  url: http://www.yahoo.com
3205
- -
3300
+ -
3206
3301
  user_agent: Y!J-BRW/1.0 (https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716)
3207
3302
  bot:
3208
3303
  name: Yahoo! Japan BRW
@@ -3211,7 +3306,7 @@
3211
3306
  producer:
3212
3307
  name: Yahoo! Japan Corp.
3213
3308
  url: https://www.yahoo.co.jp/
3214
- -
3309
+ -
3215
3310
  user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
3216
3311
  bot:
3217
3312
  name: Yahoo! Link Preview
@@ -3220,7 +3315,7 @@
3220
3315
  producer:
3221
3316
  name: Yahoo! Inc.
3222
3317
  url: http://www.yahoo.com
3223
- -
3318
+ -
3224
3319
  user_agent: Yahoo:LinkExpander:Slingstone
3225
3320
  bot:
3226
3321
  name: Yahoo! Link Preview
@@ -3229,7 +3324,7 @@
3229
3324
  producer:
3230
3325
  name: Yahoo! Inc.
3231
3326
  url: http://www.yahoo.com
3232
- -
3327
+ -
3233
3328
  user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
3234
3329
  bot:
3235
3330
  name: Yahoo! Slurp
@@ -3238,7 +3333,7 @@
3238
3333
  producer:
3239
3334
  name: Yahoo! Inc.
3240
3335
  url: http://www.yahoo.com
3241
- -
3336
+ -
3242
3337
  user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
3243
3338
  bot:
3244
3339
  name: Yahoo! Slurp
@@ -3247,7 +3342,7 @@
3247
3342
  producer:
3248
3343
  name: Yahoo! Inc.
3249
3344
  url: http://www.yahoo.com
3250
- -
3345
+ -
3251
3346
  user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
3252
3347
  bot:
3253
3348
  name: Yandex Bot
@@ -3256,7 +3351,7 @@
3256
3351
  producer:
3257
3352
  name: Yandex LLC
3258
3353
  url: http://company.yandex.com
3259
- -
3354
+ -
3260
3355
  user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
3261
3356
  bot:
3262
3357
  name: Yandex Bot
@@ -3265,7 +3360,7 @@
3265
3360
  producer:
3266
3361
  name: Yandex LLC
3267
3362
  url: http://company.yandex.com
3268
- -
3363
+ -
3269
3364
  user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
3270
3365
  bot:
3271
3366
  name: Yandex Bot
@@ -3274,7 +3369,7 @@
3274
3369
  producer:
3275
3370
  name: Yandex LLC
3276
3371
  url: http://company.yandex.com
3277
- -
3372
+ -
3278
3373
  user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
3279
3374
  bot:
3280
3375
  name: Yandex Bot
@@ -3283,7 +3378,7 @@
3283
3378
  producer:
3284
3379
  name: Yandex LLC
3285
3380
  url: http://company.yandex.com
3286
- -
3381
+ -
3287
3382
  user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
3288
3383
  bot:
3289
3384
  name: Yandex Bot
@@ -3292,7 +3387,7 @@
3292
3387
  producer:
3293
3388
  name: Yandex LLC
3294
3389
  url: http://company.yandex.com
3295
- -
3390
+ -
3296
3391
  user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
3297
3392
  bot:
3298
3393
  name: Yandex Bot
@@ -3301,7 +3396,7 @@
3301
3396
  producer:
3302
3397
  name: Yandex LLC
3303
3398
  url: http://company.yandex.com
3304
- -
3399
+ -
3305
3400
  user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
3306
3401
  bot:
3307
3402
  name: Yandex Bot
@@ -3310,7 +3405,7 @@
3310
3405
  producer:
3311
3406
  name: Yandex LLC
3312
3407
  url: http://company.yandex.com
3313
- -
3408
+ -
3314
3409
  user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
3315
3410
  bot:
3316
3411
  name: Yandex Bot
@@ -3319,7 +3414,7 @@
3319
3414
  producer:
3320
3415
  name: Yandex LLC
3321
3416
  url: http://company.yandex.com
3322
- -
3417
+ -
3323
3418
  user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
3324
3419
  bot:
3325
3420
  name: Yandex Bot
@@ -3328,7 +3423,7 @@
3328
3423
  producer:
3329
3424
  name: Yandex LLC
3330
3425
  url: http://company.yandex.com
3331
- -
3426
+ -
3332
3427
  user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
3333
3428
  bot:
3334
3429
  name: Yandex Bot
@@ -3337,7 +3432,7 @@
3337
3432
  producer:
3338
3433
  name: Yandex LLC
3339
3434
  url: http://company.yandex.com
3340
- -
3435
+ -
3341
3436
  user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
3342
3437
  bot:
3343
3438
  name: Yandex Bot
@@ -3346,7 +3441,7 @@
3346
3441
  producer:
3347
3442
  name: Yandex LLC
3348
3443
  url: http://company.yandex.com
3349
- -
3444
+ -
3350
3445
  user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
3351
3446
  bot:
3352
3447
  name: Yandex Bot
@@ -3355,7 +3450,7 @@
3355
3450
  producer:
3356
3451
  name: Yandex LLC
3357
3452
  url: http://company.yandex.com
3358
- -
3453
+ -
3359
3454
  user_agent: Mozilla/5.0 (compatible; YandexMobileScreenShotBot/1.0; +http://yandex.com/bots)
3360
3455
  bot:
3361
3456
  name: Yandex Bot
@@ -3364,7 +3459,7 @@
3364
3459
  producer:
3365
3460
  name: Yandex LLC
3366
3461
  url: http://company.yandex.com
3367
- -
3462
+ -
3368
3463
  user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
3369
3464
  bot:
3370
3465
  name: Yandex Bot
@@ -3373,7 +3468,7 @@
3373
3468
  producer:
3374
3469
  name: Yandex LLC
3375
3470
  url: http://company.yandex.com
3376
- -
3471
+ -
3377
3472
  user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
3378
3473
  bot:
3379
3474
  name: Yandex Bot
@@ -3382,7 +3477,7 @@
3382
3477
  producer:
3383
3478
  name: Yandex LLC
3384
3479
  url: http://company.yandex.com
3385
- -
3480
+ -
3386
3481
  user_agent: Mozilla/5.0 (compatible; YandexOntoDB/1.0; +http://yandex.com/bots)
3387
3482
  bot:
3388
3483
  name: Yandex Bot
@@ -3391,7 +3486,7 @@
3391
3486
  producer:
3392
3487
  name: Yandex LLC
3393
3488
  url: http://company.yandex.com
3394
- -
3489
+ -
3395
3490
  user_agent: Mozilla/5.0 (compatible; YandexOntoDBAPI/1.0; +http://yandex.com/bots)
3396
3491
  bot:
3397
3492
  name: Yandex Bot
@@ -3400,7 +3495,7 @@
3400
3495
  producer:
3401
3496
  name: Yandex LLC
3402
3497
  url: http://company.yandex.com
3403
- -
3498
+ -
3404
3499
  user_agent: Mozilla/5.0 (compatible; YandexPartner/3.0; +http://yandex.com/bots)
3405
3500
  bot:
3406
3501
  name: Yandex Bot
@@ -3409,7 +3504,7 @@
3409
3504
  producer:
3410
3505
  name: Yandex LLC
3411
3506
  url: http://company.yandex.com
3412
- -
3507
+ -
3413
3508
  user_agent: Mozilla/5.0 (compatible; YandexRCA/1.0; +http://yandex.com/bots)
3414
3509
  bot:
3415
3510
  name: Yandex Bot
@@ -3418,7 +3513,7 @@
3418
3513
  producer:
3419
3514
  name: Yandex LLC
3420
3515
  url: http://company.yandex.com
3421
- -
3516
+ -
3422
3517
  user_agent: Mozilla/5.0 (compatible; YandexSearchShop/1.0; +http://yandex.com/bots)
3423
3518
  bot:
3424
3519
  name: Yandex Bot
@@ -3427,7 +3522,7 @@
3427
3522
  producer:
3428
3523
  name: Yandex LLC
3429
3524
  url: http://company.yandex.com
3430
- -
3525
+ -
3431
3526
  user_agent: Mozilla/5.0 (compatible; YandexTracker/1.0; +http://yandex.com/bots)
3432
3527
  bot:
3433
3528
  name: Yandex Bot
@@ -3436,7 +3531,7 @@
3436
3531
  producer:
3437
3532
  name: Yandex LLC
3438
3533
  url: http://company.yandex.com
3439
- -
3534
+ -
3440
3535
  user_agent: Mozilla/5.0 (compatible; YandexTurbo/1.0; +http://yandex.com/bots)
3441
3536
  bot:
3442
3537
  name: Yandex Bot
@@ -3445,7 +3540,7 @@
3445
3540
  producer:
3446
3541
  name: Yandex LLC
3447
3542
  url: http://company.yandex.com
3448
- -
3543
+ -
3449
3544
  user_agent: Mozilla/5.0 (compatible; YandexVerticals/1.0; http://yandex.com/bots)
3450
3545
  bot:
3451
3546
  name: Yandex Bot
@@ -3454,7 +3549,7 @@
3454
3549
  producer:
3455
3550
  name: Yandex LLC
3456
3551
  url: http://company.yandex.com
3457
- -
3552
+ -
3458
3553
  user_agent: Mozilla/5.0 (compatible; NaverJapan/1.0; +http://corp.naver.jp/)
3459
3554
  bot:
3460
3555
  name: Yeti/Naverbot
@@ -3463,7 +3558,7 @@
3463
3558
  producer:
3464
3559
  name: Naver
3465
3560
  url: http://www.naver.com
3466
- -
3561
+ -
3467
3562
  user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
3468
3563
  bot:
3469
3564
  name: Yeti/Naverbot
@@ -3472,7 +3567,7 @@
3472
3567
  producer:
3473
3568
  name: Naver
3474
3569
  url: http://www.naver.com
3475
- -
3570
+ -
3476
3571
  user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
3477
3572
  bot:
3478
3573
  name: Youdao Bot
@@ -3481,13 +3576,13 @@
3481
3576
  producer:
3482
3577
  name: NetEase, Inc.
3483
3578
  url: http://corp.163.com
3484
- -
3579
+ -
3485
3580
  user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
3486
3581
  bot:
3487
3582
  name: Yourls
3488
3583
  category: Crawler
3489
3584
  url: http://yourls.org
3490
- -
3585
+ -
3491
3586
  user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
3492
3587
  bot:
3493
3588
  name: Yunyun Bot
@@ -3496,7 +3591,7 @@
3496
3591
  producer:
3497
3592
  name: YunYun
3498
3593
  url: http://www.yunyun.com
3499
- -
3594
+ -
3500
3595
  user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
3501
3596
  bot:
3502
3597
  name: Yunyun Bot
@@ -3505,7 +3600,7 @@
3505
3600
  producer:
3506
3601
  name: YunYun
3507
3602
  url: http://www.yunyun.com
3508
- -
3603
+ -
3509
3604
  user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
3510
3605
  bot:
3511
3606
  name: Yunyun Bot
@@ -3514,21 +3609,21 @@
3514
3609
  producer:
3515
3610
  name: YunYun
3516
3611
  url: http://www.yunyun.com
3517
- -
3612
+ -
3518
3613
  user_agent: Zao/0.1 (http://www.kototol.org/zao)
3519
3614
  bot:
3520
3615
  name: Zao
3521
3616
  category: Crawler
3522
- -
3617
+ -
3523
3618
  user_agent: zelist.ro feed parser (+http://www.zelist.ro)
3524
3619
  bot:
3525
3620
  name: Ze List
3526
- category: Feed Fetcher
3527
3621
  url: https://www.zelist.ro/
3622
+ category: Feed Fetcher
3528
3623
  producer:
3529
3624
  name: Treeworks SRL
3530
3625
  url: https://www.tree.ro/
3531
- -
3626
+ -
3532
3627
  user_agent: Zookabot/2.5;++http://zookabot.com
3533
3628
  bot:
3534
3629
  name: Zookabot
@@ -3537,7 +3632,7 @@
3537
3632
  producer:
3538
3633
  name: Hwacha ApS
3539
3634
  url: http://hwacha.dk
3540
- -
3635
+ -
3541
3636
  user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
3542
3637
  bot:
3543
3638
  name: ZumBot
@@ -3546,7 +3641,7 @@
3546
3641
  producer:
3547
3642
  name: ZUM internet
3548
3643
  url: http://www.zuminternet.com/
3549
- -
3644
+ -
3550
3645
  user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
3551
3646
  bot:
3552
3647
  name: ZumBot
@@ -3555,106 +3650,106 @@
3555
3650
  producer:
3556
3651
  name: ZUM internet
3557
3652
  url: http://www.zuminternet.com/
3558
- -
3653
+ -
3559
3654
  user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
3560
3655
  bot:
3561
3656
  name: aHrefs Bot
3562
3657
  category: Crawler
3563
- url: http://ahrefs.com/robot
3658
+ url: https://ahrefs.com/robot
3564
3659
  producer:
3565
3660
  name: Ahrefs Pte Ltd
3566
- url: http://ahrefs.com/robot
3567
- -
3661
+ url: https://ahrefs.com/robot
3662
+ -
3568
3663
  user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
3569
3664
  bot:
3570
3665
  name: aHrefs Bot
3571
3666
  category: Crawler
3572
- url: http://ahrefs.com/robot
3667
+ url: https://ahrefs.com/robot
3573
3668
  producer:
3574
3669
  name: Ahrefs Pte Ltd
3575
- url: http://ahrefs.com/robot
3576
- -
3670
+ url: https://ahrefs.com/robot
3671
+ -
3577
3672
  user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
3578
3673
  bot:
3579
3674
  name: aHrefs Bot
3580
3675
  category: Crawler
3581
- url: http://ahrefs.com/robot
3676
+ url: https://ahrefs.com/robot
3582
3677
  producer:
3583
3678
  name: Ahrefs Pte Ltd
3584
- url: http://ahrefs.com/robot
3585
- -
3679
+ url: https://ahrefs.com/robot
3680
+ -
3586
3681
  user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
3587
3682
  bot:
3588
3683
  name: aHrefs Bot
3589
3684
  category: Crawler
3590
- url: http://ahrefs.com/robot
3685
+ url: https://ahrefs.com/robot
3591
3686
  producer:
3592
3687
  name: Ahrefs Pte Ltd
3593
- url: http://ahrefs.com/robot
3594
- -
3688
+ url: https://ahrefs.com/robot
3689
+ -
3595
3690
  user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
3596
3691
  bot:
3597
3692
  name: archive.org bot
3598
3693
  category: Crawler
3599
- url: http://www.archive.org/details/archive.org_bot
3694
+ url: https://archive.org/details/archive.org_bot
3600
3695
  producer:
3601
3696
  name: The Internet Archive
3602
- url: http://www.archive.org
3603
- -
3697
+ url: https://archive.org
3698
+ -
3604
3699
  user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
3605
3700
  bot:
3606
3701
  name: archive.org bot
3607
3702
  category: Crawler
3608
- url: http://www.archive.org/details/archive.org_bot
3703
+ url: https://archive.org/details/archive.org_bot
3609
3704
  producer:
3610
3705
  name: The Internet Archive
3611
- url: http://www.archive.org
3612
- -
3706
+ url: https://archive.org
3707
+ -
3613
3708
  user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
3614
3709
  bot:
3615
3710
  name: archive.org bot
3616
3711
  category: Crawler
3617
- url: http://www.archive.org/details/archive.org_bot
3712
+ url: https://archive.org/details/archive.org_bot
3618
3713
  producer:
3619
3714
  name: The Internet Archive
3620
- url: http://www.archive.org
3621
- -
3715
+ url: https://archive.org
3716
+ -
3622
3717
  user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
3623
3718
  bot:
3624
3719
  name: archive.org bot
3625
3720
  category: Crawler
3626
- url: http://www.archive.org/details/archive.org_bot
3721
+ url: https://archive.org/details/archive.org_bot
3627
3722
  producer:
3628
3723
  name: The Internet Archive
3629
- url: http://www.archive.org
3630
- -
3724
+ url: https://archive.org
3725
+ -
3631
3726
  user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
3632
3727
  bot:
3633
3728
  name: archive.org bot
3634
3729
  category: Crawler
3635
- url: http://www.archive.org/details/archive.org_bot
3730
+ url: https://archive.org/details/archive.org_bot
3636
3731
  producer:
3637
3732
  name: The Internet Archive
3638
- url: http://www.archive.org
3639
- -
3733
+ url: https://archive.org
3734
+ -
3640
3735
  user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
3641
3736
  bot:
3642
3737
  name: archive.org bot
3643
3738
  category: Crawler
3644
- url: http://www.archive.org/details/archive.org_bot
3739
+ url: https://archive.org/details/archive.org_bot
3645
3740
  producer:
3646
3741
  name: The Internet Archive
3647
- url: http://www.archive.org
3648
- -
3742
+ url: https://archive.org
3743
+ -
3649
3744
  user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
3650
3745
  bot:
3651
3746
  name: archive.org bot
3652
3747
  category: Crawler
3653
- url: http://www.archive.org/details/archive.org_bot
3748
+ url: https://archive.org/details/archive.org_bot
3654
3749
  producer:
3655
3750
  name: The Internet Archive
3656
- url: http://www.archive.org
3657
- -
3751
+ url: https://archive.org
3752
+ -
3658
3753
  user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
3659
3754
  bot:
3660
3755
  name: ccBot crawler
@@ -3663,7 +3758,7 @@
3663
3758
  producer:
3664
3759
  name: reddit inc.
3665
3760
  url: http://www.reddit.com
3666
- -
3761
+ -
3667
3762
  user_agent: Mozilla/5.0 eCairn-Grabber/1.0 (+http://ecairn.com/grabber)
3668
3763
  bot:
3669
3764
  name: eCairn-Grabber
@@ -3671,7 +3766,7 @@
3671
3766
  producer:
3672
3767
  name: eCairn
3673
3768
  url: https://ecairn.com
3674
- -
3769
+ -
3675
3770
  user_agent: eZ Publish Link Validator
3676
3771
  bot:
3677
3772
  name: eZ Publish Link Validator
@@ -3680,7 +3775,7 @@
3680
3775
  producer:
3681
3776
  name: eZ Systems AS
3682
3777
  url: https://ez.no/
3683
- -
3778
+ -
3684
3779
  user_agent: Mozilla/5.0 (compatible; evc-batch/2.0)
3685
3780
  bot:
3686
3781
  name: evc-batch
@@ -3689,13 +3784,13 @@
3689
3784
  producer:
3690
3785
  name: eVenture Capital Partners II, LLC
3691
3786
  url: http://www.eventures.vc/
3692
- -
3787
+ -
3693
3788
  user_agent: Mozilla/5.0 (compatible; inoreader.com; 2 subscribers)
3694
3789
  bot:
3695
3790
  name: inoreader
3696
3791
  category: Feed Reader
3697
3792
  url: https://www.inoreader.com
3698
- -
3793
+ -
3699
3794
  user_agent: masscan/1.0 (https://github.com/robertdavidgraham/masscan)
3700
3795
  bot:
3701
3796
  name: masscan
@@ -3704,21 +3799,21 @@
3704
3799
  producer:
3705
3800
  name: Robert Graham
3706
3801
  url: https://github.com/robertdavidgraham
3707
- -
3802
+ -
3708
3803
  user_agent: 'Mozilla/5.0/Firefox/42.0 - nbertaupete95(at)gmail.com'
3709
3804
  bot:
3710
3805
  name: nbertaupete95
3711
3806
  category: Crawler
3712
- -
3807
+ -
3713
3808
  user_agent: Mozilla/5.0 (compatible; oBot/2.3.1; http://www.xforce-security.com/crawler/)
3714
3809
  bot:
3715
3810
  name: oBot
3716
3811
  category: Search bot
3717
- url: http://www.xforce-security.com/crawler/
3812
+ url: https://www.xforce-security.com/crawler/
3718
3813
  producer:
3719
3814
  name: 'IBM Germany Research & Development GmbH'
3720
3815
  url: https://exchange.xforce.ibmcloud.com/
3721
- -
3816
+ -
3722
3817
  user_agent: 'sqlmap/1.1.8.2#dev (http://sqlmap.org)'
3723
3818
  bot:
3724
3819
  name: sqlmap
@@ -3727,87 +3822,613 @@
3727
3822
  producer:
3728
3823
  name: sqlmap
3729
3824
  url: http://sqlmap.org/
3730
- -
3825
+ -
3731
3826
  user_agent: Mozilla/5.0 (compatible; theoldreader.com; 1 subscribers; feed-id=aaa)
3732
3827
  bot:
3733
3828
  name: theoldreader
3734
3829
  category: Feed Reader
3735
3830
  url: https://theoldreader.com
3736
-
3737
3831
  -
3738
- user_agent: Seobility
3832
+ user_agent: Sprinklr 2.0
3739
3833
  bot:
3740
- name: Seobility
3834
+ name: Sprinklr
3741
3835
  category: Crawler
3742
- url: 'https://www.seobility.net/en/faq/?category=crawling#!aboutourbot'
3743
-
3836
+ url: ""
3837
+ producer:
3838
+ name: Sprinklr, Inc.
3839
+ url: https://www.sprinklr.com/
3744
3840
  -
3745
- user_agent: Vercelbot (+https://vercel.com)
3841
+ user_agent: Mozilla/5.0 (X11; Linux x86_64)AppleWebKit/537.36 (KHTML, like Gecko; Google-Ads-Qualify)Chrome/85.0.4183.140 Safari/537.36
3746
3842
  bot:
3747
- name: Vercel Bot
3748
- category: Service bot
3749
- url: https://vercel.com
3750
-
3843
+ name: Googlebot
3844
+ category: Search bot
3845
+ url: http://www.google.com/bot.html
3846
+ producer:
3847
+ name: Google Inc.
3848
+ url: http://www.google.com
3751
3849
  -
3752
- user_agent: Grammarly/1.0 (http://www.grammarly.com)
3850
+ user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64; BDCbot/1.0; +http://bigweb.bigdatacorp.com.br/faq.aspx) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36
3753
3851
  bot:
3754
- name: Grammarly
3755
- category: Service bot
3756
- url: http://www.grammarly.com
3757
-
3852
+ name: BDCbot
3853
+ category: Crawler
3854
+ url: https://bigweb.bigdatacorp.com.br/pages/faq.aspx
3855
+ producer:
3856
+ name: BIG Data Solucoes Em Tecnologia de Informatica LTDA
3857
+ url: https://bigdatacorp.com.br/
3758
3858
  -
3759
- user_agent: Robozilla/1.0
3859
+ user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36 CloudflareDiagnostics/1.0
3760
3860
  bot:
3761
- name: Robozilla
3861
+ name: Cloudflare Diagnostics
3862
+ category: Site Monitor
3863
+ url: https://www.cloudflare.com/
3864
+ producer:
3865
+ name: Cloudflare
3866
+ url: https://www.cloudflare.com
3867
+ -
3868
+ user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 12_0 like Mac OS X) adbeat.com/policy AppleWebKit/605.1.15 (KHTML, like Gecko) CriOS/69.0.3497.105 Mobile/15E148 Safari/605.1
3869
+ bot:
3870
+ name: Adbeat
3762
3871
  category: Crawler
3763
-
3872
+ url: https://www.adbeat.com/operation_policy
3873
+ producer:
3874
+ name: PPC Labs LLC
3875
+ url: https://www.adbeat.com/
3764
3876
  -
3765
- user_agent: Mozilla/5.0 (compatible; Domains Project/1.1.0; +https://domainsproject.org)
3877
+ user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; BW/1.1; bit.ly/2W6Px8S) Chrome/84.0.4147.105 Safari/537.36
3766
3878
  bot:
3767
- name: Domains Project
3879
+ name: BuiltWith
3768
3880
  category: Crawler
3769
- url: https://domainsproject.org
3770
-
3881
+ url: https://builtwith.com/biup
3882
+ producer:
3883
+ name: BuiltWith Pty Ltd
3884
+ url: https://builtwith.com/
3771
3885
  -
3772
- user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; PetalBot;+https://aspiegel.com/petalbot)
3886
+ user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36 (+https://whatis.contentkingapp.com)
3773
3887
  bot:
3774
- name: Petal Bot
3888
+ name: ContentKing
3889
+ category: Site Monitor
3890
+ url: https://whatis.contentkingapp.com/
3891
+ producer:
3892
+ name: ContentKing BV
3893
+ url: https://www.contentkingapp.com/
3894
+ -
3895
+ user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.89 Safari/537.36 MicroAdBot/1.1 (https://www.microad.co.jp/contact/)
3896
+ bot:
3897
+ name: MicroAdBot
3775
3898
  category: Crawler
3776
- url: https://aspiegel.com/petalbot
3777
-
3899
+ url: https://www.microad.co.jp/
3900
+ producer:
3901
+ name: MicroAd, Inc.
3902
+ url: https://www.microad.co.jp/
3778
3903
  -
3779
- user_agent: SerendeputyBot/0.8.6 (http://serendeputy.com/about/serendeputy-bot)
3904
+ user_agent: Mozilla/5.0 (compatible; PingAdmin.Ru/1.2; +http://pingadmin.ru/free_test/)
3780
3905
  bot:
3781
- name: Serendeputy Bot
3906
+ name: PingAdmin.Ru
3907
+ category: Site Monitor
3908
+ url: https://ping-admin.ru/
3909
+ -
3910
+ user_agent: Mozilla/5.0 (compatible; WebDataStats/1.0 ; +https://webdatastats.com/policy.html)
3911
+ bot:
3912
+ name: WebDataStats
3782
3913
  category: Crawler
3783
- url: http://serendeputy.com/about/serendeputy-bot
3784
-
3914
+ url: https://webdatastats.com/policy.html
3915
+ producer:
3916
+ name: WebTehRazrabotka LLC
3917
+ url: https://webdatastats.com/
3785
3918
  -
3786
- user_agent: ias-va/3.1 (+https://www.admantx.com/service-fetcher.html)
3919
+ user_agent: Mozilla/5.0 (compatible; parse.ly scraper/0.14; +http://parsely.com)
3787
3920
  bot:
3788
- name: ADmantX Service Fetcher
3789
- category: Service bot
3790
- url: https://www.admantx.com/service-fetcher.html
3791
-
3921
+ name: parse.ly
3922
+ category: Crawler
3923
+ url: https://www.parse.ly/help/integration/crawler
3924
+ producer:
3925
+ name: Parsely, Inc.
3926
+ url: https://www.parse.ly/
3792
3927
  -
3793
- user_agent: Mozilla/5.0 (compatible) SemanticScholarBot (+https://www.semanticscholar.org/crawler)
3928
+ user_agent: Mozilla/5.0 (compatible; Nimbostratus-Bot/v1.3.2; http://cloudsystemnetworks.com)
3794
3929
  bot:
3795
- name: Semantic Scholar Bot
3930
+ name: Nimbostratus Bot
3931
+ category: Site Monitor
3932
+ url: http://cloudsystemnetworks.com
3933
+ -
3934
+ user_agent: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.17) Gecko/20110515 HeartRails_Capture/1.0.4 (+http://capture.heartrails.com/) Namoroka/3.6.17
3935
+ bot:
3936
+ name: Heart Rails Capture
3937
+ category: Service Agent
3938
+ url: http://capture.heartrails.com
3939
+ -
3940
+ user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36 http://notifyninja.com/monitoring
3941
+ bot:
3942
+ name: Notify Ninja
3943
+ category: Site Monitor
3944
+ url: http://notifyninja.com
3945
+ -
3946
+ user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) Project-Resonance (http://project-resonance.com/) (KHTML, like Gecko) Chrome/83.0.4103.61 Safari/537.36
3947
+ bot:
3948
+ name: Project Resonance
3796
3949
  category: Crawler
3797
- url: https://www.semanticscholar.org/crawler
3798
-
3950
+ url: http://project-resonance.com
3799
3951
  -
3800
- user_agent: Mozilla/5.0 (compatible; VelenPublicWebCrawler/1.0; +https://velen.io)
3952
+ user_agent: Mozilla/5.0 (compatible; DataXu/1.0; +http://dataxu.com)
3801
3953
  bot:
3802
- name: Velen Public Web Crawler
3954
+ name: DataXu
3955
+ category: Service Agent
3956
+ url: https://advertising.roku.com/dataxu
3957
+ producer:
3958
+ name: Roku, Inc.
3959
+ url: https://roku.com
3960
+ -
3961
+ user_agent: Mozilla/5.0 (Unknown; Linux x86_64) AppleWebKit/534.34 (KHTML, like Gecko) PingdomTMS/0.8.5 Safari/534.34
3962
+ bot:
3963
+ name: Pingdom Bot
3964
+ category: Site Monitor
3965
+ url: ""
3966
+ producer:
3967
+ name: Pingdom AB
3968
+ url: https://www.pingdom.com
3969
+ -
3970
+ user_agent: Mozilla/5.0 (compatible; Cocolyzebot/1.0; https://cocolyze.com/bot)
3971
+ bot:
3972
+ name: Cocolyzebot
3803
3973
  category: Crawler
3804
- url: https://hunter.io/robot
3805
-
3974
+ url: https://cocolyze.com/en/cocolyzebot
3975
+ producer:
3976
+ name: VSI INNOVATION SAS
3977
+ url: https://vsi-innovation.com/
3806
3978
  -
3807
- user_agent: Barkrowler/0.9 (+http://www.exensa.com/crawl)
3979
+ user_agent: veryhip (http://veryhip.com/)
3808
3980
  bot:
3809
- name: Barkrowler
3981
+ name: VeryHip
3810
3982
  category: Crawler
3811
- url: http://www.exensa.com/crawl
3812
-
3813
-
3983
+ url: https://veryhip.com/
3984
+ producer:
3985
+ name: VeryHip
3986
+ url: https://veryhip.com/
3987
+ -
3988
+ user_agent: Mozilla/5.0 (compatible; LinkpadBot/2.3; +http://linkpad.org/robot/)
3989
+ bot:
3990
+ name: LinkpadBot
3991
+ category: Crawler
3992
+ url: https://www.linkpad.org/
3993
+ producer:
3994
+ name: Solomono LLC
3995
+ url: https://www.linkpad.org/
3996
+ -
3997
+ user_agent: Mozilla/4.0 (compatible; MuscatFerret/1.7; http://www.webtop.com/)
3998
+ bot:
3999
+ name: MuscatFerret
4000
+ category: Crawler
4001
+ url: http://www.webtop.com/
4002
+ -
4003
+ user_agent: Quora-Bot/1.0 (http://www.quora.com)
4004
+ bot:
4005
+ name: Quora Bot
4006
+ category: Crawler
4007
+ url: ""
4008
+ producer:
4009
+ name: Quora
4010
+ url: https://www.quora.com/
4011
+ -
4012
+ user_agent: PageThing.com
4013
+ bot:
4014
+ name: PageThing
4015
+ category: Crawler
4016
+ url: https://www.pagething.com/
4017
+ producer:
4018
+ name: SPECIALNOISE LTD
4019
+ url: https://www.specialnoise.com/
4020
+ -
4021
+ user_agent: ArchiveBox/0.5.3 (+https://github.com/ArchiveBox/ArchiveBox/)
4022
+ bot:
4023
+ name: ArchiveBox
4024
+ url: https://archivebox.io/
4025
+ category: Crawler
4026
+ producer:
4027
+ name: ""
4028
+ url: ""
4029
+ -
4030
+ user_agent: Choosito/1.0 +http://www.choosito.com/
4031
+ bot:
4032
+ name: Choosito
4033
+ url: https://www.choosito.com/
4034
+ category: Crawler
4035
+ producer:
4036
+ name: Choosito! Inc.
4037
+ url: https://www.choosito.com/
4038
+ -
4039
+ user_agent: datagnionbot (+http://www.datagnion.com/bot.html)
4040
+ bot:
4041
+ name: datagnionbot
4042
+ url: https://www.datagnion.com/bot.html
4043
+ category: Crawler
4044
+ producer:
4045
+ name: DATAGNION GMBH
4046
+ url: https://www.datagnion.com/
4047
+ -
4048
+ user_agent: InterNaetBoten/0.99 (http://www.xn--internt-bxa.nu)
4049
+ bot:
4050
+ name: Generic Bot
4051
+ -
4052
+ user_agent: EasyBib AutoCite (http://autocite-info.citation-api.com/)
4053
+ bot:
4054
+ name: Generic Bot
4055
+ -
4056
+ user_agent: Bidtellect/0.0.643.0
4057
+ bot:
4058
+ name: Generic Bot
4059
+ -
4060
+ user_agent: Mozilla/5.0 (compatible; meg/0.2; +https://github.com/tomnomnom/meg)
4061
+ bot:
4062
+ name: Generic Bot
4063
+ -
4064
+ user_agent: Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:66.0) WhatCMS/1.0
4065
+ bot:
4066
+ name: WhatCMS
4067
+ url: https://whatcms.org/
4068
+ category: Crawler
4069
+ producer:
4070
+ name: "Nineteen Ten LLC"
4071
+ url: "https://whatcms.org/"
4072
+ -
4073
+ user_agent: httpx - Open-source project (github.com/projectdiscovery/httpx)
4074
+ bot:
4075
+ name: httpx
4076
+ url: https://github.com/projectdiscovery/httpx
4077
+ category: Crawler
4078
+ producer:
4079
+ name: ""
4080
+ url: ""
4081
+ -
4082
+ user_agent: 'Expanse indexes the network perimeters of our customers. If you have any questions or concerns, please reach out to: scaninfo@expanseinc.com'
4083
+ bot:
4084
+ name: Expanse
4085
+ category: Security Checker
4086
+ url: https://expanse.co/
4087
+ producer:
4088
+ name: Expanse Inc.
4089
+ url: https://expanse.co/
4090
+ -
4091
+ user_agent: 'HuaweiWebCatBot/6.0) (To acquire the allowed html pages as reliable information of URL categorization in the automatic process for Huawei Web Categorization.; https://isecurity.huawei.com/; sec at huawei dot com)'
4092
+ bot:
4093
+ name: HuaweiWebCatBot
4094
+ category: Crawler
4095
+ url: https://isecurity.huawei.com
4096
+ producer:
4097
+ name: Huawei Technologies Co., Ltd.
4098
+ url: https://huawei.com
4099
+ -
4100
+ user_agent: Mozilla/5.0 (compatible; SputnikFaviconBot/1.2; +http://corp.sputnik.ru/webmaster)
4101
+ bot:
4102
+ name: Sputnik Favicon Bot
4103
+ url: ""
4104
+ category: Crawler
4105
+ -
4106
+ user_agent: Hatena-Favicon2 (http://www.hatena.ne.jp/faq/)
4107
+ bot:
4108
+ name: Hatena Favicon
4109
+ category: Crawler
4110
+ url: https://www.hatena.ne.jp/faq/
4111
+ producer:
4112
+ name: Hatena Co., Ltd.
4113
+ url: https://www.hatena.ne.jp
4114
+ -
4115
+ user_agent: Mozilla/5.0 (compatible; RyowlEngine/1.0; +https://ryowl.org)
4116
+ bot:
4117
+ name: Ryowl
4118
+ category: Crawler
4119
+ url: https://ryowl.org
4120
+ -
4121
+ user_agent: Mozilla/5.0 (compatible; OdklBot/1.0 like Linux; klass@odnoklassniki.ru)
4122
+ bot:
4123
+ name: Odnoklassniki Bot
4124
+ category: Crawler
4125
+ url: https://odnoklassniki.ru
4126
+ -
4127
+ user_agent: Mediatoolkitbot (complaints@mediatoolkit.com)
4128
+ bot:
4129
+ name: Mediatoolkit Bot
4130
+ category: Crawler
4131
+ url: https://mediatoolkit.com
4132
+ -
4133
+ user_agent: ZoominfoBot (zoominfobot at zoominfo dot com)
4134
+ bot:
4135
+ name: ZoominfoBot
4136
+ category: Crawler
4137
+ url: https://www.zoominfo.com
4138
+ -
4139
+ user_agent: Mozilla/5.0 (compatible; WeViKaBot/1.0; +http://www.wevika.de/)
4140
+ bot:
4141
+ name: WeViKaBot
4142
+ category: Crawler
4143
+ url: http://www.wevika.de
4144
+ -
4145
+ user_agent: Mozilla/5.0 (compatible; SEOkicks; +https://www.seokicks.de/robot.html)
4146
+ bot:
4147
+ name: SEOkicks
4148
+ category: Crawler
4149
+ url: https://www.seokicks.de/robot.html
4150
+ -
4151
+ user_agent: Mozilla/5.0 (compatible; Plukkie/1.6; http://www.botje.com/plukkie.htm)
4152
+ bot:
4153
+ name: Plukkie
4154
+ category: Crawler
4155
+ url: http://www.botje.com/plukkie.htm
4156
+ -
4157
+ user_agent: Mozilla/5.0 (compatible; proximic; https://www.comscore.com/Web-Crawler)
4158
+ bot:
4159
+ name: Comscore
4160
+ category: Crawler
4161
+ url: https://www.comscore.com/Web-Crawler
4162
+ -
4163
+ user_agent: Mozilla/5.0 (compatible; SurdotlyBot/1.0; +http://sur.ly/bot.html)
4164
+ bot:
4165
+ name: SurdotlyBot
4166
+ category: Crawler
4167
+ url: http://sur.ly/bot.html
4168
+ -
4169
+ user_agent: Mozilla/5.0 (compatible; Gowikibot/1.0; +http://www.gowikibot.com)
4170
+ bot:
4171
+ name: Gowikibot
4172
+ category: Crawler
4173
+ url: http:/www.gowikibot.com
4174
+ -
4175
+ user_agent: Mozilla/5.0 (compatible; SabsimBot/3.0; +https://sabsim.com)
4176
+ bot:
4177
+ name: SabsimBot
4178
+ category: Crawler
4179
+ url: https://sabsim.com
4180
+ -
4181
+ user_agent: Mozilla/5.0 (compatible; LumtelBot/1.0; +http://lumtel.com)
4182
+ bot:
4183
+ name: LumtelBot
4184
+ category: Crawler
4185
+ url: https://umtel.com
4186
+ -
4187
+ user_agent: Mozilla/5.0+(compatible;+PiplBot;+http://www.pipl.com/bot/)
4188
+ bot:
4189
+ name: PiplBot
4190
+ category: Crawler
4191
+ url: http://www.pipl.com/bot
4192
+ -
4193
+ user_agent: Mozilla/5.0 (compatible; woobot/2.0; +https://www.woorank.com/bot)
4194
+ bot:
4195
+ name: WooRank
4196
+ category: Crawler
4197
+ url: https://www.woorank.com/bot
4198
+ -
4199
+ user_agent: YahooMailProxy; https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
4200
+ bot:
4201
+ name: Yahoo! Mail Proxy
4202
+ category: Service Agent
4203
+ url: https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
4204
+ producer:
4205
+ name: Yahoo! Inc.
4206
+ url: http://www.yahoo.com
4207
+ -
4208
+ user_agent: 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; Cookiebot/1.0; http://cookiebot.com/) Chrome/79.0.3945.117 Safari/537.36'
4209
+ bot:
4210
+ name: Cookiebot
4211
+ category: Crawler
4212
+ url: https://support.cookiebot.com/hc/en-us/articles/360014264140-Scanner-User-Agent
4213
+ producer:
4214
+ name: Cybot A/S
4215
+ url: https://www.cybot.com/
4216
+ -
4217
+ user_agent: NetSystemsResearch studies the availability of various services across the internet. Our website is netsystemsresearch.com
4218
+ bot:
4219
+ name: NetSystemsResearch
4220
+ category: Security Checker
4221
+ url: https://www.netsystemsresearch.com/
4222
+ producer:
4223
+ name: NET SYSTEMS RESEARCH LLC
4224
+ url: https://www.netsystemsresearch.com/
4225
+ -
4226
+ user_agent: 'Mozilla/5.0 (compatible; CensysInspect/1.1; https://about.censys.io/)'
4227
+ bot:
4228
+ name: CensysInspect
4229
+ category: Security Checker
4230
+ url: https://about.censys.io/
4231
+ producer:
4232
+ name: Censys, Inc.
4233
+ url: https://censys.io/
4234
+ -
4235
+ user_agent: https://gdnplus.com:Gather Analyze Provide.
4236
+ bot:
4237
+ name: GDNP
4238
+ category: Crawler
4239
+ url: https://gdnplus.com/
4240
+ producer:
4241
+ name: Global Digital Network Plus, LLC
4242
+ url: https://gdnplus.com/
4243
+ -
4244
+ user_agent: WellKnownBot/0.1 (https://well-known.dev)
4245
+ bot:
4246
+ name: WellKnownBot
4247
+ category: Crawler
4248
+ url: https://well-known.dev
4249
+ -
4250
+ user_agent: Mozilla/5.0 (compatible; Adsbot/3.1; https://seostar.co/robot/)
4251
+ bot:
4252
+ name: Adsbot
4253
+ category: Crawler
4254
+ url: https://seostar.co/robot/
4255
+ -
4256
+ user_agent: MTRobot/0.2 (Metrics Tools Analytics Crawler; https://metrics-tools.de/robot.html; crawler@metrics-tools.de)
4257
+ bot:
4258
+ name: MTRobot
4259
+ category: Crawler
4260
+ url: https://metrics-tools.de/robot.html
4261
+ producer:
4262
+ name: Metrics Tools
4263
+ url: https://metrics-tools.de/
4264
+ -
4265
+ user_agent: My User Agent 1.0
4266
+ bot:
4267
+ name: Generic Bot
4268
+ -
4269
+ user_agent: serpstatbot/1.0 (advanced backlink tracking bot; curl/7.58.0; http://serpstatbot.com/; abuse@serpstatbot.com)
4270
+ bot:
4271
+ name: serpstatbot
4272
+ category: Crawler
4273
+ url: http://serpstatbot.com/
4274
+ producer:
4275
+ name: Netpeak Ltd
4276
+ url: https://netpeak.net/
4277
+ -
4278
+ user_agent: colly - https://github.com/gocolly/colly/v2
4279
+ bot:
4280
+ name: colly
4281
+ category: Crawler
4282
+ url: https://github.com/gocolly/colly/
4283
+ -
4284
+ user_agent: l9tcpid/v1.0.0
4285
+ bot:
4286
+ name: l9tcpid
4287
+ category: Security Checker
4288
+ url: https://github.com/LeakIX/l9tcpid
4289
+ -
4290
+ user_agent: Mozilla/5.0 (compatible; MegaIndex.ru/2.0; +http://megaindex.com/crawler)
4291
+ bot:
4292
+ name: MegaIndex
4293
+ category: Crawler
4294
+ url: https://megaindex.com/crawler
4295
+ -
4296
+ user_agent: Mozilla/5.0 (compatible; Seekport Crawler; http://seekport.com/)
4297
+ bot:
4298
+ name: Seekport
4299
+ category: Crawler
4300
+ url: http://www.seekport.com/
4301
+ producer:
4302
+ name: SISTRIX GmbH
4303
+ url: https://www.sistrix.de/
4304
+ -
4305
+ user_agent: Mozilla/5.0 (compatible; seolyt/1.1; +https://seolyt.com)
4306
+ bot:
4307
+ name: seolyt
4308
+ category: Crawler
4309
+ url: https://seolyt.com/
4310
+ -
4311
+ user_agent: Mozilla/5.0 (compatible; YaK/1.0; http://linkfluence.com/; bot@linkfluence.com)
4312
+ bot:
4313
+ name: YaK
4314
+ category: Crawler
4315
+ url: https://www.linkfluence.com/
4316
+ producer:
4317
+ name: Linkfluence SAS
4318
+ url: https://www.linkfluence.com/
4319
+ -
4320
+ user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64; +http://www.komodia.com/newwiki/index.php/URL_server_crawler) KomodiaBot/1.0
4321
+ bot:
4322
+ name: KomodiaBot
4323
+ category: Crawler
4324
+ url: http://www.komodia.com/newwiki/index.php/URL_server_crawler
4325
+ producer:
4326
+ name: Komodia Inc.
4327
+ url: https://www.komodia.com/
4328
+ -
4329
+ user_agent: Mozilla/5.0 (Windows NT 6.3; WOW64; Trident/7.0; rv:11.0; Catchpoint) like Gecko
4330
+ bot:
4331
+ name: Catchpoint
4332
+ category: Site Monitor
4333
+ url: https://www.catchpoint.com/
4334
+ producer:
4335
+ name: Catchpoint Systems
4336
+ url: https://www.catchpoint.com/
4337
+ -
4338
+ user_agent: Better Uptime Bot Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36
4339
+ bot:
4340
+ name: Better Uptime Bot
4341
+ category: Site Monitor
4342
+ url: https://betteruptime.com/faq
4343
+ producer:
4344
+ name: Better Uptime
4345
+ url: https://betteruptime.com/
4346
+ -
4347
+ user_agent: gobuster/3.1.0
4348
+ bot:
4349
+ name: Gobuster
4350
+ url: https://github.com/OJ/gobuster
4351
+ -
4352
+ user_agent: k6/0.31.1 (https://k6.io/)
4353
+ bot:
4354
+ name: K6
4355
+ url: https://k6.io/
4356
+ -
4357
+ user_agent: Mozilla/5.0 (compatible; Neevabot/1.0; https://neeva.com/neevabot)
4358
+ bot:
4359
+ name: Neevabot
4360
+ category: Search bot
4361
+ url: https://neeva.com/neevabot
4362
+ producer:
4363
+ name: Neeva Inc.
4364
+ url: https://neeva.com/
4365
+ -
4366
+ user_agent: LinkPreview/1.5 (http://linkpreview.net)
4367
+ bot:
4368
+ name: LinkPreview
4369
+ category: Service Agent
4370
+ url: https://www.linkpreview.net/
4371
+ -
4372
+ user_agent: Mozilla/5.0 (compatible; JungleKeyThumbnail/1.1; +http://www.junglekey.fr/)
4373
+ bot:
4374
+ name: JungleKeyThumbnail
4375
+ category: Crawler
4376
+ url: https://junglekey.com/
4377
+ -
4378
+ user_agent: rocketmonitor 1.0
4379
+ bot:
4380
+ name: RocketMonitorBot
4381
+ category: Site Monitor
4382
+ url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
4383
+ producer:
4384
+ name: Radio Mast, Inc.
4385
+ url: https://www.radiomast.io/
4386
+ -
4387
+ user_agent: RocketMonitorBot/1.0 ( https://www.radiomast.io)
4388
+ bot:
4389
+ name: RocketMonitorBot
4390
+ category: Site Monitor
4391
+ url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
4392
+ producer:
4393
+ name: Radio Mast, Inc.
4394
+ url: https://www.radiomast.io/
4395
+ -
4396
+ user_agent: SitemapParser-VIPnytt/1.1 ( https://github.com/VIPnytt/SitemapParser/blob/master/README.md)
4397
+ bot:
4398
+ name: SitemapParser-VIPnytt
4399
+ category: Crawler
4400
+ url: https://github.com/VIPnytt/SitemapParser/
4401
+ -
4402
+ user_agent: Turnitin (https://bit.ly/2UvnfoQ)
4403
+ bot:
4404
+ name: Turnitin
4405
+ category: Crawler
4406
+ url: https://turnitin.com/robot/crawlerinfo.html
4407
+ -
4408
+ user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; Storebot-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Mobile Safari/537.36
4409
+ bot:
4410
+ name: Google StoreBot
4411
+ category: Crawler
4412
+ -
4413
+ user_agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.56 Safari/537.36 DMBrowser/2.1 (UV)
4414
+ bot:
4415
+ name: Dotcom Monitor
4416
+ category: Site Monitor
4417
+ url: https://www.dotcom-monitor.com
4418
+ -
4419
+ user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64; rv:29.0) Gecko/20100101 /29.0 DMBrowser-BV
4420
+ bot:
4421
+ name: Dotcom Monitor
4422
+ category: Site Monitor
4423
+ url: https://www.dotcom-monitor.com
4424
+ -
4425
+ user_agent: Mozilla/5.0 (compatible; ThinkChaos/0.3.0; +In_the_test_phase,_if_the_ThinkChaos_brings_you_trouble,_please_add_disallow_to_the_robots.txt._Thank_you.)
4426
+ bot:
4427
+ name: ThinkChaos
4428
+ category: Crawler
4429
+ -
4430
+ user_agent: Mozilla/5.0 (compatible; DataForSeoBot/1.0; +https://dataforseo.com/dataforseo-bot)
4431
+ bot:
4432
+ name: DataForSeoBot
4433
+ category: Crawler
4434
+ url: https://dataforseo.com/dataforseo-bot