device_detector 1.0.3 → 1.0.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (94) hide show
  1. checksums.yaml +5 -5
  2. data/CHANGELOG.md +15 -0
  3. data/README.md +8 -7
  4. data/lib/device_detector/bot.rb +2 -2
  5. data/lib/device_detector/browser.rb +364 -0
  6. data/lib/device_detector/client.rb +11 -2
  7. data/lib/device_detector/device.rb +1247 -22
  8. data/lib/device_detector/memory_cache.rb +5 -5
  9. data/lib/device_detector/metadata_extractor.rb +7 -8
  10. data/lib/device_detector/model_extractor.rb +3 -3
  11. data/lib/device_detector/name_extractor.rb +2 -2
  12. data/lib/device_detector/os.rb +150 -116
  13. data/lib/device_detector/parser.rb +23 -10
  14. data/lib/device_detector/version.rb +1 -1
  15. data/lib/device_detector/version_extractor.rb +29 -2
  16. data/lib/device_detector.rb +73 -40
  17. data/regexes/bots.yml +868 -62
  18. data/regexes/client/browser_engine.yml +11 -2
  19. data/regexes/client/browsers.yml +1132 -112
  20. data/regexes/client/feed_readers.yml +5 -11
  21. data/regexes/client/libraries.yml +86 -2
  22. data/regexes/client/mediaplayers.yml +39 -3
  23. data/regexes/client/mobile_apps.yml +940 -66
  24. data/regexes/client/pim.yml +66 -3
  25. data/regexes/device/cameras.yml +6 -6
  26. data/regexes/device/car_browsers.yml +23 -3
  27. data/regexes/device/consoles.yml +15 -3
  28. data/regexes/device/mobiles.yml +18351 -3566
  29. data/regexes/device/notebooks.yml +114 -0
  30. data/regexes/device/portable_media_player.yml +36 -9
  31. data/regexes/device/shell_tv.yml +117 -0
  32. data/regexes/device/televisions.yml +440 -35
  33. data/regexes/oss.yml +635 -284
  34. data/regexes/vendorfragments.yml +5 -1
  35. metadata +21 -118
  36. data/.gitignore +0 -14
  37. data/.travis.yml +0 -14
  38. data/Gemfile +0 -8
  39. data/Rakefile +0 -96
  40. data/device_detector.gemspec +0 -26
  41. data/spec/device_detector/bot_fixtures_spec.rb +0 -30
  42. data/spec/device_detector/client_fixtures_spec.rb +0 -31
  43. data/spec/device_detector/concrete_user_agent_spec.rb +0 -135
  44. data/spec/device_detector/detector_fixtures_spec.rb +0 -100
  45. data/spec/device_detector/device_fixtures_spec.rb +0 -36
  46. data/spec/device_detector/device_spec.rb +0 -151
  47. data/spec/device_detector/memory_cache_spec.rb +0 -148
  48. data/spec/device_detector/model_extractor_spec.rb +0 -63
  49. data/spec/device_detector/os_fixtures_spec.rb +0 -26
  50. data/spec/device_detector/version_extractor_spec.rb +0 -79
  51. data/spec/device_detector_spec.rb +0 -189
  52. data/spec/fixtures/client/browser.yml +0 -2206
  53. data/spec/fixtures/client/feed_reader.yml +0 -199
  54. data/spec/fixtures/client/library.yml +0 -175
  55. data/spec/fixtures/client/mediaplayer.yml +0 -163
  56. data/spec/fixtures/client/mobile_app.yml +0 -193
  57. data/spec/fixtures/client/pim.yml +0 -115
  58. data/spec/fixtures/detector/bots.yml +0 -3260
  59. data/spec/fixtures/detector/camera.yml +0 -121
  60. data/spec/fixtures/detector/car_browser.yml +0 -21
  61. data/spec/fixtures/detector/console.yml +0 -281
  62. data/spec/fixtures/detector/desktop.yml +0 -5361
  63. data/spec/fixtures/detector/feature_phone.yml +0 -891
  64. data/spec/fixtures/detector/feed_reader.yml +0 -551
  65. data/spec/fixtures/detector/mediaplayer.yml +0 -210
  66. data/spec/fixtures/detector/mobile_apps.yml +0 -456
  67. data/spec/fixtures/detector/phablet.yml +0 -3785
  68. data/spec/fixtures/detector/portable_media_player.yml +0 -178
  69. data/spec/fixtures/detector/smart_display.yml +0 -61
  70. data/spec/fixtures/detector/smartphone-1.yml +0 -9953
  71. data/spec/fixtures/detector/smartphone-10.yml +0 -9924
  72. data/spec/fixtures/detector/smartphone-11.yml +0 -9889
  73. data/spec/fixtures/detector/smartphone-12.yml +0 -8655
  74. data/spec/fixtures/detector/smartphone-2.yml +0 -9967
  75. data/spec/fixtures/detector/smartphone-3.yml +0 -9887
  76. data/spec/fixtures/detector/smartphone-4.yml +0 -9911
  77. data/spec/fixtures/detector/smartphone-5.yml +0 -9933
  78. data/spec/fixtures/detector/smartphone-6.yml +0 -9923
  79. data/spec/fixtures/detector/smartphone-7.yml +0 -9892
  80. data/spec/fixtures/detector/smartphone-8.yml +0 -9896
  81. data/spec/fixtures/detector/smartphone-9.yml +0 -9928
  82. data/spec/fixtures/detector/smartphone.yml +0 -9984
  83. data/spec/fixtures/detector/tablet-1.yml +0 -10023
  84. data/spec/fixtures/detector/tablet-2.yml +0 -9968
  85. data/spec/fixtures/detector/tablet-3.yml +0 -7787
  86. data/spec/fixtures/detector/tablet.yml +0 -9951
  87. data/spec/fixtures/detector/tv.yml +0 -3333
  88. data/spec/fixtures/detector/unknown.yml +0 -3283
  89. data/spec/fixtures/device/camera.yml +0 -19
  90. data/spec/fixtures/device/car_browser.yml +0 -7
  91. data/spec/fixtures/device/console.yml +0 -79
  92. data/spec/fixtures/parser/oss.yml +0 -1047
  93. data/spec/fixtures/parser/vendorfragments.yml +0 -162
  94. data/spec/spec_helper.rb +0 -9
@@ -1,3260 +0,0 @@
1
- ---
2
- -
3
- user_agent: 360spider-image
4
- bot:
5
- name: 360Spider
6
- category: Search bot
7
- url: http://www.so.com/help/help_3_2.html
8
- producer:
9
- name: Online Media Group, Inc.
10
- url: ""
11
- -
12
- user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
13
- bot:
14
- name: 360Spider
15
- category: Search bot
16
- url: http://www.so.com/help/help_3_2.html
17
- producer:
18
- name: Online Media Group, Inc.
19
- url: ""
20
- -
21
- user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
22
- bot:
23
- name: 360Spider
24
- category: Search bot
25
- url: http://www.so.com/help/help_3_2.html
26
- producer:
27
- name: Online Media Group, Inc.
28
- url: ""
29
- -
30
- user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
31
- bot:
32
- name: 360Spider
33
- category: Search bot
34
- url: http://www.so.com/help/help_3_2.html
35
- producer:
36
- name: Online Media Group, Inc.
37
- url: ""
38
- -
39
- user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
40
- bot:
41
- name: ADMantX
42
- -
43
- user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
44
- bot:
45
- name: Aboundexbot
46
- category: Search bot
47
- url: http://www.aboundex.com/crawler/
48
- producer:
49
- name: Aboundex.com
50
- url: http://www.aboundex.com
51
- -
52
- user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
53
- bot:
54
- name: Acoon
55
- category: Search bot
56
- url: http://www.acoon.de/robot.asp
57
- producer:
58
- name: Acoon GmbH
59
- url: http://www.acoon.de
60
- -
61
- user_agent: AddThis.com robot tech.support@clearspring.com
62
- bot:
63
- name: AddThis.com
64
- category: Social Media Agent
65
- url: ""
66
- producer:
67
- name: Clearspring Technologies, Inc.
68
- url: http://www.clearspring.com
69
- -
70
- user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
71
- bot:
72
- name: Alexa Crawler
73
- category: Search bot
74
- url: https://alexa.zendesk.com/hc/en-us/sections/200100794-Crawlers
75
- producer:
76
- name: Alexa Internet
77
- url: http://www.alexa.com
78
- -
79
- user_agent: Mozilla/5.0 (compatible; alexa site audit/1.0; http://www.alexa.com/help/webmasters; )
80
- bot:
81
- name: Alexa Site Audit
82
- category: Site Monitor
83
- url: http://www.alexa.com/help/webmasters
84
- producer:
85
- name: Alexa Internet
86
- url: http://www.alexa.com
87
- -
88
- user_agent: Amazon Route 53 Health Check Service; ref:xxxxxxxx-xxxx-xxxxxxxxx-xxxxxxxxxxxx; report http://amzn.to/xxxxxxx
89
- bot:
90
- name: Amazon Route53 Health Check
91
- category: Service Agent
92
- producer:
93
- name: Amazon Web Services
94
- url: https://aws.amazon.com/
95
- -
96
- user_agent: Amazon-Route53-Health-Check-Service (ref b0eb04d5-cb5e-40e7-839b-558e52fc3f0d; report http://amzn.to/1vsZADi)
97
- bot:
98
- name: Amazon Route53 Health Check
99
- category: Service Agent
100
- producer:
101
- name: Amazon Web Services
102
- url: https://aws.amazon.com/
103
- -
104
- user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
105
- bot:
106
- name: Amorank Spider
107
- category: Crawler
108
- url: http://amorank.com/webcrawler.html
109
- producer:
110
- name: Amorank
111
- url: http://www.amorank.com
112
- -
113
- user_agent: 'Curious George - www.analyticsseo.com/crawler'
114
- bot:
115
- name: Analytics SEO Crawler
116
- category: Crawler
117
- url: http://www.analyticsseo.com/crawler
118
- producer:
119
- name: Analytics SEO
120
- url: http://www.analyticsseo.com
121
- -
122
- user_agent: ApacheBench/2.3
123
- bot:
124
- name: ApacheBench
125
- category: Benchmark
126
- url: https://httpd.apache.org/docs/2.4/programs/ab.html
127
- producer:
128
- name: The Apache Software Foundation
129
- url: http://www.apache.org/foundation/
130
- -
131
- user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
132
- bot:
133
- name: Applebot
134
- category: Crawler
135
- url: http://www.apple.com/go/applebot
136
- producer:
137
- name: Apple Inc
138
- url: http://www.apple.com
139
- -
140
- user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
141
- bot:
142
- name: Applebot
143
- category: Crawler
144
- url: http://www.apple.com/go/applebot
145
- producer:
146
- name: Apple Inc
147
- url: http://www.apple.com
148
- -
149
- user_agent: Arachni/v1.5.1
150
- bot:
151
- name: Arachni
152
- category: Security Checker
153
- url: http://www.arachni-scanner.com
154
- producer:
155
- name: Sarosys LLC
156
- url: http://www.sarosys.com/
157
- -
158
- user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
159
- bot:
160
- name: Ask Jeeves
161
- category: Search bot
162
- url: ""
163
- producer:
164
- name: Ask Jeeves Inc.
165
- url: http://www.ask.com
166
- -
167
- user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
168
- bot:
169
- name: BLEXBot Crawler
170
- category: Crawler
171
- url: http://webmeup-crawler.com
172
- producer:
173
- name: WebMeUp
174
- url: http://webmeup.com
175
- -
176
- user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
177
- bot:
178
- name: BUbiNG
179
- category: Crawler
180
- url: http://law.di.unimi.it/BUbiNG.html
181
- producer:
182
- name: The Laboratory for Web Algorithmics (LAW)
183
- url: 'http://law.di.unimi.it/software.php#buging'
184
- -
185
- user_agent: Backlink-Check.de (+http://www.backlink-check.de/bot.html)
186
- bot:
187
- name: Backlink-Check.de
188
- category: Crawler
189
- url: http://www.backlink-check.de/bot.html
190
- producer:
191
- name: Mediagreen Medienservice
192
- url: http://www.backlink-check.de
193
- -
194
- user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
195
- bot:
196
- name: BacklinkCrawler
197
- category: Crawler
198
- url: http://www.backlinktest.com/crawler.html
199
- producer:
200
- name: 2.0Promotion GbR
201
- url: http://www.backlinktest.com
202
- -
203
- user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
204
- bot:
205
- name: Baidu Spider
206
- category: Search bot
207
- url: http://www.baidu.com/search/spider.htm
208
- producer:
209
- name: Baidu
210
- url: http://www.baidu.com
211
- -
212
- user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
213
- bot:
214
- name: Baidu Spider
215
- category: Search bot
216
- url: http://www.baidu.com/search/spider.htm
217
- producer:
218
- name: Baidu
219
- url: http://www.baidu.com
220
- -
221
- user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
222
- bot:
223
- name: Baidu Spider
224
- category: Search bot
225
- url: http://www.baidu.com/search/spider.htm
226
- producer:
227
- name: Baidu
228
- url: http://www.baidu.com
229
- -
230
- user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
231
- bot:
232
- name: Baidu Spider
233
- category: Search bot
234
- url: http://www.baidu.com/search/spider.htm
235
- producer:
236
- name: Baidu
237
- url: http://www.baidu.com
238
- -
239
- user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
240
- bot:
241
- name: Baidu Spider
242
- category: Search bot
243
- url: http://www.baidu.com/search/spider.htm
244
- producer:
245
- name: Baidu
246
- url: http://www.baidu.com
247
- -
248
- user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
249
- bot:
250
- name: Baidu Spider
251
- category: Search bot
252
- url: http://www.baidu.com/search/spider.htm
253
- producer:
254
- name: Baidu
255
- url: http://www.baidu.com
256
- -
257
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
258
- bot:
259
- name: Baidu Spider
260
- category: Search bot
261
- url: http://www.baidu.com/search/spider.htm
262
- producer:
263
- name: Baidu
264
- url: http://www.baidu.com
265
- -
266
- user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
267
- bot:
268
- name: BazQux Reader
269
- url: https://bazqux.com/fetcher
270
- category: Feed Fetcher
271
- producer:
272
- name: ""
273
- url: ""
274
- -
275
- user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
276
- bot:
277
- name: BingBot
278
- category: Search bot
279
- url: http://search.msn.com/msnbot.htmn
280
- producer:
281
- name: Microsoft Corporation
282
- url: http://www.microsoft.com
283
- -
284
- user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
285
- bot:
286
- name: BingBot
287
- category: Search bot
288
- url: http://search.msn.com/msnbot.htmn
289
- producer:
290
- name: Microsoft Corporation
291
- url: http://www.microsoft.com
292
- -
293
- user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
294
- bot:
295
- name: BingBot
296
- category: Search bot
297
- url: http://search.msn.com/msnbot.htmn
298
- producer:
299
- name: Microsoft Corporation
300
- url: http://www.microsoft.com
301
- -
302
- user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
303
- bot:
304
- name: BingBot
305
- category: Search bot
306
- url: http://search.msn.com/msnbot.htmn
307
- producer:
308
- name: Microsoft Corporation
309
- url: http://www.microsoft.com
310
- -
311
- user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
312
- bot:
313
- name: BingBot
314
- category: Search bot
315
- url: http://search.msn.com/msnbot.htmn
316
- producer:
317
- name: Microsoft Corporation
318
- url: http://www.microsoft.com
319
- -
320
- user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
321
- bot:
322
- name: BingBot
323
- category: Search bot
324
- url: http://search.msn.com/msnbot.htmn
325
- producer:
326
- name: Microsoft Corporation
327
- url: http://www.microsoft.com
328
- -
329
- user_agent: msnbot/2.0b v1394720947.6703
330
- bot:
331
- name: BingBot
332
- category: Search bot
333
- url: http://search.msn.com/msnbot.htmn
334
- producer:
335
- name: Microsoft Corporation
336
- url: http://www.microsoft.com
337
- -
338
- user_agent: MSNBot/Nutch-1.5.1
339
- bot:
340
- name: BingBot
341
- category: Search bot
342
- url: http://search.msn.com/msnbot.htmn
343
- producer:
344
- name: Microsoft Corporation
345
- url: http://www.microsoft.com
346
- -
347
- user_agent: bitlybot/3.0
348
- bot:
349
- name: BitlyBot
350
- category: Crawler
351
- url: https://bitly.com
352
- producer:
353
- name: Bitly, Inc.
354
- url: https://bitly.com
355
- -
356
- user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
357
- bot:
358
- name: Blekkobot
359
- category: Search bot
360
- url: http://blekko.com/about/blekkobot
361
- producer:
362
- name: Blekko
363
- url: http://blekko.com
364
- -
365
- user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
366
- bot:
367
- name: Bloglovin
368
- url: http://www.bloglovin.com
369
- category: Feed Fetcher
370
- producer:
371
- name: ""
372
- url: ""
373
- -
374
- user_agent: Blogtrottr/2.0
375
- bot:
376
- name: Blogtrottr
377
- url: ""
378
- category: Feed Fetcher
379
- producer:
380
- name: Blogtrottr Ltd
381
- url: https://blogtrottr.com/
382
- -
383
- user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
384
- bot:
385
- name: Bountii Bot
386
- category: Search bot
387
- url: http://bountii.com/contact.php
388
- producer:
389
- name: Bountii Inc.
390
- url: http://bountii.com
391
- -
392
- user_agent: Browsershots
393
- bot:
394
- name: Browsershots
395
- category: Service Agent
396
- url: http://browsershots.org/faq
397
- producer:
398
- name: Browsershots.org
399
- url: http://browsershots.org
400
- -
401
- user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
402
- bot:
403
- name: Butterfly Robot
404
- category: Search bot
405
- url: http://labs.topsy.com/butterfly
406
- producer:
407
- name: Topsy Labs
408
- url: http://labs.topsy.com
409
- -
410
- user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
411
- bot:
412
- name: Butterfly Robot
413
- category: Search bot
414
- url: http://labs.topsy.com/butterfly
415
- producer:
416
- name: Topsy Labs
417
- url: http://labs.topsy.com
418
- -
419
- user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
420
- bot:
421
- name: CareerBot
422
- category: Crawler
423
- url: http://www.career-x.de/bot.html
424
- producer:
425
- name: career-x GmbH
426
- url: http://www.career-x.de
427
- -
428
- user_agent: Castro 2, Episode Duration Lookup
429
- bot:
430
- name: Castro 2
431
- category: Service Agent
432
- url: http://supertop.co/castro/
433
- producer:
434
- name: Supertop
435
- url: http://supertop.co
436
- -
437
- user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
438
- bot:
439
- name: Cliqzbot
440
- category: Crawler
441
- url: http://cliqz.com/company/cliqzbot
442
- producer:
443
- name: 10betterpages GmbH
444
- url: http://cliqz.com
445
- -
446
- user_agent: Mozilla/5.0 (compatible; Cloudflare-AMP/1.0; +https://amp.cloudflare.com/doc/fetcher.html) AppleWebKit/534.34
447
- bot:
448
- name: CloudFlare AMP Fetcher
449
- category: Crawler
450
- url: https://amp.cloudflare.com/doc/fetcher.html
451
- producer:
452
- name: CloudFlare
453
- url: http://www.cloudflare.com
454
- -
455
- user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
456
- bot:
457
- name: CloudFlare Always Online
458
- category: Site Monitor
459
- url: http://www.cloudflare.com/always-online
460
- producer:
461
- name: CloudFlare
462
- url: http://www.cloudflare.com
463
- -
464
- user_agent: collectd/5.5.1
465
- bot:
466
- name: Collectd
467
- url: https://collectd.org/
468
- category: Site Monitor
469
- producer:
470
- name: Collectd
471
- url: https://collectd.org/
472
- -
473
- user_agent: CommaFeed/1.0 (http://www.commafeed.com)
474
- bot:
475
- name: CommaFeed
476
- url: http://www.commafeed.com
477
- category: Feed Fetcher
478
- producer:
479
- name: ""
480
- url: ""
481
- -
482
- user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
483
- bot:
484
- name: Cốc Cốc Bot
485
- url: http://help.coccoc.com/
486
- category: Search bot
487
- producer:
488
- name: Cốc Cốc
489
- url: http://coccoc.com/
490
- -
491
- user_agent: Datadog Agent/5.10.1
492
- bot:
493
- name: Datadog Agent
494
- url: https://github.com/DataDog/dd-agent
495
- category: Site Monitor
496
- producer:
497
- name: Datadog
498
- url: https://www.datadoghq.com/
499
- -
500
- user_agent: Mozilla/5.0 (X11; Datanyze; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36
501
- bot:
502
- name: Datanyze
503
- url: ""
504
- category: Crawler
505
- producer:
506
- name: Datanyze
507
- url: https://www.datanyze.com
508
- -
509
- user_agent: Mozilla/5.0 (compatible; Dataprovider/6.92; +https://www.dataprovider.com/)
510
- bot:
511
- name: Dataprovider
512
- category: Crawler
513
- url: ""
514
- producer:
515
- name: Dataprovider B.V.
516
- url: https://www.dataprovider.com/
517
- -
518
- user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
519
- bot:
520
- name: Daum
521
- category: Search bot
522
- url: http://tab.search.daum.net/aboutWebSearch_en.html
523
- producer:
524
- name: Daum Communications Corp.
525
- url: http://www.kakaocorp.com/main
526
- -
527
- user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
528
- bot:
529
- name: Daum
530
- category: Search bot
531
- url: http://tab.search.daum.net/aboutWebSearch_en.html
532
- producer:
533
- name: Daum Communications Corp.
534
- url: http://www.kakaocorp.com/main
535
- -
536
- user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
537
- bot:
538
- name: Dazoobot
539
- category: Search bot
540
- url: ""
541
- producer:
542
- name: DAZOO.FR
543
- url: http://dazoo.fr
544
- -
545
- user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
546
- bot:
547
- name: Discobot
548
- category: Search bot
549
- url: http://discoveryengine.com/discobot.html
550
- producer:
551
- name: Discovery Engine
552
- url: http://discoveryengine.com
553
- -
554
- user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
555
- bot:
556
- name: Domain Re-Animator Bot
557
- category: Crawler
558
- url: ""
559
- producer:
560
- name: Domain Re-Animator, LLC
561
- url: http://domainreanimator.com
562
- -
563
- user_agent: support@domainreanimator.com
564
- bot:
565
- name: Domain Re-Animator Bot
566
- category: Crawler
567
- url: ""
568
- producer:
569
- name: Domain Re-Animator, LLC
570
- url: http://domainreanimator.com
571
- -
572
- user_agent: dotbot
573
- bot:
574
- name: DotBot
575
- category: Crawler
576
- url: http://www.opensiteexplorer.org/dotbot
577
- producer:
578
- name: SEOmoz, Inc.
579
- url: http://moz.com/
580
- -
581
- user_agent: DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)
582
- bot:
583
- name: DuckDuckGo Bot
584
- category: Search bot
585
- url: https://duckduckgo.com/duckduckbot
586
- producer:
587
- name: DuckDuckGo
588
- url: https://duckduckgo.com/
589
- -
590
- user_agent: Mozilla/5.0 (compatible; DuckDuckGo-Favicons-Bot/1.0; +http://duckduckgo.com)
591
- bot:
592
- name: DuckDuckGo Bot
593
- category: Search bot
594
- url: https://duckduckgo.com/duckduckbot
595
- producer:
596
- name: DuckDuckGo
597
- url: https://duckduckgo.com/
598
- -
599
- user_agent: EMail Exractor
600
- bot:
601
- name: EMail Exractor
602
- category: Crawler
603
- url: ""
604
- producer:
605
- name: ""
606
- url: ""
607
- -
608
- user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
609
- bot:
610
- name: Easou Spider
611
- category: Search bot
612
- url: http://www.easou.com/search/spider.html
613
- producer:
614
- name: easou ICP
615
- url: http://www.easou.com
616
- -
617
- user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
618
- bot:
619
- name: Easou Spider
620
- category: Search bot
621
- url: http://www.easou.com/search/spider.html
622
- producer:
623
- name: easou ICP
624
- url: http://www.easou.com
625
- -
626
- user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
627
- bot:
628
- name: ExaBot
629
- category: Crawler
630
- url: http://www.exabot.com/go/robot
631
- producer:
632
- name: Dassault Systèmes
633
- url: http://www.3ds.com
634
- -
635
- user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
636
- bot:
637
- name: ExaBot
638
- category: Crawler
639
- url: http://www.exabot.com/go/robot
640
- producer:
641
- name: Dassault Systèmes
642
- url: http://www.3ds.com
643
- -
644
- user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
645
- bot:
646
- name: ExaBot
647
- category: Crawler
648
- url: http://www.exabot.com/go/robot
649
- producer:
650
- name: Dassault Systèmes
651
- url: http://www.3ds.com
652
- -
653
- user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
654
- bot:
655
- name: ExactSeek Crawler
656
- category: Search bot
657
- url: http://www.exactseek.com
658
- producer:
659
- name: Jayde Online, Inc.
660
- url: http://www.jaydeonlineinc.com
661
- -
662
- user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
663
- bot:
664
- name: Ezooms
665
- category: Crawler
666
- url: ""
667
- producer:
668
- name: SEOmoz, Inc.
669
- url: http://moz.com/
670
- -
671
- user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
672
- bot:
673
- name: Facebook External Hit
674
- category: Social Media Agent
675
- url: https://www.facebook.com/externalhit_uatext.php
676
- producer:
677
- name: Facebook
678
- url: http://www.facebook.com
679
- -
680
- user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
681
- bot:
682
- name: Facebook External Hit
683
- category: Social Media Agent
684
- url: https://www.facebook.com/externalhit_uatext.php
685
- producer:
686
- name: Facebook
687
- url: http://www.facebook.com
688
- -
689
- user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
690
- bot:
691
- name: Feed Wrangler
692
- url: https://feedwrangler.net/
693
- category: Feed Fetcher
694
- producer:
695
- name: 'David Smith & Developing Perspective, LLC'
696
- url: https://david-smith.org
697
- -
698
- user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
699
- bot:
700
- name: FeedBurner
701
- url: http://www.feedburner.com
702
- category: Feed Fetcher
703
- producer:
704
- name: ""
705
- url: ""
706
- -
707
- user_agent: 'Feedbin - 9 subscribers'
708
- bot:
709
- name: Feedbin
710
- url: http://feedbin.com/
711
- category: Feed Fetcher
712
- producer:
713
- name: ""
714
- url: ""
715
- -
716
- user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
717
- bot:
718
- name: Feedly
719
- url: http://www.feedly.com
720
- category: Feed Fetcher
721
- producer:
722
- name: ""
723
- url: ""
724
- -
725
- user_agent: FeedlyApp/1.0 (http://www.feedly.com)
726
- bot:
727
- name: Feedly
728
- url: http://www.feedly.com
729
- category: Feed Fetcher
730
- producer:
731
- name: ""
732
- url: ""
733
- -
734
- user_agent: FeedlyBot/1.0 (http://feedly.com)
735
- bot:
736
- name: Feedly
737
- url: http://www.feedly.com
738
- category: Feed Fetcher
739
- producer:
740
- name: ""
741
- url: ""
742
- -
743
- user_agent: MetaFeedly/1.0 (http://www.feedly.com)
744
- bot:
745
- name: Feedly
746
- url: http://www.feedly.com
747
- category: Feed Fetcher
748
- producer:
749
- name: ""
750
- url: ""
751
- -
752
- user_agent: Feedspot http://www.feedspot.com
753
- bot:
754
- name: Feedspot
755
- url: http://www.feedspot.com
756
- category: Feed Fetcher
757
- producer:
758
- name: ""
759
- url: ""
760
- -
761
- user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
762
- bot:
763
- name: Fever
764
- url: http://feedafever.com/
765
- category: Feed Fetcher
766
- producer:
767
- name: ""
768
- url: ""
769
- -
770
- user_agent: Mozilla/5.0 (compatible; Findxbot/1.0; +http://www.findxbot.com)
771
- bot:
772
- name: Findxbot
773
- category: Crawler
774
- url: http://www.findxbot.com
775
- -
776
- user_agent: Mozilla/5.0 (compatible; FlipboardProxy/1.2; +http://flipboard.com/browserproxy)
777
- bot:
778
- name: Flipboard
779
- url: http://flipboard.com/browserproxy
780
- category: Feed Fetcher
781
- producer:
782
- name: Flipboard
783
- url: http://flipboard.com/
784
- -
785
- user_agent: Mozilla/5.0 (compatible; FlipboardRSS/1.2; +http://flipboard.com/browserproxy)
786
- bot:
787
- name: Flipboard
788
- url: http://flipboard.com/browserproxy
789
- category: Feed Fetcher
790
- producer:
791
- name: Flipboard
792
- url: http://flipboard.com/
793
- -
794
- user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
795
- bot:
796
- name: FreshRSS
797
- category: Feed Fetcher
798
- url: https://freshrss.org/
799
- -
800
- user_agent: FreshRSS/1.12.0 (Linux; https://freshrss.org)
801
- bot:
802
- name: FreshRSS
803
- category: Feed Fetcher
804
- url: https://freshrss.org/
805
- -
806
- user_agent: COMODO SSL Checker
807
- bot:
808
- name: Generic Bot
809
- -
810
- user_agent: help@dataminr.com
811
- bot:
812
- name: Generic Bot
813
- -
814
- user_agent: 'HybridBot (hybrid.ru/about. If our bot caused problems please contact us. Contact email: m.lyashkov@targetix.net)'
815
- bot:
816
- name: Generic Bot
817
- -
818
- user_agent: Mozilla/5.0 (compatible; +http://tweetedtimes.com)
819
- bot:
820
- name: Generic Bot
821
- -
822
- user_agent: Mozilla/5.0 (compatible; Shareaholicbot/2.0; +http://www.shareaholic.com/bot)
823
- bot:
824
- name: Generic Bot
825
- -
826
- user_agent: Mozilla/5.0 (compatible; TrendsmapResolver/0.1)
827
- bot:
828
- name: Generic Bot
829
- -
830
- user_agent: niki-bot
831
- bot:
832
- name: Generic Bot
833
- -
834
- user_agent: PHPCrawl
835
- bot:
836
- name: Generic Bot
837
- -
838
- user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
839
- bot:
840
- name: Genieo Web filter
841
- category: ""
842
- url: http://www.genieo.com/webfilter.html
843
- producer:
844
- name: Genieo
845
- url: http://www.genieo.com
846
- -
847
- user_agent: GigablastOpenSource/1.0
848
- bot:
849
- name: Gigablast
850
- category: Search bot
851
- url: https://github.com/gigablast/open-source-search-engine
852
- producer:
853
- name: Matt Wells
854
- url: http://www.gigablast.com/faq.html
855
- -
856
- user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
857
- bot:
858
- name: Gluten Free Crawler
859
- category: Crawler
860
- url: http://glutenfreepleasure.com/
861
- producer:
862
- name: ""
863
- url: ""
864
- -
865
- user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
866
- bot:
867
- name: Gmail Image Proxy
868
- category: Crawler
869
- url: ""
870
- producer:
871
- name: Google Inc.
872
- url: http://www.google.com
873
- -
874
- user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.75 Safari/537.36 Google Favicon
875
- bot:
876
- name: Google Favicon
877
- category: Crawler
878
- -
879
- user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
880
- bot:
881
- name: Goo
882
- category: Search bot
883
- url: http://search.goo.ne.jp/option/use/sub4/sub4-1
884
- producer:
885
- name: NTT Resonant
886
- url: http://goo.ne.jp
887
- -
888
- user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
889
- bot:
890
- name: Google PageSpeed Insights
891
- category: Site Monitor
892
- url: http://developers.google.com/speed/pagespeed/insights/
893
- producer:
894
- name: Google Inc.
895
- url: http://www.google.com
896
- -
897
- user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
898
- bot:
899
- name: Google Partner Monitoring
900
- category: Site Monitor
901
- url: ""
902
- producer:
903
- name: Google Inc.
904
- url: http://www.google.com
905
- -
906
- user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Search Console) Chrome/41.0.2272.118 Safari/537.36
907
- bot:
908
- name: Google Search Console
909
- category: Crawler
910
- url: https://search.google.com/search-console/about
911
- producer:
912
- name: Google Inc.
913
- url: http://www.google.com
914
- -
915
- user_agent: Google-Structured-Data-Testing-Tool +https://search.google.com/structured-data/testing-tool)
916
- bot:
917
- name: Google Structured Data Testing Tool
918
- category: Validator
919
- url: https://search.google.com/structured-data/testing-tool
920
- producer:
921
- name: Google Inc.
922
- url: http://www.google.com
923
- -
924
- user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
925
- bot:
926
- name: Googlebot
927
- category: Search bot
928
- url: http://www.google.com/bot.html
929
- producer:
930
- name: Google Inc.
931
- url: http://www.google.com
932
- -
933
- user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
934
- bot:
935
- name: Googlebot
936
- category: Search bot
937
- url: http://www.google.com/bot.html
938
- producer:
939
- name: Google Inc.
940
- url: http://www.google.com
941
- -
942
- user_agent: APIs-Google (+https://developers.google.com/webmasters/APIs-Google.html)
943
- bot:
944
- name: Googlebot
945
- category: Search bot
946
- url: http://www.google.com/bot.html
947
- producer:
948
- name: Google Inc.
949
- url: http://www.google.com
950
- -
951
- user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
952
- bot:
953
- name: Googlebot
954
- category: Search bot
955
- url: http://www.google.com/bot.html
956
- producer:
957
- name: Google Inc.
958
- url: http://www.google.com
959
- -
960
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
961
- bot:
962
- name: Googlebot
963
- category: Search bot
964
- url: http://www.google.com/bot.html
965
- producer:
966
- name: Google Inc.
967
- url: http://www.google.com
968
- -
969
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
970
- bot:
971
- name: Googlebot
972
- category: Search bot
973
- url: http://www.google.com/bot.html
974
- producer:
975
- name: Google Inc.
976
- url: http://www.google.com
977
- -
978
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
979
- bot:
980
- name: Googlebot
981
- category: Search bot
982
- url: http://www.google.com/bot.html
983
- producer:
984
- name: Google Inc.
985
- url: http://www.google.com
986
- -
987
- user_agent: Google-AdWords-Express
988
- bot:
989
- name: Googlebot
990
- category: Search bot
991
- url: http://www.google.com/bot.html
992
- producer:
993
- name: Google Inc.
994
- url: http://www.google.com
995
- -
996
- user_agent: Google-Adwords-Instant (+http://www.google.com/adsbot.html)
997
- bot:
998
- name: Googlebot
999
- category: Search bot
1000
- url: http://www.google.com/bot.html
1001
- producer:
1002
- name: Google Inc.
1003
- url: http://www.google.com
1004
- -
1005
- user_agent: Google-speakr
1006
- bot:
1007
- name: Googlebot
1008
- category: Search bot
1009
- url: http://www.google.com/bot.html
1010
- producer:
1011
- name: Google Inc.
1012
- url: http://www.google.com
1013
- -
1014
- user_agent: Googlebot (gocrawl v0.4)
1015
- bot:
1016
- name: Googlebot
1017
- category: Search bot
1018
- url: http://www.google.com/bot.html
1019
- producer:
1020
- name: Google Inc.
1021
- url: http://www.google.com
1022
- -
1023
- user_agent: Googlebot-Image/1.0
1024
- bot:
1025
- name: Googlebot
1026
- category: Search bot
1027
- url: http://www.google.com/bot.html
1028
- producer:
1029
- name: Google Inc.
1030
- url: http://www.google.com
1031
- -
1032
- user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
1033
- bot:
1034
- name: Googlebot
1035
- category: Search bot
1036
- url: http://www.google.com/bot.html
1037
- producer:
1038
- name: Google Inc.
1039
- url: http://www.google.com
1040
- -
1041
- user_agent: Googlebot-Video/1.0
1042
- bot:
1043
- name: Googlebot
1044
- category: Search bot
1045
- url: http://www.google.com/bot.html
1046
- producer:
1047
- name: Google Inc.
1048
- url: http://www.google.com
1049
- -
1050
- user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
1051
- bot:
1052
- name: Googlebot
1053
- category: Search bot
1054
- url: http://www.google.com/bot.html
1055
- producer:
1056
- name: Google Inc.
1057
- url: http://www.google.com
1058
- -
1059
- user_agent: Googlebot/Nutch-1.7
1060
- bot:
1061
- name: Googlebot
1062
- category: Search bot
1063
- url: http://www.google.com/bot.html
1064
- producer:
1065
- name: Google Inc.
1066
- url: http://www.google.com
1067
- -
1068
- user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
1069
- bot:
1070
- name: Googlebot
1071
- category: Search bot
1072
- url: http://www.google.com/bot.html
1073
- producer:
1074
- name: Google Inc.
1075
- url: http://www.google.com
1076
- -
1077
- user_agent: Mediapartners-Google
1078
- bot:
1079
- name: Googlebot
1080
- category: Search bot
1081
- url: http://www.google.com/bot.html
1082
- producer:
1083
- name: Google Inc.
1084
- url: http://www.google.com
1085
- -
1086
- user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
1087
- bot:
1088
- name: Googlebot
1089
- category: Search bot
1090
- url: http://www.google.com/bot.html
1091
- producer:
1092
- name: Google Inc.
1093
- url: http://www.google.com
1094
- -
1095
- user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
1096
- bot:
1097
- name: Googlebot
1098
- category: Search bot
1099
- url: http://www.google.com/bot.html
1100
- producer:
1101
- name: Google Inc.
1102
- url: http://www.google.com
1103
- -
1104
- user_agent: Mozilla/5.0 (en-US) AppleWebKit/537.36 (KHTML, like Gecko; Google-Assess) Chrome/34.0.1847.116 Safari/537.36
1105
- bot:
1106
- name: Googlebot
1107
- category: Search bot
1108
- url: http://www.google.com/bot.html
1109
- producer:
1110
- name: Google Inc.
1111
- url: http://www.google.com
1112
- -
1113
- user_agent: Mozilla/5.0 (en-us) AppleWebKit/537.36(KHTML, like Gecko; Google-Adwords-DisplayAds-WebRender;) Chrome/41.0.2272.118Safari/537.36
1114
- bot:
1115
- name: Googlebot
1116
- category: Search bot
1117
- url: http://www.google.com/bot.html
1118
- producer:
1119
- name: Google Inc.
1120
- url: http://www.google.com
1121
- -
1122
- user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
1123
- bot:
1124
- name: Googlebot
1125
- category: Search bot
1126
- url: http://www.google.com/bot.html
1127
- producer:
1128
- name: Google Inc.
1129
- url: http://www.google.com
1130
- -
1131
- user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
1132
- bot:
1133
- name: Googlebot
1134
- category: Search bot
1135
- url: http://www.google.com/bot.html
1136
- producer:
1137
- name: Google Inc.
1138
- url: http://www.google.com
1139
- -
1140
- user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-Read-Aloud; +https://support.google.com/webmasters/answer/1061943)
1141
- bot:
1142
- name: Googlebot
1143
- category: Search bot
1144
- url: http://www.google.com/bot.html
1145
- producer:
1146
- name: Google Inc.
1147
- url: http://www.google.com
1148
- -
1149
- user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
1150
- bot:
1151
- name: Googlebot
1152
- category: Search bot
1153
- url: http://www.google.com/bot.html
1154
- producer:
1155
- name: Google Inc.
1156
- url: http://www.google.com
1157
- -
1158
- user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
1159
- bot:
1160
- name: Googlebot
1161
- category: Search bot
1162
- url: http://www.google.com/bot.html
1163
- producer:
1164
- name: Google Inc.
1165
- url: http://www.google.com
1166
- -
1167
- user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36 (compatible; Google-Shopping-Quality +http://www.google.com/merchants/tos/extend/DE/tos.html)
1168
- bot:
1169
- name: Googlebot
1170
- category: Search bot
1171
- url: http://www.google.com/bot.html
1172
- producer:
1173
- name: Google Inc.
1174
- url: http://www.google.com
1175
- -
1176
- user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
1177
- bot:
1178
- name: Googlebot
1179
- category: Search bot
1180
- url: http://www.google.com/bot.html
1181
- producer:
1182
- name: Google Inc.
1183
- url: http://www.google.com
1184
- -
1185
- user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
1186
- bot:
1187
- name: Googlebot
1188
- category: Search bot
1189
- url: http://www.google.com/bot.html
1190
- producer:
1191
- name: Google Inc.
1192
- url: http://www.google.com
1193
- -
1194
- user_agent: Mozilla/5.0 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
1195
- bot:
1196
- name: Grapeshot
1197
- category: Crawler
1198
- url: https://www.grapeshot.com/crawler
1199
- producer:
1200
- name: Grapeshot
1201
- url: https://www.grapeshot.com
1202
- -
1203
- user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1. 4 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
1204
- bot:
1205
- name: Grapeshot
1206
- category: Crawler
1207
- url: https://www.grapeshot.com/crawler
1208
- producer:
1209
- name: Grapeshot
1210
- url: https://www.grapeshot.com
1211
- -
1212
- user_agent: HTTPMon/1.0b (http://www.httpmon.com)
1213
- bot:
1214
- name: HTTPMon
1215
- category: Site Monitor
1216
- url: http://www.httpmon.com
1217
- producer:
1218
- name: towards GmbH
1219
- url: http://www.towards.ch/
1220
- -
1221
- user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
1222
- bot:
1223
- name: Heritrix
1224
- category: Crawler
1225
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1226
- producer:
1227
- name: The Internet Archive
1228
- url: http://www.archive.org
1229
- -
1230
- user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
1231
- bot:
1232
- name: Heritrix
1233
- category: Crawler
1234
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1235
- producer:
1236
- name: The Internet Archive
1237
- url: http://www.archive.org
1238
- -
1239
- user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
1240
- bot:
1241
- name: Heritrix
1242
- category: Crawler
1243
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1244
- producer:
1245
- name: The Internet Archive
1246
- url: http://www.archive.org
1247
- -
1248
- user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
1249
- bot:
1250
- name: Heritrix
1251
- category: Crawler
1252
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1253
- producer:
1254
- name: The Internet Archive
1255
- url: http://www.archive.org
1256
- -
1257
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
1258
- bot:
1259
- name: Heritrix
1260
- category: Crawler
1261
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1262
- producer:
1263
- name: The Internet Archive
1264
- url: http://www.archive.org
1265
- -
1266
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
1267
- bot:
1268
- name: Heritrix
1269
- category: Crawler
1270
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1271
- producer:
1272
- name: The Internet Archive
1273
- url: http://www.archive.org
1274
- -
1275
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
1276
- bot:
1277
- name: Heritrix
1278
- category: Crawler
1279
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1280
- producer:
1281
- name: The Internet Archive
1282
- url: http://www.archive.org
1283
- -
1284
- user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
1285
- bot:
1286
- name: Heritrix
1287
- category: Crawler
1288
- url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
1289
- producer:
1290
- name: The Internet Archive
1291
- url: http://www.archive.org
1292
- -
1293
- user_agent: Heurekabot-Feed/1.0 (+https://sluzby.heureka.cz/napoveda/heurekabot/)
1294
- bot:
1295
- name: Heureka Feed
1296
- category: Crawler
1297
- url: https://sluzby.heureka.cz/napoveda/heurekabot/
1298
- producer:
1299
- name: Heureka.cz, a.s.
1300
- url: https://www.heureka.cz/
1301
- -
1302
- user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
1303
- bot:
1304
- name: HubPages
1305
- category: Crawler
1306
- url: http://hubpages.com/help/crawlingpolicy
1307
- producer:
1308
- name: HubPages
1309
- url: http://hubpages.com/
1310
- -
1311
- user_agent: HubSpot Website Grader (web-crawlers@hubspot.com)
1312
- bot:
1313
- name: HubSpot
1314
- category: Crawler
1315
- producer:
1316
- name: HubSpot Inc.
1317
- url: https://www.hubspot.com
1318
- -
1319
- user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
1320
- bot:
1321
- name: ICC-Crawler
1322
- category: Crawler
1323
- url: http://www.nict.go.jp/en/univ-com/plan/crawl.html
1324
- producer:
1325
- name: ""
1326
- url: ""
1327
- -
1328
- user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
1329
- bot:
1330
- name: IIS Site Analysis
1331
- category: Crawler
1332
- url: http://www.iis.net/iisbot.html
1333
- producer:
1334
- name: Microsoft Corporation
1335
- url: http://www.microsoft.com
1336
- -
1337
- user_agent: IP-Guide.com Crawler/1.0 (https://ip-guide.com)
1338
- bot:
1339
- name: IP-Guide Crawler
1340
- category: Crawler
1341
- url: ""
1342
- producer:
1343
- name: ""
1344
- url: https://ip-guide.com
1345
- -
1346
- user_agent: Mozilla/5.0 (compatible; ips-agent)
1347
- bot:
1348
- name: IPS Agent
1349
- category: crawler
1350
- producer:
1351
- name: VeriSign, Inc
1352
- url: http://www.verisign.com/
1353
- -
1354
- user_agent: kouio.com RSS reader
1355
- bot:
1356
- name: Kouio
1357
- url: http://kouio.com/
1358
- category: Feed Fetcher
1359
- producer:
1360
- name: ""
1361
- url: ""
1362
- -
1363
- user_agent: 'kouio.com RSS reader - 6 subscribers'
1364
- bot:
1365
- name: Kouio
1366
- url: http://kouio.com/
1367
- category: Feed Fetcher
1368
- producer:
1369
- name: ""
1370
- url: ""
1371
- -
1372
- user_agent: 'ltx71 - (http://ltx71.com/)'
1373
- bot:
1374
- name: LTX71
1375
- url: http://ltx71.com/
1376
- producer:
1377
- name: ""
1378
- url: ""
1379
- -
1380
- user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
1381
- bot:
1382
- name: Larbin web crawler
1383
- category: Crawler
1384
- url: http://larbin.sourceforge.net
1385
- producer:
1386
- name: ""
1387
- url: ""
1388
- -
1389
- user_agent: "Mozilla/5.0 (compatible; Let's Encrypt validation server; +https://www.letsencrypt.org)"
1390
- bot:
1391
- name: "Let's Encrypt Validation"
1392
- category: Service Agent
1393
- url: https://letsencrypt.org/how-it-works/
1394
- producer:
1395
- name: "Let's Encrypt"
1396
- url: https://letsencrypt.org
1397
- -
1398
- user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/61.0.3116.0 Mobile Safari/537.36 Chrome-Lighthouse
1399
- bot:
1400
- name: Lighthouse
1401
- category: Site Monitor
1402
- url: https://developers.google.com/web/tools/lighthouse
1403
- producer:
1404
- name: Lighthouse
1405
- url: https://developers.google.com/web/tools/lighthouse
1406
- -
1407
- user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
1408
- bot:
1409
- name: Linkdex Bot
1410
- category: Search bot
1411
- url: http://www.linkdex.com/bots
1412
- producer:
1413
- name: Mojeek Ltd.
1414
- url: http://www.mojeek.com
1415
- -
1416
- user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
1417
- bot:
1418
- name: Linkdex Bot
1419
- category: Search bot
1420
- url: http://www.linkdex.com/bots
1421
- producer:
1422
- name: Mojeek Ltd.
1423
- url: http://www.mojeek.com
1424
- -
1425
- user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
1426
- bot:
1427
- name: Linkdex Bot
1428
- category: Search bot
1429
- url: http://www.linkdex.com/bots
1430
- producer:
1431
- name: Mojeek Ltd.
1432
- url: http://www.mojeek.com
1433
- -
1434
- user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
1435
- bot:
1436
- name: LinkedIn Bot
1437
- category: Social Media Agent
1438
- url: http://www.linkedin.com
1439
- producer:
1440
- name: LinkedIn
1441
- url: http://www.linkedin.com
1442
- -
1443
- user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
1444
- bot:
1445
- name: MJ12 Bot
1446
- category: Search bot
1447
- url: http://majestic12.co.uk/bot.php
1448
- producer:
1449
- name: Majestic-12
1450
- url: http://majestic12.co.uk
1451
- -
1452
- user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
1453
- bot:
1454
- name: Magpie-Crawler
1455
- category: Social Media Agent
1456
- url: http://www.brandwatch.com/magpie-crawler/
1457
- producer:
1458
- name: Brandwatch
1459
- url: http://www.brandwatch.com
1460
- -
1461
- user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
1462
- bot:
1463
- name: MagpieRSS
1464
- url: http://magpierss.sourceforge.net/
1465
- category: Feed Parser
1466
- producer:
1467
- name: ""
1468
- url: ""
1469
- -
1470
- user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
1471
- bot:
1472
- name: Mail.Ru Bot
1473
- category: Search bot
1474
- url: http://help.mail.ru/webmaster/indexing/robots/types_robots
1475
- producer:
1476
- name: Mail.Ru Group
1477
- url: http://corp.mail.ru
1478
- -
1479
- user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
1480
- bot:
1481
- name: Mail.Ru Bot
1482
- category: Search bot
1483
- url: http://help.mail.ru/webmaster/indexing/robots/types_robots
1484
- producer:
1485
- name: Mail.Ru Group
1486
- url: http://corp.mail.ru
1487
- -
1488
- user_agent: http.rb/2.2.2 (Mastodon/1.6.1; +https://mathtod.online/)
1489
- bot:
1490
- name: Mastodon Bot
1491
- category: Social Media Agent
1492
- -
1493
- user_agent: http.rb/3.2.0 (Mastodon/2.4.3; +https://uwu.social/)
1494
- bot:
1495
- name: Mastodon Bot
1496
- category: Social Media Agent
1497
- -
1498
- user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
1499
- bot:
1500
- name: Meanpath Bot
1501
- category: Search bot
1502
- url: http://www.meanpath.com/meanpathbot.html
1503
- producer:
1504
- name: Meanpath
1505
- url: http://www.meanpath.com
1506
- -
1507
- user_agent: MetaInspector/5.4.0 (+https://github.com/jaimeiniesta/metainspector)
1508
- bot:
1509
- name: MetaInspector
1510
- category: Crawler
1511
- url: https://github.com/jaimeiniesta/metainspector
1512
- -
1513
- user_agent: Mozilla/5.0 (compatible; MetaJobBot; http://www.metajob.de/crawler)
1514
- bot:
1515
- name: MetaJobBot
1516
- category: Crawler
1517
- url: http://www.metajob.at/the/crawler
1518
- producer:
1519
- name: MetaJob
1520
- url: http://www.metajob.at
1521
- -
1522
- user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
1523
- bot:
1524
- name: Mixrank Bot
1525
- category: Crawler
1526
- url: http://mixrank.com
1527
- producer:
1528
- name: Online Media Group, Inc.
1529
- url: ""
1530
- -
1531
- user_agent: Mnogosearch-3.1.21
1532
- bot:
1533
- name: Mnogosearch
1534
- category: Search bot
1535
- url: http://www.mnogosearch.org/
1536
- producer:
1537
- name: Lavtech.Com Corp.
1538
- url: ""
1539
- -
1540
- user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
1541
- bot:
1542
- name: MojeekBot
1543
- category: Search bot
1544
- url: http://www.mojeek.com/bot.html
1545
- producer:
1546
- name: Mojeek Ltd.
1547
- url: http://www.mojeek.com
1548
- -
1549
- user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
1550
- bot:
1551
- name: Monitor.Us
1552
- category: Site Monitor
1553
- url: http://www.monitor.us
1554
- producer:
1555
- name: Monitor.Us
1556
- url: http://www.monitor.us
1557
- -
1558
- user_agent: munin/2.0.30-1 (libwww-perl/6.15)
1559
- bot:
1560
- name: Munin
1561
- category: Site Monitor
1562
- url: http://munin-monitoring.org/
1563
- producer:
1564
- name: Munin
1565
- url: http://munin-monitoring.org/
1566
- -
1567
- user_agent: munin/http_loadtime
1568
- bot:
1569
- name: Munin
1570
- category: Site Monitor
1571
- url: http://munin-monitoring.org/
1572
- producer:
1573
- name: Munin
1574
- url: http://munin-monitoring.org/
1575
- -
1576
- user_agent: nlcrawler/1.0 (+http://northernlight.com/)
1577
- bot:
1578
- name: NLCrawler
1579
- category: Crawler
1580
- url: ""
1581
- producer:
1582
- name: Northern Light
1583
- url: http://northernlight.com
1584
- -
1585
- user_agent: check_http/v1.5 (nagios-plugins 1.5)
1586
- bot:
1587
- name: Nagios check_http
1588
- category: Site Monitor
1589
- url: https://nagios.org
1590
- producer:
1591
- name: Nagios Plugins Development Team
1592
- url: https://nagios.org
1593
- -
1594
- user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
1595
- bot:
1596
- name: NalezenCzBot
1597
- category: Crawler
1598
- url: http://www.nalezen.cz/about-crawler
1599
- producer:
1600
- name: Jaroslav Kuboš
1601
- url: ""
1602
- -
1603
- user_agent: NetLyzer FastProbe
1604
- bot:
1605
- name: NetLyzer FastProbe
1606
- -
1607
- user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
1608
- bot:
1609
- name: Netcraft Survey Bot
1610
- category: Search bot
1611
- url: ""
1612
- producer:
1613
- name: Netcraft
1614
- url: http://www.netcraft.com
1615
- -
1616
- user_agent: Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)
1617
- bot:
1618
- name: Netcraft Survey Bot
1619
- category: Search bot
1620
- url: ""
1621
- producer:
1622
- name: Netcraft
1623
- url: http://www.netcraft.com
1624
- -
1625
- user_agent: 'Netcraft SSL Server Survey - contact info@netcraft.com'
1626
- bot:
1627
- name: Netcraft Survey Bot
1628
- category: Search bot
1629
- url: ""
1630
- producer:
1631
- name: Netcraft
1632
- url: http://www.netcraft.com
1633
- -
1634
- user_agent: Netvibes (http://www.netvibes.com)
1635
- bot:
1636
- name: Netvibes
1637
- url: http://www.netvibes.com/
1638
- category: Feed Fetcher
1639
- producer:
1640
- name: ""
1641
- url: ""
1642
- -
1643
- user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
1644
- bot:
1645
- name: Netvibes
1646
- url: http://www.netvibes.com/
1647
- category: Feed Fetcher
1648
- producer:
1649
- name: ""
1650
- url: ""
1651
- -
1652
- user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1653
- bot:
1654
- name: NewsBlur
1655
- url: http://www.newsblur.com
1656
- category: Feed Fetcher
1657
- producer:
1658
- name: ""
1659
- url: ""
1660
- -
1661
- user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1662
- bot:
1663
- name: NewsBlur
1664
- url: http://www.newsblur.com
1665
- category: Feed Fetcher
1666
- producer:
1667
- name: ""
1668
- url: ""
1669
- -
1670
- user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1671
- bot:
1672
- name: NewsBlur
1673
- url: http://www.newsblur.com
1674
- category: Feed Fetcher
1675
- producer:
1676
- name: ""
1677
- url: ""
1678
- -
1679
- user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1680
- bot:
1681
- name: NewsBlur
1682
- url: http://www.newsblur.com
1683
- category: Feed Fetcher
1684
- producer:
1685
- name: ""
1686
- url: ""
1687
- -
1688
- user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
1689
- bot:
1690
- name: NewsGator
1691
- url: http://www.newsgator.com
1692
- category: Feed Fetcher
1693
- producer:
1694
- name: ""
1695
- url: ""
1696
- -
1697
- user_agent: Mozilla/5.0 (compatible; Nmap Scripting Engine; https://nmap.org/book/nse.html)
1698
- bot:
1699
- name: Nmap
1700
- category: Security Checker
1701
- url: https://nmap.org/book/nse.html
1702
- producer:
1703
- name: Nmap
1704
- url: https://nmap.org/
1705
- -
1706
- user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
1707
- bot:
1708
- name: Nutch-based Bot
1709
- category: Crawler
1710
- url: https://nutch.apache.org
1711
- producer:
1712
- name: The Apache Software Foundation
1713
- url: http://www.apache.org/foundation/
1714
- -
1715
- user_agent: CB/Nutch-1.7
1716
- bot:
1717
- name: Nutch-based Bot
1718
- category: Crawler
1719
- url: https://nutch.apache.org
1720
- producer:
1721
- name: The Apache Software Foundation
1722
- url: http://www.apache.org/foundation/
1723
- -
1724
- user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
1725
- bot:
1726
- name: Nutch-based Bot
1727
- category: Crawler
1728
- url: https://nutch.apache.org
1729
- producer:
1730
- name: The Apache Software Foundation
1731
- url: http://www.apache.org/foundation/
1732
- -
1733
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
1734
- bot:
1735
- name: Nutch-based Bot
1736
- category: Crawler
1737
- url: https://nutch.apache.org
1738
- producer:
1739
- name: The Apache Software Foundation
1740
- url: http://www.apache.org/foundation/
1741
- -
1742
- user_agent: My Nutch Spider/Nutch-1.6
1743
- bot:
1744
- name: Nutch-based Bot
1745
- category: Crawler
1746
- url: https://nutch.apache.org
1747
- producer:
1748
- name: The Apache Software Foundation
1749
- url: http://www.apache.org/foundation/
1750
- -
1751
- user_agent: MySpider/Nutch-2.2
1752
- bot:
1753
- name: Nutch-based Bot
1754
- category: Crawler
1755
- url: https://nutch.apache.org
1756
- producer:
1757
- name: The Apache Software Foundation
1758
- url: http://www.apache.org/foundation/
1759
- -
1760
- user_agent: Nutch12/Nutch-1.2
1761
- bot:
1762
- name: Nutch-based Bot
1763
- category: Crawler
1764
- url: https://nutch.apache.org
1765
- producer:
1766
- name: The Apache Software Foundation
1767
- url: http://www.apache.org/foundation/
1768
- -
1769
- user_agent: NutchSpider/Nutch-1.4
1770
- bot:
1771
- name: Nutch-based Bot
1772
- category: Crawler
1773
- url: https://nutch.apache.org
1774
- producer:
1775
- name: The Apache Software Foundation
1776
- url: http://www.apache.org/foundation/
1777
- -
1778
- user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
1779
- bot:
1780
- name: Nutch-based Bot
1781
- category: Crawler
1782
- url: https://nutch.apache.org
1783
- producer:
1784
- name: The Apache Software Foundation
1785
- url: http://www.apache.org/foundation/
1786
- -
1787
- user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
1788
- bot:
1789
- name: Nutch-based Bot
1790
- category: Crawler
1791
- url: https://nutch.apache.org
1792
- producer:
1793
- name: The Apache Software Foundation
1794
- url: http://www.apache.org/foundation/
1795
- -
1796
- user_agent: testnutch/Nutch-1.8
1797
- bot:
1798
- name: Nutch-based Bot
1799
- category: Crawler
1800
- url: https://nutch.apache.org
1801
- producer:
1802
- name: The Apache Software Foundation
1803
- url: http://www.apache.org/foundation/
1804
- -
1805
- user_agent: Your Nutch Spider/Nutch-2.2.1
1806
- bot:
1807
- name: Nutch-based Bot
1808
- category: Crawler
1809
- url: https://nutch.apache.org
1810
- producer:
1811
- name: The Apache Software Foundation
1812
- url: http://www.apache.org/foundation/
1813
- -
1814
- user_agent: your sipder name/Nutch-1.7
1815
- bot:
1816
- name: Nutch-based Bot
1817
- category: Crawler
1818
- url: https://nutch.apache.org
1819
- producer:
1820
- name: The Apache Software Foundation
1821
- url: http://www.apache.org/foundation/
1822
- -
1823
- user_agent: Octopus 1.0.2
1824
- bot:
1825
- name: Octopus
1826
- -
1827
- user_agent: omgili/0.5 +http://omgili.com
1828
- bot:
1829
- name: Omgili bot
1830
- category: Search bot
1831
- url: http://www.omgili.com/Crawler.html
1832
- producer:
1833
- name: Omgili
1834
- url: http://www.omgili.com
1835
- -
1836
- user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
1837
- bot:
1838
- name: Omgili bot
1839
- category: Search bot
1840
- url: http://www.omgili.com/Crawler.html
1841
- producer:
1842
- name: Omgili
1843
- url: http://www.omgili.com
1844
- -
1845
- user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
1846
- bot:
1847
- name: OpenLinkProfiler
1848
- category: Crawler
1849
- url: http://openlinkprofiler.org/bot
1850
- producer:
1851
- name: Axandra GmbH
1852
- url: http://www.axandra.com
1853
- -
1854
- user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
1855
- bot:
1856
- name: OpenWebSpider
1857
- category: Crawler
1858
- url: http://www.openwebspider.org
1859
- producer:
1860
- name: OpenWebSpider Lab
1861
- url: http://lab.openwebspider.org
1862
- -
1863
- user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
1864
- bot:
1865
- name: Openindex Spider
1866
- category: Search bot
1867
- url: http://www.openindex.io/en/webmasters/spider.html
1868
- producer:
1869
- name: Openindex B.V.
1870
- url: http://www.openindex.io
1871
- -
1872
- user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
1873
- bot:
1874
- name: Orange Bot
1875
- category: Search bot
1876
- url: http://lemoteur.orange.fr
1877
- producer:
1878
- name: Orange
1879
- url: http://www.orange.fr
1880
- -
1881
- user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
1882
- bot:
1883
- name: Orange Bot
1884
- category: Search bot
1885
- url: http://lemoteur.orange.fr
1886
- producer:
1887
- name: Orange
1888
- url: http://www.orange.fr
1889
- -
1890
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
1891
- bot:
1892
- name: Orange Bot
1893
- category: Search bot
1894
- url: http://lemoteur.orange.fr
1895
- producer:
1896
- name: Orange
1897
- url: http://www.orange.fr
1898
- -
1899
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
1900
- bot:
1901
- name: Orange Bot
1902
- category: Search bot
1903
- url: http://lemoteur.orange.fr
1904
- producer:
1905
- name: Orange
1906
- url: http://www.orange.fr
1907
- -
1908
- user_agent: Mozilla/5.0 (Java) outbrain
1909
- bot:
1910
- name: Outbrain
1911
- category: Crawler
1912
- url: ""
1913
- producer:
1914
- name: Outbrain
1915
- url: http://www.outbrain.com/
1916
- -
1917
- user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
1918
- bot:
1919
- name: PHP Server Monitor
1920
- category: Site Monitor
1921
- url: https://github.com/phpservermon/phpservermon
1922
- producer:
1923
- name: PHP Server Monitor
1924
- url: http://www.phpservermonitor.org/
1925
- -
1926
- user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
1927
- bot:
1928
- name: PaperLiBot
1929
- category: Search bot
1930
- url: http://support.paper.li/entries/20023257-what-is-paper-li
1931
- producer:
1932
- name: Smallrivers SA
1933
- url: http://www.paper.li
1934
- -
1935
- user_agent: phantomas/1.11.0 (PhantomJS/1.9.8; linux x64)
1936
- bot:
1937
- name: Phantomas
1938
- category: Site Monitor
1939
- url: https://github.com/macbre/phantomas
1940
- -
1941
- user_agent: psbot-page (+http://www.picsearch.com/bot.html)
1942
- bot:
1943
- name: Picsearch bot
1944
- category: Search bot
1945
- url: http://www.picsearch.com/bot.html
1946
- producer:
1947
- name: Picsearch
1948
- url: http://www.picsearch.com
1949
- -
1950
- user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
1951
- bot:
1952
- name: Picsearch bot
1953
- category: Search bot
1954
- url: http://www.picsearch.com/bot.html
1955
- producer:
1956
- name: Picsearch
1957
- url: http://www.picsearch.com
1958
- -
1959
- user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
1960
- bot:
1961
- name: Pingdom Bot
1962
- category: Site Monitor
1963
- url: ""
1964
- producer:
1965
- name: Pingdom AB
1966
- url: https://www.pingdom.com
1967
- -
1968
- user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
1969
- bot:
1970
- name: Pinterest
1971
- url: ""
1972
- category: Crawler
1973
- producer:
1974
- name: Pinterest
1975
- url: http://www.pinterest.com/
1976
- -
1977
- user_agent: PocketParser/2.0 (+https://getpocket.com/pocketparser_ua)
1978
- bot:
1979
- name: PocketParser
1980
- category: Read-it-later Service
1981
- url: https://getpocket.com/pocketparser_ua
1982
- producer:
1983
- name: Pocket
1984
- url: https://getpocket.com/
1985
- -
1986
- user_agent: PritTorrent/1.0
1987
- bot:
1988
- name: PritTorrent
1989
- category: Crawler
1990
- url: https://github.com/astro/prittorrent
1991
- producer:
1992
- name: Bitlove
1993
- url: http://bitlove.org/
1994
- -
1995
- user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
1996
- bot:
1997
- name: QuerySeekerSpider
1998
- category: Crawler
1999
- url: http://queryseeker.com/bot.html
2000
- producer:
2001
- name: QueryEye Inc.
2002
- url: http://queryeye.com
2003
- -
2004
- user_agent: Quora Link Preview/1.0 (http://www.quora.com)
2005
- bot:
2006
- name: Quora Link Preview
2007
- category: Crawler
2008
- url: ""
2009
- producer:
2010
- name: Quora
2011
- url: http://www.quora.com
2012
- -
2013
- user_agent: 'Mozilla/5.0 (compatible; Qwantify/2.2w; +https://www.qwant.com/)/*'
2014
- bot:
2015
- name: Qwantify
2016
- category: Crawler
2017
- url: https://www.qwant.com/
2018
- producer:
2019
- name: Qwant Corporation
2020
- url: https://www.qwant.com/
2021
- -
2022
- user_agent: ROI Hunter; https://api-dev.roihunter.com
2023
- bot:
2024
- name: ROI Hunter
2025
- category: Crawler
2026
- url: ""
2027
- producer:
2028
- name: Roihunter a.s.
2029
- url: http://roihunter.com/
2030
- -
2031
- user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
2032
- bot:
2033
- name: RSSRadio Bot
2034
- -
2035
- user_agent: Rainmeter WebParser plugin
2036
- bot:
2037
- name: Rainmeter
2038
- category: Crawler
2039
- url: https://www.rainmeter.net
2040
- -
2041
- user_agent: RamblerMail/6.0 (incompatible; ImageProxy/6.0)
2042
- bot:
2043
- name: RamblerMail Image Proxy
2044
- category: Crawler
2045
- url: ""
2046
- producer:
2047
- name: 'Rambler&Co'
2048
- url: https://rambler-co.ru/
2049
- -
2050
- user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
2051
- bot:
2052
- name: Reddit Bot
2053
- category: Social Media Agent
2054
- url: http://www.reddit.com/feedback
2055
- producer:
2056
- name: reddit inc.
2057
- url: http://www.reddit.com
2058
- -
2059
- user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
2060
- bot:
2061
- name: Rogerbot
2062
- category: Crawler
2063
- url: http://moz.com/help/pro/what-is-rogerbot-
2064
- producer:
2065
- name: SEOmoz, Inc.
2066
- url: http://moz.com/
2067
- -
2068
- user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
2069
- bot:
2070
- name: Rogerbot
2071
- category: Crawler
2072
- url: http://moz.com/help/pro/what-is-rogerbot-
2073
- producer:
2074
- name: SEOmoz, Inc.
2075
- url: http://moz.com/
2076
- -
2077
- user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
2078
- bot:
2079
- name: Rogerbot
2080
- category: Crawler
2081
- url: http://moz.com/help/pro/what-is-rogerbot-
2082
- producer:
2083
- name: SEOmoz, Inc.
2084
- url: http://moz.com/
2085
- -
2086
- user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
2087
- bot:
2088
- name: SEOENGBot
2089
- category: Crawler
2090
- url: http://www.seoengine.com/seoengbot.htm
2091
- producer:
2092
- name: SEO Engine
2093
- url: http://www.seoengine.com
2094
- -
2095
- user_agent: Mozilla/5.0 (compatible; SEOkicks-Robot; +http://www.seokicks.de/robot.html)
2096
- bot:
2097
- name: SEOkicks-Robot
2098
- category: Crawler
2099
- url: http://www.seokicks.de/robot.html
2100
- producer:
2101
- name: SEOkicks
2102
- url: https://www.seokicks.de/
2103
- -
2104
- user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
2105
- bot:
2106
- name: SISTRIX Crawler
2107
- category: Crawler
2108
- url: http://crawler.sistrix.net
2109
- producer:
2110
- name: SISTRIX GmbH
2111
- url: http://www.sistrix.de
2112
- -
2113
- user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer)
2114
- bot:
2115
- name: SISTRIX Optimizer
2116
- category: Crawler
2117
- url: https://optimizer.sistrix.com
2118
- producer:
2119
- name: SISTRIX GmbH
2120
- url: http://www.sistrix.de
2121
- -
2122
- user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer; Uptime; +https://www.sistrix.com/faq/uptime)
2123
- bot:
2124
- name: SISTRIX Optimizer
2125
- category: Crawler
2126
- url: https://optimizer.sistrix.com
2127
- producer:
2128
- name: SISTRIX GmbH
2129
- url: http://www.sistrix.de
2130
- -
2131
- user_agent: SSL Labs (https://www.ssllabs.com/about/assessment.html)
2132
- bot:
2133
- name: SSL Labs
2134
- category: Validator
2135
- url: https://www.ssllabs.com/about/assessment.html
2136
- producer:
2137
- name: SSL Labs
2138
- url: https://www.ssllabs.com/about/assessment.html
2139
- -
2140
- user_agent: SafeDNSBot (https://www.safedns.com/searchbot)
2141
- bot:
2142
- name: SafeDNSBot
2143
- category: Crawler
2144
- url: https://www.safedns.com/searchbot
2145
- producer:
2146
- name: SafeDNS, Inc.
2147
- url: https://www.safedns.com/
2148
- -
2149
- user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
2150
- bot:
2151
- name: Scrapy
2152
- category: Crawler
2153
- url: http://scrapy.org
2154
- -
2155
- user_agent: Screaming Frog SEO Spider/2.22
2156
- bot:
2157
- name: Screaming Frog SEO Spider
2158
- category: Crawler
2159
- url: http://www.screamingfrog.co.uk/seo-spider
2160
- producer:
2161
- name: Screaming Frog Ltd
2162
- url: http://www.screamingfrog.co.uk
2163
- -
2164
- user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
2165
- bot:
2166
- name: ScreenerBot
2167
- category: Crawler
2168
- url: http://www.screenerbot.com
2169
- producer:
2170
- name: ""
2171
- url: ""
2172
- -
2173
- user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
2174
- bot:
2175
- name: Semrush Bot
2176
- category: Crawler
2177
- url: http://www.semrush.com/bot.html
2178
- producer:
2179
- name: SEMrush
2180
- url: http://www.semrush.com
2181
- -
2182
- user_agent: SensikaBot/x.33 (+http://sensika.com)
2183
- bot:
2184
- name: Sensika Bot
2185
- category: ""
2186
- url: ""
2187
- producer:
2188
- name: Sensika
2189
- url: http://sensika.com
2190
- -
2191
- user_agent: sentry/8.6.0 (https://getsentry.com)
2192
- bot:
2193
- name: Sentry Bot
2194
- producer:
2195
- name: Sentry
2196
- url: https://sentry.io
2197
- -
2198
- user_agent: Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)
2199
- bot:
2200
- name: Seoscanners.net
2201
- category: Crawler
2202
- url: ""
2203
- -
2204
- user_agent: Server Density Service Monitoring v2
2205
- bot:
2206
- name: Server Density
2207
- -
2208
- user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
2209
- bot:
2210
- name: Seznam Bot
2211
- category: Search bot
2212
- url: http://www.mapy.cz/cz/seznambot.html
2213
- producer:
2214
- name: Seznam.cz, a.s.
2215
- url: http://www.seznam.cz/
2216
- -
2217
- user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
2218
- bot:
2219
- name: Seznam Bot
2220
- category: Search bot
2221
- url: http://www.mapy.cz/cz/seznambot.html
2222
- producer:
2223
- name: Seznam.cz, a.s.
2224
- url: http://www.seznam.cz/
2225
- -
2226
- user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
2227
- bot:
2228
- name: Seznam Bot
2229
- category: Search bot
2230
- url: http://www.mapy.cz/cz/seznambot.html
2231
- producer:
2232
- name: Seznam.cz, a.s.
2233
- url: http://www.seznam.cz/
2234
- -
2235
- user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
2236
- bot:
2237
- name: Seznam Bot
2238
- category: Search bot
2239
- url: http://www.mapy.cz/cz/seznambot.html
2240
- producer:
2241
- name: Seznam.cz, a.s.
2242
- url: http://www.seznam.cz/
2243
- -
2244
- user_agent: Mozilla/5.0 SeznamEmailProxy/2.0.174
2245
- bot:
2246
- name: Seznam Email Proxy
2247
- category: Crawler
2248
- url: ""
2249
- producer:
2250
- name: Seznam.cz, a.s.
2251
- url: http://www.seznam.cz/
2252
- -
2253
- user_agent: Seznam-Zbozi-robot/3.0
2254
- bot:
2255
- name: Seznam Zbozi.cz
2256
- category: Crawler
2257
- url: ""
2258
- producer:
2259
- name: Seznam.cz, a.s.
2260
- url: https://www.zbozi.cz/
2261
- -
2262
- user_agent: Mozilla/5.0 (ShopAlike; LadenZeile) FeedBot
2263
- bot:
2264
- name: ShopAlike
2265
- category: Crawler
2266
- url: ""
2267
- producer:
2268
- name: Visual Meta
2269
- url: https://www.shopalike.cz/
2270
- -
2271
- user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
2272
- bot:
2273
- name: ShopWiki
2274
- category: Search tools
2275
- url: http://www.shopwiki.com/wiki/Help:Bot
2276
- producer:
2277
- name: ShopWiki Corp.
2278
- url: http://www.shopwiki.com
2279
- -
2280
- user_agent: SilverReader/1.0; http://silverreader.com
2281
- bot:
2282
- name: SilverReader
2283
- url: http://silverreader.com
2284
- category: Feed Fetcher
2285
- producer:
2286
- name: ""
2287
- url: ""
2288
- -
2289
- user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
2290
- bot:
2291
- name: SimplePie
2292
- url: http://www.simplepie.org
2293
- category: Feed Parser
2294
- producer:
2295
- name: ""
2296
- url: ""
2297
- -
2298
- user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
2299
- bot:
2300
- name: SimplePie
2301
- url: http://www.simplepie.org
2302
- category: Feed Parser
2303
- producer:
2304
- name: ""
2305
- url: ""
2306
- -
2307
- user_agent: Site24x7
2308
- bot:
2309
- name: Site24x7 Website Monitoring
2310
- category: Site Monitor
2311
- url: https://www.site24x7.com/site24x7-faq.html
2312
- producer:
2313
- name: Site24x7
2314
- url: https://www.site24x7.com
2315
- -
2316
- user_agent: SiteSucker for macOS/2.10.5
2317
- bot:
2318
- name: SiteSucker
2319
- category: Crawler
2320
- url: http://ricks-apps.com/osx/sitesucker/
2321
- -
2322
- user_agent: sixy.ch/1.0
2323
- bot:
2324
- name: Sixy.ch
2325
- category: Site Monitor
2326
- url: http://sixy.ch
2327
- producer:
2328
- name: Manuel Kasper
2329
- url: https://neon1.net/
2330
- -
2331
- user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
2332
- bot:
2333
- name: Skype URI Preview
2334
- category: Service Agent
2335
- url: ""
2336
- producer:
2337
- name: Skype Communications S.à.r.l.
2338
- url: https://www.skype.com
2339
- -
2340
- user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
2341
- bot:
2342
- name: Slackbot
2343
- category: Crawler
2344
- url: https://api.slack.com/robots
2345
- producer:
2346
- name: Slack Technologies
2347
- url: http://slack.com
2348
- -
2349
- user_agent: 'AppEngine-Google; (+http://code.google.com/appengine; appid: s~snapchat-proxy)'
2350
- bot:
2351
- name: Snapchat Proxy
2352
- category: Crawler
2353
- url: https://www.snapchat.com
2354
- producer:
2355
- name: Snapchat Inc.
2356
- url: https://www.snapchat.com
2357
- -
2358
- user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
2359
- bot:
2360
- name: Sogou Spider
2361
- category: Search bot
2362
- url: http://www.sogou.com/docs/help/webmasters.htm
2363
- producer:
2364
- name: Sohu, Inc.
2365
- url: http://www.sogou.com
2366
- -
2367
- user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
2368
- bot:
2369
- name: Sogou Spider
2370
- category: Search bot
2371
- url: http://www.sogou.com/docs/help/webmasters.htm
2372
- producer:
2373
- name: Sohu, Inc.
2374
- url: http://www.sogou.com
2375
- -
2376
- user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
2377
- bot:
2378
- name: Sogou Spider
2379
- category: Search bot
2380
- url: http://www.sogou.com/docs/help/webmasters.htm
2381
- producer:
2382
- name: Sohu, Inc.
2383
- url: http://www.sogou.com
2384
- -
2385
- user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
2386
- bot:
2387
- name: Sogou Spider
2388
- category: Search bot
2389
- url: http://www.sogou.com/docs/help/webmasters.htm
2390
- producer:
2391
- name: Sohu, Inc.
2392
- url: http://www.sogou.com
2393
- -
2394
- user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
2395
- bot:
2396
- name: Soso Spider
2397
- category: Search bot
2398
- url: http://help.soso.com/webspider.htm
2399
- producer:
2400
- name: Tencent Holdings
2401
- url: http://www.soso.com
2402
- -
2403
- user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_6) AppleWebKit/537.36 (KHTML, like Gecko) Sparkler/0.2.0-SNAPSHOT
2404
- bot:
2405
- name: Sparkler
2406
- category: Crawler
2407
- url: https://github.com/USCDataScience/sparkler
2408
- -
2409
- user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
2410
- bot:
2411
- name: Spinn3r
2412
- category: Crawler
2413
- url: http://spinn3r.com/robot
2414
- producer:
2415
- name: Tailrank Inc
2416
- url: http://spinn3r.com
2417
- -
2418
- user_agent: Spotify/1.0
2419
- bot:
2420
- name: Spotify
2421
- producer:
2422
- name: Spotify
2423
- url: https://www.spotify.com
2424
- -
2425
- user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
2426
- bot:
2427
- name: Sputnik Bot
2428
- category: ""
2429
- url: ""
2430
- producer:
2431
- name: ""
2432
- url: ""
2433
- -
2434
- user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
2435
- bot:
2436
- name: Sputnik Bot
2437
- category: ""
2438
- url: ""
2439
- producer:
2440
- name: ""
2441
- url: ""
2442
- -
2443
- user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.4 (KHTML, like Gecko) Chrome/98 Safari/537.4 (StatusCake)
2444
- bot:
2445
- name: StatusCake
2446
- category: Site Monitor
2447
- url: https://www.statuscake.com
2448
- producer:
2449
- name: StatusCake
2450
- url: https://www.statuscake.com
2451
- -
2452
- user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
2453
- bot:
2454
- name: Superfeedr Bot
2455
- category: Feed Fetcher
2456
- url: ""
2457
- producer:
2458
- name: Superfeedr
2459
- url: https://superfeedr.com/
2460
- -
2461
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
2462
- bot:
2463
- name: Survey Bot
2464
- category: Search bot
2465
- url: http://www.domaintools.com/webmasters/surveybot.php
2466
- producer:
2467
- name: Domain Tools
2468
- url: http://www.domaintools.com
2469
- -
2470
- user_agent: TLSProbe/1.0 (+https://scan.trustnet.venafi.com/)
2471
- bot:
2472
- name: TLSProbe
2473
- url: https://scan.trustnet.venafi.com/
2474
- category: Security search bot
2475
- producer:
2476
- name: Venafi TrustNet
2477
- url: https://www.venafi.com
2478
- -
2479
- user_agent: Tarmot Gezgin/1.0 (compatible; TarmotGezgin/1.1; +http://www.tarmot.com/gezgin)
2480
- bot:
2481
- name: Tarmot Gezgin
2482
- url: http://www.tarmot.com/gezgin/
2483
- category: Search bot
2484
- -
2485
- user_agent: TelegramBot (like TwitterBot)
2486
- bot:
2487
- name: TelegramBot
2488
- url: https://telegram.org/blog/bot-revolution
2489
- -
2490
- user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
2491
- bot:
2492
- name: TinEye Crawler
2493
- category: Search bot
2494
- url: http://www.tineye.com/crawler.html
2495
- producer:
2496
- name: Idée Inc.
2497
- url: http://ideeinc.com
2498
- -
2499
- user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
2500
- bot:
2501
- name: Tiny Tiny RSS
2502
- url: http://tt-rss.org
2503
- category: Feed Fetcher
2504
- producer:
2505
- name: ""
2506
- url: ""
2507
- -
2508
- user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
2509
- bot:
2510
- name: Tiny Tiny RSS
2511
- url: http://tt-rss.org
2512
- category: Feed Fetcher
2513
- producer:
2514
- name: ""
2515
- url: ""
2516
- -
2517
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 6.0; en-GB; rv:1.0; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20071127 Firefox/3.0.0.11
2518
- bot:
2519
- name: Trendiction Bot
2520
- category: Crawler
2521
- url: http://www.trendiction.de/bot
2522
- producer:
2523
- name: Talkwalker Inc.
2524
- url: http://www.talkwalker.com
2525
- -
2526
- user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
2527
- bot:
2528
- name: TurnitinBot
2529
- category: Crawler
2530
- url: http://www.turnitin.com/robot/crawlerinfo.html
2531
- producer:
2532
- name: iParadigms, LLC.
2533
- url: http://www.turnitin.com
2534
- -
2535
- user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
2536
- bot:
2537
- name: TweetedTimes Bot
2538
- category: Crawler
2539
- url: http://tweetedtimes.com
2540
- producer:
2541
- name: TweetedTimes
2542
- url: http://tweetedtimes.com/
2543
- -
2544
- user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
2545
- bot:
2546
- name: TweetedTimes Bot
2547
- category: Crawler
2548
- url: http://tweetedtimes.com
2549
- producer:
2550
- name: TweetedTimes
2551
- url: http://tweetedtimes.com/
2552
- -
2553
- user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
2554
- bot:
2555
- name: Tweetmeme Bot
2556
- category: Crawler
2557
- url: http://tweetmeme.com/
2558
- producer:
2559
- name: Mediasift
2560
- url: ""
2561
- -
2562
- user_agent: Twitterbot/1.0
2563
- bot:
2564
- name: Twitterbot
2565
- category: Social Media Agent
2566
- url: https://dev.twitter.com/docs/cards/getting-started
2567
- producer:
2568
- name: Twitter
2569
- url: http://www.twitter.com
2570
- -
2571
- user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
2572
- bot:
2573
- name: URLAppendBot
2574
- category: Crawler
2575
- url: http://www.profound.net/urlappendbot.html
2576
- producer:
2577
- name: Profound Networks
2578
- url: http://www.profound.net
2579
- -
2580
- user_agent: 'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36 (via secureurl.fwdcdn.com - mail.ukr.net proxy)'
2581
- bot:
2582
- name: UkrNet Mail Proxy
2583
- category: Crawler
2584
- url: ""
2585
- producer:
2586
- name: UkrNet Ltd
2587
- url: https://www.ukr.net/
2588
- -
2589
- user_agent: UniversalFeedParser/5.2.1 +https://code.google.com/p/feedparser/
2590
- bot:
2591
- name: UniversalFeedParser
2592
- category: Feed Fetcher
2593
- url: https://github.com/kurtmckee/feedparser
2594
- producer:
2595
- name: Kurt McKee
2596
- url: https://github.com/kurtmckee
2597
- -
2598
- user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
2599
- bot:
2600
- name: Uptime Robot
2601
- category: Site Monitor
2602
- url: ""
2603
- producer:
2604
- name: Uptime Robot
2605
- url: http://uptimerobot.com
2606
- -
2607
- user_agent: Mozilla/5.0 (compatible; Uptimebot/1.0; +http://www.uptime.com/uptimebot)
2608
- bot:
2609
- name: Uptimebot
2610
- category: Site Monitor
2611
- url: https://uptime.com/uptimebot
2612
- producer:
2613
- name: Uptime
2614
- url: https://uptime.com
2615
- -
2616
- user_agent: Mozilla/5.0 (compatible; vkShare; +http://vk.com/dev/Share)
2617
- bot:
2618
- name: VK Share Button
2619
- category: Crawler
2620
- url: http://vk.com/dev/Share
2621
- producer:
2622
- name: VK
2623
- url: http://vk.com/
2624
- -
2625
- user_agent: 'Mozilla/4.0 (compatible; Vagabondo/4.0; http://webagent.wise-guys.nl/; http://www.wise-guys.nl/)'
2626
- bot:
2627
- name: Vagabondo
2628
- category: Crawler
2629
- url: ""
2630
- producer:
2631
- name: WiseGuys
2632
- url: http://www.wise-guys.nl/
2633
- -
2634
- user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
2635
- bot:
2636
- name: Visual Site Mapper Crawler
2637
- category: Crawler
2638
- url: http://www.visualsitemapper.com/crawler
2639
- producer:
2640
- name: Alentum Software Ltd.
2641
- url: http://www.alentum.com
2642
- -
2643
- user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
2644
- bot:
2645
- name: W3C CSS Validator
2646
- category: Validator
2647
- url: http://jigsaw.w3.org/css-validator
2648
- producer:
2649
- name: W3C
2650
- url: http://www.w3.org
2651
- -
2652
- user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
2653
- bot:
2654
- name: W3C I18N Checker
2655
- category: Validator
2656
- url: http://validator.w3.org/i18n-checker
2657
- producer:
2658
- name: W3C
2659
- url: http://www.w3.org
2660
- -
2661
- user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
2662
- bot:
2663
- name: W3C Link Checker
2664
- category: Validator
2665
- url: http://validator.w3.org/checklink
2666
- producer:
2667
- name: W3C
2668
- url: http://www.w3.org
2669
- -
2670
- user_agent: W3C-checklink/4.81 libwww-perl/5.836
2671
- bot:
2672
- name: W3C Link Checker
2673
- category: Validator
2674
- url: http://validator.w3.org/checklink
2675
- producer:
2676
- name: W3C
2677
- url: http://www.w3.org
2678
- -
2679
- user_agent: Validator.nu/LV http://validator.w3.org/services
2680
- bot:
2681
- name: W3C Markup Validation Service
2682
- category: Validator
2683
- url: http://validator.w3.org/services
2684
- producer:
2685
- name: W3C
2686
- url: http://www.w3.org
2687
- -
2688
- user_agent: W3C_Validator/1.3 http://validator.w3.org/services
2689
- bot:
2690
- name: W3C Markup Validation Service
2691
- category: Validator
2692
- url: http://validator.w3.org/services
2693
- producer:
2694
- name: W3C
2695
- url: http://www.w3.org
2696
- -
2697
- user_agent: W3C_Validator/1.767
2698
- bot:
2699
- name: W3C Markup Validation Service
2700
- category: Validator
2701
- url: http://validator.w3.org/services
2702
- producer:
2703
- name: W3C
2704
- url: http://www.w3.org
2705
- -
2706
- user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
2707
- bot:
2708
- name: W3C MobileOK Checker
2709
- category: Validator
2710
- url: http://validator.w3.org/mobile
2711
- producer:
2712
- name: W3C
2713
- url: http://www.w3.org
2714
- -
2715
- user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
2716
- bot:
2717
- name: W3C Unified Validator
2718
- category: Validator
2719
- url: http://validator.w3.org/unicorn
2720
- producer:
2721
- name: W3C
2722
- url: http://www.w3.org
2723
- -
2724
- user_agent: Mozilla/5.0 (compatible; Wappalyzer; +https://github.com/AliasIO/Wappalyzer)
2725
- bot:
2726
- name: Wappalyzer
2727
- url: https://github.com/AliasIO/Wappalyzer
2728
- producer:
2729
- name: AliasIO
2730
- url: https://github.com/AliasIO
2731
- -
2732
- user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
2733
- bot:
2734
- name: WeSEE:Search
2735
- category: Search bot
2736
- url: http://www.wesee.com/bot
2737
- producer:
2738
- name: WeSEE Ltd
2739
- url: http://www.wesee.com
2740
- -
2741
- user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Moto G (4) Build/MPJ24.139-64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.146 Mobile Safari/537.36 PTST/180829.190838
2742
- bot:
2743
- name: WebPageTest
2744
- category: Site Monitor
2745
- url: https://www.webpagetest.org
2746
- -
2747
- user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
2748
- bot:
2749
- name: WebSitePulse
2750
- category: Site Monitor
2751
- url: http://badcheese.com/crawler.html
2752
- producer:
2753
- name: WebSitePulse
2754
- url: http://www.websitepulse.com/
2755
- -
2756
- user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
2757
- bot:
2758
- name: WebbCrawler
2759
- category: Crawler
2760
- url: http://badcheese.com/crawler.html
2761
- producer:
2762
- name: Steve Webb
2763
- url: http://badcheese.com
2764
- -
2765
- user_agent: WordPress/4.7.2; https://example.com
2766
- bot:
2767
- name: WordPress
2768
- category: Service Agent
2769
- url: https://wordpress.org/
2770
- producer:
2771
- name: Wordpress.org
2772
- url: https://wordpress.org/
2773
- -
2774
- user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
2775
- bot:
2776
- name: Wotbox
2777
- category: Search bot
2778
- url: http://www.wotbox.com/bot/
2779
- producer:
2780
- name: Wotbox
2781
- url: http://www.wotbox.com
2782
- -
2783
- user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
2784
- bot:
2785
- name: YaCy
2786
- category: Search bot
2787
- url: http://yacy.net/bot.html
2788
- producer:
2789
- name: YaCy
2790
- url: http://yacy.net
2791
- -
2792
- user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
2793
- bot:
2794
- name: YaCy
2795
- category: Search bot
2796
- url: http://yacy.net/bot.html
2797
- producer:
2798
- name: YaCy
2799
- url: http://yacy.net
2800
- -
2801
- user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
2802
- bot:
2803
- name: Yahoo Gemini
2804
- category: Crawler
2805
- url: https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html
2806
- producer:
2807
- name: Yahoo! Inc.
2808
- url: http://www.yahoo.com
2809
- -
2810
- user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
2811
- bot:
2812
- name: Yahoo! Link Preview
2813
- category: Crawler
2814
- url: https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html
2815
- producer:
2816
- name: Yahoo! Inc.
2817
- url: http://www.yahoo.com
2818
- -
2819
- user_agent: Yahoo:LinkExpander:Slingstone
2820
- bot:
2821
- name: Yahoo! Link Preview
2822
- category: Crawler
2823
- url: https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html
2824
- producer:
2825
- name: Yahoo! Inc.
2826
- url: http://www.yahoo.com
2827
- -
2828
- user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
2829
- bot:
2830
- name: Yahoo! Slurp
2831
- category: Search bot
2832
- url: http://help.yahoo.com/ysearch/slurp
2833
- producer:
2834
- name: Yahoo! Inc.
2835
- url: http://www.yahoo.com
2836
- -
2837
- user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
2838
- bot:
2839
- name: Yahoo! Slurp
2840
- category: Search bot
2841
- url: http://help.yahoo.com/ysearch/slurp
2842
- producer:
2843
- name: Yahoo! Inc.
2844
- url: http://www.yahoo.com
2845
- -
2846
- user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
2847
- bot:
2848
- name: Yandex Bot
2849
- category: Search bot
2850
- url: http://www.yandex.com/bots
2851
- producer:
2852
- name: Yandex LLC
2853
- url: http://company.yandex.com
2854
- -
2855
- user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
2856
- bot:
2857
- name: Yandex Bot
2858
- category: Search bot
2859
- url: http://www.yandex.com/bots
2860
- producer:
2861
- name: Yandex LLC
2862
- url: http://company.yandex.com
2863
- -
2864
- user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
2865
- bot:
2866
- name: Yandex Bot
2867
- category: Search bot
2868
- url: http://www.yandex.com/bots
2869
- producer:
2870
- name: Yandex LLC
2871
- url: http://company.yandex.com
2872
- -
2873
- user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
2874
- bot:
2875
- name: Yandex Bot
2876
- category: Search bot
2877
- url: http://www.yandex.com/bots
2878
- producer:
2879
- name: Yandex LLC
2880
- url: http://company.yandex.com
2881
- -
2882
- user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
2883
- bot:
2884
- name: Yandex Bot
2885
- category: Search bot
2886
- url: http://www.yandex.com/bots
2887
- producer:
2888
- name: Yandex LLC
2889
- url: http://company.yandex.com
2890
- -
2891
- user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
2892
- bot:
2893
- name: Yandex Bot
2894
- category: Search bot
2895
- url: http://www.yandex.com/bots
2896
- producer:
2897
- name: Yandex LLC
2898
- url: http://company.yandex.com
2899
- -
2900
- user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
2901
- bot:
2902
- name: Yandex Bot
2903
- category: Search bot
2904
- url: http://www.yandex.com/bots
2905
- producer:
2906
- name: Yandex LLC
2907
- url: http://company.yandex.com
2908
- -
2909
- user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
2910
- bot:
2911
- name: Yandex Bot
2912
- category: Search bot
2913
- url: http://www.yandex.com/bots
2914
- producer:
2915
- name: Yandex LLC
2916
- url: http://company.yandex.com
2917
- -
2918
- user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
2919
- bot:
2920
- name: Yandex Bot
2921
- category: Search bot
2922
- url: http://www.yandex.com/bots
2923
- producer:
2924
- name: Yandex LLC
2925
- url: http://company.yandex.com
2926
- -
2927
- user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
2928
- bot:
2929
- name: Yandex Bot
2930
- category: Search bot
2931
- url: http://www.yandex.com/bots
2932
- producer:
2933
- name: Yandex LLC
2934
- url: http://company.yandex.com
2935
- -
2936
- user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
2937
- bot:
2938
- name: Yandex Bot
2939
- category: Search bot
2940
- url: http://www.yandex.com/bots
2941
- producer:
2942
- name: Yandex LLC
2943
- url: http://company.yandex.com
2944
- -
2945
- user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
2946
- bot:
2947
- name: Yandex Bot
2948
- category: Search bot
2949
- url: http://www.yandex.com/bots
2950
- producer:
2951
- name: Yandex LLC
2952
- url: http://company.yandex.com
2953
- -
2954
- user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
2955
- bot:
2956
- name: Yandex Bot
2957
- category: Search bot
2958
- url: http://www.yandex.com/bots
2959
- producer:
2960
- name: Yandex LLC
2961
- url: http://company.yandex.com
2962
- -
2963
- user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
2964
- bot:
2965
- name: Yandex Bot
2966
- category: Search bot
2967
- url: http://www.yandex.com/bots
2968
- producer:
2969
- name: Yandex LLC
2970
- url: http://company.yandex.com
2971
- -
2972
- user_agent: Mozilla/5.0 (compatible; YandexVerticals/1.0; http://yandex.com/bots)
2973
- bot:
2974
- name: Yandex Bot
2975
- category: Search bot
2976
- url: http://www.yandex.com/bots
2977
- producer:
2978
- name: Yandex LLC
2979
- url: http://company.yandex.com
2980
- -
2981
- user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
2982
- bot:
2983
- name: Yeti/Naverbot
2984
- category: Search bot
2985
- url: http://help.naver.com/robots/
2986
- producer:
2987
- name: Naver
2988
- url: http://www.naver.com
2989
- -
2990
- user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
2991
- bot:
2992
- name: Youdao Bot
2993
- category: Search bot
2994
- url: http://www.youdao.com/help/webmaster/spider
2995
- producer:
2996
- name: NetEase, Inc.
2997
- url: http://corp.163.com
2998
- -
2999
- user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
3000
- bot:
3001
- name: Yourls
3002
- category: Crawler
3003
- url: http://yourls.org
3004
- -
3005
- user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
3006
- bot:
3007
- name: Yunyun Bot
3008
- category: Search bot
3009
- url: http://www.yunyun.com/SiteInfo.php?r=about
3010
- producer:
3011
- name: YunYun
3012
- url: http://www.yunyun.com
3013
- -
3014
- user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
3015
- bot:
3016
- name: Yunyun Bot
3017
- category: Search bot
3018
- url: http://www.yunyun.com/SiteInfo.php?r=about
3019
- producer:
3020
- name: YunYun
3021
- url: http://www.yunyun.com
3022
- -
3023
- user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
3024
- bot:
3025
- name: Yunyun Bot
3026
- category: Search bot
3027
- url: http://www.yunyun.com/SiteInfo.php?r=about
3028
- producer:
3029
- name: YunYun
3030
- url: http://www.yunyun.com
3031
- -
3032
- user_agent: Zao/0.1 (http://www.kototol.org/zao)
3033
- bot:
3034
- name: Zao
3035
- category: Crawler
3036
- -
3037
- user_agent: Zookabot/2.5;++http://zookabot.com
3038
- bot:
3039
- name: Zookabot
3040
- category: Crawler
3041
- url: http://zookabot.com
3042
- producer:
3043
- name: Hwacha ApS
3044
- url: http://hwacha.dk
3045
- -
3046
- user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
3047
- bot:
3048
- name: ZumBot
3049
- category: Search bot
3050
- url: http://help.zum.com/inquiry
3051
- producer:
3052
- name: ZUM internet
3053
- url: http://www.zuminternet.com/
3054
- -
3055
- user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
3056
- bot:
3057
- name: ZumBot
3058
- category: Search bot
3059
- url: http://help.zum.com/inquiry
3060
- producer:
3061
- name: ZUM internet
3062
- url: http://www.zuminternet.com/
3063
- -
3064
- user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
3065
- bot:
3066
- name: aHrefs Bot
3067
- category: Crawler
3068
- url: http://ahrefs.com/robot
3069
- producer:
3070
- name: Ahrefs Pte Ltd
3071
- url: http://ahrefs.com/robot
3072
- -
3073
- user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
3074
- bot:
3075
- name: aHrefs Bot
3076
- category: Crawler
3077
- url: http://ahrefs.com/robot
3078
- producer:
3079
- name: Ahrefs Pte Ltd
3080
- url: http://ahrefs.com/robot
3081
- -
3082
- user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
3083
- bot:
3084
- name: aHrefs Bot
3085
- category: Crawler
3086
- url: http://ahrefs.com/robot
3087
- producer:
3088
- name: Ahrefs Pte Ltd
3089
- url: http://ahrefs.com/robot
3090
- -
3091
- user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
3092
- bot:
3093
- name: aHrefs Bot
3094
- category: Crawler
3095
- url: http://ahrefs.com/robot
3096
- producer:
3097
- name: Ahrefs Pte Ltd
3098
- url: http://ahrefs.com/robot
3099
- -
3100
- user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
3101
- bot:
3102
- name: archive.org bot
3103
- category: Crawler
3104
- url: http://www.archive.org/details/archive.org_bot
3105
- producer:
3106
- name: The Internet Archive
3107
- url: http://www.archive.org
3108
- -
3109
- user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
3110
- bot:
3111
- name: archive.org bot
3112
- category: Crawler
3113
- url: http://www.archive.org/details/archive.org_bot
3114
- producer:
3115
- name: The Internet Archive
3116
- url: http://www.archive.org
3117
- -
3118
- user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
3119
- bot:
3120
- name: archive.org bot
3121
- category: Crawler
3122
- url: http://www.archive.org/details/archive.org_bot
3123
- producer:
3124
- name: The Internet Archive
3125
- url: http://www.archive.org
3126
- -
3127
- user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
3128
- bot:
3129
- name: archive.org bot
3130
- category: Crawler
3131
- url: http://www.archive.org/details/archive.org_bot
3132
- producer:
3133
- name: The Internet Archive
3134
- url: http://www.archive.org
3135
- -
3136
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
3137
- bot:
3138
- name: archive.org bot
3139
- category: Crawler
3140
- url: http://www.archive.org/details/archive.org_bot
3141
- producer:
3142
- name: The Internet Archive
3143
- url: http://www.archive.org
3144
- -
3145
- user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
3146
- bot:
3147
- name: archive.org bot
3148
- category: Crawler
3149
- url: http://www.archive.org/details/archive.org_bot
3150
- producer:
3151
- name: The Internet Archive
3152
- url: http://www.archive.org
3153
- -
3154
- user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
3155
- bot:
3156
- name: archive.org bot
3157
- category: Crawler
3158
- url: http://www.archive.org/details/archive.org_bot
3159
- producer:
3160
- name: The Internet Archive
3161
- url: http://www.archive.org
3162
- -
3163
- user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
3164
- bot:
3165
- name: ccBot crawler
3166
- category: Crawler
3167
- url: http://commoncrawl.org/faq/
3168
- producer:
3169
- name: reddit inc.
3170
- url: http://www.reddit.com
3171
- -
3172
- user_agent: Mozilla/5.0 (compatible; evc-batch/2.0)
3173
- bot:
3174
- name: evc-batch
3175
- category: Crawler
3176
- url: ""
3177
- producer:
3178
- name: eVenture Capital Partners II, LLC
3179
- url: http://www.eventures.vc/
3180
- -
3181
- user_agent: masscan/1.0 (https://github.com/robertdavidgraham/masscan)
3182
- bot:
3183
- name: masscan
3184
- url: https://github.com/robertdavidgraham/masscan
3185
- category: Crawler
3186
- producer:
3187
- name: Robert Graham
3188
- url: https://github.com/robertdavidgraham
3189
- -
3190
- user_agent: 'sqlmap/1.1.8.2#dev (http://sqlmap.org)'
3191
- bot:
3192
- name: sqlmap
3193
- category: Security Checker
3194
- url: http://sqlmap.org/
3195
- producer:
3196
- name: sqlmap
3197
- url: http://sqlmap.org/
3198
- -
3199
- user_agent: 'BoardReader Blog Indexer(http://boardreader.com)'
3200
- bot:
3201
- name: BoardReader Blog Indexer
3202
- category: Crawler
3203
- producer:
3204
- name: BoardReader
3205
- url: http://boardreader.com/
3206
- -
3207
- user_agent: 'Nuzzel'
3208
- bot:
3209
- name: Nuzzel
3210
- category: Crawler
3211
- producer:
3212
- name: Nuzzel
3213
- url: https://www.nuzzel.com/
3214
- -
3215
- user_agent: 'Mozilla/5.0 eCairn-Grabber/1.0 (+http://ecairn.com/grabber)'
3216
- bot:
3217
- name: eCairn-Grabber
3218
- category: Crawler
3219
- producer:
3220
- name: eCairn
3221
- url: https://ecairn.com
3222
- -
3223
- user_agent: 'Mozilla/5.0/Firefox/42.0 - nbertaupete95(at)gmail.com'
3224
- bot:
3225
- name: nbertaupete95
3226
- category: Crawler
3227
- -
3228
- user_agent: 'Mozilla/5.0 (compatible; Twingly Recon; twingly.com)'
3229
- bot:
3230
- name: Twingly Recon
3231
- category: Crawler
3232
- producer:
3233
- name: Twingly
3234
- url: https://www.twingly.com
3235
- -
3236
- user_agent: 'Mozilla/5.0 (compatible; inoreader.com; 2 subscribers)'
3237
- bot:
3238
- name: inoreader
3239
- category: Feed Reader
3240
- url: https://www.inoreader.com
3241
- -
3242
- user_agent: 'Mozilla/5.0 (compatible; theoldreader.com; 1 subscribers; feed-id=aaa)'
3243
- bot:
3244
- name: theoldreader
3245
- category: Feed Reader
3246
- url: https://theoldreader.com
3247
- -
3248
- user_agent: 'The Knowledge AI'
3249
- bot:
3250
- name: The Knowledge AI
3251
- category: Crawler
3252
- -
3253
- user_agent: shopify-partner-homepage-scraper
3254
- bot:
3255
- name: Shopify Partner
3256
- category: Crawler
3257
- url: https://www.shopify.com/partners
3258
- producer:
3259
- name: Shopify
3260
- url: https://www.shopify.com/