device_detector 0.7.0 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (72) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile +4 -0
  3. data/Rakefile +12 -6
  4. data/device_detector.gemspec +1 -1
  5. data/lib/device_detector.rb +65 -4
  6. data/lib/device_detector/client.rb +6 -6
  7. data/lib/device_detector/device.rb +62 -31
  8. data/lib/device_detector/memory_cache.rb +1 -1
  9. data/lib/device_detector/metadata_extractor.rb +4 -13
  10. data/lib/device_detector/model_extractor.rb +10 -1
  11. data/lib/device_detector/name_extractor.rb +1 -1
  12. data/lib/device_detector/os.rb +141 -5
  13. data/lib/device_detector/parser.rb +23 -12
  14. data/lib/device_detector/version.rb +1 -1
  15. data/lib/device_detector/version_extractor.rb +1 -1
  16. data/regexes/bots.yml +36 -1
  17. data/regexes/{browser_engines.yml → client/browser_engine.yml} +4 -1
  18. data/regexes/{browsers.yml → client/browsers.yml} +31 -27
  19. data/regexes/{feed_readers.yml → client/feed_readers.yml} +0 -1
  20. data/regexes/{libraries.yml → client/libraries.yml} +1 -1
  21. data/regexes/{mediaplayers.yml → client/mediaplayers.yml} +1 -1
  22. data/regexes/{mobile_apps.yml → client/mobile_apps.yml} +0 -1
  23. data/regexes/{pim.yml → client/pim.yml} +1 -1
  24. data/regexes/{devices → device}/cameras.yml +1 -1
  25. data/regexes/{devices → device}/car_browsers.yml +0 -1
  26. data/regexes/{devices → device}/consoles.yml +0 -1
  27. data/regexes/{devices → device}/mobiles.yml +193 -49
  28. data/regexes/{devices/portable_media_players.yml → device/portable_media_player.yml} +0 -1
  29. data/regexes/{devices → device}/televisions.yml +0 -3
  30. data/regexes/oss.yml +105 -102
  31. data/regexes/vendorfragments.yml +70 -0
  32. data/spec/device_detector/bot_fixtures_spec.rb +30 -0
  33. data/spec/device_detector/client_fixtures_spec.rb +31 -0
  34. data/spec/device_detector/concrete_user_agent_spec.rb +41 -1
  35. data/spec/device_detector/detector_fixtures_spec.rb +56 -0
  36. data/spec/device_detector/device_fixtures_spec.rb +36 -0
  37. data/spec/device_detector/device_spec.rb +3 -3
  38. data/spec/device_detector/memory_cache_spec.rb +1 -1
  39. data/spec/device_detector/model_extractor_spec.rb +7 -7
  40. data/spec/device_detector/os_fixtures_spec.rb +26 -0
  41. data/spec/device_detector/version_extractor_spec.rb +10 -10
  42. data/spec/device_detector_spec.rb +1 -1
  43. data/spec/fixtures/client/browser.yml +986 -0
  44. data/spec/fixtures/client/feed_reader.yml +180 -0
  45. data/spec/fixtures/client/library.yml +78 -0
  46. data/spec/fixtures/client/mediaplayer.yml +144 -0
  47. data/spec/fixtures/client/mobile_app.yml +24 -0
  48. data/spec/fixtures/client/pim.yml +90 -0
  49. data/spec/fixtures/detector/bots.yml +716 -0
  50. data/spec/fixtures/detector/camera.yml +91 -0
  51. data/spec/fixtures/detector/car_browser.yml +19 -0
  52. data/spec/fixtures/detector/console.yml +253 -0
  53. data/spec/fixtures/detector/desktop.yml +4568 -0
  54. data/spec/fixtures/detector/feature_phone.yml +719 -0
  55. data/spec/fixtures/detector/feed_reader.yml +462 -0
  56. data/spec/fixtures/detector/mediaplayer.yml +141 -0
  57. data/spec/fixtures/detector/mobile_apps.yml +32 -0
  58. data/spec/fixtures/detector/phablet.yml +1095 -0
  59. data/spec/fixtures/detector/portable_media_player.yml +145 -0
  60. data/spec/fixtures/detector/smart_display.yml +19 -0
  61. data/spec/fixtures/detector/smartphone.yml +28673 -0
  62. data/spec/fixtures/detector/tablet.yml +13201 -0
  63. data/spec/fixtures/detector/tv.yml +1380 -0
  64. data/spec/fixtures/detector/unknown.yml +3536 -0
  65. data/spec/fixtures/device/camera.yml +18 -0
  66. data/spec/fixtures/device/car_browser.yml +6 -0
  67. data/spec/fixtures/device/console.yml +72 -0
  68. data/spec/fixtures/parser/bots.yml +2055 -0
  69. data/spec/fixtures/parser/oss.yml +607 -0
  70. data/spec/fixtures/parser/vendorfragments.yml +156 -0
  71. data/spec/spec_helper.rb +6 -2
  72. metadata +84 -17
@@ -0,0 +1,716 @@
1
+ -
2
+ user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
3
+ name: '360Spider'
4
+ -
5
+ user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
6
+ name: '360Spider'
7
+ -
8
+ user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
9
+ name: '360Spider'
10
+ -
11
+ user_agent: 360spider-image
12
+ name: '360Spider'
13
+ -
14
+ user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
15
+ name: 'Aboundexbot'
16
+ -
17
+ user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
18
+ name: 'Acoon'
19
+ -
20
+ user_agent: AddThis.com robot tech.support@clearspring.com
21
+ name: 'AddThis.com'
22
+ -
23
+ user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
24
+ name: 'aHrefs Bot'
25
+ -
26
+ user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
27
+ name: 'aHrefs Bot'
28
+ -
29
+ user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
30
+ name: 'aHrefs Bot'
31
+ -
32
+ user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
33
+ name: 'aHrefs Bot'
34
+ -
35
+ user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
36
+ name: 'Alexa Crawler'
37
+ -
38
+ user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
39
+ name: 'Amorank Spider'
40
+ -
41
+ user_agent: Curious George - www.analyticsseo.com/crawler
42
+ name: 'Analytics SEO Crawler'
43
+ -
44
+ user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
45
+ name: 'archive.org bot'
46
+ -
47
+ user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
48
+ name: 'archive.org bot'
49
+ -
50
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
51
+ name: 'archive.org bot'
52
+ -
53
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
54
+ name: 'archive.org bot'
55
+ -
56
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
57
+ name: 'archive.org bot'
58
+ -
59
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
60
+ name: 'archive.org bot'
61
+ -
62
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
63
+ name: 'archive.org bot'
64
+ -
65
+ user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
66
+ name: 'Ask Jeeves'
67
+ -
68
+ user_agent: Backlink-Ceck.de (+http://www.backlink-check.de/bot.html)
69
+ name: 'Backlink-Ceck.de'
70
+ -
71
+ user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
72
+ name: 'BacklinkCrawler'
73
+ -
74
+ user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
75
+ name: 'Baidu Spider'
76
+ -
77
+ user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
78
+ name: 'Baidu Spider'
79
+ -
80
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
81
+ name: 'Baidu Spider'
82
+ -
83
+ user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
84
+ name: 'Baidu Spider'
85
+ -
86
+ user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
87
+ name: 'Baidu Spider'
88
+ -
89
+ user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
90
+ name: 'Baidu Spider'
91
+ -
92
+ user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
93
+ name: 'Baidu Spider'
94
+ -
95
+ user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
96
+ name: 'BingBot'
97
+ -
98
+ user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
99
+ name: 'BingBot'
100
+ -
101
+ user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
102
+ name: 'BingBot'
103
+ -
104
+ user_agent: MSNBot/Nutch-1.5.1
105
+ name: 'BingBot'
106
+ -
107
+ user_agent: msnbot/2.0b v1394720947.6703
108
+ name: 'BingBot'
109
+ -
110
+ user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
111
+ name: 'BingBot'
112
+ -
113
+ user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
114
+ name: 'BingBot'
115
+ -
116
+ user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
117
+ name: 'BingBot'
118
+ -
119
+ user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
120
+ name: 'Blekkobot'
121
+ -
122
+ user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
123
+ name: 'BLEXBot Crawler'
124
+ -
125
+ user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
126
+ name: 'Bountii Bot'
127
+ -
128
+ user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
129
+ name: 'Butterfly Robot'
130
+ -
131
+ user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
132
+ name: 'Butterfly Robot'
133
+ -
134
+ user_agent: Browsershots
135
+ name: 'Browsershots'
136
+ -
137
+ user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
138
+ name: 'CareerBot'
139
+ -
140
+ user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
141
+ name: 'ccBot crawler'
142
+ -
143
+ user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
144
+ name: 'Cliqzbot'
145
+ -
146
+ user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
147
+ name: 'CloudFlare Always Online'
148
+ -
149
+ user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
150
+ name: 'Dazoobot'
151
+ -
152
+ user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
153
+ name: 'Discobot'
154
+ -
155
+ user_agent: dotbot
156
+ name: 'DotBot'
157
+ -
158
+ user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
159
+ name: 'Easou Spider'
160
+ -
161
+ user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
162
+ name: 'Easou Spider'
163
+ -
164
+ user_agent: EMail Exractor
165
+ name: 'EMail Exractor'
166
+ -
167
+ user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
168
+ name: 'ExaBot'
169
+ -
170
+ user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
171
+ name: 'ExaBot'
172
+ -
173
+ user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
174
+ name: 'ExaBot'
175
+ -
176
+ user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
177
+ name: 'ExactSeek Crawler'
178
+ -
179
+ user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
180
+ name: 'Ezooms'
181
+ -
182
+ user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
183
+ name: 'Facebook External Hit'
184
+ -
185
+ user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
186
+ name: 'Facebook External Hit'
187
+ -
188
+ user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
189
+ name: 'Genieo Web filter'
190
+ -
191
+ user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
192
+ name: 'Goo'
193
+ -
194
+ user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
195
+ name: 'Google PageSpeed Insights'
196
+ -
197
+ user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
198
+ name: 'Googlebot'
199
+ -
200
+ user_agent: Googlebot/Nutch-1.7
201
+ name: 'Googlebot'
202
+ -
203
+ user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
204
+ name: 'Googlebot'
205
+ -
206
+ user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
207
+ name: 'Googlebot'
208
+ -
209
+ user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
210
+ name: 'Googlebot'
211
+ -
212
+ user_agent: Googlebot-Image/1.0
213
+ name: 'Googlebot'
214
+ -
215
+ user_agent: Googlebot-Video/1.0
216
+ name: 'Googlebot'
217
+ -
218
+ user_agent: Googlebot (gocrawl v0.4)
219
+ name: 'Googlebot'
220
+ -
221
+ user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
222
+ name: 'Googlebot'
223
+ -
224
+ user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
225
+ name: 'Googlebot'
226
+ -
227
+ user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
228
+ name: 'Googlebot'
229
+ -
230
+ user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
231
+ name: 'Googlebot'
232
+ -
233
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
234
+ name: 'Googlebot'
235
+ -
236
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
237
+ name: 'Googlebot'
238
+ -
239
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
240
+ name: 'Googlebot'
241
+ -
242
+ user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
243
+ name: 'Googlebot'
244
+ -
245
+ user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
246
+ name: 'Googlebot'
247
+ -
248
+ user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
249
+ name: 'Googlebot'
250
+ -
251
+ user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
252
+ name: 'Googlebot'
253
+ -
254
+ user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
255
+ name: 'Googlebot'
256
+ -
257
+ user_agent: Mediapartners-Google
258
+ name: 'Googlebot'
259
+ -
260
+ user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
261
+ name: 'Heritrix'
262
+ -
263
+ user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
264
+ name: 'Heritrix'
265
+ -
266
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
267
+ name: 'Heritrix'
268
+ -
269
+ user_agent: flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)
270
+ name: 'Heritrix'
271
+ -
272
+ user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
273
+ name: 'Heritrix'
274
+ -
275
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
276
+ name: 'Heritrix'
277
+ -
278
+ user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
279
+ name: 'Heritrix'
280
+ -
281
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
282
+ name: 'Heritrix'
283
+ -
284
+ user_agent: HTTPMon/1.0b (http://www.httpmon.com)
285
+ name: 'HTTPMon'
286
+ -
287
+ user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
288
+ name: 'IIS Site Analysis'
289
+ -
290
+ user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
291
+ name: 'Linkdex Bot'
292
+ -
293
+ user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
294
+ name: 'Linkdex Bot'
295
+ -
296
+ user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
297
+ name: 'Linkdex Bot'
298
+ -
299
+ user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
300
+ name: 'LinkedIn Bot'
301
+ -
302
+ user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
303
+ name: 'Mail.Ru Bot'
304
+ -
305
+ user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
306
+ name: 'Mail.Ru Bot'
307
+ -
308
+ user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
309
+ name: 'Magpie-Crawler'
310
+ -
311
+ user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
312
+ name: 'Meanpath Bot'
313
+ -
314
+ user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
315
+ name: 'Mixrank Bot'
316
+ -
317
+ user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
318
+ name: 'MJ12 Bot'
319
+ -
320
+ user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
321
+ name: 'MojeekBot'
322
+ -
323
+ user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
324
+ name: 'NalezenCzBot'
325
+ -
326
+ user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
327
+ name: 'Netcraft Survey Bot'
328
+ -
329
+ user_agent: nlcrawler/1.0 (+http://northernlight.com/)
330
+ name: 'NLCrawler'
331
+ -
332
+ user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
333
+ name: 'Omgili bot'
334
+ -
335
+ user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
336
+ name: 'Openindex Spider'
337
+ -
338
+ user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
339
+ name: 'OpenLinkProfiler'
340
+ -
341
+ user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
342
+ name: 'OpenWebSpider'
343
+ -
344
+ user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
345
+ name: 'PaperLiBot'
346
+ -
347
+ user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
348
+ name: 'Picsearch bot'
349
+ -
350
+ user_agent: psbot-page (+http://www.picsearch.com/bot.html)
351
+ name: 'Picsearch bot'
352
+ -
353
+ user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
354
+ name: 'Pingdom Bot'
355
+ -
356
+ user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
357
+ name: 'QuerySeekerSpider'
358
+ -
359
+ user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
360
+ name: 'Reddit Bot'
361
+ -
362
+ user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
363
+ name: 'Rogerbot'
364
+ -
365
+ user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
366
+ name: 'Rogerbot'
367
+ -
368
+ user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
369
+ name: 'Rogerbot'
370
+ -
371
+ user_agent: Screaming Frog SEO Spider/2.22
372
+ name: 'Screaming Frog SEO Spider'
373
+ -
374
+ user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
375
+ name: 'ScreenerBot'
376
+ -
377
+ user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
378
+ name: 'Semrush Bot'
379
+ -
380
+ user_agent: SensikaBot/x.33 (+http://sensika.com)
381
+ name: 'Sensika Bot'
382
+ -
383
+ user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
384
+ name: 'SEOENGBot'
385
+ -
386
+ user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
387
+ name: 'Seznam Bot'
388
+ -
389
+ user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
390
+ name: 'Seznam Bot'
391
+ -
392
+ user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
393
+ name: 'Seznam Bot'
394
+ -
395
+ user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
396
+ name: 'Seznam Bot'
397
+ -
398
+ user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
399
+ name: 'ShopWiki'
400
+ -
401
+ user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
402
+ name: 'SISTRIX Crawler'
403
+ -
404
+ user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
405
+ name: 'Sogou Spider'
406
+ -
407
+ user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
408
+ name: 'Sogou Spider'
409
+ -
410
+ user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
411
+ name: 'Sogou Spider'
412
+ -
413
+ user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
414
+ name: 'Sogou Spider'
415
+ -
416
+ user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
417
+ name: 'Soso Spider'
418
+ -
419
+ user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
420
+ name: 'Superfeedr Bot'
421
+ -
422
+ user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
423
+ name: 'Spinn3r'
424
+ -
425
+ user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
426
+ name: 'Sputnik Bot'
427
+ -
428
+ user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
429
+ name: 'Sputnik Bot'
430
+ -
431
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
432
+ name: 'Survey Bot'
433
+ -
434
+ user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
435
+ name: 'TinEye Crawler'
436
+ -
437
+ user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
438
+ name: 'TurnitinBot'
439
+ -
440
+ user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
441
+ name: 'TweetedTimes Bot'
442
+ -
443
+ user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
444
+ name: 'TweetedTimes Bot'
445
+ -
446
+ user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
447
+ name: 'Tweetmeme Bot'
448
+ -
449
+ user_agent: Twitterbot/1.0
450
+ name: 'Twitterbot'
451
+ -
452
+ user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
453
+ name: 'Uptime Robot'
454
+ -
455
+ user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
456
+ name: 'URLAppendBot'
457
+ -
458
+ user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
459
+ name: 'Visual Site Mapper Crawler'
460
+ -
461
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
462
+ name: 'Voila Bot'
463
+ -
464
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
465
+ name: 'Voila Bot'
466
+ -
467
+ user_agent: Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)
468
+ name: 'W3C CSS Validator'
469
+ -
470
+ user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
471
+ name: 'W3C I18N Checker'
472
+ -
473
+ user_agent: W3C-checklink/4.0 [4.4] libwww-perl/5.803
474
+ name: 'W3C Link Checker'
475
+ -
476
+ user_agent: W3C-checklink/4.81 libwww-perl/5.836
477
+ name: 'W3C Link Checker'
478
+ -
479
+ user_agent: W3C_Validator/1.3 http://validator.w3.org/services
480
+ name: 'W3C Markup Validation Service'
481
+ -
482
+ user_agent: W3C_Validator/1.767
483
+ name: 'W3C Markup Validation Service'
484
+ -
485
+ user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
486
+ name: 'W3C MobileOK Checker'
487
+ -
488
+ user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
489
+ name: 'W3C Unified Validator'
490
+ -
491
+ user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
492
+ name: 'WebbCrawler'
493
+ -
494
+ user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
495
+ name: 'WeSEE:Search'
496
+ -
497
+ user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
498
+ name: 'Wotbox'
499
+ -
500
+ user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
501
+ name: 'YaCy'
502
+ -
503
+ user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
504
+ name: 'YaCy'
505
+ -
506
+ user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
507
+ name: 'Yahoo! Slurp'
508
+ -
509
+ user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
510
+ name: 'Yahoo! Slurp'
511
+ -
512
+ user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
513
+ name: 'Yandex Bot'
514
+ -
515
+ user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
516
+ name: 'Yandex Bot'
517
+ -
518
+ user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
519
+ name: 'Yandex Bot'
520
+ -
521
+ user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
522
+ name: 'Yandex Bot'
523
+ -
524
+ user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
525
+ name: 'Yandex Bot'
526
+ -
527
+ user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
528
+ name: 'Yandex Bot'
529
+ -
530
+ user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
531
+ name: 'Yandex Bot'
532
+ -
533
+ user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
534
+ name: 'Yandex Bot'
535
+ -
536
+ user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
537
+ name: 'Yandex Bot'
538
+ -
539
+ user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
540
+ name: 'Yandex Bot'
541
+ -
542
+ user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
543
+ name: 'Yandex Bot'
544
+ -
545
+ user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
546
+ name: 'Yandex Bot'
547
+ -
548
+ user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
549
+ name: 'Yandex Bot'
550
+ -
551
+ user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
552
+ name: 'Yeti/Naverbot'
553
+ -
554
+ user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
555
+ name: 'Youdao Bot'
556
+ -
557
+ user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
558
+ name: 'Yunyun Bot'
559
+ -
560
+ user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
561
+ name: 'Yunyun Bot'
562
+ -
563
+ user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
564
+ name: 'Yunyun Bot'
565
+ -
566
+ user_agent: Zookabot/2.5;++http://zookabot.com
567
+ name: 'Zookabot'
568
+ -
569
+ user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
570
+ name: 'ZumBot'
571
+ -
572
+ user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
573
+ name: 'ZumBot'
574
+ -
575
+ user_agent: Your Nutch Spider/Nutch-2.2.1
576
+ name: 'Nutch-based Bot'
577
+ -
578
+ user_agent: Nutch12/Nutch-1.2
579
+ name: 'Nutch-based Bot'
580
+ -
581
+ user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
582
+ name: 'Nutch-based Bot'
583
+ -
584
+ user_agent: MySpider/Nutch-2.2
585
+ name: 'Nutch-based Bot'
586
+ -
587
+ user_agent: My Nutch Spider/Nutch-1.6
588
+ name: 'Nutch-based Bot'
589
+ -
590
+ user_agent: NutchSpider/Nutch-1.4
591
+ name: 'Nutch-based Bot'
592
+ -
593
+ user_agent: testnutch/Nutch-1.8
594
+ name: 'Nutch-based Bot'
595
+ -
596
+ user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
597
+ name: 'Nutch-based Bot'
598
+ -
599
+ user_agent: your sipder name/Nutch-1.7
600
+ name: 'Nutch-based Bot'
601
+ -
602
+ user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
603
+ name: 'Nutch-based Bot'
604
+ -
605
+ user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
606
+ name: 'Nutch-based Bot'
607
+ -
608
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
609
+ name: 'Nutch-based Bot'
610
+ -
611
+ user_agent: CB/Nutch-1.7
612
+ name: 'Nutch-based Bot'
613
+ -
614
+ user_agent: StatusCake Error Detector Crawler V0.01
615
+ name: 'Generic Bot'
616
+ -
617
+ user_agent: niki-bot
618
+ name: 'Generic Bot'
619
+
620
+
621
+ -
622
+ user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
623
+ name: 'Bloglovin'
624
+ -
625
+ user_agent: CommaFeed/1.0 (http://www.commafeed.com)
626
+ name: 'CommaFeed'
627
+ -
628
+ user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
629
+ name: 'FeedBurner'
630
+ -
631
+ user_agent: Feedbin - 9 subscribers
632
+ name: 'Feedbin'
633
+ -
634
+ user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
635
+ name: 'Feedly'
636
+ -
637
+ user_agent: FeedlyBot/1.0 (http://feedly.com)
638
+ name: 'Feedly'
639
+ -
640
+ user_agent: FeedlyApp/1.0 (http://www.feedly.com)
641
+ name: 'Feedly'
642
+ -
643
+ user_agent: MetaFeedly/1.0 (http://www.feedly.com)
644
+ name: 'Feedly'
645
+ -
646
+ user_agent: Feedspot http://www.feedspot.com
647
+ name: 'Feedspot'
648
+ -
649
+ user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
650
+ name: 'Fever'
651
+ -
652
+ user_agent: kouio.com RSS reader
653
+ name: 'Kouio'
654
+ -
655
+ user_agent: kouio.com RSS reader - 6 subscribers
656
+ name: 'Kouio'
657
+ -
658
+ user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
659
+ name: 'MagpieRSS'
660
+ -
661
+ user_agent: Netvibes (http://www.netvibes.com)
662
+ name: 'Netvibes'
663
+ -
664
+ user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
665
+ name: 'Netvibes'
666
+ -
667
+ user_agent: NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
668
+ name: 'NewsBlur'
669
+ -
670
+ user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
671
+ name: 'NewsBlur'
672
+ -
673
+ user_agent: NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
674
+ name: 'NewsBlur'
675
+ -
676
+ user_agent: NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
677
+ name: 'NewsBlur'
678
+ -
679
+ user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
680
+ name: 'NewsGator'
681
+ -
682
+ user_agent: SilverReader/1.0; http://silverreader.com
683
+ name: 'SilverReader'
684
+ -
685
+ user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
686
+ name: 'SimplePie'
687
+ -
688
+ user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
689
+ name: 'SimplePie'
690
+ -
691
+ user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
692
+ name: 'SimplePie'
693
+ -
694
+ user_agent: 'Tiny Tiny RSS/1.10 (http://tt-rss.org/)'
695
+ name: 'Tiny Tiny RSS'
696
+ -
697
+ user_agent: 'Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)'
698
+ name: 'Tiny Tiny RSS'
699
+ -
700
+ user_agent: 'Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)'
701
+ name: 'Yahoo Gemini'
702
+ -
703
+ user_agent: 'Mozilla/5.0 (Java) outbrain'
704
+ name: 'Outbrain'
705
+ -
706
+ user_agent: 'HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)'
707
+ name: 'HubPages'
708
+ -
709
+ user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
710
+ name: 'ADMantX'
711
+ -
712
+ user_agent: 'Pinterest/0.2 (+http://www.pinterest.com/)'
713
+ name: 'Pinterest'
714
+ -
715
+ user_agent: 'Server Density Service Monitoring v2'
716
+ name: 'Server Density'