device_detector 0.8.2 → 0.9.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (58) hide show
  1. checksums.yaml +4 -4
  2. data/.travis.yml +11 -3
  3. data/CHANGELOG.md +10 -5
  4. data/README.md +4 -4
  5. data/Rakefile +24 -19
  6. data/device_detector.gemspec +1 -1
  7. data/lib/device_detector.rb +25 -3
  8. data/lib/device_detector/device.rb +1 -1
  9. data/lib/device_detector/model_extractor.rb +4 -0
  10. data/lib/device_detector/os.rb +8 -3
  11. data/lib/device_detector/parser.rb +1 -1
  12. data/lib/device_detector/version.rb +1 -1
  13. data/regexes/bots.yml +211 -27
  14. data/regexes/client/browsers.yml +192 -58
  15. data/regexes/client/feed_readers.yml +6 -0
  16. data/regexes/client/libraries.yml +4 -0
  17. data/regexes/client/mediaplayers.yml +8 -4
  18. data/regexes/client/mobile_apps.yml +39 -4
  19. data/regexes/client/pim.yml +4 -0
  20. data/regexes/device/mobiles.yml +1803 -242
  21. data/regexes/device/televisions.yml +53 -11
  22. data/regexes/oss.yml +180 -12
  23. data/regexes/vendorfragments.yml +1 -0
  24. data/spec/device_detector/concrete_user_agent_spec.rb +36 -0
  25. data/spec/device_detector/detector_fixtures_spec.rb +1 -1
  26. data/spec/fixtures/client/browser.yml +313 -2
  27. data/spec/fixtures/client/feed_reader.yml +8 -1
  28. data/spec/fixtures/client/library.yml +7 -1
  29. data/spec/fixtures/client/mediaplayer.yml +6 -1
  30. data/spec/fixtures/client/mobile_app.yml +6 -0
  31. data/spec/fixtures/client/pim.yml +6 -0
  32. data/spec/fixtures/detector/bots.yml +2307 -612
  33. data/spec/fixtures/detector/camera.yml +6 -0
  34. data/spec/fixtures/detector/car_browser.yml +1 -0
  35. data/spec/fixtures/detector/console.yml +14 -0
  36. data/spec/fixtures/detector/desktop.yml +308 -48
  37. data/spec/fixtures/detector/feature_phone.yml +63 -0
  38. data/spec/fixtures/detector/feed_reader.yml +50 -26
  39. data/spec/fixtures/detector/mediaplayer.yml +28 -6
  40. data/spec/fixtures/detector/mobile_apps.yml +117 -0
  41. data/spec/fixtures/detector/phablet.yml +1066 -183
  42. data/spec/fixtures/detector/portable_media_player.yml +8 -0
  43. data/spec/fixtures/detector/smart_display.yml +39 -0
  44. data/spec/fixtures/detector/smartphone-1.yml +9469 -0
  45. data/spec/fixtures/detector/smartphone-2.yml +9414 -0
  46. data/spec/fixtures/detector/smartphone-3.yml +9396 -0
  47. data/spec/fixtures/detector/smartphone-4.yml +5742 -0
  48. data/spec/fixtures/detector/smartphone.yml +3446 -23680
  49. data/spec/fixtures/detector/tablet-1.yml +9495 -0
  50. data/spec/fixtures/detector/tablet-2.yml +248 -0
  51. data/spec/fixtures/detector/tablet.yml +2786 -7961
  52. data/spec/fixtures/detector/tv.yml +1376 -210
  53. data/spec/fixtures/detector/unknown.yml +205 -509
  54. data/spec/fixtures/device/console.yml +6 -0
  55. data/spec/fixtures/parser/oss.yml +194 -1
  56. data/spec/fixtures/parser/vendorfragments.yml +6 -0
  57. metadata +16 -6
  58. data/spec/fixtures/parser/bots.yml +0 -2055
@@ -25,6 +25,12 @@
25
25
  -
26
26
  useragent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; Trident/4.0; .NET CLR 1.1.4322; .NET CLR 2.0.50727; .NET CLR 3.0.4506.2152; .NET CLR 3.5.30729; CMNTDF; InfoPath.2; .NET4.0C; .NET4.0E)
27
27
  vendor: CQ
28
+ -
29
+ user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.2; WOW64; Trident/6.0; .NET4.0E; .NET4.0C; .NET CLR 3.5.30729; .NET CLR 2.0.50727; .NET CLR 3.0.30729; CMDTDFJS; Tablet PC 2.0)
30
+ vendor: CQ
31
+ -
32
+ user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Trident/5.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; .NET4.0C; .NET4.0E; CMDTDF; InfoPath.3)
33
+ vendor: CQ
28
34
  -
29
35
  useragent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Win64; x64; Trident/4.0; .NET CLR 2.0.50727; SLCC2; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDC; .NET4.0C; .NET4.0E)
30
36
  vendor: DL
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: device_detector
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.8.2
4
+ version: 0.9.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Mati Sójka
@@ -9,7 +9,7 @@ authors:
9
9
  autorequire:
10
10
  bindir: bin
11
11
  cert_chain: []
12
- date: 2015-10-20 00:00:00.000000000 Z
12
+ date: 2016-07-28 00:00:00.000000000 Z
13
13
  dependencies:
14
14
  - !ruby/object:Gem::Dependency
15
15
  name: minitest
@@ -126,20 +126,25 @@ files:
126
126
  - spec/fixtures/detector/phablet.yml
127
127
  - spec/fixtures/detector/portable_media_player.yml
128
128
  - spec/fixtures/detector/smart_display.yml
129
+ - spec/fixtures/detector/smartphone-1.yml
130
+ - spec/fixtures/detector/smartphone-2.yml
131
+ - spec/fixtures/detector/smartphone-3.yml
132
+ - spec/fixtures/detector/smartphone-4.yml
129
133
  - spec/fixtures/detector/smartphone.yml
134
+ - spec/fixtures/detector/tablet-1.yml
135
+ - spec/fixtures/detector/tablet-2.yml
130
136
  - spec/fixtures/detector/tablet.yml
131
137
  - spec/fixtures/detector/tv.yml
132
138
  - spec/fixtures/detector/unknown.yml
133
139
  - spec/fixtures/device/camera.yml
134
140
  - spec/fixtures/device/car_browser.yml
135
141
  - spec/fixtures/device/console.yml
136
- - spec/fixtures/parser/bots.yml
137
142
  - spec/fixtures/parser/oss.yml
138
143
  - spec/fixtures/parser/vendorfragments.yml
139
144
  - spec/spec_helper.rb
140
145
  homepage: http://podigee.github.io/device_detector
141
146
  licenses:
142
- - LGPLv3
147
+ - LGPL-3.0
143
148
  metadata: {}
144
149
  post_install_message:
145
150
  rdoc_options: []
@@ -157,7 +162,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
157
162
  version: '0'
158
163
  requirements: []
159
164
  rubyforge_project:
160
- rubygems_version: 2.4.5
165
+ rubygems_version: 2.5.1
161
166
  signing_key:
162
167
  specification_version: 4
163
168
  summary: Precise and fast user agent parser and device detector
@@ -191,14 +196,19 @@ test_files:
191
196
  - spec/fixtures/detector/phablet.yml
192
197
  - spec/fixtures/detector/portable_media_player.yml
193
198
  - spec/fixtures/detector/smart_display.yml
199
+ - spec/fixtures/detector/smartphone-1.yml
200
+ - spec/fixtures/detector/smartphone-2.yml
201
+ - spec/fixtures/detector/smartphone-3.yml
202
+ - spec/fixtures/detector/smartphone-4.yml
194
203
  - spec/fixtures/detector/smartphone.yml
204
+ - spec/fixtures/detector/tablet-1.yml
205
+ - spec/fixtures/detector/tablet-2.yml
195
206
  - spec/fixtures/detector/tablet.yml
196
207
  - spec/fixtures/detector/tv.yml
197
208
  - spec/fixtures/detector/unknown.yml
198
209
  - spec/fixtures/device/camera.yml
199
210
  - spec/fixtures/device/car_browser.yml
200
211
  - spec/fixtures/device/console.yml
201
- - spec/fixtures/parser/bots.yml
202
212
  - spec/fixtures/parser/oss.yml
203
213
  - spec/fixtures/parser/vendorfragments.yml
204
214
  - spec/spec_helper.rb
@@ -1,2055 +0,0 @@
1
- -
2
- user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
3
- bot:
4
- name: '360Spider'
5
- category: 'Search bot'
6
- url: 'http://www.so.com/help/help_3_2.html'
7
- producer:
8
- name: 'Online Media Group, Inc.'
9
- url: ''
10
- -
11
- user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
12
- bot:
13
- name: '360Spider'
14
- category: 'Search bot'
15
- url: 'http://www.so.com/help/help_3_2.html'
16
- producer:
17
- name: 'Online Media Group, Inc.'
18
- url: ''
19
- -
20
- user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
21
- bot:
22
- name: '360Spider'
23
- category: 'Search bot'
24
- url: 'http://www.so.com/help/help_3_2.html'
25
- producer:
26
- name: 'Online Media Group, Inc.'
27
- url: ''
28
- -
29
- user_agent: 360spider-image
30
- bot:
31
- name: '360Spider'
32
- category: 'Search bot'
33
- url: 'http://www.so.com/help/help_3_2.html'
34
- producer:
35
- name: 'Online Media Group, Inc.'
36
- url: ''
37
- -
38
- user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
39
- bot:
40
- name: 'Aboundexbot'
41
- category: 'Search bot'
42
- url: 'http://www.aboundex.com/crawler/'
43
- producer:
44
- name: 'Aboundex.com'
45
- url: 'http://www.aboundex.com'
46
- -
47
- user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
48
- bot:
49
- name: 'Acoon'
50
- category: 'Search bot'
51
- url: 'http://www.acoon.de/robot.asp'
52
- producer:
53
- name: 'Acoon GmbH'
54
- url: 'http://www.acoon.de'
55
- -
56
- user_agent: AddThis.com robot tech.support@clearspring.com
57
- bot:
58
- name: 'AddThis.com'
59
- category: 'Social Media Agent'
60
- url: ''
61
- producer:
62
- name: 'Clearspring Technologies, Inc.'
63
- url: 'http://www.clearspring.com'
64
- -
65
- user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
66
- bot:
67
- name: 'aHrefs Bot'
68
- category: 'Crawler'
69
- url: 'http://ahrefs.com/robot'
70
- producer:
71
- name: 'Ahrefs Pte Ltd'
72
- url: 'http://ahrefs.com/robot'
73
- -
74
- user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
75
- bot:
76
- name: 'aHrefs Bot'
77
- category: 'Crawler'
78
- url: 'http://ahrefs.com/robot'
79
- producer:
80
- name: 'Ahrefs Pte Ltd'
81
- url: 'http://ahrefs.com/robot'
82
- -
83
- user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
84
- bot:
85
- name: 'aHrefs Bot'
86
- category: 'Crawler'
87
- url: 'http://ahrefs.com/robot'
88
- producer:
89
- name: 'Ahrefs Pte Ltd'
90
- url: 'http://ahrefs.com/robot'
91
- -
92
- user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
93
- bot:
94
- name: 'aHrefs Bot'
95
- category: 'Crawler'
96
- url: 'http://ahrefs.com/robot'
97
- producer:
98
- name: 'Ahrefs Pte Ltd'
99
- url: 'http://ahrefs.com/robot'
100
- -
101
- user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
102
- bot:
103
- name: 'Alexa Crawler'
104
- category: 'Search bot'
105
- url: 'https://alexa.zendesk.com/hc/en-us/sections/200100794-Crawlers'
106
- producer:
107
- name: 'Alexa Internet'
108
- url: 'http://www.alexa.com'
109
- -
110
- user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
111
- bot:
112
- name: 'Amorank Spider'
113
- category: 'Crawler'
114
- url: 'http://amorank.com/webcrawler.html'
115
- producer:
116
- name: 'Amorank'
117
- url: 'http://www.amorank.com'
118
- -
119
- user_agent: Curious George - www.analyticsseo.com/crawler
120
- bot:
121
- name: 'Analytics SEO Crawler'
122
- category: 'Crawler'
123
- url: 'http://www.analyticsseo.com/crawler'
124
- producer:
125
- name: 'Analytics SEO'
126
- url: 'http://www.analyticsseo.com'
127
- -
128
- user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
129
- bot:
130
- name: 'archive.org bot'
131
- category: 'Crawler'
132
- url: 'http://www.archive.org/details/archive.org_bot'
133
- producer:
134
- name: 'The Internet Archive'
135
- url: 'http://www.archive.org'
136
- -
137
- user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
138
- bot:
139
- name: 'archive.org bot'
140
- category: 'Crawler'
141
- url: 'http://www.archive.org/details/archive.org_bot'
142
- producer:
143
- name: 'The Internet Archive'
144
- url: 'http://www.archive.org'
145
- -
146
- user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
147
- bot:
148
- name: 'archive.org bot'
149
- category: 'Crawler'
150
- url: 'http://www.archive.org/details/archive.org_bot'
151
- producer:
152
- name: 'The Internet Archive'
153
- url: 'http://www.archive.org'
154
- -
155
- user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
156
- bot:
157
- name: 'archive.org bot'
158
- category: 'Crawler'
159
- url: 'http://www.archive.org/details/archive.org_bot'
160
- producer:
161
- name: 'The Internet Archive'
162
- url: 'http://www.archive.org'
163
- -
164
- user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
165
- bot:
166
- name: 'archive.org bot'
167
- category: 'Crawler'
168
- url: 'http://www.archive.org/details/archive.org_bot'
169
- producer:
170
- name: 'The Internet Archive'
171
- url: 'http://www.archive.org'
172
- -
173
- user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
174
- bot:
175
- name: 'archive.org bot'
176
- category: 'Crawler'
177
- url: 'http://www.archive.org/details/archive.org_bot'
178
- producer:
179
- name: 'The Internet Archive'
180
- url: 'http://www.archive.org'
181
- -
182
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
183
- bot:
184
- name: 'archive.org bot'
185
- category: 'Crawler'
186
- url: 'http://www.archive.org/details/archive.org_bot'
187
- producer:
188
- name: 'The Internet Archive'
189
- url: 'http://www.archive.org'
190
- -
191
- user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
192
- bot:
193
- name: 'Ask Jeeves'
194
- category: 'Search bot'
195
- url: ''
196
- producer:
197
- name: 'Ask Jeeves Inc.'
198
- url: 'http://www.ask.com'
199
- -
200
- user_agent: Backlink-Ceck.de (+http://www.backlink-check.de/bot.html)
201
- bot:
202
- name: 'Backlink-Ceck.de'
203
- category: 'Crawler'
204
- url: 'http://www.backlink-check.de/bot.html'
205
- producer:
206
- name: 'Mediagreen Medienservice'
207
- url: 'http://www.backlink-check.de'
208
- -
209
- user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
210
- bot:
211
- name: 'BacklinkCrawler'
212
- category: 'Crawler'
213
- url: 'http://www.backlinktest.com/crawler.html'
214
- producer:
215
- name: '2.0Promotion GbR'
216
- url: 'http://www.backlinktest.com'
217
- -
218
- user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
219
- bot:
220
- name: 'Baidu Spider'
221
- category: 'Search bot'
222
- url: 'http://www.baidu.com/search/spider.htm'
223
- producer:
224
- name: 'Baidu'
225
- url: 'http://www.baidu.com'
226
- -
227
- user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
228
- bot:
229
- name: 'Baidu Spider'
230
- category: 'Search bot'
231
- url: 'http://www.baidu.com/search/spider.htm'
232
- producer:
233
- name: 'Baidu'
234
- url: 'http://www.baidu.com'
235
- -
236
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
237
- bot:
238
- name: 'Baidu Spider'
239
- category: 'Search bot'
240
- url: 'http://www.baidu.com/search/spider.htm'
241
- producer:
242
- name: 'Baidu'
243
- url: 'http://www.baidu.com'
244
- -
245
- user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
246
- bot:
247
- name: 'Baidu Spider'
248
- category: 'Search bot'
249
- url: 'http://www.baidu.com/search/spider.htm'
250
- producer:
251
- name: 'Baidu'
252
- url: 'http://www.baidu.com'
253
- -
254
- user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
255
- bot:
256
- name: 'Baidu Spider'
257
- category: 'Search bot'
258
- url: 'http://www.baidu.com/search/spider.htm'
259
- producer:
260
- name: 'Baidu'
261
- url: 'http://www.baidu.com'
262
- -
263
- user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
264
- bot:
265
- name: 'Baidu Spider'
266
- category: 'Search bot'
267
- url: 'http://www.baidu.com/search/spider.htm'
268
- producer:
269
- name: 'Baidu'
270
- url: 'http://www.baidu.com'
271
- -
272
- user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
273
- bot:
274
- name: 'Baidu Spider'
275
- category: 'Search bot'
276
- url: 'http://www.baidu.com/search/spider.htm'
277
- producer:
278
- name: 'Baidu'
279
- url: 'http://www.baidu.com'
280
- -
281
- user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
282
- bot:
283
- name: 'BingBot'
284
- category: 'Search bot'
285
- url: 'http://search.msn.com/msnbot.htmn'
286
- producer:
287
- name: 'Microsoft Corporation'
288
- url: 'http://www.microsoft.com'
289
- -
290
- user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
291
- bot:
292
- name: 'BingBot'
293
- category: 'Search bot'
294
- url: 'http://search.msn.com/msnbot.htmn'
295
- producer:
296
- name: 'Microsoft Corporation'
297
- url: 'http://www.microsoft.com'
298
- -
299
- user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
300
- bot:
301
- name: 'BingBot'
302
- category: 'Search bot'
303
- url: 'http://search.msn.com/msnbot.htmn'
304
- producer:
305
- name: 'Microsoft Corporation'
306
- url: 'http://www.microsoft.com'
307
- -
308
- user_agent: MSNBot/Nutch-1.5.1
309
- bot:
310
- name: 'BingBot'
311
- category: 'Search bot'
312
- url: 'http://search.msn.com/msnbot.htmn'
313
- producer:
314
- name: 'Microsoft Corporation'
315
- url: 'http://www.microsoft.com'
316
- -
317
- user_agent: msnbot/2.0b v1394720947.6703
318
- bot:
319
- name: 'BingBot'
320
- category: 'Search bot'
321
- url: 'http://search.msn.com/msnbot.htmn'
322
- producer:
323
- name: 'Microsoft Corporation'
324
- url: 'http://www.microsoft.com'
325
- -
326
- user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
327
- bot:
328
- name: 'BingBot'
329
- category: 'Search bot'
330
- url: 'http://search.msn.com/msnbot.htmn'
331
- producer:
332
- name: 'Microsoft Corporation'
333
- url: 'http://www.microsoft.com'
334
- -
335
- user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
336
- bot:
337
- name: 'BingBot'
338
- category: 'Search bot'
339
- url: 'http://search.msn.com/msnbot.htmn'
340
- producer:
341
- name: 'Microsoft Corporation'
342
- url: 'http://www.microsoft.com'
343
- -
344
- user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
345
- bot:
346
- name: 'BingBot'
347
- category: 'Search bot'
348
- url: 'http://search.msn.com/msnbot.htmn'
349
- producer:
350
- name: 'Microsoft Corporation'
351
- url: 'http://www.microsoft.com'
352
- -
353
- user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
354
- bot:
355
- name: 'Blekkobot'
356
- category: 'Search bot'
357
- url: 'http://blekko.com/about/blekkobot'
358
- producer:
359
- name: 'Blekko'
360
- url: 'http://blekko.com'
361
- -
362
- user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
363
- bot:
364
- name: 'BLEXBot Crawler'
365
- category: 'Crawler'
366
- url: 'http://webmeup-crawler.com'
367
- producer:
368
- name: 'WebMeUp'
369
- url: 'http://webmeup.com'
370
- -
371
- user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
372
- bot:
373
- name: 'Bloglovin'
374
- url: 'http://www.bloglovin.com'
375
- category: 'Feed Fetcher'
376
- producer:
377
- name: ''
378
- url: ''
379
- -
380
- user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
381
- bot:
382
- name: 'Bountii Bot'
383
- category: 'Search bot'
384
- url: 'http://bountii.com/contact.php'
385
- producer:
386
- name: 'Bountii Inc.'
387
- url: 'http://bountii.com'
388
- -
389
- user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
390
- bot:
391
- name: 'Butterfly Robot'
392
- category: 'Search bot'
393
- url: 'http://labs.topsy.com/butterfly'
394
- producer:
395
- name: 'Topsy Labs'
396
- url: 'http://labs.topsy.com'
397
- -
398
- user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
399
- bot:
400
- name: 'Butterfly Robot'
401
- category: 'Search bot'
402
- url: 'http://labs.topsy.com/butterfly'
403
- producer:
404
- name: 'Topsy Labs'
405
- url: 'http://labs.topsy.com'
406
- -
407
- user_agent: Browsershots
408
- bot:
409
- name: 'Browsershots'
410
- category: 'Service Agent'
411
- url: 'http://browsershots.org/faq'
412
- producer:
413
- name: 'Browsershots.org'
414
- url: 'http://browsershots.org'
415
- -
416
- user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
417
- bot:
418
- name: 'CareerBot'
419
- category: 'Crawler'
420
- url: 'http://www.career-x.de/bot.html'
421
- producer:
422
- name: 'career-x GmbH'
423
- url: 'http://www.career-x.de'
424
- -
425
- user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
426
- bot:
427
- name: 'ccBot crawler'
428
- category: 'Crawler'
429
- url: 'http://commoncrawl.org/faq/'
430
- producer:
431
- name: 'reddit inc.'
432
- url: 'http://www.reddit.com'
433
- -
434
- user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
435
- bot:
436
- name: 'Cliqzbot'
437
- category: 'Crawler'
438
- url: 'http://cliqz.com/company/cliqzbot'
439
- producer:
440
- name: '10betterpages GmbH'
441
- url: 'http://cliqz.com'
442
- -
443
- user_agent: CommaFeed/1.0 (http://www.commafeed.com)
444
- bot:
445
- name: 'CommaFeed'
446
- url: 'http://www.commafeed.com'
447
- category: 'Feed Fetcher'
448
- producer:
449
- name: ''
450
- url: ''
451
- -
452
- user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
453
- bot:
454
- name: 'Dazoobot'
455
- category: 'Search bot'
456
- url: ''
457
- producer:
458
- name: 'DAZOO.FR'
459
- url: 'http://dazoo.fr'
460
- -
461
- user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
462
- bot:
463
- name: 'Discobot'
464
- category: 'Search bot'
465
- url: 'http://discoveryengine.com/discobot.html'
466
- producer:
467
- name: 'Discovery Engine'
468
- url: 'http://discoveryengine.com'
469
- -
470
- user_agent: dotbot
471
- bot:
472
- name: 'DotBot'
473
- category: 'Crawler'
474
- url: 'http://www.opensiteexplorer.org/dotbot'
475
- producer:
476
- name: 'SEOmoz, Inc.'
477
- url: 'http://moz.com/'
478
- -
479
- user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
480
- bot:
481
- name: 'Easou Spider'
482
- category: 'Search bot'
483
- url: 'http://www.easou.com/search/spider.html'
484
- producer:
485
- name: 'easou ICP'
486
- url: 'http://www.easou.com'
487
- -
488
- user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
489
- bot:
490
- name: 'Easou Spider'
491
- category: 'Search bot'
492
- url: 'http://www.easou.com/search/spider.html'
493
- producer:
494
- name: 'easou ICP'
495
- url: 'http://www.easou.com'
496
- -
497
- user_agent: EMail Exractor
498
- bot:
499
- name: 'EMail Exractor'
500
- category: 'Crawler'
501
- url: ''
502
- producer:
503
- name: ''
504
- url: ''
505
- -
506
- user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
507
- bot:
508
- name: 'ExaBot'
509
- category: 'Crawler'
510
- url: 'http://www.exabot.com/go/robot'
511
- producer:
512
- name: 'Dassault Systèmes'
513
- url: 'http://www.3ds.com'
514
- -
515
- user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
516
- bot:
517
- name: 'ExaBot'
518
- category: 'Crawler'
519
- url: 'http://www.exabot.com/go/robot'
520
- producer:
521
- name: 'Dassault Systèmes'
522
- url: 'http://www.3ds.com'
523
- -
524
- user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
525
- bot:
526
- name: 'ExaBot'
527
- category: 'Crawler'
528
- url: 'http://www.exabot.com/go/robot'
529
- producer:
530
- name: 'Dassault Systèmes'
531
- url: 'http://www.3ds.com'
532
- -
533
- user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
534
- bot:
535
- name: 'ExactSeek Crawler'
536
- category: 'Search bot'
537
- url: 'http://www.exactseek.com'
538
- producer:
539
- name: 'Jayde Online, Inc.'
540
- url: 'http://www.jaydeonlineinc.com'
541
- -
542
- user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
543
- bot:
544
- name: 'Ezooms'
545
- category: 'Crawler'
546
- url: ''
547
- producer:
548
- name: 'SEOmoz, Inc.'
549
- url: 'http://moz.com/'
550
- -
551
- user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
552
- bot:
553
- name: 'Facebook External Hit'
554
- category: 'Social Media Agent'
555
- url: 'https://www.facebook.com/externalhit_uatext.php'
556
- producer:
557
- name: 'Facebook'
558
- url: 'http://www.facebook.com'
559
- -
560
- user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
561
- bot:
562
- name: 'Facebook External Hit'
563
- category: 'Social Media Agent'
564
- url: 'https://www.facebook.com/externalhit_uatext.php'
565
- producer:
566
- name: 'Facebook'
567
- url: 'http://www.facebook.com'
568
- -
569
- user_agent: Feedbin - 9 subscribers
570
- bot:
571
- name: 'Feedbin'
572
- url: 'http://feedbin.com/'
573
- category: 'Feed Fetcher'
574
- producer:
575
- name: ''
576
- url: ''
577
- -
578
- user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
579
- bot:
580
- name: 'FeedBurner'
581
- url: 'http://www.feedburner.com'
582
- category: 'Feed Fetcher'
583
- producer:
584
- name: ''
585
- url: ''
586
- -
587
- user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
588
- bot:
589
- name: 'Feedly'
590
- url: 'http://www.feedly.com'
591
- category: 'Feed Fetcher'
592
- producer:
593
- name: ''
594
- url: ''
595
- -
596
- user_agent: FeedlyBot/1.0 (http://feedly.com)
597
- bot:
598
- name: 'Feedly'
599
- url: 'http://www.feedly.com'
600
- category: 'Feed Fetcher'
601
- producer:
602
- name: ''
603
- url: ''
604
- -
605
- user_agent: FeedlyApp/1.0 (http://www.feedly.com)
606
- bot:
607
- name: 'Feedly'
608
- url: 'http://www.feedly.com'
609
- category: 'Feed Fetcher'
610
- producer:
611
- name: ''
612
- url: ''
613
- -
614
- user_agent: MetaFeedly/1.0 (http://www.feedly.com)
615
- bot:
616
- name: 'Feedly'
617
- url: 'http://www.feedly.com'
618
- category: 'Feed Fetcher'
619
- producer:
620
- name: ''
621
- url: ''
622
- -
623
- user_agent: Feedspot http://www.feedspot.com
624
- bot:
625
- name: 'Feedspot'
626
- url: 'http://www.feedspot.com'
627
- category: 'Feed Fetcher'
628
- producer:
629
- name: ''
630
- url: ''
631
- -
632
- user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
633
- bot:
634
- name: 'Fever'
635
- url: 'http://feedafever.com/'
636
- category: 'Feed Fetcher'
637
- producer:
638
- name: ''
639
- url: ''
640
- -
641
- user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
642
- bot:
643
- name: 'Genieo Web filter'
644
- category: ''
645
- url: 'http://www.genieo.com/webfilter.html'
646
- producer:
647
- name: 'Genieo'
648
- url: 'http://www.genieo.com'
649
- -
650
- user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
651
- bot:
652
- name: 'Goo'
653
- category: 'Search bot'
654
- url: 'http://search.goo.ne.jp/option/use/sub4/sub4-1'
655
- producer:
656
- name: 'NTT Resonant'
657
- url: 'http://goo.ne.jp'
658
- -
659
- user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
660
- bot:
661
- name: 'Googlebot'
662
- category: 'Search bot'
663
- url: 'http://www.google.com/bot.html'
664
- producer:
665
- name: 'Google Inc.'
666
- url: 'http://www.google.com'
667
- -
668
- user_agent: Googlebot/Nutch-1.7
669
- bot:
670
- name: 'Googlebot'
671
- category: 'Search bot'
672
- url: 'http://www.google.com/bot.html'
673
- producer:
674
- name: 'Google Inc.'
675
- url: 'http://www.google.com'
676
- -
677
- user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
678
- bot:
679
- name: 'Googlebot'
680
- category: 'Search bot'
681
- url: 'http://www.google.com/bot.html'
682
- producer:
683
- name: 'Google Inc.'
684
- url: 'http://www.google.com'
685
- -
686
- user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
687
- bot:
688
- name: 'Googlebot'
689
- category: 'Search bot'
690
- url: 'http://www.google.com/bot.html'
691
- producer:
692
- name: 'Google Inc.'
693
- url: 'http://www.google.com'
694
- -
695
- user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
696
- bot:
697
- name: 'Googlebot'
698
- category: 'Search bot'
699
- url: 'http://www.google.com/bot.html'
700
- producer:
701
- name: 'Google Inc.'
702
- url: 'http://www.google.com'
703
- -
704
- user_agent: Googlebot-Image/1.0
705
- bot:
706
- name: 'Googlebot'
707
- category: 'Search bot'
708
- url: 'http://www.google.com/bot.html'
709
- producer:
710
- name: 'Google Inc.'
711
- url: 'http://www.google.com'
712
- -
713
- user_agent: Googlebot (gocrawl v0.4)
714
- bot:
715
- name: 'Googlebot'
716
- category: 'Search bot'
717
- url: 'http://www.google.com/bot.html'
718
- producer:
719
- name: 'Google Inc.'
720
- url: 'http://www.google.com'
721
- -
722
- user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
723
- bot:
724
- name: 'Googlebot'
725
- category: 'Search bot'
726
- url: 'http://www.google.com/bot.html'
727
- producer:
728
- name: 'Google Inc.'
729
- url: 'http://www.google.com'
730
- -
731
- user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
732
- bot:
733
- name: 'Googlebot'
734
- category: 'Search bot'
735
- url: 'http://www.google.com/bot.html'
736
- producer:
737
- name: 'Google Inc.'
738
- url: 'http://www.google.com'
739
- -
740
- user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
741
- bot:
742
- name: 'Googlebot'
743
- category: 'Search bot'
744
- url: 'http://www.google.com/bot.html'
745
- producer:
746
- name: 'Google Inc.'
747
- url: 'http://www.google.com'
748
- -
749
- user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
750
- bot:
751
- name: 'Googlebot'
752
- category: 'Search bot'
753
- url: 'http://www.google.com/bot.html'
754
- producer:
755
- name: 'Google Inc.'
756
- url: 'http://www.google.com'
757
- -
758
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
759
- bot:
760
- name: 'Googlebot'
761
- category: 'Search bot'
762
- url: 'http://www.google.com/bot.html'
763
- producer:
764
- name: 'Google Inc.'
765
- url: 'http://www.google.com'
766
- -
767
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
768
- bot:
769
- name: 'Googlebot'
770
- category: 'Search bot'
771
- url: 'http://www.google.com/bot.html'
772
- producer:
773
- name: 'Google Inc.'
774
- url: 'http://www.google.com'
775
- -
776
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
777
- bot:
778
- name: 'Googlebot'
779
- category: 'Search bot'
780
- url: 'http://www.google.com/bot.html'
781
- producer:
782
- name: 'Google Inc.'
783
- url: 'http://www.google.com'
784
- -
785
- user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
786
- bot:
787
- name: 'Googlebot'
788
- category: 'Search bot'
789
- url: 'http://www.google.com/bot.html'
790
- producer:
791
- name: 'Google Inc.'
792
- url: 'http://www.google.com'
793
- -
794
- user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
795
- bot:
796
- name: 'Googlebot'
797
- category: 'Search bot'
798
- url: 'http://www.google.com/bot.html'
799
- producer:
800
- name: 'Google Inc.'
801
- url: 'http://www.google.com'
802
- -
803
- user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
804
- bot:
805
- name: 'Googlebot'
806
- category: 'Search bot'
807
- url: 'http://www.google.com/bot.html'
808
- producer:
809
- name: 'Google Inc.'
810
- url: 'http://www.google.com'
811
- -
812
- user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
813
- bot:
814
- name: 'Googlebot'
815
- category: 'Search bot'
816
- url: 'http://www.google.com/bot.html'
817
- producer:
818
- name: 'Google Inc.'
819
- url: 'http://www.google.com'
820
- -
821
- user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
822
- bot:
823
- name: 'Googlebot'
824
- category: 'Search bot'
825
- url: 'http://www.google.com/bot.html'
826
- producer:
827
- name: 'Google Inc.'
828
- url: 'http://www.google.com'
829
- -
830
- user_agent: Mediapartners-Google
831
- bot:
832
- name: 'Googlebot'
833
- category: 'Search bot'
834
- url: 'http://www.google.com/bot.html'
835
- producer:
836
- name: 'Google Inc.'
837
- url: 'http://www.google.com'
838
- -
839
- user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
840
- bot:
841
- name: 'Heritrix'
842
- category: 'Crawler'
843
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
844
- producer:
845
- name: 'The Internet Archive'
846
- url: 'http://www.archive.org'
847
- -
848
- user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
849
- bot:
850
- name: 'Heritrix'
851
- category: 'Crawler'
852
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
853
- producer:
854
- name: 'The Internet Archive'
855
- url: 'http://www.archive.org'
856
- -
857
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
858
- bot:
859
- name: 'Heritrix'
860
- category: 'Crawler'
861
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
862
- producer:
863
- name: 'The Internet Archive'
864
- url: 'http://www.archive.org'
865
- -
866
- user_agent: flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)
867
- bot:
868
- name: 'Heritrix'
869
- category: 'Crawler'
870
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
871
- producer:
872
- name: 'The Internet Archive'
873
- url: 'http://www.archive.org'
874
- -
875
- user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
876
- bot:
877
- name: 'Heritrix'
878
- category: 'Crawler'
879
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
880
- producer:
881
- name: 'The Internet Archive'
882
- url: 'http://www.archive.org'
883
- -
884
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
885
- bot:
886
- name: 'Heritrix'
887
- category: 'Crawler'
888
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
889
- producer:
890
- name: 'The Internet Archive'
891
- url: 'http://www.archive.org'
892
- -
893
- user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
894
- bot:
895
- name: 'Heritrix'
896
- category: 'Crawler'
897
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
898
- producer:
899
- name: 'The Internet Archive'
900
- url: 'http://www.archive.org'
901
- -
902
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
903
- bot:
904
- name: 'Heritrix'
905
- category: 'Crawler'
906
- url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
907
- producer:
908
- name: 'The Internet Archive'
909
- url: 'http://www.archive.org'
910
- -
911
- user_agent: HTTPMon/1.0b (http://www.httpmon.com)
912
- bot:
913
- name: 'HTTPMon'
914
- category: 'Site Monitor'
915
- url: 'http://www.httpmon.com'
916
- producer:
917
- name: 'towards GmbH'
918
- url: 'http://www.towards.ch/'
919
- -
920
- user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
921
- bot:
922
- name: 'IIS Site Analysis'
923
- category: 'crawler'
924
- url: 'http://www.iis.net/iisbot.html'
925
- producer:
926
- name: 'Microsoft Corporation'
927
- url: 'http://www.microsoft.com'
928
- -
929
- user_agent: kouio.com RSS reader
930
- bot:
931
- name: 'Kouio'
932
- url: 'http://kouio.com/'
933
- category: 'Feed Fetcher'
934
- producer:
935
- name: ''
936
- url: ''
937
- -
938
- user_agent: kouio.com RSS reader - 6 subscribers
939
- bot:
940
- name: 'Kouio'
941
- url: 'http://kouio.com/'
942
- category: 'Feed Fetcher'
943
- producer:
944
- name: ''
945
- url: ''
946
- -
947
- user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
948
- bot:
949
- name: 'Linkdex Bot'
950
- category: 'Search bot'
951
- url: 'http://www.linkdex.com/bots'
952
- producer:
953
- name: 'Mojeek Ltd.'
954
- url: 'http://www.mojeek.com'
955
- -
956
- user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
957
- bot:
958
- name: 'Linkdex Bot'
959
- category: 'Search bot'
960
- url: 'http://www.linkdex.com/bots'
961
- producer:
962
- name: 'Mojeek Ltd.'
963
- url: 'http://www.mojeek.com'
964
- -
965
- user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
966
- bot:
967
- name: 'Linkdex Bot'
968
- category: 'Search bot'
969
- url: 'http://www.linkdex.com/bots'
970
- producer:
971
- name: 'Mojeek Ltd.'
972
- url: 'http://www.mojeek.com'
973
- -
974
- user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
975
- bot:
976
- name: 'LinkedIn Bot'
977
- category: 'Social Media Agent'
978
- url: 'http://www.linkedin.com'
979
- producer:
980
- name: 'LinkedIn'
981
- url: 'http://www.linkedin.com'
982
- -
983
- user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
984
- bot:
985
- name: 'Mail.Ru Bot'
986
- category: 'Search bot'
987
- url: 'http://help.mail.ru/webmaster/indexing/robots/types_robots'
988
- producer:
989
- name: 'Mail.Ru Group'
990
- url: 'http://corp.mail.ru'
991
- -
992
- user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
993
- bot:
994
- name: 'Mail.Ru Bot'
995
- category: 'Search bot'
996
- url: 'http://help.mail.ru/webmaster/indexing/robots/types_robots'
997
- producer:
998
- name: 'Mail.Ru Group'
999
- url: 'http://corp.mail.ru'
1000
- -
1001
- user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
1002
- bot:
1003
- name: 'Magpie-Crawler'
1004
- category: 'Social Media Agent'
1005
- url: 'http://www.brandwatch.com/magpie-crawler/'
1006
- producer:
1007
- name: 'Brandwatch'
1008
- url: 'http://www.brandwatch.com'
1009
- -
1010
- user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
1011
- bot:
1012
- name: 'MagpieRSS'
1013
- url: 'http://magpierss.sourceforge.net/'
1014
- category: 'Feed Parser'
1015
- producer:
1016
- name: ''
1017
- url: ''
1018
- -
1019
- user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
1020
- bot:
1021
- name: 'Meanpath Bot'
1022
- category: 'Search bot'
1023
- url: 'http://www.meanpath.com/meanpathbot.html'
1024
- producer:
1025
- name: 'Meanpath'
1026
- url: 'http://www.meanpath.com'
1027
- -
1028
- user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
1029
- bot:
1030
- name: 'Mixrank Bot'
1031
- category: 'Crawler'
1032
- url: 'http://mixrank.com'
1033
- producer:
1034
- name: 'Online Media Group, Inc.'
1035
- url: ''
1036
- -
1037
- user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
1038
- bot:
1039
- name: 'MJ12 Bot'
1040
- category: 'Search bot'
1041
- url: 'http://majestic12.co.uk/bot.php'
1042
- producer:
1043
- name: 'Majestic-12'
1044
- url: 'http://majestic12.co.uk'
1045
- -
1046
- user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
1047
- bot:
1048
- name: 'MojeekBot'
1049
- category: 'Search bot'
1050
- url: 'http://www.mojeek.com/bot.html'
1051
- producer:
1052
- name: 'Mojeek Ltd.'
1053
- url: 'http://www.mojeek.com'
1054
- -
1055
- user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
1056
- bot:
1057
- name: 'NalezenCzBot'
1058
- category: 'Crawler'
1059
- url: 'http://www.nalezen.cz/about-crawler'
1060
- producer:
1061
- name: 'Jaroslav Kuboš'
1062
- url: ''
1063
- -
1064
- user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
1065
- bot:
1066
- name: 'Netcraft Survey Bot'
1067
- category: 'Search bot'
1068
- url: ''
1069
- producer:
1070
- name: 'Netcraft'
1071
- url: 'http://www.netcraft.com'
1072
- -
1073
- user_agent: Netvibes (http://www.netvibes.com)
1074
- bot:
1075
- name: 'Netvibes'
1076
- url: 'http://www.netvibes.com/'
1077
- category: 'Feed Fetcher'
1078
- producer:
1079
- name: ''
1080
- url: ''
1081
- -
1082
- user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
1083
- bot:
1084
- name: 'Netvibes'
1085
- url: 'http://www.netvibes.com/'
1086
- category: 'Feed Fetcher'
1087
- producer:
1088
- name: ''
1089
- url: ''
1090
- -
1091
- user_agent: NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1092
- bot:
1093
- name: 'NewsBlur'
1094
- url: 'http://www.newsblur.com'
1095
- category: 'Feed Fetcher'
1096
- producer:
1097
- name: ''
1098
- url: ''
1099
- -
1100
- user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1101
- bot:
1102
- name: 'NewsBlur'
1103
- url: 'http://www.newsblur.com'
1104
- category: 'Feed Fetcher'
1105
- producer:
1106
- name: ''
1107
- url: ''
1108
- -
1109
- user_agent: NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1110
- bot:
1111
- name: 'NewsBlur'
1112
- url: 'http://www.newsblur.com'
1113
- category: 'Feed Fetcher'
1114
- producer:
1115
- name: ''
1116
- url: ''
1117
- -
1118
- user_agent: NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1119
- bot:
1120
- name: 'NewsBlur'
1121
- url: 'http://www.newsblur.com'
1122
- category: 'Feed Fetcher'
1123
- producer:
1124
- name: ''
1125
- url: ''
1126
- -
1127
- user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
1128
- bot:
1129
- name: NewsGator
1130
- url: 'http://www.newsgator.com'
1131
- category: 'Feed Fetcher'
1132
- producer:
1133
- name: ''
1134
- url: ''
1135
- -
1136
- user_agent: nlcrawler/1.0 (+http://northernlight.com/)
1137
- bot:
1138
- name: 'NLCrawler'
1139
- category: 'Crawler'
1140
- url: ''
1141
- producer:
1142
- name: 'Northern Light'
1143
- url: 'http://northernlight.com'
1144
- -
1145
- user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
1146
- bot:
1147
- name: 'Omgili bot'
1148
- category: 'Search bot'
1149
- url: 'http://www.omgili.com/Crawler.html'
1150
- producer:
1151
- name: 'Omgili'
1152
- url: 'http://www.omgili.com'
1153
- -
1154
- user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
1155
- bot:
1156
- name: 'Openindex Spider'
1157
- category: 'Search bot'
1158
- url: 'http://www.openindex.io/en/webmasters/spider.html'
1159
- producer:
1160
- name: 'Openindex B.V.'
1161
- url: 'http://www.openindex.io'
1162
- -
1163
- user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
1164
- bot:
1165
- name: 'OpenLinkProfiler'
1166
- category: 'Crawler'
1167
- url: 'http://openlinkprofiler.org/bot'
1168
- producer:
1169
- name: 'Axandra GmbH'
1170
- url: 'http://www.axandra.com'
1171
- -
1172
- user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
1173
- bot:
1174
- name: 'OpenWebSpider'
1175
- category: 'Crawler'
1176
- url: 'http://www.openwebspider.org'
1177
- producer:
1178
- name: 'OpenWebSpider Lab'
1179
- url: 'http://lab.openwebspider.org'
1180
- -
1181
- user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
1182
- bot:
1183
- name: 'PaperLiBot'
1184
- category: 'Search bot'
1185
- url: 'http://support.paper.li/entries/20023257-what-is-paper-li'
1186
- producer:
1187
- name: 'Smallrivers SA'
1188
- url: 'http://www.paper.li'
1189
- -
1190
- user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
1191
- bot:
1192
- name: 'Picsearch bot'
1193
- category: 'Search bot'
1194
- url: 'http://www.picsearch.com/bot.html'
1195
- producer:
1196
- name: 'Picsearch'
1197
- url: 'http://www.picsearch.com'
1198
- -
1199
- user_agent: psbot-page (+http://www.picsearch.com/bot.html)
1200
- bot:
1201
- name: 'Picsearch bot'
1202
- category: 'Search bot'
1203
- url: 'http://www.picsearch.com/bot.html'
1204
- producer:
1205
- name: 'Picsearch'
1206
- url: 'http://www.picsearch.com'
1207
- -
1208
- user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
1209
- bot:
1210
- name: 'Pingdom Bot'
1211
- category: 'Site Monitors'
1212
- url: ''
1213
- producer:
1214
- name: 'Pingdom AB'
1215
- url: 'https://www.pingdom.com'
1216
- -
1217
- user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
1218
- bot:
1219
- name: 'QuerySeekerSpider'
1220
- category: 'Crawler'
1221
- url: 'http://queryseeker.com/bot.html'
1222
- producer:
1223
- name: 'QueryEye Inc.'
1224
- url: 'http://queryeye.com'
1225
- -
1226
- user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
1227
- bot:
1228
- name: 'Reddit Bot'
1229
- category: 'Social Media Agent'
1230
- url: 'http://www.reddit.com/feedback'
1231
- producer:
1232
- name: 'reddit inc.'
1233
- url: 'http://www.reddit.com'
1234
- -
1235
- user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
1236
- bot:
1237
- name: 'Rogerbot'
1238
- category: 'Crawler'
1239
- url: 'http://moz.com/help/pro/what-is-rogerbot-'
1240
- producer:
1241
- name: 'SEOmoz, Inc.'
1242
- url: 'http://moz.com/'
1243
- -
1244
- user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
1245
- bot:
1246
- name: 'Rogerbot'
1247
- category: 'Crawler'
1248
- url: 'http://moz.com/help/pro/what-is-rogerbot-'
1249
- producer:
1250
- name: 'SEOmoz, Inc.'
1251
- url: 'http://moz.com/'
1252
- -
1253
- user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
1254
- bot:
1255
- name: 'Rogerbot'
1256
- category: 'Crawler'
1257
- url: 'http://moz.com/help/pro/what-is-rogerbot-'
1258
- producer:
1259
- name: 'SEOmoz, Inc.'
1260
- url: 'http://moz.com/'
1261
- -
1262
- user_agent: Screaming Frog SEO Spider/2.22
1263
- bot:
1264
- name: 'Screaming Frog SEO Spider'
1265
- category: 'Crawler'
1266
- url: 'http://www.screamingfrog.co.uk/seo-spider'
1267
- producer:
1268
- name: 'Screaming Frog Ltd'
1269
- url: 'http://www.screamingfrog.co.uk'
1270
- -
1271
- user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
1272
- bot:
1273
- name: 'ScreenerBot'
1274
- category: 'Crawler'
1275
- url: 'http://www.screenerbot.com'
1276
- producer:
1277
- name: ''
1278
- url: ''
1279
- -
1280
- user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
1281
- bot:
1282
- name: 'Semrush Bot'
1283
- category: 'Crawler'
1284
- url: 'http://www.semrush.com/bot.html'
1285
- producer:
1286
- name: 'SEMrush'
1287
- url: 'http://www.semrush.com'
1288
- -
1289
- user_agent: SensikaBot/x.33 (+http://sensika.com)
1290
- bot:
1291
- name: 'Sensika Bot'
1292
- category: ''
1293
- url: ''
1294
- producer:
1295
- name: 'Sensika'
1296
- url: 'http://sensika.com'
1297
- -
1298
- user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
1299
- bot:
1300
- name: 'SEOENGBot'
1301
- category: 'Crawler'
1302
- url: 'http://www.seoengine.com/seoengbot.htm'
1303
- producer:
1304
- name: 'SEO Engine'
1305
- url: 'http://www.seoengine.com'
1306
- -
1307
- user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
1308
- bot:
1309
- name: 'Seznam Bot'
1310
- category: 'Search bot'
1311
- url: 'http://www.mapy.cz/cz/seznambot.html'
1312
- producer:
1313
- name: 'Seznam.cz, a.s.'
1314
- url: 'http://www.seznam.cz/'
1315
- -
1316
- user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
1317
- bot:
1318
- name: 'Seznam Bot'
1319
- category: 'Search bot'
1320
- url: 'http://www.mapy.cz/cz/seznambot.html'
1321
- producer:
1322
- name: 'Seznam.cz, a.s.'
1323
- url: 'http://www.seznam.cz/'
1324
- -
1325
- user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
1326
- bot:
1327
- name: 'Seznam Bot'
1328
- category: 'Search bot'
1329
- url: 'http://www.mapy.cz/cz/seznambot.html'
1330
- producer:
1331
- name: 'Seznam.cz, a.s.'
1332
- url: 'http://www.seznam.cz/'
1333
- -
1334
- user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
1335
- bot:
1336
- name: 'Seznam Bot'
1337
- category: 'Search bot'
1338
- url: 'http://www.mapy.cz/cz/seznambot.html'
1339
- producer:
1340
- name: 'Seznam.cz, a.s.'
1341
- url: 'http://www.seznam.cz/'
1342
- -
1343
- user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
1344
- bot:
1345
- name: 'ShopWiki'
1346
- category: 'Search tools'
1347
- url: 'http://www.shopwiki.com/wiki/Help:Bot'
1348
- producer:
1349
- name: 'ShopWiki Corp.'
1350
- url: 'http://www.shopwiki.com'
1351
- -
1352
- user_agent: SilverReader/1.0; http://silverreader.com
1353
- bot:
1354
- name: 'SilverReader'
1355
- url: 'http://silverreader.com'
1356
- category: 'Feed Fetcher'
1357
- producer:
1358
- name: ''
1359
- url: ''
1360
- -
1361
- user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
1362
- bot:
1363
- name: 'SimplePie'
1364
- url: 'http://www.simplepie.org'
1365
- category: 'Feed Parser'
1366
- producer:
1367
- name: ''
1368
- url: ''
1369
- -
1370
- user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
1371
- bot:
1372
- name: 'SimplePie'
1373
- url: 'http://www.simplepie.org'
1374
- category: 'Feed Parser'
1375
- producer:
1376
- name: ''
1377
- url: ''
1378
- -
1379
- user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
1380
- bot:
1381
- name: 'SimplePie'
1382
- url: 'http://www.simplepie.org'
1383
- category: 'Feed Parser'
1384
- producer:
1385
- name: ''
1386
- url: ''
1387
- -
1388
- user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
1389
- bot:
1390
- name: 'SISTRIX Crawler'
1391
- category: 'Crawler'
1392
- url: 'http://crawler.sistrix.net'
1393
- producer:
1394
- name: 'SISTRIX GmbH'
1395
- url: 'http://www.sistrix.de'
1396
- -
1397
- user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
1398
- bot:
1399
- name: 'Sogou Spider'
1400
- category: 'Search bot'
1401
- url: 'http://www.sogou.com/docs/help/webmasters.htm'
1402
- producer:
1403
- name: 'Sohu, Inc.'
1404
- url: 'http://www.sogou.com'
1405
- -
1406
- user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
1407
- bot:
1408
- name: 'Sogou Spider'
1409
- category: 'Search bot'
1410
- url: 'http://www.sogou.com/docs/help/webmasters.htm'
1411
- producer:
1412
- name: 'Sohu, Inc.'
1413
- url: 'http://www.sogou.com'
1414
- -
1415
- user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
1416
- bot:
1417
- name: 'Sogou Spider'
1418
- category: 'Search bot'
1419
- url: 'http://www.sogou.com/docs/help/webmasters.htm'
1420
- producer:
1421
- name: 'Sohu, Inc.'
1422
- url: 'http://www.sogou.com'
1423
- -
1424
- user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
1425
- bot:
1426
- name: 'Sogou Spider'
1427
- category: 'Search bot'
1428
- url: 'http://www.sogou.com/docs/help/webmasters.htm'
1429
- producer:
1430
- name: 'Sohu, Inc.'
1431
- url: 'http://www.sogou.com'
1432
- -
1433
- user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
1434
- bot:
1435
- name: 'Soso Spider'
1436
- category: 'Search bot'
1437
- url: 'http://help.soso.com/webspider.htm'
1438
- producer:
1439
- name: 'Tencent Holdings'
1440
- url: 'http://www.soso.com'
1441
- -
1442
- user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
1443
- bot:
1444
- name: 'Superfeedr Bot'
1445
- category: 'Feed Fetcher'
1446
- url: ''
1447
- producer:
1448
- name: 'Superfeedr'
1449
- url: 'https://superfeedr.com/'
1450
- -
1451
- user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
1452
- bot:
1453
- name: 'Spinn3r'
1454
- category: 'Crawler'
1455
- url: 'http://spinn3r.com/robot'
1456
- producer:
1457
- name: 'Tailrank Inc'
1458
- url: 'http://spinn3r.com'
1459
- -
1460
- user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
1461
- bot:
1462
- name: 'Sputnik Bot'
1463
- category: ''
1464
- url: ''
1465
- producer:
1466
- name: ''
1467
- url: ''
1468
- -
1469
- user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
1470
- bot:
1471
- name: 'Sputnik Bot'
1472
- category: ''
1473
- url: ''
1474
- producer:
1475
- name: ''
1476
- url: ''
1477
- -
1478
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
1479
- bot:
1480
- name: 'Survey Bot'
1481
- category: 'Search bot'
1482
- url: 'http://www.domaintools.com/webmasters/surveybot.php'
1483
- producer:
1484
- name: 'Domain Tools'
1485
- url: 'http://www.domaintools.com'
1486
- -
1487
- user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
1488
- bot:
1489
- name: 'TinEye Crawler'
1490
- category: 'Search bot'
1491
- url: 'http://www.tineye.com/crawler.html'
1492
- producer:
1493
- name: 'Idée Inc.'
1494
- url: 'http://ideeinc.com'
1495
- -
1496
- user_agent: 'Tiny Tiny RSS/1.10 (http://tt-rss.org/)'
1497
- bot:
1498
- name: 'Tiny Tiny RSS'
1499
- url: 'http://tt-rss.org'
1500
- category: 'Feed Fetcher'
1501
- producer:
1502
- name: ''
1503
- url: ''
1504
- -
1505
- user_agent: 'Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)'
1506
- bot:
1507
- name: 'Tiny Tiny RSS'
1508
- url: 'http://tt-rss.org'
1509
- category: 'Feed Fetcher'
1510
- producer:
1511
- name: ''
1512
- url: ''
1513
- -
1514
- user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
1515
- bot:
1516
- name: 'TurnitinBot'
1517
- category: 'Crawler'
1518
- url: 'http://www.turnitin.com/robot/crawlerinfo.html'
1519
- producer:
1520
- name: 'iParadigms, LLC.'
1521
- url: 'http://www.turnitin.com'
1522
- -
1523
- user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
1524
- bot:
1525
- name: 'TweetedTimes Bot'
1526
- category: 'Crawler'
1527
- url: 'http://tweetedtimes.com'
1528
- producer:
1529
- name: 'TweetedTimes'
1530
- url: 'http://tweetedtimes.com/'
1531
- -
1532
- user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
1533
- bot:
1534
- name: 'TweetedTimes Bot'
1535
- category: 'Crawler'
1536
- url: 'http://tweetedtimes.com'
1537
- producer:
1538
- name: 'TweetedTimes'
1539
- url: 'http://tweetedtimes.com/'
1540
- -
1541
- user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
1542
- bot:
1543
- name: 'Tweetmeme Bot'
1544
- category: 'Crawler'
1545
- url: 'http://tweetmeme.com/'
1546
- producer:
1547
- name: 'Mediasift'
1548
- url: ''
1549
- -
1550
- user_agent: Twitterbot/1.0
1551
- bot:
1552
- name: 'Twitterbot'
1553
- category: 'Social Media Agent'
1554
- url: 'https://dev.twitter.com/docs/cards/getting-started'
1555
- producer:
1556
- name: 'Twitter'
1557
- url: 'http://www.twitter.com'
1558
- -
1559
- user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
1560
- bot:
1561
- name: 'Uptime Robot'
1562
- category: 'Site Monitor'
1563
- url: ''
1564
- producer:
1565
- name: 'Uptime Robot'
1566
- url: 'http://uptimerobot.com'
1567
- -
1568
- user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
1569
- bot:
1570
- name: 'URLAppendBot'
1571
- category: 'Crawler'
1572
- url: 'http://www.profound.net/urlappendbot.html'
1573
- producer:
1574
- name: 'Profound Networks'
1575
- url: 'http://www.profound.net'
1576
- -
1577
- user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
1578
- bot:
1579
- name: 'Visual Site Mapper Crawler'
1580
- category: 'Crawler'
1581
- url: 'http://www.visualsitemapper.com/crawler'
1582
- producer:
1583
- name: 'Alentum Software Ltd.'
1584
- url: 'http://www.alentum.com'
1585
- -
1586
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
1587
- bot:
1588
- name: 'Voila Bot'
1589
- category: 'Search bot'
1590
- url: 'http://www.voila.fr'
1591
- producer:
1592
- name: ''
1593
- url: ''
1594
- -
1595
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
1596
- bot:
1597
- name: 'Voila Bot'
1598
- category: 'Search bot'
1599
- url: 'http://www.voila.fr'
1600
- producer:
1601
- name: ''
1602
- url: ''
1603
- -
1604
- user_agent: Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)
1605
- bot:
1606
- name: 'W3C CSS Validator'
1607
- category: 'Validator'
1608
- url: 'http://jigsaw.w3.org/css-validator'
1609
- producer:
1610
- name: 'W3C'
1611
- url: 'http://www.w3.org'
1612
- -
1613
- user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
1614
- bot:
1615
- name: 'W3C I18N Checker'
1616
- category: 'Validator'
1617
- url: 'http://validator.w3.org/i18n-checker'
1618
- producer:
1619
- name: 'W3C'
1620
- url: 'http://www.w3.org'
1621
- -
1622
- user_agent: W3C-checklink/4.0 [4.4] libwww-perl/5.803
1623
- bot:
1624
- name: 'W3C Link Checker'
1625
- category: 'Validator'
1626
- url: 'http://validator.w3.org/checklink'
1627
- producer:
1628
- name: 'W3C'
1629
- url: 'http://www.w3.org'
1630
- -
1631
- user_agent: W3C-checklink/4.81 libwww-perl/5.836
1632
- bot:
1633
- name: 'W3C Link Checker'
1634
- category: 'Validator'
1635
- url: 'http://validator.w3.org/checklink'
1636
- producer:
1637
- name: 'W3C'
1638
- url: 'http://www.w3.org'
1639
- -
1640
- user_agent: W3C_Validator/1.3 http://validator.w3.org/services
1641
- bot:
1642
- name: 'W3C Markup Validation Service'
1643
- category: 'Validator'
1644
- url: 'http://validator.w3.org/services'
1645
- producer:
1646
- name: 'W3C'
1647
- url: 'http://www.w3.org'
1648
- -
1649
- user_agent: W3C_Validator/1.767
1650
- bot:
1651
- name: 'W3C Markup Validation Service'
1652
- category: 'Validator'
1653
- url: 'http://validator.w3.org/services'
1654
- producer:
1655
- name: 'W3C'
1656
- url: 'http://www.w3.org'
1657
- -
1658
- user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
1659
- bot:
1660
- name: 'W3C MobileOK Checker'
1661
- category: 'Validator'
1662
- url: 'http://validator.w3.org/mobile'
1663
- producer:
1664
- name: 'W3C'
1665
- url: 'http://www.w3.org'
1666
- -
1667
- user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
1668
- bot:
1669
- name: 'W3C Unified Validator'
1670
- category: 'Validator'
1671
- url: 'http://validator.w3.org/unicorn'
1672
- producer:
1673
- name: 'W3C'
1674
- url: 'http://www.w3.org'
1675
- -
1676
- user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
1677
- bot:
1678
- name: 'WebbCrawler'
1679
- category: 'Crawler'
1680
- url: 'http://badcheese.com/crawler.html'
1681
- producer:
1682
- name: 'Steve Webb'
1683
- url: 'http://badcheese.com'
1684
- -
1685
- user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
1686
- bot:
1687
- name: 'WeSEE:Search'
1688
- category: 'Search bot'
1689
- url: 'http://www.wesee.com/bot'
1690
- producer:
1691
- name: 'WeSEE Ltd'
1692
- url: 'http://www.wesee.com'
1693
- -
1694
- user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
1695
- bot:
1696
- name: 'Wotbox'
1697
- category: 'Search bot'
1698
- url: 'http://www.wotbox.com/bot/'
1699
- producer:
1700
- name: 'Wotbox'
1701
- url: 'http://www.wotbox.com'
1702
- -
1703
- user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
1704
- bot:
1705
- name: 'YaCy'
1706
- category: 'Search bot'
1707
- url: 'http://yacy.net/bot.html'
1708
- producer:
1709
- name: 'YaCy'
1710
- url: 'http://yacy.net'
1711
- -
1712
- user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
1713
- bot:
1714
- name: 'YaCy'
1715
- category: 'Search bot'
1716
- url: 'http://yacy.net/bot.html'
1717
- producer:
1718
- name: 'YaCy'
1719
- url: 'http://yacy.net'
1720
- -
1721
- user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
1722
- bot:
1723
- name: 'Yahoo! Slurp'
1724
- category: 'Search bot'
1725
- url: 'http://help.yahoo.com/ysearch/slurp'
1726
- producer:
1727
- name: 'Yahoo! Inc.'
1728
- url: 'http://www.yahoo.com'
1729
- -
1730
- user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
1731
- bot:
1732
- name: 'Yahoo! Slurp'
1733
- category: 'Search bot'
1734
- url: 'http://help.yahoo.com/ysearch/slurp'
1735
- producer:
1736
- name: 'Yahoo! Inc.'
1737
- url: 'http://www.yahoo.com'
1738
- -
1739
- user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
1740
- bot:
1741
- name: 'Yandex Bot'
1742
- category: 'Search bot'
1743
- url: 'http://www.yandex.com/bots'
1744
- producer:
1745
- name: 'Yandex LLC'
1746
- url: 'http://company.yandex.com'
1747
- -
1748
- user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
1749
- bot:
1750
- name: 'Yandex Bot'
1751
- category: 'Search bot'
1752
- url: 'http://www.yandex.com/bots'
1753
- producer:
1754
- name: 'Yandex LLC'
1755
- url: 'http://company.yandex.com'
1756
- -
1757
- user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
1758
- bot:
1759
- name: 'Yandex Bot'
1760
- category: 'Search bot'
1761
- url: 'http://www.yandex.com/bots'
1762
- producer:
1763
- name: 'Yandex LLC'
1764
- url: 'http://company.yandex.com'
1765
- -
1766
- user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
1767
- bot:
1768
- name: 'Yandex Bot'
1769
- category: 'Search bot'
1770
- url: 'http://www.yandex.com/bots'
1771
- producer:
1772
- name: 'Yandex LLC'
1773
- url: 'http://company.yandex.com'
1774
- -
1775
- user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
1776
- bot:
1777
- name: 'Yandex Bot'
1778
- category: 'Search bot'
1779
- url: 'http://www.yandex.com/bots'
1780
- producer:
1781
- name: 'Yandex LLC'
1782
- url: 'http://company.yandex.com'
1783
- -
1784
- user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
1785
- bot:
1786
- name: 'Yandex Bot'
1787
- category: 'Search bot'
1788
- url: 'http://www.yandex.com/bots'
1789
- producer:
1790
- name: 'Yandex LLC'
1791
- url: 'http://company.yandex.com'
1792
- -
1793
- user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
1794
- bot:
1795
- name: 'Yandex Bot'
1796
- category: 'Search bot'
1797
- url: 'http://www.yandex.com/bots'
1798
- producer:
1799
- name: 'Yandex LLC'
1800
- url: 'http://company.yandex.com'
1801
- -
1802
- user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
1803
- bot:
1804
- name: 'Yandex Bot'
1805
- category: 'Search bot'
1806
- url: 'http://www.yandex.com/bots'
1807
- producer:
1808
- name: 'Yandex LLC'
1809
- url: 'http://company.yandex.com'
1810
- -
1811
- user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
1812
- bot:
1813
- name: 'Yandex Bot'
1814
- category: 'Search bot'
1815
- url: 'http://www.yandex.com/bots'
1816
- producer:
1817
- name: 'Yandex LLC'
1818
- url: 'http://company.yandex.com'
1819
- -
1820
- user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
1821
- bot:
1822
- name: 'Yandex Bot'
1823
- category: 'Search bot'
1824
- url: 'http://www.yandex.com/bots'
1825
- producer:
1826
- name: 'Yandex LLC'
1827
- url: 'http://company.yandex.com'
1828
- -
1829
- user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
1830
- bot:
1831
- name: 'Yandex Bot'
1832
- category: 'Search bot'
1833
- url: 'http://www.yandex.com/bots'
1834
- producer:
1835
- name: 'Yandex LLC'
1836
- url: 'http://company.yandex.com'
1837
- -
1838
- user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
1839
- bot:
1840
- name: 'Yandex Bot'
1841
- category: 'Search bot'
1842
- url: 'http://www.yandex.com/bots'
1843
- producer:
1844
- name: 'Yandex LLC'
1845
- url: 'http://company.yandex.com'
1846
- -
1847
- user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
1848
- bot:
1849
- name: 'Yandex Bot'
1850
- category: 'Search bot'
1851
- url: 'http://www.yandex.com/bots'
1852
- producer:
1853
- name: 'Yandex LLC'
1854
- url: 'http://company.yandex.com'
1855
- -
1856
- user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
1857
- bot:
1858
- name: 'Yeti/Naverbot'
1859
- category: 'Search bot'
1860
- url: 'http://help.naver.com/robots/'
1861
- producer:
1862
- name: 'Naver'
1863
- url: 'http://www.naver.com'
1864
- -
1865
- user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
1866
- bot:
1867
- name: 'Youdao Bot'
1868
- category: 'Search bot'
1869
- url: 'http://www.youdao.com/help/webmaster/spider'
1870
- producer:
1871
- name: 'NetEase, Inc.'
1872
- url: 'http://corp.163.com'
1873
- -
1874
- user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
1875
- bot:
1876
- name: 'Yunyun Bot'
1877
- category: 'Search bot'
1878
- url: 'http://www.yunyun.com/SiteInfo.php?r=about'
1879
- producer:
1880
- name: 'YunYun'
1881
- url: 'http://www.yunyun.com'
1882
- -
1883
- user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
1884
- bot:
1885
- name: 'Yunyun Bot'
1886
- category: 'Search bot'
1887
- url: 'http://www.yunyun.com/SiteInfo.php?r=about'
1888
- producer:
1889
- name: 'YunYun'
1890
- url: 'http://www.yunyun.com'
1891
- -
1892
- user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
1893
- bot:
1894
- name: 'Yunyun Bot'
1895
- category: 'Search bot'
1896
- url: 'http://www.yunyun.com/SiteInfo.php?r=about'
1897
- producer:
1898
- name: 'YunYun'
1899
- url: 'http://www.yunyun.com'
1900
- -
1901
- user_agent: Zookabot/2.5;++http://zookabot.com
1902
- bot:
1903
- name: 'Zookabot'
1904
- category: 'Crawler'
1905
- url: 'http://zookabot.com'
1906
- producer:
1907
- name: 'Hwacha ApS'
1908
- url: 'http://hwacha.dk'
1909
- -
1910
- user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
1911
- bot:
1912
- name: 'ZumBot'
1913
- category: 'Search bot'
1914
- url: 'http://help.zum.com/inquiry'
1915
- producer:
1916
- name: 'ZUM internet'
1917
- url: 'http://www.zuminternet.com/'
1918
- -
1919
- user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
1920
- bot:
1921
- name: 'ZumBot'
1922
- category: 'Search bot'
1923
- url: 'http://help.zum.com/inquiry'
1924
- producer:
1925
- name: 'ZUM internet'
1926
- url: 'http://www.zuminternet.com/'
1927
- -
1928
- user_agent: Your Nutch Spider/Nutch-2.2.1
1929
- bot:
1930
- name: 'Nutch-based Bot'
1931
- category: 'crawler'
1932
- url: 'https://nutch.apache.org'
1933
- producer:
1934
- name: 'The Apache Software Foundation'
1935
- url: 'http://www.apache.org/foundation/'
1936
- -
1937
- user_agent: Nutch12/Nutch-1.2
1938
- bot:
1939
- name: 'Nutch-based Bot'
1940
- category: 'crawler'
1941
- url: 'https://nutch.apache.org'
1942
- producer:
1943
- name: 'The Apache Software Foundation'
1944
- url: 'http://www.apache.org/foundation/'
1945
- -
1946
- user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
1947
- bot:
1948
- name: 'Nutch-based Bot'
1949
- category: 'crawler'
1950
- url: 'https://nutch.apache.org'
1951
- producer:
1952
- name: 'The Apache Software Foundation'
1953
- url: 'http://www.apache.org/foundation/'
1954
- -
1955
- user_agent: MySpider/Nutch-2.2
1956
- bot:
1957
- name: 'Nutch-based Bot'
1958
- category: 'crawler'
1959
- url: 'https://nutch.apache.org'
1960
- producer:
1961
- name: 'The Apache Software Foundation'
1962
- url: 'http://www.apache.org/foundation/'
1963
- -
1964
- user_agent: My Nutch Spider/Nutch-1.6
1965
- bot:
1966
- name: 'Nutch-based Bot'
1967
- category: 'crawler'
1968
- url: 'https://nutch.apache.org'
1969
- producer:
1970
- name: 'The Apache Software Foundation'
1971
- url: 'http://www.apache.org/foundation/'
1972
- -
1973
- user_agent: NutchSpider/Nutch-1.4
1974
- bot:
1975
- name: 'Nutch-based Bot'
1976
- category: 'crawler'
1977
- url: 'https://nutch.apache.org'
1978
- producer:
1979
- name: 'The Apache Software Foundation'
1980
- url: 'http://www.apache.org/foundation/'
1981
- -
1982
- user_agent: testnutch/Nutch-1.8
1983
- bot:
1984
- name: 'Nutch-based Bot'
1985
- category: 'crawler'
1986
- url: 'https://nutch.apache.org'
1987
- producer:
1988
- name: 'The Apache Software Foundation'
1989
- url: 'http://www.apache.org/foundation/'
1990
- -
1991
- user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
1992
- bot:
1993
- name: 'Nutch-based Bot'
1994
- category: 'crawler'
1995
- url: 'https://nutch.apache.org'
1996
- producer:
1997
- name: 'The Apache Software Foundation'
1998
- url: 'http://www.apache.org/foundation/'
1999
- -
2000
- user_agent: your sipder name/Nutch-1.7
2001
- bot:
2002
- name: 'Nutch-based Bot'
2003
- category: 'crawler'
2004
- url: 'https://nutch.apache.org'
2005
- producer:
2006
- name: 'The Apache Software Foundation'
2007
- url: 'http://www.apache.org/foundation/'
2008
- -
2009
- user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
2010
- bot:
2011
- name: 'Nutch-based Bot'
2012
- category: 'crawler'
2013
- url: 'https://nutch.apache.org'
2014
- producer:
2015
- name: 'The Apache Software Foundation'
2016
- url: 'http://www.apache.org/foundation/'
2017
- -
2018
- user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
2019
- bot:
2020
- name: 'Nutch-based Bot'
2021
- category: 'crawler'
2022
- url: 'https://nutch.apache.org'
2023
- producer:
2024
- name: 'The Apache Software Foundation'
2025
- url: 'http://www.apache.org/foundation/'
2026
- -
2027
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
2028
- bot:
2029
- name: 'Nutch-based Bot'
2030
- category: 'crawler'
2031
- url: 'https://nutch.apache.org'
2032
- producer:
2033
- name: 'The Apache Software Foundation'
2034
- url: 'http://www.apache.org/foundation/'
2035
- -
2036
- user_agent: CB/Nutch-1.7
2037
- bot:
2038
- name: 'Nutch-based Bot'
2039
- category: 'crawler'
2040
- url: 'https://nutch.apache.org'
2041
- producer:
2042
- name: 'The Apache Software Foundation'
2043
- url: 'http://www.apache.org/foundation/'
2044
- -
2045
- user_agent: NetLyzer FastProbe
2046
- bot:
2047
- name: 'NetLyzer FastProbe'
2048
- -
2049
- user_agent: StatusCake Error Detector Crawler V0.01
2050
- bot:
2051
- name: 'Generic Bot'
2052
- -
2053
- user_agent: niki-bot
2054
- bot:
2055
- name: 'Generic Bot'