device_detector 0.8.2 → 0.9.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (58) hide show
  1. checksums.yaml +4 -4
  2. data/.travis.yml +11 -3
  3. data/CHANGELOG.md +10 -5
  4. data/README.md +4 -4
  5. data/Rakefile +24 -19
  6. data/device_detector.gemspec +1 -1
  7. data/lib/device_detector.rb +25 -3
  8. data/lib/device_detector/device.rb +1 -1
  9. data/lib/device_detector/model_extractor.rb +4 -0
  10. data/lib/device_detector/os.rb +8 -3
  11. data/lib/device_detector/parser.rb +1 -1
  12. data/lib/device_detector/version.rb +1 -1
  13. data/regexes/bots.yml +211 -27
  14. data/regexes/client/browsers.yml +192 -58
  15. data/regexes/client/feed_readers.yml +6 -0
  16. data/regexes/client/libraries.yml +4 -0
  17. data/regexes/client/mediaplayers.yml +8 -4
  18. data/regexes/client/mobile_apps.yml +39 -4
  19. data/regexes/client/pim.yml +4 -0
  20. data/regexes/device/mobiles.yml +1803 -242
  21. data/regexes/device/televisions.yml +53 -11
  22. data/regexes/oss.yml +180 -12
  23. data/regexes/vendorfragments.yml +1 -0
  24. data/spec/device_detector/concrete_user_agent_spec.rb +36 -0
  25. data/spec/device_detector/detector_fixtures_spec.rb +1 -1
  26. data/spec/fixtures/client/browser.yml +313 -2
  27. data/spec/fixtures/client/feed_reader.yml +8 -1
  28. data/spec/fixtures/client/library.yml +7 -1
  29. data/spec/fixtures/client/mediaplayer.yml +6 -1
  30. data/spec/fixtures/client/mobile_app.yml +6 -0
  31. data/spec/fixtures/client/pim.yml +6 -0
  32. data/spec/fixtures/detector/bots.yml +2307 -612
  33. data/spec/fixtures/detector/camera.yml +6 -0
  34. data/spec/fixtures/detector/car_browser.yml +1 -0
  35. data/spec/fixtures/detector/console.yml +14 -0
  36. data/spec/fixtures/detector/desktop.yml +308 -48
  37. data/spec/fixtures/detector/feature_phone.yml +63 -0
  38. data/spec/fixtures/detector/feed_reader.yml +50 -26
  39. data/spec/fixtures/detector/mediaplayer.yml +28 -6
  40. data/spec/fixtures/detector/mobile_apps.yml +117 -0
  41. data/spec/fixtures/detector/phablet.yml +1066 -183
  42. data/spec/fixtures/detector/portable_media_player.yml +8 -0
  43. data/spec/fixtures/detector/smart_display.yml +39 -0
  44. data/spec/fixtures/detector/smartphone-1.yml +9469 -0
  45. data/spec/fixtures/detector/smartphone-2.yml +9414 -0
  46. data/spec/fixtures/detector/smartphone-3.yml +9396 -0
  47. data/spec/fixtures/detector/smartphone-4.yml +5742 -0
  48. data/spec/fixtures/detector/smartphone.yml +3446 -23680
  49. data/spec/fixtures/detector/tablet-1.yml +9495 -0
  50. data/spec/fixtures/detector/tablet-2.yml +248 -0
  51. data/spec/fixtures/detector/tablet.yml +2786 -7961
  52. data/spec/fixtures/detector/tv.yml +1376 -210
  53. data/spec/fixtures/detector/unknown.yml +205 -509
  54. data/spec/fixtures/device/console.yml +6 -0
  55. data/spec/fixtures/parser/oss.yml +194 -1
  56. data/spec/fixtures/parser/vendorfragments.yml +6 -0
  57. metadata +16 -6
  58. data/spec/fixtures/parser/bots.yml +0 -2055
@@ -177,4 +177,11 @@
177
177
  client:
178
178
  type: feed reader
179
179
  name: RSSOwl
180
- version: "2.2.1.201312301316"
180
+ version: "2.2.1.201312301316"
181
+
182
+ -
183
+ user_agent: Stringer (https://github.com/swanson/stringer)
184
+ client:
185
+ type: feed reader
186
+ name: Stringer
187
+ version: ""
@@ -75,4 +75,10 @@
75
75
  client:
76
76
  type: library
77
77
  name: Perl
78
- version: "1.0"
78
+ version: "1.0"
79
+ -
80
+ user_agent: Guzzle/3.9.3 curl/7.38.0 PHP/5.6.14-0+deb8u1
81
+ client:
82
+ type: library
83
+ name: Guzzle (PHP HTTP Client)
84
+ version: "3.9.3"
@@ -28,6 +28,12 @@
28
28
  type: mediaplayer
29
29
  name: VLC
30
30
  version: "2.1.0"
31
+ -
32
+ user_agent: LibVLC/2.2.3 (LIVE555 Streaming Media v2015.10.12)
33
+ client:
34
+ type: mediaplayer
35
+ name: VLC
36
+ version: "2.2.3"
31
37
  -
32
38
  user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.0; FunWebProducts; SLCC1; .NET CLR 2.0.50727; Media Center PC 5.0; .NET CLR 3.0.04506; Windows-Media-Player/10.00.00.3990)
33
39
  client:
@@ -160,4 +166,3 @@
160
166
  type: mediaplayer
161
167
  name: Instacast
162
168
  version: "4.1.2"
163
-
@@ -22,3 +22,9 @@
22
22
  type: mobile app
23
23
  name: FeedR
24
24
  version: "1.0"
25
+ -
26
+ user_agent: Pinterest/3.3.3 CFNetwork/609.1.4 Darwin/13.0.0
27
+ client:
28
+ type: mobile app
29
+ name: Pinterest
30
+ version: "3.3.3"
@@ -76,6 +76,12 @@
76
76
  type: pim
77
77
  name: Postbox
78
78
  version: "1.0"
79
+ -
80
+ user_agent: MailBar/1.3.2 (Mac OS X Version 10.11.1 (Build 15B42))
81
+ client:
82
+ type: pim
83
+ name: MailBar
84
+ version: 1.3.2
79
85
  -
80
86
  user_agent: The Bat! 4.0.0.22
81
87
  client:
@@ -1,723 +1,2418 @@
1
- -
1
+ ---
2
+ -
3
+ user_agent: 360spider-image
4
+ bot:
5
+ name: 360Spider
6
+ category: Search bot
7
+ url: http://www.so.com/help/help_3_2.html
8
+ producer:
9
+ name: Online Media Group, Inc.
10
+ url:
11
+ -
12
+ user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
13
+ bot:
14
+ name: 360Spider
15
+ category: Search bot
16
+ url: http://www.so.com/help/help_3_2.html
17
+ producer:
18
+ name: Online Media Group, Inc.
19
+ url:
20
+ -
2
21
  user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
3
- name: '360Spider'
4
- -
22
+ bot:
23
+ name: 360Spider
24
+ category: Search bot
25
+ url: http://www.so.com/help/help_3_2.html
26
+ producer:
27
+ name: Online Media Group, Inc.
28
+ url:
29
+ -
5
30
  user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
6
- name: '360Spider'
7
- -
8
- user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
9
- name: '360Spider'
10
- -
11
- user_agent: 360spider-image
12
- name: '360Spider'
13
- -
31
+ bot:
32
+ name: 360Spider
33
+ category: Search bot
34
+ url: http://www.so.com/help/help_3_2.html
35
+ producer:
36
+ name: Online Media Group, Inc.
37
+ url:
38
+ -
39
+ user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
40
+ bot:
41
+ name: ADMantX
42
+ -
14
43
  user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
15
- name: 'Aboundexbot'
16
- -
44
+ bot:
45
+ name: Aboundexbot
46
+ category: Search bot
47
+ url: http://www.aboundex.com/crawler/
48
+ producer:
49
+ name: Aboundex.com
50
+ url: http://www.aboundex.com
51
+ -
17
52
  user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
18
- name: 'Acoon'
19
- -
53
+ bot:
54
+ name: Acoon
55
+ category: Search bot
56
+ url: http://www.acoon.de/robot.asp
57
+ producer:
58
+ name: Acoon GmbH
59
+ url: http://www.acoon.de
60
+ -
20
61
  user_agent: AddThis.com robot tech.support@clearspring.com
21
- name: 'AddThis.com'
22
- -
23
- user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
24
- name: 'aHrefs Bot'
25
- -
26
- user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
27
- name: 'aHrefs Bot'
28
- -
29
- user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
30
- name: 'aHrefs Bot'
31
- -
32
- user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
33
- name: 'aHrefs Bot'
34
- -
62
+ bot:
63
+ name: AddThis.com
64
+ category: Social Media Agent
65
+ url:
66
+ producer:
67
+ name: Clearspring Technologies, Inc.
68
+ url: http://www.clearspring.com
69
+ -
35
70
  user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
36
- name: 'Alexa Crawler'
37
- -
71
+ bot:
72
+ name: Alexa Crawler
73
+ category: Search bot
74
+ url: https://alexa.zendesk.com/hc/en-us/sections/200100794-Crawlers
75
+ producer:
76
+ name: Alexa Internet
77
+ url: http://www.alexa.com
78
+ -
38
79
  user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
39
- name: 'Amorank Spider'
40
- -
41
- user_agent: Curious George - www.analyticsseo.com/crawler
42
- name: 'Analytics SEO Crawler'
43
- -
44
- user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
45
- name: 'archive.org bot'
46
- -
47
- user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
48
- name: 'archive.org bot'
49
- -
50
- user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
51
- name: 'archive.org bot'
52
- -
53
- user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
54
- name: 'archive.org bot'
55
- -
56
- user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
57
- name: 'archive.org bot'
58
- -
59
- user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
60
- name: 'archive.org bot'
61
- -
62
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
63
- name: 'archive.org bot'
64
- -
80
+ bot:
81
+ name: Amorank Spider
82
+ category: Crawler
83
+ url: http://amorank.com/webcrawler.html
84
+ producer:
85
+ name: Amorank
86
+ url: http://www.amorank.com
87
+ -
88
+ user_agent: 'Curious George - www.analyticsseo.com/crawler'
89
+ bot:
90
+ name: Analytics SEO Crawler
91
+ category: Crawler
92
+ url: http://www.analyticsseo.com/crawler
93
+ producer:
94
+ name: Analytics SEO
95
+ url: http://www.analyticsseo.com
96
+ -
97
+ user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
98
+ bot:
99
+ name: Applebot
100
+ category: Crawler
101
+ url: http://www.apple.com/go/applebot
102
+ producer:
103
+ name: Apple Inc
104
+ url: http://www.apple.com
105
+ -
106
+ user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
107
+ bot:
108
+ name: Applebot
109
+ category: Crawler
110
+ url: http://www.apple.com/go/applebot
111
+ producer:
112
+ name: Apple Inc
113
+ url: http://www.apple.com
114
+ -
65
115
  user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
66
- name: 'Ask Jeeves'
67
- -
116
+ bot:
117
+ name: Ask Jeeves
118
+ category: Search bot
119
+ url:
120
+ producer:
121
+ name: Ask Jeeves Inc.
122
+ url: http://www.ask.com
123
+ -
124
+ user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
125
+ bot:
126
+ name: BLEXBot Crawler
127
+ category: Crawler
128
+ url: http://webmeup-crawler.com
129
+ producer:
130
+ name: WebMeUp
131
+ url: http://webmeup.com
132
+ -
133
+ user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
134
+ bot:
135
+ name: BUbiNG
136
+ category: Crawler
137
+ url: http://law.di.unimi.it/BUbiNG.html
138
+ producer:
139
+ name:
140
+ url:
141
+ -
68
142
  user_agent: Backlink-Ceck.de (+http://www.backlink-check.de/bot.html)
69
- name: 'Backlink-Ceck.de'
70
- -
143
+ bot:
144
+ name: Backlink-Ceck.de
145
+ category: Crawler
146
+ url: http://www.backlink-check.de/bot.html
147
+ producer:
148
+ name: Mediagreen Medienservice
149
+ url: http://www.backlink-check.de
150
+ -
71
151
  user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
72
- name: 'BacklinkCrawler'
73
- -
152
+ bot:
153
+ name: BacklinkCrawler
154
+ category: Crawler
155
+ url: http://www.backlinktest.com/crawler.html
156
+ producer:
157
+ name: 2.0Promotion GbR
158
+ url: http://www.backlinktest.com
159
+ -
160
+ user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
161
+ bot:
162
+ name: Baidu Spider
163
+ category: Search bot
164
+ url: http://www.baidu.com/search/spider.htm
165
+ producer:
166
+ name: Baidu
167
+ url: http://www.baidu.com
168
+ -
169
+ user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
170
+ bot:
171
+ name: Baidu Spider
172
+ category: Search bot
173
+ url: http://www.baidu.com/search/spider.htm
174
+ producer:
175
+ name: Baidu
176
+ url: http://www.baidu.com
177
+ -
178
+ user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
179
+ bot:
180
+ name: Baidu Spider
181
+ category: Search bot
182
+ url: http://www.baidu.com/search/spider.htm
183
+ producer:
184
+ name: Baidu
185
+ url: http://www.baidu.com
186
+ -
74
187
  user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
75
- name: 'Baidu Spider'
76
- -
188
+ bot:
189
+ name: Baidu Spider
190
+ category: Search bot
191
+ url: http://www.baidu.com/search/spider.htm
192
+ producer:
193
+ name: Baidu
194
+ url: http://www.baidu.com
195
+ -
196
+ user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
197
+ bot:
198
+ name: Baidu Spider
199
+ category: Search bot
200
+ url: http://www.baidu.com/search/spider.htm
201
+ producer:
202
+ name: Baidu
203
+ url: http://www.baidu.com
204
+ -
77
205
  user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
78
- name: 'Baidu Spider'
79
- -
206
+ bot:
207
+ name: Baidu Spider
208
+ category: Search bot
209
+ url: http://www.baidu.com/search/spider.htm
210
+ producer:
211
+ name: Baidu
212
+ url: http://www.baidu.com
213
+ -
80
214
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
81
- name: 'Baidu Spider'
82
- -
83
- user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
84
- name: 'Baidu Spider'
85
- -
86
- user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
87
- name: 'Baidu Spider'
88
- -
89
- user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
90
- name: 'Baidu Spider'
91
- -
92
- user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
93
- name: 'Baidu Spider'
94
- -
95
- user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
96
- name: 'BingBot'
97
- -
215
+ bot:
216
+ name: Baidu Spider
217
+ category: Search bot
218
+ url: http://www.baidu.com/search/spider.htm
219
+ producer:
220
+ name: Baidu
221
+ url: http://www.baidu.com
222
+ -
223
+ user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
224
+ bot:
225
+ name: BazQux Reader
226
+ url: https://bazqux.com/fetcher
227
+ category: Feed Fetcher
228
+ producer:
229
+ name:
230
+ url:
231
+ -
98
232
  user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
99
- name: 'BingBot'
100
- -
233
+ bot:
234
+ name: BingBot
235
+ category: Search bot
236
+ url: http://search.msn.com/msnbot.htmn
237
+ producer:
238
+ name: Microsoft Corporation
239
+ url: http://www.microsoft.com
240
+ -
241
+ user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
242
+ bot:
243
+ name: BingBot
244
+ category: Search bot
245
+ url: http://search.msn.com/msnbot.htmn
246
+ producer:
247
+ name: Microsoft Corporation
248
+ url: http://www.microsoft.com
249
+ -
101
250
  user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
102
- name: 'BingBot'
103
- -
104
- user_agent: MSNBot/Nutch-1.5.1
105
- name: 'BingBot'
106
- -
107
- user_agent: msnbot/2.0b v1394720947.6703
108
- name: 'BingBot'
109
- -
251
+ bot:
252
+ name: BingBot
253
+ category: Search bot
254
+ url: http://search.msn.com/msnbot.htmn
255
+ producer:
256
+ name: Microsoft Corporation
257
+ url: http://www.microsoft.com
258
+ -
259
+ user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
260
+ bot:
261
+ name: BingBot
262
+ category: Search bot
263
+ url: http://search.msn.com/msnbot.htmn
264
+ producer:
265
+ name: Microsoft Corporation
266
+ url: http://www.microsoft.com
267
+ -
110
268
  user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
111
- name: 'BingBot'
112
- -
269
+ bot:
270
+ name: BingBot
271
+ category: Search bot
272
+ url: http://search.msn.com/msnbot.htmn
273
+ producer:
274
+ name: Microsoft Corporation
275
+ url: http://www.microsoft.com
276
+ -
113
277
  user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
114
- name: 'BingBot'
115
- -
116
- user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
117
- name: 'BingBot'
118
- -
278
+ bot:
279
+ name: BingBot
280
+ category: Search bot
281
+ url: http://search.msn.com/msnbot.htmn
282
+ producer:
283
+ name: Microsoft Corporation
284
+ url: http://www.microsoft.com
285
+ -
286
+ user_agent: msnbot/2.0b v1394720947.6703
287
+ bot:
288
+ name: BingBot
289
+ category: Search bot
290
+ url: http://search.msn.com/msnbot.htmn
291
+ producer:
292
+ name: Microsoft Corporation
293
+ url: http://www.microsoft.com
294
+ -
295
+ user_agent: MSNBot/Nutch-1.5.1
296
+ bot:
297
+ name: BingBot
298
+ category: Search bot
299
+ url: http://search.msn.com/msnbot.htmn
300
+ producer:
301
+ name: Microsoft Corporation
302
+ url: http://www.microsoft.com
303
+ -
119
304
  user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
120
- name: 'Blekkobot'
121
- -
122
- user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
123
- name: 'BLEXBot Crawler'
124
- -
305
+ bot:
306
+ name: Blekkobot
307
+ category: Search bot
308
+ url: http://blekko.com/about/blekkobot
309
+ producer:
310
+ name: Blekko
311
+ url: http://blekko.com
312
+ -
313
+ user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
314
+ bot:
315
+ name: Bloglovin
316
+ url: http://www.bloglovin.com
317
+ category: Feed Fetcher
318
+ producer:
319
+ name:
320
+ url:
321
+ -
322
+ user_agent: Blogtrottr/2.0
323
+ bot:
324
+ name: Blogtrottr
325
+ url:
326
+ category: Feed Fetcher
327
+ producer:
328
+ name: Blogtrottr Ltd
329
+ url: https://blogtrottr.com/
330
+ -
125
331
  user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
126
- name: 'Bountii Bot'
127
- -
128
- user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
129
- name: 'Butterfly Robot'
130
- -
131
- user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
132
- name: 'Butterfly Robot'
133
- -
332
+ bot:
333
+ name: Bountii Bot
334
+ category: Search bot
335
+ url: http://bountii.com/contact.php
336
+ producer:
337
+ name: Bountii Inc.
338
+ url: http://bountii.com
339
+ -
134
340
  user_agent: Browsershots
135
- name: 'Browsershots'
136
- -
341
+ bot:
342
+ name: Browsershots
343
+ category: Service Agent
344
+ url: http://browsershots.org/faq
345
+ producer:
346
+ name: Browsershots.org
347
+ url: http://browsershots.org
348
+ -
349
+ user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
350
+ bot:
351
+ name: Butterfly Robot
352
+ category: Search bot
353
+ url: http://labs.topsy.com/butterfly
354
+ producer:
355
+ name: Topsy Labs
356
+ url: http://labs.topsy.com
357
+ -
358
+ user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
359
+ bot:
360
+ name: Butterfly Robot
361
+ category: Search bot
362
+ url: http://labs.topsy.com/butterfly
363
+ producer:
364
+ name: Topsy Labs
365
+ url: http://labs.topsy.com
366
+ -
137
367
  user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
138
- name: 'CareerBot'
139
- -
140
- user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
141
- name: 'ccBot crawler'
142
- -
368
+ bot:
369
+ name: CareerBot
370
+ category: Crawler
371
+ url: http://www.career-x.de/bot.html
372
+ producer:
373
+ name: career-x GmbH
374
+ url: http://www.career-x.de
375
+ -
143
376
  user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
144
- name: 'Cliqzbot'
145
- -
377
+ bot:
378
+ name: Cliqzbot
379
+ category: Crawler
380
+ url: http://cliqz.com/company/cliqzbot
381
+ producer:
382
+ name: 10betterpages GmbH
383
+ url: http://cliqz.com
384
+ -
146
385
  user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
147
- name: 'CloudFlare Always Online'
148
- -
386
+ bot:
387
+ name: CloudFlare Always Online
388
+ category: Site Monitor
389
+ url: http://www.cloudflare.com/always-online
390
+ producer:
391
+ name: CloudFlare
392
+ url: http://www.cloudflare.com
393
+ -
394
+ user_agent: CommaFeed/1.0 (http://www.commafeed.com)
395
+ bot:
396
+ name: CommaFeed
397
+ url: http://www.commafeed.com
398
+ category: Feed Fetcher
399
+ producer:
400
+ name:
401
+ url:
402
+ -
403
+ user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
404
+ bot:
405
+ name: Cốc Cốc Bot
406
+ url: http://help.coccoc.com/
407
+ category: Search bot
408
+ producer:
409
+ name: Cốc Cốc
410
+ url: http://coccoc.com/
411
+ -
412
+ user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
413
+ bot:
414
+ name: Daum
415
+ category: Search bot
416
+ url: http://tab.search.daum.net/aboutWebSearch_en.html
417
+ producer:
418
+ name: Daum Communications Corp.
419
+ url: http://www.kakaocorp.com/main
420
+ -
421
+ user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
422
+ bot:
423
+ name: Daum
424
+ category: Search bot
425
+ url: http://tab.search.daum.net/aboutWebSearch_en.html
426
+ producer:
427
+ name: Daum Communications Corp.
428
+ url: http://www.kakaocorp.com/main
429
+ -
149
430
  user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
150
- name: 'Dazoobot'
151
- -
431
+ bot:
432
+ name: Dazoobot
433
+ category: Search bot
434
+ url:
435
+ producer:
436
+ name: DAZOO.FR
437
+ url: http://dazoo.fr
438
+ -
152
439
  user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
153
- name: 'Discobot'
154
- -
440
+ bot:
441
+ name: Discobot
442
+ category: Search bot
443
+ url: http://discoveryengine.com/discobot.html
444
+ producer:
445
+ name: Discovery Engine
446
+ url: http://discoveryengine.com
447
+ -
448
+ user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
449
+ bot:
450
+ name: Domain Re-Animator Bot
451
+ category: Crawler
452
+ url:
453
+ producer:
454
+ name: Domain Re-Animator, LLC
455
+ url: http://domainreanimator.com
456
+ -
457
+ user_agent: support@domainreanimator.com
458
+ bot:
459
+ name: Domain Re-Animator Bot
460
+ category: Crawler
461
+ url:
462
+ producer:
463
+ name: Domain Re-Animator, LLC
464
+ url: http://domainreanimator.com
465
+ -
155
466
  user_agent: dotbot
156
- name: 'DotBot'
157
- -
467
+ bot:
468
+ name: DotBot
469
+ category: Crawler
470
+ url: http://www.opensiteexplorer.org/dotbot
471
+ producer:
472
+ name: SEOmoz, Inc.
473
+ url: http://moz.com/
474
+ -
475
+ user_agent: EMail Exractor
476
+ bot:
477
+ name: EMail Exractor
478
+ category: Crawler
479
+ url:
480
+ producer:
481
+ name:
482
+ url:
483
+ -
158
484
  user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
159
- name: 'Easou Spider'
160
- -
485
+ bot:
486
+ name: Easou Spider
487
+ category: Search bot
488
+ url: http://www.easou.com/search/spider.html
489
+ producer:
490
+ name: easou ICP
491
+ url: http://www.easou.com
492
+ -
161
493
  user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
162
- name: 'Easou Spider'
163
- -
164
- user_agent: EMail Exractor
165
- name: 'EMail Exractor'
166
- -
167
- user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
168
- name: 'ExaBot'
169
- -
494
+ bot:
495
+ name: Easou Spider
496
+ category: Search bot
497
+ url: http://www.easou.com/search/spider.html
498
+ producer:
499
+ name: easou ICP
500
+ url: http://www.easou.com
501
+ -
170
502
  user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
171
- name: 'ExaBot'
172
- -
503
+ bot:
504
+ name: ExaBot
505
+ category: Crawler
506
+ url: http://www.exabot.com/go/robot
507
+ producer:
508
+ name: Dassault Systèmes
509
+ url: http://www.3ds.com
510
+ -
511
+ user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
512
+ bot:
513
+ name: ExaBot
514
+ category: Crawler
515
+ url: http://www.exabot.com/go/robot
516
+ producer:
517
+ name: Dassault Systèmes
518
+ url: http://www.3ds.com
519
+ -
173
520
  user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
174
- name: 'ExaBot'
175
- -
521
+ bot:
522
+ name: ExaBot
523
+ category: Crawler
524
+ url: http://www.exabot.com/go/robot
525
+ producer:
526
+ name: Dassault Systèmes
527
+ url: http://www.3ds.com
528
+ -
176
529
  user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
177
- name: 'ExactSeek Crawler'
178
- -
530
+ bot:
531
+ name: ExactSeek Crawler
532
+ category: Search bot
533
+ url: http://www.exactseek.com
534
+ producer:
535
+ name: Jayde Online, Inc.
536
+ url: http://www.jaydeonlineinc.com
537
+ -
179
538
  user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
180
- name: 'Ezooms'
181
- -
539
+ bot:
540
+ name: Ezooms
541
+ category: Crawler
542
+ url:
543
+ producer:
544
+ name: SEOmoz, Inc.
545
+ url: http://moz.com/
546
+ -
182
547
  user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
183
- name: 'Facebook External Hit'
184
- -
548
+ bot:
549
+ name: Facebook External Hit
550
+ category: Social Media Agent
551
+ url: https://www.facebook.com/externalhit_uatext.php
552
+ producer:
553
+ name: Facebook
554
+ url: http://www.facebook.com
555
+ -
185
556
  user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
186
- name: 'Facebook External Hit'
187
- -
557
+ bot:
558
+ name: Facebook External Hit
559
+ category: Social Media Agent
560
+ url: https://www.facebook.com/externalhit_uatext.php
561
+ producer:
562
+ name: Facebook
563
+ url: http://www.facebook.com
564
+ -
565
+ user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
566
+ bot:
567
+ name: Feed Wrangler
568
+ url: https://feedwrangler.net/
569
+ category: Feed Fetcher
570
+ producer:
571
+ name: 'David Smith & Developing Perspective, LLC'
572
+ url: https://david-smith.org
573
+ -
574
+ user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
575
+ bot:
576
+ name: FeedBurner
577
+ url: http://www.feedburner.com
578
+ category: Feed Fetcher
579
+ producer:
580
+ name:
581
+ url:
582
+ -
583
+ user_agent: 'Feedbin - 9 subscribers'
584
+ bot:
585
+ name: Feedbin
586
+ url: http://feedbin.com/
587
+ category: Feed Fetcher
588
+ producer:
589
+ name:
590
+ url:
591
+ -
592
+ user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
593
+ bot:
594
+ name: Feedly
595
+ url: http://www.feedly.com
596
+ category: Feed Fetcher
597
+ producer:
598
+ name:
599
+ url:
600
+ -
601
+ user_agent: FeedlyApp/1.0 (http://www.feedly.com)
602
+ bot:
603
+ name: Feedly
604
+ url: http://www.feedly.com
605
+ category: Feed Fetcher
606
+ producer:
607
+ name:
608
+ url:
609
+ -
610
+ user_agent: FeedlyBot/1.0 (http://feedly.com)
611
+ bot:
612
+ name: Feedly
613
+ url: http://www.feedly.com
614
+ category: Feed Fetcher
615
+ producer:
616
+ name:
617
+ url:
618
+ -
619
+ user_agent: MetaFeedly/1.0 (http://www.feedly.com)
620
+ bot:
621
+ name: Feedly
622
+ url: http://www.feedly.com
623
+ category: Feed Fetcher
624
+ producer:
625
+ name:
626
+ url:
627
+ -
628
+ user_agent: Feedspot http://www.feedspot.com
629
+ bot:
630
+ name: Feedspot
631
+ url: http://www.feedspot.com
632
+ category: Feed Fetcher
633
+ producer:
634
+ name:
635
+ url:
636
+ -
637
+ user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
638
+ bot:
639
+ name: Fever
640
+ url: http://feedafever.com/
641
+ category: Feed Fetcher
642
+ producer:
643
+ name:
644
+ url:
645
+ -
646
+ user_agent: niki-bot
647
+ bot:
648
+ name: Generic Bot
649
+ -
650
+ user_agent: StatusCake Error Detector Crawler V0.01
651
+ bot:
652
+ name: Generic Bot
653
+ -
188
654
  user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
189
- name: 'Genieo Web filter'
190
- -
655
+ bot:
656
+ name: Genieo Web filter
657
+ category:
658
+ url: http://www.genieo.com/webfilter.html
659
+ producer:
660
+ name: Genieo
661
+ url: http://www.genieo.com
662
+ -
663
+ user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
664
+ bot:
665
+ name: Gluten Free Crawler
666
+ category: Crawler
667
+ url: http://glutenfreepleasure.com/
668
+ producer:
669
+ name:
670
+ url:
671
+ -
672
+ user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
673
+ bot:
674
+ name: Gmail Image Proxy
675
+ category: Crawler
676
+ url:
677
+ producer:
678
+ name: Google Inc.
679
+ url: http://www.google.com
680
+ -
191
681
  user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
192
- name: 'Goo'
193
- -
682
+ bot:
683
+ name: Goo
684
+ category: Search bot
685
+ url: http://search.goo.ne.jp/option/use/sub4/sub4-1
686
+ producer:
687
+ name: NTT Resonant
688
+ url: http://goo.ne.jp
689
+ -
194
690
  user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
195
- name: 'Google PageSpeed Insights'
196
- -
691
+ bot:
692
+ name: Google PageSpeed Insights
693
+ category: Site Monitor
694
+ url: http://developers.google.com/speed/pagespeed/insights/
695
+ producer:
696
+ name: Google Inc.
697
+ url: http://www.google.com
698
+ -
699
+ user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
700
+ bot:
701
+ name: Google Partner Monitoring
702
+ category: Site Monitor
703
+ url:
704
+ producer:
705
+ name: Google Inc.
706
+ url: http://www.google.com
707
+ -
708
+ user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
709
+ bot:
710
+ name: Googlebot
711
+ category: Search bot
712
+ url: http://www.google.com/bot.html
713
+ producer:
714
+ name: Google Inc.
715
+ url: http://www.google.com
716
+ -
717
+ user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
718
+ bot:
719
+ name: Googlebot
720
+ category: Search bot
721
+ url: http://www.google.com/bot.html
722
+ producer:
723
+ name: Google Inc.
724
+ url: http://www.google.com
725
+ -
726
+ user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
727
+ bot:
728
+ name: Googlebot
729
+ category: Search bot
730
+ url: http://www.google.com/bot.html
731
+ producer:
732
+ name: Google Inc.
733
+ url: http://www.google.com
734
+ -
735
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
736
+ bot:
737
+ name: Googlebot
738
+ category: Search bot
739
+ url: http://www.google.com/bot.html
740
+ producer:
741
+ name: Google Inc.
742
+ url: http://www.google.com
743
+ -
744
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
745
+ bot:
746
+ name: Googlebot
747
+ category: Search bot
748
+ url: http://www.google.com/bot.html
749
+ producer:
750
+ name: Google Inc.
751
+ url: http://www.google.com
752
+ -
753
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
754
+ bot:
755
+ name: Googlebot
756
+ category: Search bot
757
+ url: http://www.google.com/bot.html
758
+ producer:
759
+ name: Google Inc.
760
+ url: http://www.google.com
761
+ -
762
+ user_agent: Googlebot (gocrawl v0.4)
763
+ bot:
764
+ name: Googlebot
765
+ category: Search bot
766
+ url: http://www.google.com/bot.html
767
+ producer:
768
+ name: Google Inc.
769
+ url: http://www.google.com
770
+ -
771
+ user_agent: Googlebot-Image/1.0
772
+ bot:
773
+ name: Googlebot
774
+ category: Search bot
775
+ url: http://www.google.com/bot.html
776
+ producer:
777
+ name: Google Inc.
778
+ url: http://www.google.com
779
+ -
780
+ user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
781
+ bot:
782
+ name: Googlebot
783
+ category: Search bot
784
+ url: http://www.google.com/bot.html
785
+ producer:
786
+ name: Google Inc.
787
+ url: http://www.google.com
788
+ -
789
+ user_agent: Googlebot-Video/1.0
790
+ bot:
791
+ name: Googlebot
792
+ category: Search bot
793
+ url: http://www.google.com/bot.html
794
+ producer:
795
+ name: Google Inc.
796
+ url: http://www.google.com
797
+ -
197
798
  user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
198
- name: 'Googlebot'
199
- -
799
+ bot:
800
+ name: Googlebot
801
+ category: Search bot
802
+ url: http://www.google.com/bot.html
803
+ producer:
804
+ name: Google Inc.
805
+ url: http://www.google.com
806
+ -
200
807
  user_agent: Googlebot/Nutch-1.7
201
- name: 'Googlebot'
202
- -
203
- user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
204
- name: 'Googlebot'
205
- -
808
+ bot:
809
+ name: Googlebot
810
+ category: Search bot
811
+ url: http://www.google.com/bot.html
812
+ producer:
813
+ name: Google Inc.
814
+ url: http://www.google.com
815
+ -
816
+ user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
817
+ bot:
818
+ name: Googlebot
819
+ category: Search bot
820
+ url: http://www.google.com/bot.html
821
+ producer:
822
+ name: Google Inc.
823
+ url: http://www.google.com
824
+ -
825
+ user_agent: Mediapartners-Google
826
+ bot:
827
+ name: Googlebot
828
+ category: Search bot
829
+ url: http://www.google.com/bot.html
830
+ producer:
831
+ name: Google Inc.
832
+ url: http://www.google.com
833
+ -
834
+ user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
835
+ bot:
836
+ name: Googlebot
837
+ category: Search bot
838
+ url: http://www.google.com/bot.html
839
+ producer:
840
+ name: Google Inc.
841
+ url: http://www.google.com
842
+ -
206
843
  user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
207
- name: 'Googlebot'
208
- -
844
+ bot:
845
+ name: Googlebot
846
+ category: Search bot
847
+ url: http://www.google.com/bot.html
848
+ producer:
849
+ name: Google Inc.
850
+ url: http://www.google.com
851
+ -
209
852
  user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
210
- name: 'Googlebot'
211
- -
212
- user_agent: Googlebot-Image/1.0
213
- name: 'Googlebot'
214
- -
215
- user_agent: Googlebot-Video/1.0
216
- name: 'Googlebot'
217
- -
218
- user_agent: Googlebot (gocrawl v0.4)
219
- name: 'Googlebot'
220
- -
221
- user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
222
- name: 'Googlebot'
223
- -
224
- user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
225
- name: 'Googlebot'
226
- -
227
- user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
228
- name: 'Googlebot'
229
- -
230
- user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
231
- name: 'Googlebot'
232
- -
233
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
234
- name: 'Googlebot'
235
- -
236
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
237
- name: 'Googlebot'
238
- -
239
- user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
240
- name: 'Googlebot'
241
- -
853
+ bot:
854
+ name: Googlebot
855
+ category: Search bot
856
+ url: http://www.google.com/bot.html
857
+ producer:
858
+ name: Google Inc.
859
+ url: http://www.google.com
860
+ -
861
+ user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
862
+ bot:
863
+ name: Googlebot
864
+ category: Search bot
865
+ url: http://www.google.com/bot.html
866
+ producer:
867
+ name: Google Inc.
868
+ url: http://www.google.com
869
+ -
242
870
  user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
243
- name: 'Googlebot'
244
- -
245
- user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
246
- name: 'Googlebot'
247
- -
871
+ bot:
872
+ name: Googlebot
873
+ category: Search bot
874
+ url: http://www.google.com/bot.html
875
+ producer:
876
+ name: Google Inc.
877
+ url: http://www.google.com
878
+ -
248
879
  user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
249
- name: 'Googlebot'
250
- -
251
- user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
252
- name: 'Googlebot'
253
- -
254
- user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
255
- name: 'Googlebot'
256
- -
257
- user_agent: Mediapartners-Google
258
- name: 'Googlebot'
259
- -
880
+ bot:
881
+ name: Googlebot
882
+ category: Search bot
883
+ url: http://www.google.com/bot.html
884
+ producer:
885
+ name: Google Inc.
886
+ url: http://www.google.com
887
+ -
888
+ user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
889
+ bot:
890
+ name: Googlebot
891
+ category: Search bot
892
+ url: http://www.google.com/bot.html
893
+ producer:
894
+ name: Google Inc.
895
+ url: http://www.google.com
896
+ -
897
+ user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
898
+ bot:
899
+ name: Googlebot
900
+ category: Search bot
901
+ url: http://www.google.com/bot.html
902
+ producer:
903
+ name: Google Inc.
904
+ url: http://www.google.com
905
+ -
906
+ user_agent: HTTPMon/1.0b (http://www.httpmon.com)
907
+ bot:
908
+ name: HTTPMon
909
+ category: Site Monitor
910
+ url: http://www.httpmon.com
911
+ producer:
912
+ name: towards GmbH
913
+ url: http://www.towards.ch/
914
+ -
915
+ user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
916
+ bot:
917
+ name: Heritrix
918
+ category: Crawler
919
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
920
+ producer:
921
+ name: The Internet Archive
922
+ url: http://www.archive.org
923
+ -
924
+ user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
925
+ bot:
926
+ name: Heritrix
927
+ category: Crawler
928
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
929
+ producer:
930
+ name: The Internet Archive
931
+ url: http://www.archive.org
932
+ -
260
933
  user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
261
- name: 'Heritrix'
262
- -
263
- user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
264
- name: 'Heritrix'
265
- -
266
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
267
- name: 'Heritrix'
268
- -
269
- user_agent: flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)
270
- name: 'Heritrix'
271
- -
934
+ bot:
935
+ name: Heritrix
936
+ category: Crawler
937
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
938
+ producer:
939
+ name: The Internet Archive
940
+ url: http://www.archive.org
941
+ -
272
942
  user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
273
- name: 'Heritrix'
274
- -
275
- user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
276
- name: 'Heritrix'
277
- -
278
- user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
279
- name: 'Heritrix'
280
- -
943
+ bot:
944
+ name: Heritrix
945
+ category: Crawler
946
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
947
+ producer:
948
+ name: The Internet Archive
949
+ url: http://www.archive.org
950
+ -
951
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
952
+ bot:
953
+ name: Heritrix
954
+ category: Crawler
955
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
956
+ producer:
957
+ name: The Internet Archive
958
+ url: http://www.archive.org
959
+ -
281
960
  user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
282
- name: 'Heritrix'
283
- -
284
- user_agent: HTTPMon/1.0b (http://www.httpmon.com)
285
- name: 'HTTPMon'
286
- -
961
+ bot:
962
+ name: Heritrix
963
+ category: Crawler
964
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
965
+ producer:
966
+ name: The Internet Archive
967
+ url: http://www.archive.org
968
+ -
969
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
970
+ bot:
971
+ name: Heritrix
972
+ category: Crawler
973
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
974
+ producer:
975
+ name: The Internet Archive
976
+ url: http://www.archive.org
977
+ -
978
+ user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
979
+ bot:
980
+ name: Heritrix
981
+ category: Crawler
982
+ url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
983
+ producer:
984
+ name: The Internet Archive
985
+ url: http://www.archive.org
986
+ -
987
+ user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
988
+ bot:
989
+ name: HubPages
990
+ category: Crawler
991
+ url: http://hubpages.com/help/crawlingpolicy
992
+ producer:
993
+ name: HubPages
994
+ url: http://hubpages.com/
995
+ -
996
+ user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
997
+ bot:
998
+ name: ICC-Crawler
999
+ category: Crawler
1000
+ url: http://www.nict.go.jp/en/univ-com/plan/crawl.html
1001
+ producer:
1002
+ name:
1003
+ url:
1004
+ -
287
1005
  user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
288
- name: 'IIS Site Analysis'
289
- -
290
- user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
291
- name: 'Linkdex Bot'
292
- -
293
- user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
294
- name: 'Linkdex Bot'
295
- -
1006
+ bot:
1007
+ name: IIS Site Analysis
1008
+ category: Crawler
1009
+ url: http://www.iis.net/iisbot.html
1010
+ producer:
1011
+ name: Microsoft Corporation
1012
+ url: http://www.microsoft.com
1013
+ -
1014
+ user_agent: kouio.com RSS reader
1015
+ bot:
1016
+ name: Kouio
1017
+ url: http://kouio.com/
1018
+ category: Feed Fetcher
1019
+ producer:
1020
+ name:
1021
+ url:
1022
+ -
1023
+ user_agent: 'kouio.com RSS reader - 6 subscribers'
1024
+ bot:
1025
+ name: Kouio
1026
+ url: http://kouio.com/
1027
+ category: Feed Fetcher
1028
+ producer:
1029
+ name:
1030
+ url:
1031
+ -
1032
+ user_agent: 'ltx71 - (http://ltx71.com/)'
1033
+ bot:
1034
+ name: LTX71
1035
+ url: http://ltx71.com/
1036
+ producer:
1037
+ name:
1038
+ url:
1039
+ -
1040
+ user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
1041
+ bot:
1042
+ name: Larbin web crawler
1043
+ category: Crawler
1044
+ url: http://larbin.sourceforge.net
1045
+ producer:
1046
+ name:
1047
+ url:
1048
+ -
296
1049
  user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
297
- name: 'Linkdex Bot'
298
- -
1050
+ bot:
1051
+ name: Linkdex Bot
1052
+ category: Search bot
1053
+ url: http://www.linkdex.com/bots
1054
+ producer:
1055
+ name: Mojeek Ltd.
1056
+ url: http://www.mojeek.com
1057
+ -
1058
+ user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
1059
+ bot:
1060
+ name: Linkdex Bot
1061
+ category: Search bot
1062
+ url: http://www.linkdex.com/bots
1063
+ producer:
1064
+ name: Mojeek Ltd.
1065
+ url: http://www.mojeek.com
1066
+ -
1067
+ user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
1068
+ bot:
1069
+ name: Linkdex Bot
1070
+ category: Search bot
1071
+ url: http://www.linkdex.com/bots
1072
+ producer:
1073
+ name: Mojeek Ltd.
1074
+ url: http://www.mojeek.com
1075
+ -
299
1076
  user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
300
- name: 'LinkedIn Bot'
301
- -
1077
+ bot:
1078
+ name: LinkedIn Bot
1079
+ category: Social Media Agent
1080
+ url: http://www.linkedin.com
1081
+ producer:
1082
+ name: LinkedIn
1083
+ url: http://www.linkedin.com
1084
+ -
1085
+ user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
1086
+ bot:
1087
+ name: MJ12 Bot
1088
+ category: Search bot
1089
+ url: http://majestic12.co.uk/bot.php
1090
+ producer:
1091
+ name: Majestic-12
1092
+ url: http://majestic12.co.uk
1093
+ -
1094
+ user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
1095
+ bot:
1096
+ name: Magpie-Crawler
1097
+ category: Social Media Agent
1098
+ url: http://www.brandwatch.com/magpie-crawler/
1099
+ producer:
1100
+ name: Brandwatch
1101
+ url: http://www.brandwatch.com
1102
+ -
1103
+ user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
1104
+ bot:
1105
+ name: MagpieRSS
1106
+ url: http://magpierss.sourceforge.net/
1107
+ category: Feed Parser
1108
+ producer:
1109
+ name:
1110
+ url:
1111
+ -
302
1112
  user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
303
- name: 'Mail.Ru Bot'
304
- -
1113
+ bot:
1114
+ name: Mail.Ru Bot
1115
+ category: Search bot
1116
+ url: http://help.mail.ru/webmaster/indexing/robots/types_robots
1117
+ producer:
1118
+ name: Mail.Ru Group
1119
+ url: http://corp.mail.ru
1120
+ -
305
1121
  user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
306
- name: 'Mail.Ru Bot'
307
- -
308
- user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
309
- name: 'Magpie-Crawler'
310
- -
1122
+ bot:
1123
+ name: Mail.Ru Bot
1124
+ category: Search bot
1125
+ url: http://help.mail.ru/webmaster/indexing/robots/types_robots
1126
+ producer:
1127
+ name: Mail.Ru Group
1128
+ url: http://corp.mail.ru
1129
+ -
311
1130
  user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
312
- name: 'Meanpath Bot'
313
- -
1131
+ bot:
1132
+ name: Meanpath Bot
1133
+ category: Search bot
1134
+ url: http://www.meanpath.com/meanpathbot.html
1135
+ producer:
1136
+ name: Meanpath
1137
+ url: http://www.meanpath.com
1138
+ -
314
1139
  user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
315
- name: 'Mixrank Bot'
316
- -
317
- user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
318
- name: 'MJ12 Bot'
319
- -
1140
+ bot:
1141
+ name: Mixrank Bot
1142
+ category: Crawler
1143
+ url: http://mixrank.com
1144
+ producer:
1145
+ name: Online Media Group, Inc.
1146
+ url:
1147
+ -
320
1148
  user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
321
- name: 'MojeekBot'
322
- -
1149
+ bot:
1150
+ name: MojeekBot
1151
+ category: Search bot
1152
+ url: http://www.mojeek.com/bot.html
1153
+ producer:
1154
+ name: Mojeek Ltd.
1155
+ url: http://www.mojeek.com
1156
+ -
1157
+ user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
1158
+ bot:
1159
+ name: Monitor.Us
1160
+ category: Site Monitor
1161
+ url: http://www.monitor.us
1162
+ producer:
1163
+ name: Monitor.Us
1164
+ url: http://www.monitor.us
1165
+ -
1166
+ user_agent: nlcrawler/1.0 (+http://northernlight.com/)
1167
+ bot:
1168
+ name: NLCrawler
1169
+ category: Crawler
1170
+ url:
1171
+ producer:
1172
+ name: Northern Light
1173
+ url: http://northernlight.com
1174
+ -
323
1175
  user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
324
- name: 'NalezenCzBot'
325
- -
1176
+ bot:
1177
+ name: NalezenCzBot
1178
+ category: Crawler
1179
+ url: http://www.nalezen.cz/about-crawler
1180
+ producer:
1181
+ name: Jaroslav Kuboš
1182
+ url:
1183
+ -
1184
+ user_agent: NetLyzer FastProbe
1185
+ bot:
1186
+ name: NetLyzer FastProbe
1187
+ -
326
1188
  user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
327
- name: 'Netcraft Survey Bot'
328
- -
329
- user_agent: nlcrawler/1.0 (+http://northernlight.com/)
330
- name: 'NLCrawler'
331
- -
1189
+ bot:
1190
+ name: Netcraft Survey Bot
1191
+ category: Search bot
1192
+ url:
1193
+ producer:
1194
+ name: Netcraft
1195
+ url: http://www.netcraft.com
1196
+ -
1197
+ user_agent: Netvibes (http://www.netvibes.com)
1198
+ bot:
1199
+ name: Netvibes
1200
+ url: http://www.netvibes.com/
1201
+ category: Feed Fetcher
1202
+ producer:
1203
+ name:
1204
+ url:
1205
+ -
1206
+ user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
1207
+ bot:
1208
+ name: Netvibes
1209
+ url: http://www.netvibes.com/
1210
+ category: Feed Fetcher
1211
+ producer:
1212
+ name:
1213
+ url:
1214
+ -
1215
+ user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1216
+ bot:
1217
+ name: NewsBlur
1218
+ url: http://www.newsblur.com
1219
+ category: Feed Fetcher
1220
+ producer:
1221
+ name:
1222
+ url:
1223
+ -
1224
+ user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1225
+ bot:
1226
+ name: NewsBlur
1227
+ url: http://www.newsblur.com
1228
+ category: Feed Fetcher
1229
+ producer:
1230
+ name:
1231
+ url:
1232
+ -
1233
+ user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1234
+ bot:
1235
+ name: NewsBlur
1236
+ url: http://www.newsblur.com
1237
+ category: Feed Fetcher
1238
+ producer:
1239
+ name:
1240
+ url:
1241
+ -
1242
+ user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
1243
+ bot:
1244
+ name: NewsBlur
1245
+ url: http://www.newsblur.com
1246
+ category: Feed Fetcher
1247
+ producer:
1248
+ name:
1249
+ url:
1250
+ -
1251
+ user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
1252
+ bot:
1253
+ name: NewsGator
1254
+ url: http://www.newsgator.com
1255
+ category: Feed Fetcher
1256
+ producer:
1257
+ name:
1258
+ url:
1259
+ -
1260
+ user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
1261
+ bot:
1262
+ name: Nutch-based Bot
1263
+ category: Crawler
1264
+ url: https://nutch.apache.org
1265
+ producer:
1266
+ name: The Apache Software Foundation
1267
+ url: http://www.apache.org/foundation/
1268
+ -
1269
+ user_agent: CB/Nutch-1.7
1270
+ bot:
1271
+ name: Nutch-based Bot
1272
+ category: Crawler
1273
+ url: https://nutch.apache.org
1274
+ producer:
1275
+ name: The Apache Software Foundation
1276
+ url: http://www.apache.org/foundation/
1277
+ -
1278
+ user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
1279
+ bot:
1280
+ name: Nutch-based Bot
1281
+ category: Crawler
1282
+ url: https://nutch.apache.org
1283
+ producer:
1284
+ name: The Apache Software Foundation
1285
+ url: http://www.apache.org/foundation/
1286
+ -
1287
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
1288
+ bot:
1289
+ name: Nutch-based Bot
1290
+ category: Crawler
1291
+ url: https://nutch.apache.org
1292
+ producer:
1293
+ name: The Apache Software Foundation
1294
+ url: http://www.apache.org/foundation/
1295
+ -
1296
+ user_agent: My Nutch Spider/Nutch-1.6
1297
+ bot:
1298
+ name: Nutch-based Bot
1299
+ category: Crawler
1300
+ url: https://nutch.apache.org
1301
+ producer:
1302
+ name: The Apache Software Foundation
1303
+ url: http://www.apache.org/foundation/
1304
+ -
1305
+ user_agent: MySpider/Nutch-2.2
1306
+ bot:
1307
+ name: Nutch-based Bot
1308
+ category: Crawler
1309
+ url: https://nutch.apache.org
1310
+ producer:
1311
+ name: The Apache Software Foundation
1312
+ url: http://www.apache.org/foundation/
1313
+ -
1314
+ user_agent: Nutch12/Nutch-1.2
1315
+ bot:
1316
+ name: Nutch-based Bot
1317
+ category: Crawler
1318
+ url: https://nutch.apache.org
1319
+ producer:
1320
+ name: The Apache Software Foundation
1321
+ url: http://www.apache.org/foundation/
1322
+ -
1323
+ user_agent: NutchSpider/Nutch-1.4
1324
+ bot:
1325
+ name: Nutch-based Bot
1326
+ category: Crawler
1327
+ url: https://nutch.apache.org
1328
+ producer:
1329
+ name: The Apache Software Foundation
1330
+ url: http://www.apache.org/foundation/
1331
+ -
1332
+ user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
1333
+ bot:
1334
+ name: Nutch-based Bot
1335
+ category: Crawler
1336
+ url: https://nutch.apache.org
1337
+ producer:
1338
+ name: The Apache Software Foundation
1339
+ url: http://www.apache.org/foundation/
1340
+ -
1341
+ user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
1342
+ bot:
1343
+ name: Nutch-based Bot
1344
+ category: Crawler
1345
+ url: https://nutch.apache.org
1346
+ producer:
1347
+ name: The Apache Software Foundation
1348
+ url: http://www.apache.org/foundation/
1349
+ -
1350
+ user_agent: testnutch/Nutch-1.8
1351
+ bot:
1352
+ name: Nutch-based Bot
1353
+ category: Crawler
1354
+ url: https://nutch.apache.org
1355
+ producer:
1356
+ name: The Apache Software Foundation
1357
+ url: http://www.apache.org/foundation/
1358
+ -
1359
+ user_agent: Your Nutch Spider/Nutch-2.2.1
1360
+ bot:
1361
+ name: Nutch-based Bot
1362
+ category: Crawler
1363
+ url: https://nutch.apache.org
1364
+ producer:
1365
+ name: The Apache Software Foundation
1366
+ url: http://www.apache.org/foundation/
1367
+ -
1368
+ user_agent: your sipder name/Nutch-1.7
1369
+ bot:
1370
+ name: Nutch-based Bot
1371
+ category: Crawler
1372
+ url: https://nutch.apache.org
1373
+ producer:
1374
+ name: The Apache Software Foundation
1375
+ url: http://www.apache.org/foundation/
1376
+ -
332
1377
  user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
333
- name: 'Omgili bot'
334
- -
335
- user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
336
- name: 'Openindex Spider'
337
- -
1378
+ bot:
1379
+ name: Omgili bot
1380
+ category: Search bot
1381
+ url: http://www.omgili.com/Crawler.html
1382
+ producer:
1383
+ name: Omgili
1384
+ url: http://www.omgili.com
1385
+ -
338
1386
  user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
339
- name: 'OpenLinkProfiler'
340
- -
1387
+ bot:
1388
+ name: OpenLinkProfiler
1389
+ category: Crawler
1390
+ url: http://openlinkprofiler.org/bot
1391
+ producer:
1392
+ name: Axandra GmbH
1393
+ url: http://www.axandra.com
1394
+ -
341
1395
  user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
342
- name: 'OpenWebSpider'
343
- -
1396
+ bot:
1397
+ name: OpenWebSpider
1398
+ category: Crawler
1399
+ url: http://www.openwebspider.org
1400
+ producer:
1401
+ name: OpenWebSpider Lab
1402
+ url: http://lab.openwebspider.org
1403
+ -
1404
+ user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
1405
+ bot:
1406
+ name: Openindex Spider
1407
+ category: Search bot
1408
+ url: http://www.openindex.io/en/webmasters/spider.html
1409
+ producer:
1410
+ name: Openindex B.V.
1411
+ url: http://www.openindex.io
1412
+ -
1413
+ user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
1414
+ bot:
1415
+ name: Orange Bot
1416
+ category: Search bot
1417
+ url: http://lemoteur.orange.fr
1418
+ producer:
1419
+ name: Orange
1420
+ url: http://www.orange.fr
1421
+ -
1422
+ user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
1423
+ bot:
1424
+ name: Orange Bot
1425
+ category: Search bot
1426
+ url: http://lemoteur.orange.fr
1427
+ producer:
1428
+ name: Orange
1429
+ url: http://www.orange.fr
1430
+ -
1431
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
1432
+ bot:
1433
+ name: Orange Bot
1434
+ category: Search bot
1435
+ url: http://lemoteur.orange.fr
1436
+ producer:
1437
+ name: Orange
1438
+ url: http://www.orange.fr
1439
+ -
1440
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
1441
+ bot:
1442
+ name: Orange Bot
1443
+ category: Search bot
1444
+ url: http://lemoteur.orange.fr
1445
+ producer:
1446
+ name: Orange
1447
+ url: http://www.orange.fr
1448
+ -
1449
+ user_agent: Mozilla/5.0 (Java) outbrain
1450
+ bot:
1451
+ name: Outbrain
1452
+ category: Crawler
1453
+ url:
1454
+ producer:
1455
+ name: Outbrain
1456
+ url: http://www.outbrain.com/
1457
+ -
1458
+ user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
1459
+ bot:
1460
+ name: PHP Server Monitor
1461
+ category: Site Monitor
1462
+ url: https://github.com/phpservermon/phpservermon
1463
+ producer:
1464
+ name: PHP Server Monitor
1465
+ url: http://www.phpservermonitor.org/
1466
+ -
344
1467
  user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
345
- name: 'PaperLiBot'
346
- -
347
- user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
348
- name: 'Picsearch bot'
349
- -
1468
+ bot:
1469
+ name: PaperLiBot
1470
+ category: Search bot
1471
+ url: http://support.paper.li/entries/20023257-what-is-paper-li
1472
+ producer:
1473
+ name: Smallrivers SA
1474
+ url: http://www.paper.li
1475
+ -
350
1476
  user_agent: psbot-page (+http://www.picsearch.com/bot.html)
351
- name: 'Picsearch bot'
352
- -
1477
+ bot:
1478
+ name: Picsearch bot
1479
+ category: Search bot
1480
+ url: http://www.picsearch.com/bot.html
1481
+ producer:
1482
+ name: Picsearch
1483
+ url: http://www.picsearch.com
1484
+ -
1485
+ user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
1486
+ bot:
1487
+ name: Picsearch bot
1488
+ category: Search bot
1489
+ url: http://www.picsearch.com/bot.html
1490
+ producer:
1491
+ name: Picsearch
1492
+ url: http://www.picsearch.com
1493
+ -
353
1494
  user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
354
- name: 'Pingdom Bot'
355
- -
1495
+ bot:
1496
+ name: Pingdom Bot
1497
+ category: Site Monitor
1498
+ url:
1499
+ producer:
1500
+ name: Pingdom AB
1501
+ url: https://www.pingdom.com
1502
+ -
1503
+ user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
1504
+ bot:
1505
+ name: Pinterest
1506
+ url:
1507
+ category: Crawler
1508
+ producer:
1509
+ name: Pinterest
1510
+ url: http://www.pinterest.com/
1511
+ -
356
1512
  user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
357
- name: 'QuerySeekerSpider'
358
- -
1513
+ bot:
1514
+ name: QuerySeekerSpider
1515
+ category: Crawler
1516
+ url: http://queryseeker.com/bot.html
1517
+ producer:
1518
+ name: QueryEye Inc.
1519
+ url: http://queryeye.com
1520
+ -
1521
+ user_agent: ROI Hunter; https://api-dev.roihunter.com
1522
+ bot:
1523
+ name: ROI Hunter
1524
+ category: Crawler
1525
+ url:
1526
+ producer:
1527
+ name: Roihunter a.s.
1528
+ url: http://roihunter.com/
1529
+ -
359
1530
  user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
360
- name: 'Reddit Bot'
361
- -
1531
+ bot:
1532
+ name: Reddit Bot
1533
+ category: Social Media Agent
1534
+ url: http://www.reddit.com/feedback
1535
+ producer:
1536
+ name: reddit inc.
1537
+ url: http://www.reddit.com
1538
+ -
362
1539
  user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
363
- name: 'Rogerbot'
364
- -
1540
+ bot:
1541
+ name: Rogerbot
1542
+ category: Crawler
1543
+ url: http://moz.com/help/pro/what-is-rogerbot-
1544
+ producer:
1545
+ name: SEOmoz, Inc.
1546
+ url: http://moz.com/
1547
+ -
365
1548
  user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
366
- name: 'Rogerbot'
367
- -
1549
+ bot:
1550
+ name: Rogerbot
1551
+ category: Crawler
1552
+ url: http://moz.com/help/pro/what-is-rogerbot-
1553
+ producer:
1554
+ name: SEOmoz, Inc.
1555
+ url: http://moz.com/
1556
+ -
368
1557
  user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
369
- name: 'Rogerbot'
370
- -
1558
+ bot:
1559
+ name: Rogerbot
1560
+ category: Crawler
1561
+ url: http://moz.com/help/pro/what-is-rogerbot-
1562
+ producer:
1563
+ name: SEOmoz, Inc.
1564
+ url: http://moz.com/
1565
+ -
1566
+ user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
1567
+ bot:
1568
+ name: SEOENGBot
1569
+ category: Crawler
1570
+ url: http://www.seoengine.com/seoengbot.htm
1571
+ producer:
1572
+ name: SEO Engine
1573
+ url: http://www.seoengine.com
1574
+ -
1575
+ user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
1576
+ bot:
1577
+ name: SISTRIX Crawler
1578
+ category: Crawler
1579
+ url: http://crawler.sistrix.net
1580
+ producer:
1581
+ name: SISTRIX GmbH
1582
+ url: http://www.sistrix.de
1583
+ -
1584
+ user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
1585
+ bot:
1586
+ name: Scrapy
1587
+ category: Crawler
1588
+ url: http://scrapy.org
1589
+ -
371
1590
  user_agent: Screaming Frog SEO Spider/2.22
372
- name: 'Screaming Frog SEO Spider'
373
- -
1591
+ bot:
1592
+ name: Screaming Frog SEO Spider
1593
+ category: Crawler
1594
+ url: http://www.screamingfrog.co.uk/seo-spider
1595
+ producer:
1596
+ name: Screaming Frog Ltd
1597
+ url: http://www.screamingfrog.co.uk
1598
+ -
374
1599
  user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
375
- name: 'ScreenerBot'
376
- -
1600
+ bot:
1601
+ name: ScreenerBot
1602
+ category: Crawler
1603
+ url: http://www.screenerbot.com
1604
+ producer:
1605
+ name:
1606
+ url:
1607
+ -
377
1608
  user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
378
- name: 'Semrush Bot'
379
- -
1609
+ bot:
1610
+ name: Semrush Bot
1611
+ category: Crawler
1612
+ url: http://www.semrush.com/bot.html
1613
+ producer:
1614
+ name: SEMrush
1615
+ url: http://www.semrush.com
1616
+ -
380
1617
  user_agent: SensikaBot/x.33 (+http://sensika.com)
381
- name: 'Sensika Bot'
382
- -
383
- user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
384
- name: 'SEOENGBot'
385
- -
1618
+ bot:
1619
+ name: Sensika Bot
1620
+ category:
1621
+ url:
1622
+ producer:
1623
+ name: Sensika
1624
+ url: http://sensika.com
1625
+ -
1626
+ user_agent: Server Density Service Monitoring v2
1627
+ bot:
1628
+ name: Server Density
1629
+ -
386
1630
  user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
387
- name: 'Seznam Bot'
388
- -
1631
+ bot:
1632
+ name: Seznam Bot
1633
+ category: Search bot
1634
+ url: http://www.mapy.cz/cz/seznambot.html
1635
+ producer:
1636
+ name: Seznam.cz, a.s.
1637
+ url: http://www.seznam.cz/
1638
+ -
389
1639
  user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
390
- name: 'Seznam Bot'
391
- -
392
- user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
393
- name: 'Seznam Bot'
394
- -
1640
+ bot:
1641
+ name: Seznam Bot
1642
+ category: Search bot
1643
+ url: http://www.mapy.cz/cz/seznambot.html
1644
+ producer:
1645
+ name: Seznam.cz, a.s.
1646
+ url: http://www.seznam.cz/
1647
+ -
395
1648
  user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
396
- name: 'Seznam Bot'
397
- -
1649
+ bot:
1650
+ name: Seznam Bot
1651
+ category: Search bot
1652
+ url: http://www.mapy.cz/cz/seznambot.html
1653
+ producer:
1654
+ name: Seznam.cz, a.s.
1655
+ url: http://www.seznam.cz/
1656
+ -
1657
+ user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
1658
+ bot:
1659
+ name: Seznam Bot
1660
+ category: Search bot
1661
+ url: http://www.mapy.cz/cz/seznambot.html
1662
+ producer:
1663
+ name: Seznam.cz, a.s.
1664
+ url: http://www.seznam.cz/
1665
+ -
398
1666
  user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
399
- name: 'ShopWiki'
400
- -
401
- user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
402
- name: 'SISTRIX Crawler'
403
- -
404
- user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
405
- name: 'Sogou Spider'
406
- -
407
- user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
408
- name: 'Sogou Spider'
409
- -
410
- user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
411
- name: 'Sogou Spider'
412
- -
1667
+ bot:
1668
+ name: ShopWiki
1669
+ category: Search tools
1670
+ url: http://www.shopwiki.com/wiki/Help:Bot
1671
+ producer:
1672
+ name: ShopWiki Corp.
1673
+ url: http://www.shopwiki.com
1674
+ -
1675
+ user_agent: SilverReader/1.0; http://silverreader.com
1676
+ bot:
1677
+ name: SilverReader
1678
+ url: http://silverreader.com
1679
+ category: Feed Fetcher
1680
+ producer:
1681
+ name:
1682
+ url:
1683
+ -
1684
+ user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
1685
+ bot:
1686
+ name: SimplePie
1687
+ url: http://www.simplepie.org
1688
+ category: Feed Parser
1689
+ producer:
1690
+ name:
1691
+ url:
1692
+ -
1693
+ user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
1694
+ bot:
1695
+ name: SimplePie
1696
+ url: http://www.simplepie.org
1697
+ category: Feed Parser
1698
+ producer:
1699
+ name:
1700
+ url:
1701
+ -
1702
+ user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
1703
+ bot:
1704
+ name: SimplePie
1705
+ url: http://www.simplepie.org
1706
+ category: Feed Parser
1707
+ producer:
1708
+ name:
1709
+ url:
1710
+ -
1711
+ user_agent: Site24x7
1712
+ bot:
1713
+ name: Site24x7 Website Monitoring
1714
+ category: Site Monitor
1715
+ url: https://www.site24x7.com/site24x7-faq.html
1716
+ producer:
1717
+ name: Site24x7
1718
+ url: https://www.site24x7.com
1719
+ -
1720
+ user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
1721
+ bot:
1722
+ name: Skype URI Preview
1723
+ category: Service Agent
1724
+ url:
1725
+ producer:
1726
+ name: Skype Communications S.à.r.l.
1727
+ url: https://www.skype.com
1728
+ -
1729
+ user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
1730
+ bot:
1731
+ name: Slackbot
1732
+ category: Crawler
1733
+ url: https://api.slack.com/robots
1734
+ producer:
1735
+ name: Slack Technologies
1736
+ url: http://slack.com
1737
+ -
413
1738
  user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
414
- name: 'Sogou Spider'
415
- -
1739
+ bot:
1740
+ name: Sogou Spider
1741
+ category: Search bot
1742
+ url: http://www.sogou.com/docs/help/webmasters.htm
1743
+ producer:
1744
+ name: Sohu, Inc.
1745
+ url: http://www.sogou.com
1746
+ -
1747
+ user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
1748
+ bot:
1749
+ name: Sogou Spider
1750
+ category: Search bot
1751
+ url: http://www.sogou.com/docs/help/webmasters.htm
1752
+ producer:
1753
+ name: Sohu, Inc.
1754
+ url: http://www.sogou.com
1755
+ -
1756
+ user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
1757
+ bot:
1758
+ name: Sogou Spider
1759
+ category: Search bot
1760
+ url: http://www.sogou.com/docs/help/webmasters.htm
1761
+ producer:
1762
+ name: Sohu, Inc.
1763
+ url: http://www.sogou.com
1764
+ -
1765
+ user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
1766
+ bot:
1767
+ name: Sogou Spider
1768
+ category: Search bot
1769
+ url: http://www.sogou.com/docs/help/webmasters.htm
1770
+ producer:
1771
+ name: Sohu, Inc.
1772
+ url: http://www.sogou.com
1773
+ -
416
1774
  user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
417
- name: 'Soso Spider'
418
- -
419
- user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
420
- name: 'Superfeedr Bot'
421
- -
1775
+ bot:
1776
+ name: Soso Spider
1777
+ category: Search bot
1778
+ url: http://help.soso.com/webspider.htm
1779
+ producer:
1780
+ name: Tencent Holdings
1781
+ url: http://www.soso.com
1782
+ -
422
1783
  user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
423
- name: 'Spinn3r'
424
- -
1784
+ bot:
1785
+ name: Spinn3r
1786
+ category: Crawler
1787
+ url: http://spinn3r.com/robot
1788
+ producer:
1789
+ name: Tailrank Inc
1790
+ url: http://spinn3r.com
1791
+ -
425
1792
  user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
426
- name: 'Sputnik Bot'
427
- -
1793
+ bot:
1794
+ name: Sputnik Bot
1795
+ category:
1796
+ url:
1797
+ producer:
1798
+ name:
1799
+ url:
1800
+ -
428
1801
  user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
429
- name: 'Sputnik Bot'
430
- -
1802
+ bot:
1803
+ name: Sputnik Bot
1804
+ category:
1805
+ url:
1806
+ producer:
1807
+ name:
1808
+ url:
1809
+ -
1810
+ user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
1811
+ bot:
1812
+ name: Superfeedr Bot
1813
+ category: Feed Fetcher
1814
+ url:
1815
+ producer:
1816
+ name: Superfeedr
1817
+ url: https://superfeedr.com/
1818
+ -
431
1819
  user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
432
- name: 'Survey Bot'
433
- -
1820
+ bot:
1821
+ name: Survey Bot
1822
+ category: Search bot
1823
+ url: http://www.domaintools.com/webmasters/surveybot.php
1824
+ producer:
1825
+ name: Domain Tools
1826
+ url: http://www.domaintools.com
1827
+ -
1828
+ user_agent: TelegramBot (like TwitterBot)
1829
+ bot:
1830
+ name: TelgramBot
1831
+ url: https://telegram.org/blog/bot-revolution
1832
+ -
434
1833
  user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
435
- name: 'TinEye Crawler'
436
- -
1834
+ bot:
1835
+ name: TinEye Crawler
1836
+ category: Search bot
1837
+ url: http://www.tineye.com/crawler.html
1838
+ producer:
1839
+ name: Idée Inc.
1840
+ url: http://ideeinc.com
1841
+ -
1842
+ user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
1843
+ bot:
1844
+ name: Tiny Tiny RSS
1845
+ url: http://tt-rss.org
1846
+ category: Feed Fetcher
1847
+ producer:
1848
+ name:
1849
+ url:
1850
+ -
1851
+ user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
1852
+ bot:
1853
+ name: Tiny Tiny RSS
1854
+ url: http://tt-rss.org
1855
+ category: Feed Fetcher
1856
+ producer:
1857
+ name:
1858
+ url:
1859
+ -
437
1860
  user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
438
- name: 'TurnitinBot'
439
- -
440
- user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
441
- name: 'TweetedTimes Bot'
442
- -
1861
+ bot:
1862
+ name: TurnitinBot
1863
+ category: Crawler
1864
+ url: http://www.turnitin.com/robot/crawlerinfo.html
1865
+ producer:
1866
+ name: iParadigms, LLC.
1867
+ url: http://www.turnitin.com
1868
+ -
443
1869
  user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
444
- name: 'TweetedTimes Bot'
445
- -
1870
+ bot:
1871
+ name: TweetedTimes Bot
1872
+ category: Crawler
1873
+ url: http://tweetedtimes.com
1874
+ producer:
1875
+ name: TweetedTimes
1876
+ url: http://tweetedtimes.com/
1877
+ -
1878
+ user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
1879
+ bot:
1880
+ name: TweetedTimes Bot
1881
+ category: Crawler
1882
+ url: http://tweetedtimes.com
1883
+ producer:
1884
+ name: TweetedTimes
1885
+ url: http://tweetedtimes.com/
1886
+ -
446
1887
  user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
447
- name: 'Tweetmeme Bot'
448
- -
1888
+ bot:
1889
+ name: Tweetmeme Bot
1890
+ category: Crawler
1891
+ url: http://tweetmeme.com/
1892
+ producer:
1893
+ name: Mediasift
1894
+ url:
1895
+ -
449
1896
  user_agent: Twitterbot/1.0
450
- name: 'Twitterbot'
451
- -
452
- user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
453
- name: 'Uptime Robot'
454
- -
1897
+ bot:
1898
+ name: Twitterbot
1899
+ category: Social Media Agent
1900
+ url: https://dev.twitter.com/docs/cards/getting-started
1901
+ producer:
1902
+ name: Twitter
1903
+ url: http://www.twitter.com
1904
+ -
455
1905
  user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
456
- name: 'URLAppendBot'
457
- -
1906
+ bot:
1907
+ name: URLAppendBot
1908
+ category: Crawler
1909
+ url: http://www.profound.net/urlappendbot.html
1910
+ producer:
1911
+ name: Profound Networks
1912
+ url: http://www.profound.net
1913
+ -
1914
+ user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
1915
+ bot:
1916
+ name: Uptime Robot
1917
+ category: Site Monitor
1918
+ url:
1919
+ producer:
1920
+ name: Uptime Robot
1921
+ url: http://uptimerobot.com
1922
+ -
458
1923
  user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
459
- name: 'Visual Site Mapper Crawler'
460
- -
461
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
462
- name: 'Voila Bot'
463
- -
464
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
465
- name: 'Voila Bot'
466
- -
467
- user_agent: Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)
468
- name: 'W3C CSS Validator'
469
- -
1924
+ bot:
1925
+ name: Visual Site Mapper Crawler
1926
+ category: Crawler
1927
+ url: http://www.visualsitemapper.com/crawler
1928
+ producer:
1929
+ name: Alentum Software Ltd.
1930
+ url: http://www.alentum.com
1931
+ -
1932
+ user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
1933
+ bot:
1934
+ name: W3C CSS Validator
1935
+ category: Validator
1936
+ url: http://jigsaw.w3.org/css-validator
1937
+ producer:
1938
+ name: W3C
1939
+ url: http://www.w3.org
1940
+ -
470
1941
  user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
471
- name: 'W3C I18N Checker'
472
- -
473
- user_agent: W3C-checklink/4.0 [4.4] libwww-perl/5.803
474
- name: 'W3C Link Checker'
475
- -
1942
+ bot:
1943
+ name: W3C I18N Checker
1944
+ category: Validator
1945
+ url: http://validator.w3.org/i18n-checker
1946
+ producer:
1947
+ name: W3C
1948
+ url: http://www.w3.org
1949
+ -
1950
+ user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
1951
+ bot:
1952
+ name: W3C Link Checker
1953
+ category: Validator
1954
+ url: http://validator.w3.org/checklink
1955
+ producer:
1956
+ name: W3C
1957
+ url: http://www.w3.org
1958
+ -
476
1959
  user_agent: W3C-checklink/4.81 libwww-perl/5.836
477
- name: 'W3C Link Checker'
478
- -
1960
+ bot:
1961
+ name: W3C Link Checker
1962
+ category: Validator
1963
+ url: http://validator.w3.org/checklink
1964
+ producer:
1965
+ name: W3C
1966
+ url: http://www.w3.org
1967
+ -
479
1968
  user_agent: W3C_Validator/1.3 http://validator.w3.org/services
480
- name: 'W3C Markup Validation Service'
481
- -
1969
+ bot:
1970
+ name: W3C Markup Validation Service
1971
+ category: Validator
1972
+ url: http://validator.w3.org/services
1973
+ producer:
1974
+ name: W3C
1975
+ url: http://www.w3.org
1976
+ -
482
1977
  user_agent: W3C_Validator/1.767
483
- name: 'W3C Markup Validation Service'
484
- -
1978
+ bot:
1979
+ name: W3C Markup Validation Service
1980
+ category: Validator
1981
+ url: http://validator.w3.org/services
1982
+ producer:
1983
+ name: W3C
1984
+ url: http://www.w3.org
1985
+ -
485
1986
  user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
486
- name: 'W3C MobileOK Checker'
487
- -
1987
+ bot:
1988
+ name: W3C MobileOK Checker
1989
+ category: Validator
1990
+ url: http://validator.w3.org/mobile
1991
+ producer:
1992
+ name: W3C
1993
+ url: http://www.w3.org
1994
+ -
488
1995
  user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
489
- name: 'W3C Unified Validator'
490
- -
491
- user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
492
- name: 'WebbCrawler'
493
- -
1996
+ bot:
1997
+ name: W3C Unified Validator
1998
+ category: Validator
1999
+ url: http://validator.w3.org/unicorn
2000
+ producer:
2001
+ name: W3C
2002
+ url: http://www.w3.org
2003
+ -
494
2004
  user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
495
- name: 'WeSEE:Search'
496
- -
2005
+ bot:
2006
+ name: WeSEE:Search
2007
+ category: Search bot
2008
+ url: http://www.wesee.com/bot
2009
+ producer:
2010
+ name: WeSEE Ltd
2011
+ url: http://www.wesee.com
2012
+ -
2013
+ user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
2014
+ bot:
2015
+ name: WebSitePulse
2016
+ category: Site Monitor
2017
+ url: http://badcheese.com/crawler.html
2018
+ producer:
2019
+ name: WebSitePulse
2020
+ url: http://www.websitepulse.com/
2021
+ -
2022
+ user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
2023
+ bot:
2024
+ name: WebbCrawler
2025
+ category: Crawler
2026
+ url: http://badcheese.com/crawler.html
2027
+ producer:
2028
+ name: Steve Webb
2029
+ url: http://badcheese.com
2030
+ -
497
2031
  user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
498
- name: 'Wotbox'
499
- -
500
- user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
501
- name: 'YaCy'
502
- -
2032
+ bot:
2033
+ name: Wotbox
2034
+ category: Search bot
2035
+ url: http://www.wotbox.com/bot/
2036
+ producer:
2037
+ name: Wotbox
2038
+ url: http://www.wotbox.com
2039
+ -
503
2040
  user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
504
- name: 'YaCy'
505
- -
2041
+ bot:
2042
+ name: YaCy
2043
+ category: Search bot
2044
+ url: http://yacy.net/bot.html
2045
+ producer:
2046
+ name: YaCy
2047
+ url: http://yacy.net
2048
+ -
2049
+ user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
2050
+ bot:
2051
+ name: YaCy
2052
+ category: Search bot
2053
+ url: http://yacy.net/bot.html
2054
+ producer:
2055
+ name: YaCy
2056
+ url: http://yacy.net
2057
+ -
2058
+ user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
2059
+ bot:
2060
+ name: Yahoo Gemini
2061
+ category: Crawler
2062
+ url: https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html
2063
+ producer:
2064
+ name: Yahoo! Inc.
2065
+ url: http://www.yahoo.com
2066
+ -
2067
+ user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
2068
+ bot:
2069
+ name: Yahoo! Link Preview
2070
+ category: Crawler
2071
+ url: https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html
2072
+ producer:
2073
+ name: Yahoo! Inc.
2074
+ url: http://www.yahoo.com
2075
+ -
2076
+ user_agent: Yahoo:LinkExpander:Slingstone
2077
+ bot:
2078
+ name: Yahoo! Link Preview
2079
+ category: Crawler
2080
+ url: https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html
2081
+ producer:
2082
+ name: Yahoo! Inc.
2083
+ url: http://www.yahoo.com
2084
+ -
506
2085
  user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
507
- name: 'Yahoo! Slurp'
508
- -
2086
+ bot:
2087
+ name: Yahoo! Slurp
2088
+ category: Search bot
2089
+ url: http://help.yahoo.com/ysearch/slurp
2090
+ producer:
2091
+ name: Yahoo! Inc.
2092
+ url: http://www.yahoo.com
2093
+ -
509
2094
  user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
510
- name: 'Yahoo! Slurp'
511
- -
512
- user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
513
- name: 'Yandex Bot'
514
- -
2095
+ bot:
2096
+ name: Yahoo! Slurp
2097
+ category: Search bot
2098
+ url: http://help.yahoo.com/ysearch/slurp
2099
+ producer:
2100
+ name: Yahoo! Inc.
2101
+ url: http://www.yahoo.com
2102
+ -
2103
+ user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
2104
+ bot:
2105
+ name: Yandex Bot
2106
+ category: Search bot
2107
+ url: http://www.yandex.com/bots
2108
+ producer:
2109
+ name: Yandex LLC
2110
+ url: http://company.yandex.com
2111
+ -
2112
+ user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
2113
+ bot:
2114
+ name: Yandex Bot
2115
+ category: Search bot
2116
+ url: http://www.yandex.com/bots
2117
+ producer:
2118
+ name: Yandex LLC
2119
+ url: http://company.yandex.com
2120
+ -
515
2121
  user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
516
- name: 'Yandex Bot'
517
- -
518
- user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
519
- name: 'Yandex Bot'
520
- -
521
- user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
522
- name: 'Yandex Bot'
523
- -
524
- user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
525
- name: 'Yandex Bot'
526
- -
527
- user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
528
- name: 'Yandex Bot'
529
- -
530
- user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
531
- name: 'Yandex Bot'
532
- -
2122
+ bot:
2123
+ name: Yandex Bot
2124
+ category: Search bot
2125
+ url: http://www.yandex.com/bots
2126
+ producer:
2127
+ name: Yandex LLC
2128
+ url: http://company.yandex.com
2129
+ -
533
2130
  user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
534
- name: 'Yandex Bot'
535
- -
2131
+ bot:
2132
+ name: Yandex Bot
2133
+ category: Search bot
2134
+ url: http://www.yandex.com/bots
2135
+ producer:
2136
+ name: Yandex LLC
2137
+ url: http://company.yandex.com
2138
+ -
2139
+ user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
2140
+ bot:
2141
+ name: Yandex Bot
2142
+ category: Search bot
2143
+ url: http://www.yandex.com/bots
2144
+ producer:
2145
+ name: Yandex LLC
2146
+ url: http://company.yandex.com
2147
+ -
536
2148
  user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
537
- name: 'Yandex Bot'
538
- -
2149
+ bot:
2150
+ name: Yandex Bot
2151
+ category: Search bot
2152
+ url: http://www.yandex.com/bots
2153
+ producer:
2154
+ name: Yandex LLC
2155
+ url: http://company.yandex.com
2156
+ -
2157
+ user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
2158
+ bot:
2159
+ name: Yandex Bot
2160
+ category: Search bot
2161
+ url: http://www.yandex.com/bots
2162
+ producer:
2163
+ name: Yandex LLC
2164
+ url: http://company.yandex.com
2165
+ -
2166
+ user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
2167
+ bot:
2168
+ name: Yandex Bot
2169
+ category: Search bot
2170
+ url: http://www.yandex.com/bots
2171
+ producer:
2172
+ name: Yandex LLC
2173
+ url: http://company.yandex.com
2174
+ -
539
2175
  user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
540
- name: 'Yandex Bot'
541
- -
542
- user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
543
- name: 'Yandex Bot'
544
- -
2176
+ bot:
2177
+ name: Yandex Bot
2178
+ category: Search bot
2179
+ url: http://www.yandex.com/bots
2180
+ producer:
2181
+ name: Yandex LLC
2182
+ url: http://company.yandex.com
2183
+ -
2184
+ user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
2185
+ bot:
2186
+ name: Yandex Bot
2187
+ category: Search bot
2188
+ url: http://www.yandex.com/bots
2189
+ producer:
2190
+ name: Yandex LLC
2191
+ url: http://company.yandex.com
2192
+ -
2193
+ user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
2194
+ bot:
2195
+ name: Yandex Bot
2196
+ category: Search bot
2197
+ url: http://www.yandex.com/bots
2198
+ producer:
2199
+ name: Yandex LLC
2200
+ url: http://company.yandex.com
2201
+ -
2202
+ user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
2203
+ bot:
2204
+ name: Yandex Bot
2205
+ category: Search bot
2206
+ url: http://www.yandex.com/bots
2207
+ producer:
2208
+ name: Yandex LLC
2209
+ url: http://company.yandex.com
2210
+ -
545
2211
  user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
546
- name: 'Yandex Bot'
547
- -
548
- user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
549
- name: 'Yandex Bot'
550
- -
2212
+ bot:
2213
+ name: Yandex Bot
2214
+ category: Search bot
2215
+ url: http://www.yandex.com/bots
2216
+ producer:
2217
+ name: Yandex LLC
2218
+ url: http://company.yandex.com
2219
+ -
2220
+ user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
2221
+ bot:
2222
+ name: Yandex Bot
2223
+ category: Search bot
2224
+ url: http://www.yandex.com/bots
2225
+ producer:
2226
+ name: Yandex LLC
2227
+ url: http://company.yandex.com
2228
+ -
551
2229
  user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
552
- name: 'Yeti/Naverbot'
553
- -
2230
+ bot:
2231
+ name: Yeti/Naverbot
2232
+ category: Search bot
2233
+ url: http://help.naver.com/robots/
2234
+ producer:
2235
+ name: Naver
2236
+ url: http://www.naver.com
2237
+ -
554
2238
  user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
555
- name: 'Youdao Bot'
556
- -
557
- user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
558
- name: 'Yunyun Bot'
559
- -
2239
+ bot:
2240
+ name: Youdao Bot
2241
+ category: Search bot
2242
+ url: http://www.youdao.com/help/webmaster/spider
2243
+ producer:
2244
+ name: NetEase, Inc.
2245
+ url: http://corp.163.com
2246
+ -
2247
+ user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
2248
+ bot:
2249
+ name: Yourls
2250
+ category: Crawler
2251
+ url: http://yourls.org
2252
+ -
560
2253
  user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
561
- name: 'Yunyun Bot'
562
- -
2254
+ bot:
2255
+ name: Yunyun Bot
2256
+ category: Search bot
2257
+ url: http://www.yunyun.com/SiteInfo.php?r=about
2258
+ producer:
2259
+ name: YunYun
2260
+ url: http://www.yunyun.com
2261
+ -
2262
+ user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
2263
+ bot:
2264
+ name: Yunyun Bot
2265
+ category: Search bot
2266
+ url: http://www.yunyun.com/SiteInfo.php?r=about
2267
+ producer:
2268
+ name: YunYun
2269
+ url: http://www.yunyun.com
2270
+ -
563
2271
  user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
564
- name: 'Yunyun Bot'
565
- -
2272
+ bot:
2273
+ name: Yunyun Bot
2274
+ category: Search bot
2275
+ url: http://www.yunyun.com/SiteInfo.php?r=about
2276
+ producer:
2277
+ name: YunYun
2278
+ url: http://www.yunyun.com
2279
+ -
2280
+ user_agent: Zao/0.1 (http://www.kototol.org/zao)
2281
+ bot:
2282
+ name: Zao
2283
+ category: Crawler
2284
+ -
566
2285
  user_agent: Zookabot/2.5;++http://zookabot.com
567
- name: 'Zookabot'
568
- -
2286
+ bot:
2287
+ name: Zookabot
2288
+ category: Crawler
2289
+ url: http://zookabot.com
2290
+ producer:
2291
+ name: Hwacha ApS
2292
+ url: http://hwacha.dk
2293
+ -
569
2294
  user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
570
- name: 'ZumBot'
571
- -
2295
+ bot:
2296
+ name: ZumBot
2297
+ category: Search bot
2298
+ url: http://help.zum.com/inquiry
2299
+ producer:
2300
+ name: ZUM internet
2301
+ url: http://www.zuminternet.com/
2302
+ -
572
2303
  user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
573
- name: 'ZumBot'
574
- -
575
- user_agent: Your Nutch Spider/Nutch-2.2.1
576
- name: 'Nutch-based Bot'
577
- -
578
- user_agent: Nutch12/Nutch-1.2
579
- name: 'Nutch-based Bot'
580
- -
581
- user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
582
- name: 'Nutch-based Bot'
583
- -
584
- user_agent: MySpider/Nutch-2.2
585
- name: 'Nutch-based Bot'
586
- -
587
- user_agent: My Nutch Spider/Nutch-1.6
588
- name: 'Nutch-based Bot'
589
- -
590
- user_agent: NutchSpider/Nutch-1.4
591
- name: 'Nutch-based Bot'
592
- -
593
- user_agent: testnutch/Nutch-1.8
594
- name: 'Nutch-based Bot'
595
- -
596
- user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
597
- name: 'Nutch-based Bot'
598
- -
599
- user_agent: your sipder name/Nutch-1.7
600
- name: 'Nutch-based Bot'
601
- -
602
- user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
603
- name: 'Nutch-based Bot'
604
- -
605
- user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
606
- name: 'Nutch-based Bot'
607
- -
608
- user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
609
- name: 'Nutch-based Bot'
610
- -
611
- user_agent: CB/Nutch-1.7
612
- name: 'Nutch-based Bot'
613
- -
614
- user_agent: StatusCake Error Detector Crawler V0.01
615
- name: 'Generic Bot'
616
- -
617
- user_agent: niki-bot
618
- name: 'Generic Bot'
619
-
620
-
621
- -
622
- user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
623
- name: 'Bloglovin'
624
- -
625
- user_agent: CommaFeed/1.0 (http://www.commafeed.com)
626
- name: 'CommaFeed'
627
- -
628
- user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
629
- name: 'FeedBurner'
630
- -
631
- user_agent: Feedbin - 9 subscribers
632
- name: 'Feedbin'
633
- -
634
- user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
635
- name: 'Feedly'
636
- -
637
- user_agent: FeedlyBot/1.0 (http://feedly.com)
638
- name: 'Feedly'
639
- -
640
- user_agent: FeedlyApp/1.0 (http://www.feedly.com)
641
- name: 'Feedly'
642
- -
643
- user_agent: MetaFeedly/1.0 (http://www.feedly.com)
644
- name: 'Feedly'
645
- -
646
- user_agent: Feedspot http://www.feedspot.com
647
- name: 'Feedspot'
648
- -
649
- user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
650
- name: 'Fever'
651
- -
652
- user_agent: kouio.com RSS reader
653
- name: 'Kouio'
654
- -
655
- user_agent: kouio.com RSS reader - 6 subscribers
656
- name: 'Kouio'
657
- -
658
- user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
659
- name: 'MagpieRSS'
660
- -
661
- user_agent: Netvibes (http://www.netvibes.com)
662
- name: 'Netvibes'
663
- -
664
- user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
665
- name: 'Netvibes'
666
- -
667
- user_agent: NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
668
- name: 'NewsBlur'
669
- -
670
- user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
671
- name: 'NewsBlur'
672
- -
673
- user_agent: NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
674
- name: 'NewsBlur'
675
- -
676
- user_agent: NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
677
- name: 'NewsBlur'
678
- -
679
- user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
680
- name: 'NewsGator'
681
- -
682
- user_agent: SilverReader/1.0; http://silverreader.com
683
- name: 'SilverReader'
684
- -
685
- user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
686
- name: 'SimplePie'
687
- -
688
- user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
689
- name: 'SimplePie'
690
- -
691
- user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
692
- name: 'SimplePie'
693
- -
694
- user_agent: 'Tiny Tiny RSS/1.10 (http://tt-rss.org/)'
695
- name: 'Tiny Tiny RSS'
696
- -
697
- user_agent: 'Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)'
698
- name: 'Tiny Tiny RSS'
699
- -
700
- user_agent: 'Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)'
701
- name: 'Yahoo Gemini'
702
- -
703
- user_agent: 'Mozilla/5.0 (Java) outbrain'
704
- name: 'Outbrain'
705
- -
706
- user_agent: 'HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)'
707
- name: 'HubPages'
708
- -
709
- user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
710
- name: 'ADMantX'
711
- -
712
- user_agent: 'Pinterest/0.2 (+http://www.pinterest.com/)'
713
- name: 'Pinterest'
714
- -
715
- user_agent: 'Server Density Service Monitoring v2'
716
- name: 'Server Density'
717
- -
718
- user_agent: 'Site24x7'
719
- name: 'Site24x7 Website Monitoring'
720
- -
721
- user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
722
- name: 'Monitor.Us'
723
-
2304
+ bot:
2305
+ name: ZumBot
2306
+ category: Search bot
2307
+ url: http://help.zum.com/inquiry
2308
+ producer:
2309
+ name: ZUM internet
2310
+ url: http://www.zuminternet.com/
2311
+ -
2312
+ user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
2313
+ bot:
2314
+ name: aHrefs Bot
2315
+ category: Crawler
2316
+ url: http://ahrefs.com/robot
2317
+ producer:
2318
+ name: Ahrefs Pte Ltd
2319
+ url: http://ahrefs.com/robot
2320
+ -
2321
+ user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
2322
+ bot:
2323
+ name: aHrefs Bot
2324
+ category: Crawler
2325
+ url: http://ahrefs.com/robot
2326
+ producer:
2327
+ name: Ahrefs Pte Ltd
2328
+ url: http://ahrefs.com/robot
2329
+ -
2330
+ user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
2331
+ bot:
2332
+ name: aHrefs Bot
2333
+ category: Crawler
2334
+ url: http://ahrefs.com/robot
2335
+ producer:
2336
+ name: Ahrefs Pte Ltd
2337
+ url: http://ahrefs.com/robot
2338
+ -
2339
+ user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
2340
+ bot:
2341
+ name: aHrefs Bot
2342
+ category: Crawler
2343
+ url: http://ahrefs.com/robot
2344
+ producer:
2345
+ name: Ahrefs Pte Ltd
2346
+ url: http://ahrefs.com/robot
2347
+ -
2348
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
2349
+ bot:
2350
+ name: archive.org bot
2351
+ category: Crawler
2352
+ url: http://www.archive.org/details/archive.org_bot
2353
+ producer:
2354
+ name: The Internet Archive
2355
+ url: http://www.archive.org
2356
+ -
2357
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
2358
+ bot:
2359
+ name: archive.org bot
2360
+ category: Crawler
2361
+ url: http://www.archive.org/details/archive.org_bot
2362
+ producer:
2363
+ name: The Internet Archive
2364
+ url: http://www.archive.org
2365
+ -
2366
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
2367
+ bot:
2368
+ name: archive.org bot
2369
+ category: Crawler
2370
+ url: http://www.archive.org/details/archive.org_bot
2371
+ producer:
2372
+ name: The Internet Archive
2373
+ url: http://www.archive.org
2374
+ -
2375
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
2376
+ bot:
2377
+ name: archive.org bot
2378
+ category: Crawler
2379
+ url: http://www.archive.org/details/archive.org_bot
2380
+ producer:
2381
+ name: The Internet Archive
2382
+ url: http://www.archive.org
2383
+ -
2384
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
2385
+ bot:
2386
+ name: archive.org bot
2387
+ category: Crawler
2388
+ url: http://www.archive.org/details/archive.org_bot
2389
+ producer:
2390
+ name: The Internet Archive
2391
+ url: http://www.archive.org
2392
+ -
2393
+ user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
2394
+ bot:
2395
+ name: archive.org bot
2396
+ category: Crawler
2397
+ url: http://www.archive.org/details/archive.org_bot
2398
+ producer:
2399
+ name: The Internet Archive
2400
+ url: http://www.archive.org
2401
+ -
2402
+ user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
2403
+ bot:
2404
+ name: archive.org bot
2405
+ category: Crawler
2406
+ url: http://www.archive.org/details/archive.org_bot
2407
+ producer:
2408
+ name: The Internet Archive
2409
+ url: http://www.archive.org
2410
+ -
2411
+ user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
2412
+ bot:
2413
+ name: ccBot crawler
2414
+ category: Crawler
2415
+ url: http://commoncrawl.org/faq/
2416
+ producer:
2417
+ name: reddit inc.
2418
+ url: http://www.reddit.com