device_detector 0.7.0 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (72) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile +4 -0
  3. data/Rakefile +12 -6
  4. data/device_detector.gemspec +1 -1
  5. data/lib/device_detector.rb +65 -4
  6. data/lib/device_detector/client.rb +6 -6
  7. data/lib/device_detector/device.rb +62 -31
  8. data/lib/device_detector/memory_cache.rb +1 -1
  9. data/lib/device_detector/metadata_extractor.rb +4 -13
  10. data/lib/device_detector/model_extractor.rb +10 -1
  11. data/lib/device_detector/name_extractor.rb +1 -1
  12. data/lib/device_detector/os.rb +141 -5
  13. data/lib/device_detector/parser.rb +23 -12
  14. data/lib/device_detector/version.rb +1 -1
  15. data/lib/device_detector/version_extractor.rb +1 -1
  16. data/regexes/bots.yml +36 -1
  17. data/regexes/{browser_engines.yml → client/browser_engine.yml} +4 -1
  18. data/regexes/{browsers.yml → client/browsers.yml} +31 -27
  19. data/regexes/{feed_readers.yml → client/feed_readers.yml} +0 -1
  20. data/regexes/{libraries.yml → client/libraries.yml} +1 -1
  21. data/regexes/{mediaplayers.yml → client/mediaplayers.yml} +1 -1
  22. data/regexes/{mobile_apps.yml → client/mobile_apps.yml} +0 -1
  23. data/regexes/{pim.yml → client/pim.yml} +1 -1
  24. data/regexes/{devices → device}/cameras.yml +1 -1
  25. data/regexes/{devices → device}/car_browsers.yml +0 -1
  26. data/regexes/{devices → device}/consoles.yml +0 -1
  27. data/regexes/{devices → device}/mobiles.yml +193 -49
  28. data/regexes/{devices/portable_media_players.yml → device/portable_media_player.yml} +0 -1
  29. data/regexes/{devices → device}/televisions.yml +0 -3
  30. data/regexes/oss.yml +105 -102
  31. data/regexes/vendorfragments.yml +70 -0
  32. data/spec/device_detector/bot_fixtures_spec.rb +30 -0
  33. data/spec/device_detector/client_fixtures_spec.rb +31 -0
  34. data/spec/device_detector/concrete_user_agent_spec.rb +41 -1
  35. data/spec/device_detector/detector_fixtures_spec.rb +56 -0
  36. data/spec/device_detector/device_fixtures_spec.rb +36 -0
  37. data/spec/device_detector/device_spec.rb +3 -3
  38. data/spec/device_detector/memory_cache_spec.rb +1 -1
  39. data/spec/device_detector/model_extractor_spec.rb +7 -7
  40. data/spec/device_detector/os_fixtures_spec.rb +26 -0
  41. data/spec/device_detector/version_extractor_spec.rb +10 -10
  42. data/spec/device_detector_spec.rb +1 -1
  43. data/spec/fixtures/client/browser.yml +986 -0
  44. data/spec/fixtures/client/feed_reader.yml +180 -0
  45. data/spec/fixtures/client/library.yml +78 -0
  46. data/spec/fixtures/client/mediaplayer.yml +144 -0
  47. data/spec/fixtures/client/mobile_app.yml +24 -0
  48. data/spec/fixtures/client/pim.yml +90 -0
  49. data/spec/fixtures/detector/bots.yml +716 -0
  50. data/spec/fixtures/detector/camera.yml +91 -0
  51. data/spec/fixtures/detector/car_browser.yml +19 -0
  52. data/spec/fixtures/detector/console.yml +253 -0
  53. data/spec/fixtures/detector/desktop.yml +4568 -0
  54. data/spec/fixtures/detector/feature_phone.yml +719 -0
  55. data/spec/fixtures/detector/feed_reader.yml +462 -0
  56. data/spec/fixtures/detector/mediaplayer.yml +141 -0
  57. data/spec/fixtures/detector/mobile_apps.yml +32 -0
  58. data/spec/fixtures/detector/phablet.yml +1095 -0
  59. data/spec/fixtures/detector/portable_media_player.yml +145 -0
  60. data/spec/fixtures/detector/smart_display.yml +19 -0
  61. data/spec/fixtures/detector/smartphone.yml +28673 -0
  62. data/spec/fixtures/detector/tablet.yml +13201 -0
  63. data/spec/fixtures/detector/tv.yml +1380 -0
  64. data/spec/fixtures/detector/unknown.yml +3536 -0
  65. data/spec/fixtures/device/camera.yml +18 -0
  66. data/spec/fixtures/device/car_browser.yml +6 -0
  67. data/spec/fixtures/device/console.yml +72 -0
  68. data/spec/fixtures/parser/bots.yml +2055 -0
  69. data/spec/fixtures/parser/oss.yml +607 -0
  70. data/spec/fixtures/parser/vendorfragments.yml +156 -0
  71. data/spec/spec_helper.rb +6 -2
  72. metadata +84 -17
@@ -0,0 +1,18 @@
1
+ -
2
+ user_agent: Mozilla/5.0 (Linux; U; Android 4.0; de-DE; EK-GC100 Build/IMM76D) AppleWebKit/534.30 (KHTML, like Gecko) Version/4.0 Mobile Safari/534.30
3
+ device:
4
+ type: 8
5
+ brand: SA
6
+ model: GALAXY Camera
7
+ -
8
+ user_agent: Mozilla/5.0 (Linux; Android 4.1.2; EK-GC100 Build/JZO54K) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/28.0.1500.63 Mobile Safari/537.36 OPR/15.0.1162.60140
9
+ device:
10
+ type: 8
11
+ brand: SA
12
+ model: GALAXY Camera
13
+ -
14
+ user_agent: Mozilla/5.0 (Linux; U; Android 2.3.3; ja-jp; COOLPIX S800c Build/CP01_WW) AppleWebKit/533.1 (KHTML, like Gecko) Version/4.0 Mobile Safari/533.1
15
+ device:
16
+ type: 8
17
+ brand: NN
18
+ model: Coolpix S800c
@@ -0,0 +1,6 @@
1
+ -
2
+ user_agent: Mozilla/5.0 (X11; u; Linux; C) AppleWebKit /533.3 (Khtml, like Gheko) QtCarBrowser Safari/533.3
3
+ device:
4
+ type: 6
5
+ brand: TA
6
+ model: Model S
@@ -0,0 +1,72 @@
1
+ -
2
+ user_agent: Mozilla/5.0 (Linux; Android 4.1.1; ARCHOS GAMEPAD Build/JRO03H) AppleWebKit/535.19 (KHTML, like Gecko) Chrome/18.0.1025.166 Safari/535.19
3
+ device:
4
+ type: 4
5
+ brand: AR
6
+ model: Gamepad
7
+ -
8
+ user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0; Xbox)
9
+ device:
10
+ type: 4
11
+ brand: MS
12
+ model: Xbox 360
13
+ -
14
+ user_agent: Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.2; Trident/6.0; Xbox; Xbox One)
15
+ device:
16
+ type: 4
17
+ brand: MS
18
+ model: Xbox One
19
+ -
20
+ user_agent: Mozilla/5.0 (Nintendo 3DS; U; ; en) Version/1.7498.EU
21
+ device:
22
+ type: 4
23
+ brand: NI
24
+ model: 3DS
25
+ -
26
+ user_agent: Bunjalloo/0.7.6(Nintendo DS;U;en)
27
+ device:
28
+ type: 4
29
+ brand: NI
30
+ model: DS
31
+ -
32
+ user_agent: Opera/9.30 (Nintendo Wii; U; ; 3642; en)
33
+ device:
34
+ type: 4
35
+ brand: NI
36
+ model: Wii
37
+ -
38
+ user_agent: Mozilla/5.0 (Nintendo WiiU) AppleWebKit/534.52 (KHTML, like Gecko) NX/2.1.0.8.21 NintendoBrowser/1.0.0.7494.US
39
+ device:
40
+ type: 4
41
+ brand: NI
42
+ model: WiiU
43
+ -
44
+ user_agent: Mozilla/5.0 (Linux; U; Android OUYA 4.1.2; en-us; OUYA Build/JZO54L-OUYA) AppleWebKit/534.30 (KHTML, like Gecko) Version/4.0 Safari/534.30
45
+ device:
46
+ type: 4
47
+ brand: OU
48
+ model: OUYA
49
+ -
50
+ user_agent: Mozilla/5.0 (PLAYSTATION 3 4.46) AppleWebKit/531.22.8 (KHTML, like Gecko)
51
+ device:
52
+ type: 4
53
+ brand: SO
54
+ model: PlayStation 3
55
+ -
56
+ user_agent: Mozilla/5.0 (PlayStation 4 1.52) AppleWebKit/536.26 (KHTML, like Gecko)
57
+ device:
58
+ type: 4
59
+ brand: SO
60
+ model: PlayStation 4
61
+ -
62
+ user_agent: Mozilla/4.0 (PlayStation Portable); 2.00)
63
+ device:
64
+ type: 4
65
+ brand: SO
66
+ model: PlayStation Portable
67
+ -
68
+ user_agent: Mozilla/5.0 (PlayStation Vita 3.01) AppleWebKit/536.26 (KHTML, like Gecko) Silk/3.2
69
+ device:
70
+ type: 4
71
+ brand: SO
72
+ model: PlayStation Vita
@@ -0,0 +1,2055 @@
1
+ -
2
+ user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
3
+ bot:
4
+ name: '360Spider'
5
+ category: 'Search bot'
6
+ url: 'http://www.so.com/help/help_3_2.html'
7
+ producer:
8
+ name: 'Online Media Group, Inc.'
9
+ url: ''
10
+ -
11
+ user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
12
+ bot:
13
+ name: '360Spider'
14
+ category: 'Search bot'
15
+ url: 'http://www.so.com/help/help_3_2.html'
16
+ producer:
17
+ name: 'Online Media Group, Inc.'
18
+ url: ''
19
+ -
20
+ user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
21
+ bot:
22
+ name: '360Spider'
23
+ category: 'Search bot'
24
+ url: 'http://www.so.com/help/help_3_2.html'
25
+ producer:
26
+ name: 'Online Media Group, Inc.'
27
+ url: ''
28
+ -
29
+ user_agent: 360spider-image
30
+ bot:
31
+ name: '360Spider'
32
+ category: 'Search bot'
33
+ url: 'http://www.so.com/help/help_3_2.html'
34
+ producer:
35
+ name: 'Online Media Group, Inc.'
36
+ url: ''
37
+ -
38
+ user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
39
+ bot:
40
+ name: 'Aboundexbot'
41
+ category: 'Search bot'
42
+ url: 'http://www.aboundex.com/crawler/'
43
+ producer:
44
+ name: 'Aboundex.com'
45
+ url: 'http://www.aboundex.com'
46
+ -
47
+ user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
48
+ bot:
49
+ name: 'Acoon'
50
+ category: 'Search bot'
51
+ url: 'http://www.acoon.de/robot.asp'
52
+ producer:
53
+ name: 'Acoon GmbH'
54
+ url: 'http://www.acoon.de'
55
+ -
56
+ user_agent: AddThis.com robot tech.support@clearspring.com
57
+ bot:
58
+ name: 'AddThis.com'
59
+ category: 'Social Media Agent'
60
+ url: ''
61
+ producer:
62
+ name: 'Clearspring Technologies, Inc.'
63
+ url: 'http://www.clearspring.com'
64
+ -
65
+ user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
66
+ bot:
67
+ name: 'aHrefs Bot'
68
+ category: 'Crawler'
69
+ url: 'http://ahrefs.com/robot'
70
+ producer:
71
+ name: 'Ahrefs Pte Ltd'
72
+ url: 'http://ahrefs.com/robot'
73
+ -
74
+ user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
75
+ bot:
76
+ name: 'aHrefs Bot'
77
+ category: 'Crawler'
78
+ url: 'http://ahrefs.com/robot'
79
+ producer:
80
+ name: 'Ahrefs Pte Ltd'
81
+ url: 'http://ahrefs.com/robot'
82
+ -
83
+ user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
84
+ bot:
85
+ name: 'aHrefs Bot'
86
+ category: 'Crawler'
87
+ url: 'http://ahrefs.com/robot'
88
+ producer:
89
+ name: 'Ahrefs Pte Ltd'
90
+ url: 'http://ahrefs.com/robot'
91
+ -
92
+ user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
93
+ bot:
94
+ name: 'aHrefs Bot'
95
+ category: 'Crawler'
96
+ url: 'http://ahrefs.com/robot'
97
+ producer:
98
+ name: 'Ahrefs Pte Ltd'
99
+ url: 'http://ahrefs.com/robot'
100
+ -
101
+ user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
102
+ bot:
103
+ name: 'Alexa Crawler'
104
+ category: 'Search bot'
105
+ url: 'https://alexa.zendesk.com/hc/en-us/sections/200100794-Crawlers'
106
+ producer:
107
+ name: 'Alexa Internet'
108
+ url: 'http://www.alexa.com'
109
+ -
110
+ user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
111
+ bot:
112
+ name: 'Amorank Spider'
113
+ category: 'Crawler'
114
+ url: 'http://amorank.com/webcrawler.html'
115
+ producer:
116
+ name: 'Amorank'
117
+ url: 'http://www.amorank.com'
118
+ -
119
+ user_agent: Curious George - www.analyticsseo.com/crawler
120
+ bot:
121
+ name: 'Analytics SEO Crawler'
122
+ category: 'Crawler'
123
+ url: 'http://www.analyticsseo.com/crawler'
124
+ producer:
125
+ name: 'Analytics SEO'
126
+ url: 'http://www.analyticsseo.com'
127
+ -
128
+ user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
129
+ bot:
130
+ name: 'archive.org bot'
131
+ category: 'Crawler'
132
+ url: 'http://www.archive.org/details/archive.org_bot'
133
+ producer:
134
+ name: 'The Internet Archive'
135
+ url: 'http://www.archive.org'
136
+ -
137
+ user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
138
+ bot:
139
+ name: 'archive.org bot'
140
+ category: 'Crawler'
141
+ url: 'http://www.archive.org/details/archive.org_bot'
142
+ producer:
143
+ name: 'The Internet Archive'
144
+ url: 'http://www.archive.org'
145
+ -
146
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
147
+ bot:
148
+ name: 'archive.org bot'
149
+ category: 'Crawler'
150
+ url: 'http://www.archive.org/details/archive.org_bot'
151
+ producer:
152
+ name: 'The Internet Archive'
153
+ url: 'http://www.archive.org'
154
+ -
155
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
156
+ bot:
157
+ name: 'archive.org bot'
158
+ category: 'Crawler'
159
+ url: 'http://www.archive.org/details/archive.org_bot'
160
+ producer:
161
+ name: 'The Internet Archive'
162
+ url: 'http://www.archive.org'
163
+ -
164
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
165
+ bot:
166
+ name: 'archive.org bot'
167
+ category: 'Crawler'
168
+ url: 'http://www.archive.org/details/archive.org_bot'
169
+ producer:
170
+ name: 'The Internet Archive'
171
+ url: 'http://www.archive.org'
172
+ -
173
+ user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
174
+ bot:
175
+ name: 'archive.org bot'
176
+ category: 'Crawler'
177
+ url: 'http://www.archive.org/details/archive.org_bot'
178
+ producer:
179
+ name: 'The Internet Archive'
180
+ url: 'http://www.archive.org'
181
+ -
182
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
183
+ bot:
184
+ name: 'archive.org bot'
185
+ category: 'Crawler'
186
+ url: 'http://www.archive.org/details/archive.org_bot'
187
+ producer:
188
+ name: 'The Internet Archive'
189
+ url: 'http://www.archive.org'
190
+ -
191
+ user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
192
+ bot:
193
+ name: 'Ask Jeeves'
194
+ category: 'Search bot'
195
+ url: ''
196
+ producer:
197
+ name: 'Ask Jeeves Inc.'
198
+ url: 'http://www.ask.com'
199
+ -
200
+ user_agent: Backlink-Ceck.de (+http://www.backlink-check.de/bot.html)
201
+ bot:
202
+ name: 'Backlink-Ceck.de'
203
+ category: 'Crawler'
204
+ url: 'http://www.backlink-check.de/bot.html'
205
+ producer:
206
+ name: 'Mediagreen Medienservice'
207
+ url: 'http://www.backlink-check.de'
208
+ -
209
+ user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
210
+ bot:
211
+ name: 'BacklinkCrawler'
212
+ category: 'Crawler'
213
+ url: 'http://www.backlinktest.com/crawler.html'
214
+ producer:
215
+ name: '2.0Promotion GbR'
216
+ url: 'http://www.backlinktest.com'
217
+ -
218
+ user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
219
+ bot:
220
+ name: 'Baidu Spider'
221
+ category: 'Search bot'
222
+ url: 'http://www.baidu.com/search/spider.htm'
223
+ producer:
224
+ name: 'Baidu'
225
+ url: 'http://www.baidu.com'
226
+ -
227
+ user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
228
+ bot:
229
+ name: 'Baidu Spider'
230
+ category: 'Search bot'
231
+ url: 'http://www.baidu.com/search/spider.htm'
232
+ producer:
233
+ name: 'Baidu'
234
+ url: 'http://www.baidu.com'
235
+ -
236
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
237
+ bot:
238
+ name: 'Baidu Spider'
239
+ category: 'Search bot'
240
+ url: 'http://www.baidu.com/search/spider.htm'
241
+ producer:
242
+ name: 'Baidu'
243
+ url: 'http://www.baidu.com'
244
+ -
245
+ user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
246
+ bot:
247
+ name: 'Baidu Spider'
248
+ category: 'Search bot'
249
+ url: 'http://www.baidu.com/search/spider.htm'
250
+ producer:
251
+ name: 'Baidu'
252
+ url: 'http://www.baidu.com'
253
+ -
254
+ user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
255
+ bot:
256
+ name: 'Baidu Spider'
257
+ category: 'Search bot'
258
+ url: 'http://www.baidu.com/search/spider.htm'
259
+ producer:
260
+ name: 'Baidu'
261
+ url: 'http://www.baidu.com'
262
+ -
263
+ user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
264
+ bot:
265
+ name: 'Baidu Spider'
266
+ category: 'Search bot'
267
+ url: 'http://www.baidu.com/search/spider.htm'
268
+ producer:
269
+ name: 'Baidu'
270
+ url: 'http://www.baidu.com'
271
+ -
272
+ user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
273
+ bot:
274
+ name: 'Baidu Spider'
275
+ category: 'Search bot'
276
+ url: 'http://www.baidu.com/search/spider.htm'
277
+ producer:
278
+ name: 'Baidu'
279
+ url: 'http://www.baidu.com'
280
+ -
281
+ user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
282
+ bot:
283
+ name: 'BingBot'
284
+ category: 'Search bot'
285
+ url: 'http://search.msn.com/msnbot.htmn'
286
+ producer:
287
+ name: 'Microsoft Corporation'
288
+ url: 'http://www.microsoft.com'
289
+ -
290
+ user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
291
+ bot:
292
+ name: 'BingBot'
293
+ category: 'Search bot'
294
+ url: 'http://search.msn.com/msnbot.htmn'
295
+ producer:
296
+ name: 'Microsoft Corporation'
297
+ url: 'http://www.microsoft.com'
298
+ -
299
+ user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
300
+ bot:
301
+ name: 'BingBot'
302
+ category: 'Search bot'
303
+ url: 'http://search.msn.com/msnbot.htmn'
304
+ producer:
305
+ name: 'Microsoft Corporation'
306
+ url: 'http://www.microsoft.com'
307
+ -
308
+ user_agent: MSNBot/Nutch-1.5.1
309
+ bot:
310
+ name: 'BingBot'
311
+ category: 'Search bot'
312
+ url: 'http://search.msn.com/msnbot.htmn'
313
+ producer:
314
+ name: 'Microsoft Corporation'
315
+ url: 'http://www.microsoft.com'
316
+ -
317
+ user_agent: msnbot/2.0b v1394720947.6703
318
+ bot:
319
+ name: 'BingBot'
320
+ category: 'Search bot'
321
+ url: 'http://search.msn.com/msnbot.htmn'
322
+ producer:
323
+ name: 'Microsoft Corporation'
324
+ url: 'http://www.microsoft.com'
325
+ -
326
+ user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
327
+ bot:
328
+ name: 'BingBot'
329
+ category: 'Search bot'
330
+ url: 'http://search.msn.com/msnbot.htmn'
331
+ producer:
332
+ name: 'Microsoft Corporation'
333
+ url: 'http://www.microsoft.com'
334
+ -
335
+ user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
336
+ bot:
337
+ name: 'BingBot'
338
+ category: 'Search bot'
339
+ url: 'http://search.msn.com/msnbot.htmn'
340
+ producer:
341
+ name: 'Microsoft Corporation'
342
+ url: 'http://www.microsoft.com'
343
+ -
344
+ user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
345
+ bot:
346
+ name: 'BingBot'
347
+ category: 'Search bot'
348
+ url: 'http://search.msn.com/msnbot.htmn'
349
+ producer:
350
+ name: 'Microsoft Corporation'
351
+ url: 'http://www.microsoft.com'
352
+ -
353
+ user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
354
+ bot:
355
+ name: 'Blekkobot'
356
+ category: 'Search bot'
357
+ url: 'http://blekko.com/about/blekkobot'
358
+ producer:
359
+ name: 'Blekko'
360
+ url: 'http://blekko.com'
361
+ -
362
+ user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
363
+ bot:
364
+ name: 'BLEXBot Crawler'
365
+ category: 'Crawler'
366
+ url: 'http://webmeup-crawler.com'
367
+ producer:
368
+ name: 'WebMeUp'
369
+ url: 'http://webmeup.com'
370
+ -
371
+ user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
372
+ bot:
373
+ name: 'Bloglovin'
374
+ url: 'http://www.bloglovin.com'
375
+ category: 'Feed Fetcher'
376
+ producer:
377
+ name: ''
378
+ url: ''
379
+ -
380
+ user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
381
+ bot:
382
+ name: 'Bountii Bot'
383
+ category: 'Search bot'
384
+ url: 'http://bountii.com/contact.php'
385
+ producer:
386
+ name: 'Bountii Inc.'
387
+ url: 'http://bountii.com'
388
+ -
389
+ user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
390
+ bot:
391
+ name: 'Butterfly Robot'
392
+ category: 'Search bot'
393
+ url: 'http://labs.topsy.com/butterfly'
394
+ producer:
395
+ name: 'Topsy Labs'
396
+ url: 'http://labs.topsy.com'
397
+ -
398
+ user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
399
+ bot:
400
+ name: 'Butterfly Robot'
401
+ category: 'Search bot'
402
+ url: 'http://labs.topsy.com/butterfly'
403
+ producer:
404
+ name: 'Topsy Labs'
405
+ url: 'http://labs.topsy.com'
406
+ -
407
+ user_agent: Browsershots
408
+ bot:
409
+ name: 'Browsershots'
410
+ category: 'Service Agent'
411
+ url: 'http://browsershots.org/faq'
412
+ producer:
413
+ name: 'Browsershots.org'
414
+ url: 'http://browsershots.org'
415
+ -
416
+ user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
417
+ bot:
418
+ name: 'CareerBot'
419
+ category: 'Crawler'
420
+ url: 'http://www.career-x.de/bot.html'
421
+ producer:
422
+ name: 'career-x GmbH'
423
+ url: 'http://www.career-x.de'
424
+ -
425
+ user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
426
+ bot:
427
+ name: 'ccBot crawler'
428
+ category: 'Crawler'
429
+ url: 'http://commoncrawl.org/faq/'
430
+ producer:
431
+ name: 'reddit inc.'
432
+ url: 'http://www.reddit.com'
433
+ -
434
+ user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
435
+ bot:
436
+ name: 'Cliqzbot'
437
+ category: 'Crawler'
438
+ url: 'http://cliqz.com/company/cliqzbot'
439
+ producer:
440
+ name: '10betterpages GmbH'
441
+ url: 'http://cliqz.com'
442
+ -
443
+ user_agent: CommaFeed/1.0 (http://www.commafeed.com)
444
+ bot:
445
+ name: 'CommaFeed'
446
+ url: 'http://www.commafeed.com'
447
+ category: 'Feed Fetcher'
448
+ producer:
449
+ name: ''
450
+ url: ''
451
+ -
452
+ user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
453
+ bot:
454
+ name: 'Dazoobot'
455
+ category: 'Search bot'
456
+ url: ''
457
+ producer:
458
+ name: 'DAZOO.FR'
459
+ url: 'http://dazoo.fr'
460
+ -
461
+ user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
462
+ bot:
463
+ name: 'Discobot'
464
+ category: 'Search bot'
465
+ url: 'http://discoveryengine.com/discobot.html'
466
+ producer:
467
+ name: 'Discovery Engine'
468
+ url: 'http://discoveryengine.com'
469
+ -
470
+ user_agent: dotbot
471
+ bot:
472
+ name: 'DotBot'
473
+ category: 'Crawler'
474
+ url: 'http://www.opensiteexplorer.org/dotbot'
475
+ producer:
476
+ name: 'SEOmoz, Inc.'
477
+ url: 'http://moz.com/'
478
+ -
479
+ user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
480
+ bot:
481
+ name: 'Easou Spider'
482
+ category: 'Search bot'
483
+ url: 'http://www.easou.com/search/spider.html'
484
+ producer:
485
+ name: 'easou ICP'
486
+ url: 'http://www.easou.com'
487
+ -
488
+ user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
489
+ bot:
490
+ name: 'Easou Spider'
491
+ category: 'Search bot'
492
+ url: 'http://www.easou.com/search/spider.html'
493
+ producer:
494
+ name: 'easou ICP'
495
+ url: 'http://www.easou.com'
496
+ -
497
+ user_agent: EMail Exractor
498
+ bot:
499
+ name: 'EMail Exractor'
500
+ category: 'Crawler'
501
+ url: ''
502
+ producer:
503
+ name: ''
504
+ url: ''
505
+ -
506
+ user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
507
+ bot:
508
+ name: 'ExaBot'
509
+ category: 'Crawler'
510
+ url: 'http://www.exabot.com/go/robot'
511
+ producer:
512
+ name: 'Dassault Systèmes'
513
+ url: 'http://www.3ds.com'
514
+ -
515
+ user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
516
+ bot:
517
+ name: 'ExaBot'
518
+ category: 'Crawler'
519
+ url: 'http://www.exabot.com/go/robot'
520
+ producer:
521
+ name: 'Dassault Systèmes'
522
+ url: 'http://www.3ds.com'
523
+ -
524
+ user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
525
+ bot:
526
+ name: 'ExaBot'
527
+ category: 'Crawler'
528
+ url: 'http://www.exabot.com/go/robot'
529
+ producer:
530
+ name: 'Dassault Systèmes'
531
+ url: 'http://www.3ds.com'
532
+ -
533
+ user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
534
+ bot:
535
+ name: 'ExactSeek Crawler'
536
+ category: 'Search bot'
537
+ url: 'http://www.exactseek.com'
538
+ producer:
539
+ name: 'Jayde Online, Inc.'
540
+ url: 'http://www.jaydeonlineinc.com'
541
+ -
542
+ user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
543
+ bot:
544
+ name: 'Ezooms'
545
+ category: 'Crawler'
546
+ url: ''
547
+ producer:
548
+ name: 'SEOmoz, Inc.'
549
+ url: 'http://moz.com/'
550
+ -
551
+ user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
552
+ bot:
553
+ name: 'Facebook External Hit'
554
+ category: 'Social Media Agent'
555
+ url: 'https://www.facebook.com/externalhit_uatext.php'
556
+ producer:
557
+ name: 'Facebook'
558
+ url: 'http://www.facebook.com'
559
+ -
560
+ user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
561
+ bot:
562
+ name: 'Facebook External Hit'
563
+ category: 'Social Media Agent'
564
+ url: 'https://www.facebook.com/externalhit_uatext.php'
565
+ producer:
566
+ name: 'Facebook'
567
+ url: 'http://www.facebook.com'
568
+ -
569
+ user_agent: Feedbin - 9 subscribers
570
+ bot:
571
+ name: 'Feedbin'
572
+ url: 'http://feedbin.com/'
573
+ category: 'Feed Fetcher'
574
+ producer:
575
+ name: ''
576
+ url: ''
577
+ -
578
+ user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
579
+ bot:
580
+ name: 'FeedBurner'
581
+ url: 'http://www.feedburner.com'
582
+ category: 'Feed Fetcher'
583
+ producer:
584
+ name: ''
585
+ url: ''
586
+ -
587
+ user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
588
+ bot:
589
+ name: 'Feedly'
590
+ url: 'http://www.feedly.com'
591
+ category: 'Feed Fetcher'
592
+ producer:
593
+ name: ''
594
+ url: ''
595
+ -
596
+ user_agent: FeedlyBot/1.0 (http://feedly.com)
597
+ bot:
598
+ name: 'Feedly'
599
+ url: 'http://www.feedly.com'
600
+ category: 'Feed Fetcher'
601
+ producer:
602
+ name: ''
603
+ url: ''
604
+ -
605
+ user_agent: FeedlyApp/1.0 (http://www.feedly.com)
606
+ bot:
607
+ name: 'Feedly'
608
+ url: 'http://www.feedly.com'
609
+ category: 'Feed Fetcher'
610
+ producer:
611
+ name: ''
612
+ url: ''
613
+ -
614
+ user_agent: MetaFeedly/1.0 (http://www.feedly.com)
615
+ bot:
616
+ name: 'Feedly'
617
+ url: 'http://www.feedly.com'
618
+ category: 'Feed Fetcher'
619
+ producer:
620
+ name: ''
621
+ url: ''
622
+ -
623
+ user_agent: Feedspot http://www.feedspot.com
624
+ bot:
625
+ name: 'Feedspot'
626
+ url: 'http://www.feedspot.com'
627
+ category: 'Feed Fetcher'
628
+ producer:
629
+ name: ''
630
+ url: ''
631
+ -
632
+ user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
633
+ bot:
634
+ name: 'Fever'
635
+ url: 'http://feedafever.com/'
636
+ category: 'Feed Fetcher'
637
+ producer:
638
+ name: ''
639
+ url: ''
640
+ -
641
+ user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
642
+ bot:
643
+ name: 'Genieo Web filter'
644
+ category: ''
645
+ url: 'http://www.genieo.com/webfilter.html'
646
+ producer:
647
+ name: 'Genieo'
648
+ url: 'http://www.genieo.com'
649
+ -
650
+ user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
651
+ bot:
652
+ name: 'Goo'
653
+ category: 'Search bot'
654
+ url: 'http://search.goo.ne.jp/option/use/sub4/sub4-1'
655
+ producer:
656
+ name: 'NTT Resonant'
657
+ url: 'http://goo.ne.jp'
658
+ -
659
+ user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
660
+ bot:
661
+ name: 'Googlebot'
662
+ category: 'Search bot'
663
+ url: 'http://www.google.com/bot.html'
664
+ producer:
665
+ name: 'Google Inc.'
666
+ url: 'http://www.google.com'
667
+ -
668
+ user_agent: Googlebot/Nutch-1.7
669
+ bot:
670
+ name: 'Googlebot'
671
+ category: 'Search bot'
672
+ url: 'http://www.google.com/bot.html'
673
+ producer:
674
+ name: 'Google Inc.'
675
+ url: 'http://www.google.com'
676
+ -
677
+ user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
678
+ bot:
679
+ name: 'Googlebot'
680
+ category: 'Search bot'
681
+ url: 'http://www.google.com/bot.html'
682
+ producer:
683
+ name: 'Google Inc.'
684
+ url: 'http://www.google.com'
685
+ -
686
+ user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
687
+ bot:
688
+ name: 'Googlebot'
689
+ category: 'Search bot'
690
+ url: 'http://www.google.com/bot.html'
691
+ producer:
692
+ name: 'Google Inc.'
693
+ url: 'http://www.google.com'
694
+ -
695
+ user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
696
+ bot:
697
+ name: 'Googlebot'
698
+ category: 'Search bot'
699
+ url: 'http://www.google.com/bot.html'
700
+ producer:
701
+ name: 'Google Inc.'
702
+ url: 'http://www.google.com'
703
+ -
704
+ user_agent: Googlebot-Image/1.0
705
+ bot:
706
+ name: 'Googlebot'
707
+ category: 'Search bot'
708
+ url: 'http://www.google.com/bot.html'
709
+ producer:
710
+ name: 'Google Inc.'
711
+ url: 'http://www.google.com'
712
+ -
713
+ user_agent: Googlebot (gocrawl v0.4)
714
+ bot:
715
+ name: 'Googlebot'
716
+ category: 'Search bot'
717
+ url: 'http://www.google.com/bot.html'
718
+ producer:
719
+ name: 'Google Inc.'
720
+ url: 'http://www.google.com'
721
+ -
722
+ user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
723
+ bot:
724
+ name: 'Googlebot'
725
+ category: 'Search bot'
726
+ url: 'http://www.google.com/bot.html'
727
+ producer:
728
+ name: 'Google Inc.'
729
+ url: 'http://www.google.com'
730
+ -
731
+ user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
732
+ bot:
733
+ name: 'Googlebot'
734
+ category: 'Search bot'
735
+ url: 'http://www.google.com/bot.html'
736
+ producer:
737
+ name: 'Google Inc.'
738
+ url: 'http://www.google.com'
739
+ -
740
+ user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
741
+ bot:
742
+ name: 'Googlebot'
743
+ category: 'Search bot'
744
+ url: 'http://www.google.com/bot.html'
745
+ producer:
746
+ name: 'Google Inc.'
747
+ url: 'http://www.google.com'
748
+ -
749
+ user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
750
+ bot:
751
+ name: 'Googlebot'
752
+ category: 'Search bot'
753
+ url: 'http://www.google.com/bot.html'
754
+ producer:
755
+ name: 'Google Inc.'
756
+ url: 'http://www.google.com'
757
+ -
758
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
759
+ bot:
760
+ name: 'Googlebot'
761
+ category: 'Search bot'
762
+ url: 'http://www.google.com/bot.html'
763
+ producer:
764
+ name: 'Google Inc.'
765
+ url: 'http://www.google.com'
766
+ -
767
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
768
+ bot:
769
+ name: 'Googlebot'
770
+ category: 'Search bot'
771
+ url: 'http://www.google.com/bot.html'
772
+ producer:
773
+ name: 'Google Inc.'
774
+ url: 'http://www.google.com'
775
+ -
776
+ user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
777
+ bot:
778
+ name: 'Googlebot'
779
+ category: 'Search bot'
780
+ url: 'http://www.google.com/bot.html'
781
+ producer:
782
+ name: 'Google Inc.'
783
+ url: 'http://www.google.com'
784
+ -
785
+ user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
786
+ bot:
787
+ name: 'Googlebot'
788
+ category: 'Search bot'
789
+ url: 'http://www.google.com/bot.html'
790
+ producer:
791
+ name: 'Google Inc.'
792
+ url: 'http://www.google.com'
793
+ -
794
+ user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
795
+ bot:
796
+ name: 'Googlebot'
797
+ category: 'Search bot'
798
+ url: 'http://www.google.com/bot.html'
799
+ producer:
800
+ name: 'Google Inc.'
801
+ url: 'http://www.google.com'
802
+ -
803
+ user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
804
+ bot:
805
+ name: 'Googlebot'
806
+ category: 'Search bot'
807
+ url: 'http://www.google.com/bot.html'
808
+ producer:
809
+ name: 'Google Inc.'
810
+ url: 'http://www.google.com'
811
+ -
812
+ user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
813
+ bot:
814
+ name: 'Googlebot'
815
+ category: 'Search bot'
816
+ url: 'http://www.google.com/bot.html'
817
+ producer:
818
+ name: 'Google Inc.'
819
+ url: 'http://www.google.com'
820
+ -
821
+ user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
822
+ bot:
823
+ name: 'Googlebot'
824
+ category: 'Search bot'
825
+ url: 'http://www.google.com/bot.html'
826
+ producer:
827
+ name: 'Google Inc.'
828
+ url: 'http://www.google.com'
829
+ -
830
+ user_agent: Mediapartners-Google
831
+ bot:
832
+ name: 'Googlebot'
833
+ category: 'Search bot'
834
+ url: 'http://www.google.com/bot.html'
835
+ producer:
836
+ name: 'Google Inc.'
837
+ url: 'http://www.google.com'
838
+ -
839
+ user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
840
+ bot:
841
+ name: 'Heritrix'
842
+ category: 'Crawler'
843
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
844
+ producer:
845
+ name: 'The Internet Archive'
846
+ url: 'http://www.archive.org'
847
+ -
848
+ user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
849
+ bot:
850
+ name: 'Heritrix'
851
+ category: 'Crawler'
852
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
853
+ producer:
854
+ name: 'The Internet Archive'
855
+ url: 'http://www.archive.org'
856
+ -
857
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
858
+ bot:
859
+ name: 'Heritrix'
860
+ category: 'Crawler'
861
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
862
+ producer:
863
+ name: 'The Internet Archive'
864
+ url: 'http://www.archive.org'
865
+ -
866
+ user_agent: flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)
867
+ bot:
868
+ name: 'Heritrix'
869
+ category: 'Crawler'
870
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
871
+ producer:
872
+ name: 'The Internet Archive'
873
+ url: 'http://www.archive.org'
874
+ -
875
+ user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
876
+ bot:
877
+ name: 'Heritrix'
878
+ category: 'Crawler'
879
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
880
+ producer:
881
+ name: 'The Internet Archive'
882
+ url: 'http://www.archive.org'
883
+ -
884
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
885
+ bot:
886
+ name: 'Heritrix'
887
+ category: 'Crawler'
888
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
889
+ producer:
890
+ name: 'The Internet Archive'
891
+ url: 'http://www.archive.org'
892
+ -
893
+ user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
894
+ bot:
895
+ name: 'Heritrix'
896
+ category: 'Crawler'
897
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
898
+ producer:
899
+ name: 'The Internet Archive'
900
+ url: 'http://www.archive.org'
901
+ -
902
+ user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
903
+ bot:
904
+ name: 'Heritrix'
905
+ category: 'Crawler'
906
+ url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
907
+ producer:
908
+ name: 'The Internet Archive'
909
+ url: 'http://www.archive.org'
910
+ -
911
+ user_agent: HTTPMon/1.0b (http://www.httpmon.com)
912
+ bot:
913
+ name: 'HTTPMon'
914
+ category: 'Site Monitor'
915
+ url: 'http://www.httpmon.com'
916
+ producer:
917
+ name: 'towards GmbH'
918
+ url: 'http://www.towards.ch/'
919
+ -
920
+ user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
921
+ bot:
922
+ name: 'IIS Site Analysis'
923
+ category: 'crawler'
924
+ url: 'http://www.iis.net/iisbot.html'
925
+ producer:
926
+ name: 'Microsoft Corporation'
927
+ url: 'http://www.microsoft.com'
928
+ -
929
+ user_agent: kouio.com RSS reader
930
+ bot:
931
+ name: 'Kouio'
932
+ url: 'http://kouio.com/'
933
+ category: 'Feed Fetcher'
934
+ producer:
935
+ name: ''
936
+ url: ''
937
+ -
938
+ user_agent: kouio.com RSS reader - 6 subscribers
939
+ bot:
940
+ name: 'Kouio'
941
+ url: 'http://kouio.com/'
942
+ category: 'Feed Fetcher'
943
+ producer:
944
+ name: ''
945
+ url: ''
946
+ -
947
+ user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
948
+ bot:
949
+ name: 'Linkdex Bot'
950
+ category: 'Search bot'
951
+ url: 'http://www.linkdex.com/bots'
952
+ producer:
953
+ name: 'Mojeek Ltd.'
954
+ url: 'http://www.mojeek.com'
955
+ -
956
+ user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
957
+ bot:
958
+ name: 'Linkdex Bot'
959
+ category: 'Search bot'
960
+ url: 'http://www.linkdex.com/bots'
961
+ producer:
962
+ name: 'Mojeek Ltd.'
963
+ url: 'http://www.mojeek.com'
964
+ -
965
+ user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
966
+ bot:
967
+ name: 'Linkdex Bot'
968
+ category: 'Search bot'
969
+ url: 'http://www.linkdex.com/bots'
970
+ producer:
971
+ name: 'Mojeek Ltd.'
972
+ url: 'http://www.mojeek.com'
973
+ -
974
+ user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
975
+ bot:
976
+ name: 'LinkedIn Bot'
977
+ category: 'Social Media Agent'
978
+ url: 'http://www.linkedin.com'
979
+ producer:
980
+ name: 'LinkedIn'
981
+ url: 'http://www.linkedin.com'
982
+ -
983
+ user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
984
+ bot:
985
+ name: 'Mail.Ru Bot'
986
+ category: 'Search bot'
987
+ url: 'http://help.mail.ru/webmaster/indexing/robots/types_robots'
988
+ producer:
989
+ name: 'Mail.Ru Group'
990
+ url: 'http://corp.mail.ru'
991
+ -
992
+ user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
993
+ bot:
994
+ name: 'Mail.Ru Bot'
995
+ category: 'Search bot'
996
+ url: 'http://help.mail.ru/webmaster/indexing/robots/types_robots'
997
+ producer:
998
+ name: 'Mail.Ru Group'
999
+ url: 'http://corp.mail.ru'
1000
+ -
1001
+ user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
1002
+ bot:
1003
+ name: 'Magpie-Crawler'
1004
+ category: 'Social Media Agent'
1005
+ url: 'http://www.brandwatch.com/magpie-crawler/'
1006
+ producer:
1007
+ name: 'Brandwatch'
1008
+ url: 'http://www.brandwatch.com'
1009
+ -
1010
+ user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
1011
+ bot:
1012
+ name: 'MagpieRSS'
1013
+ url: 'http://magpierss.sourceforge.net/'
1014
+ category: 'Feed Parser'
1015
+ producer:
1016
+ name: ''
1017
+ url: ''
1018
+ -
1019
+ user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
1020
+ bot:
1021
+ name: 'Meanpath Bot'
1022
+ category: 'Search bot'
1023
+ url: 'http://www.meanpath.com/meanpathbot.html'
1024
+ producer:
1025
+ name: 'Meanpath'
1026
+ url: 'http://www.meanpath.com'
1027
+ -
1028
+ user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
1029
+ bot:
1030
+ name: 'Mixrank Bot'
1031
+ category: 'Crawler'
1032
+ url: 'http://mixrank.com'
1033
+ producer:
1034
+ name: 'Online Media Group, Inc.'
1035
+ url: ''
1036
+ -
1037
+ user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
1038
+ bot:
1039
+ name: 'MJ12 Bot'
1040
+ category: 'Search bot'
1041
+ url: 'http://majestic12.co.uk/bot.php'
1042
+ producer:
1043
+ name: 'Majestic-12'
1044
+ url: 'http://majestic12.co.uk'
1045
+ -
1046
+ user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
1047
+ bot:
1048
+ name: 'MojeekBot'
1049
+ category: 'Search bot'
1050
+ url: 'http://www.mojeek.com/bot.html'
1051
+ producer:
1052
+ name: 'Mojeek Ltd.'
1053
+ url: 'http://www.mojeek.com'
1054
+ -
1055
+ user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
1056
+ bot:
1057
+ name: 'NalezenCzBot'
1058
+ category: 'Crawler'
1059
+ url: 'http://www.nalezen.cz/about-crawler'
1060
+ producer:
1061
+ name: 'Jaroslav Kuboš'
1062
+ url: ''
1063
+ -
1064
+ user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
1065
+ bot:
1066
+ name: 'Netcraft Survey Bot'
1067
+ category: 'Search bot'
1068
+ url: ''
1069
+ producer:
1070
+ name: 'Netcraft'
1071
+ url: 'http://www.netcraft.com'
1072
+ -
1073
+ user_agent: Netvibes (http://www.netvibes.com)
1074
+ bot:
1075
+ name: 'Netvibes'
1076
+ url: 'http://www.netvibes.com/'
1077
+ category: 'Feed Fetcher'
1078
+ producer:
1079
+ name: ''
1080
+ url: ''
1081
+ -
1082
+ user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
1083
+ bot:
1084
+ name: 'Netvibes'
1085
+ url: 'http://www.netvibes.com/'
1086
+ category: 'Feed Fetcher'
1087
+ producer:
1088
+ name: ''
1089
+ url: ''
1090
+ -
1091
+ user_agent: NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1092
+ bot:
1093
+ name: 'NewsBlur'
1094
+ url: 'http://www.newsblur.com'
1095
+ category: 'Feed Fetcher'
1096
+ producer:
1097
+ name: ''
1098
+ url: ''
1099
+ -
1100
+ user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1101
+ bot:
1102
+ name: 'NewsBlur'
1103
+ url: 'http://www.newsblur.com'
1104
+ category: 'Feed Fetcher'
1105
+ producer:
1106
+ name: ''
1107
+ url: ''
1108
+ -
1109
+ user_agent: NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1110
+ bot:
1111
+ name: 'NewsBlur'
1112
+ url: 'http://www.newsblur.com'
1113
+ category: 'Feed Fetcher'
1114
+ producer:
1115
+ name: ''
1116
+ url: ''
1117
+ -
1118
+ user_agent: NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
1119
+ bot:
1120
+ name: 'NewsBlur'
1121
+ url: 'http://www.newsblur.com'
1122
+ category: 'Feed Fetcher'
1123
+ producer:
1124
+ name: ''
1125
+ url: ''
1126
+ -
1127
+ user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
1128
+ bot:
1129
+ name: NewsGator
1130
+ url: 'http://www.newsgator.com'
1131
+ category: 'Feed Fetcher'
1132
+ producer:
1133
+ name: ''
1134
+ url: ''
1135
+ -
1136
+ user_agent: nlcrawler/1.0 (+http://northernlight.com/)
1137
+ bot:
1138
+ name: 'NLCrawler'
1139
+ category: 'Crawler'
1140
+ url: ''
1141
+ producer:
1142
+ name: 'Northern Light'
1143
+ url: 'http://northernlight.com'
1144
+ -
1145
+ user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
1146
+ bot:
1147
+ name: 'Omgili bot'
1148
+ category: 'Search bot'
1149
+ url: 'http://www.omgili.com/Crawler.html'
1150
+ producer:
1151
+ name: 'Omgili'
1152
+ url: 'http://www.omgili.com'
1153
+ -
1154
+ user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
1155
+ bot:
1156
+ name: 'Openindex Spider'
1157
+ category: 'Search bot'
1158
+ url: 'http://www.openindex.io/en/webmasters/spider.html'
1159
+ producer:
1160
+ name: 'Openindex B.V.'
1161
+ url: 'http://www.openindex.io'
1162
+ -
1163
+ user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
1164
+ bot:
1165
+ name: 'OpenLinkProfiler'
1166
+ category: 'Crawler'
1167
+ url: 'http://openlinkprofiler.org/bot'
1168
+ producer:
1169
+ name: 'Axandra GmbH'
1170
+ url: 'http://www.axandra.com'
1171
+ -
1172
+ user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
1173
+ bot:
1174
+ name: 'OpenWebSpider'
1175
+ category: 'Crawler'
1176
+ url: 'http://www.openwebspider.org'
1177
+ producer:
1178
+ name: 'OpenWebSpider Lab'
1179
+ url: 'http://lab.openwebspider.org'
1180
+ -
1181
+ user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
1182
+ bot:
1183
+ name: 'PaperLiBot'
1184
+ category: 'Search bot'
1185
+ url: 'http://support.paper.li/entries/20023257-what-is-paper-li'
1186
+ producer:
1187
+ name: 'Smallrivers SA'
1188
+ url: 'http://www.paper.li'
1189
+ -
1190
+ user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
1191
+ bot:
1192
+ name: 'Picsearch bot'
1193
+ category: 'Search bot'
1194
+ url: 'http://www.picsearch.com/bot.html'
1195
+ producer:
1196
+ name: 'Picsearch'
1197
+ url: 'http://www.picsearch.com'
1198
+ -
1199
+ user_agent: psbot-page (+http://www.picsearch.com/bot.html)
1200
+ bot:
1201
+ name: 'Picsearch bot'
1202
+ category: 'Search bot'
1203
+ url: 'http://www.picsearch.com/bot.html'
1204
+ producer:
1205
+ name: 'Picsearch'
1206
+ url: 'http://www.picsearch.com'
1207
+ -
1208
+ user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
1209
+ bot:
1210
+ name: 'Pingdom Bot'
1211
+ category: 'Site Monitors'
1212
+ url: ''
1213
+ producer:
1214
+ name: 'Pingdom AB'
1215
+ url: 'https://www.pingdom.com'
1216
+ -
1217
+ user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
1218
+ bot:
1219
+ name: 'QuerySeekerSpider'
1220
+ category: 'Crawler'
1221
+ url: 'http://queryseeker.com/bot.html'
1222
+ producer:
1223
+ name: 'QueryEye Inc.'
1224
+ url: 'http://queryeye.com'
1225
+ -
1226
+ user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
1227
+ bot:
1228
+ name: 'Reddit Bot'
1229
+ category: 'Social Media Agent'
1230
+ url: 'http://www.reddit.com/feedback'
1231
+ producer:
1232
+ name: 'reddit inc.'
1233
+ url: 'http://www.reddit.com'
1234
+ -
1235
+ user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
1236
+ bot:
1237
+ name: 'Rogerbot'
1238
+ category: 'Crawler'
1239
+ url: 'http://moz.com/help/pro/what-is-rogerbot-'
1240
+ producer:
1241
+ name: 'SEOmoz, Inc.'
1242
+ url: 'http://moz.com/'
1243
+ -
1244
+ user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
1245
+ bot:
1246
+ name: 'Rogerbot'
1247
+ category: 'Crawler'
1248
+ url: 'http://moz.com/help/pro/what-is-rogerbot-'
1249
+ producer:
1250
+ name: 'SEOmoz, Inc.'
1251
+ url: 'http://moz.com/'
1252
+ -
1253
+ user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
1254
+ bot:
1255
+ name: 'Rogerbot'
1256
+ category: 'Crawler'
1257
+ url: 'http://moz.com/help/pro/what-is-rogerbot-'
1258
+ producer:
1259
+ name: 'SEOmoz, Inc.'
1260
+ url: 'http://moz.com/'
1261
+ -
1262
+ user_agent: Screaming Frog SEO Spider/2.22
1263
+ bot:
1264
+ name: 'Screaming Frog SEO Spider'
1265
+ category: 'Crawler'
1266
+ url: 'http://www.screamingfrog.co.uk/seo-spider'
1267
+ producer:
1268
+ name: 'Screaming Frog Ltd'
1269
+ url: 'http://www.screamingfrog.co.uk'
1270
+ -
1271
+ user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
1272
+ bot:
1273
+ name: 'ScreenerBot'
1274
+ category: 'Crawler'
1275
+ url: 'http://www.screenerbot.com'
1276
+ producer:
1277
+ name: ''
1278
+ url: ''
1279
+ -
1280
+ user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
1281
+ bot:
1282
+ name: 'Semrush Bot'
1283
+ category: 'Crawler'
1284
+ url: 'http://www.semrush.com/bot.html'
1285
+ producer:
1286
+ name: 'SEMrush'
1287
+ url: 'http://www.semrush.com'
1288
+ -
1289
+ user_agent: SensikaBot/x.33 (+http://sensika.com)
1290
+ bot:
1291
+ name: 'Sensika Bot'
1292
+ category: ''
1293
+ url: ''
1294
+ producer:
1295
+ name: 'Sensika'
1296
+ url: 'http://sensika.com'
1297
+ -
1298
+ user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
1299
+ bot:
1300
+ name: 'SEOENGBot'
1301
+ category: 'Crawler'
1302
+ url: 'http://www.seoengine.com/seoengbot.htm'
1303
+ producer:
1304
+ name: 'SEO Engine'
1305
+ url: 'http://www.seoengine.com'
1306
+ -
1307
+ user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
1308
+ bot:
1309
+ name: 'Seznam Bot'
1310
+ category: 'Search bot'
1311
+ url: 'http://www.mapy.cz/cz/seznambot.html'
1312
+ producer:
1313
+ name: 'Seznam.cz, a.s.'
1314
+ url: 'http://www.seznam.cz/'
1315
+ -
1316
+ user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
1317
+ bot:
1318
+ name: 'Seznam Bot'
1319
+ category: 'Search bot'
1320
+ url: 'http://www.mapy.cz/cz/seznambot.html'
1321
+ producer:
1322
+ name: 'Seznam.cz, a.s.'
1323
+ url: 'http://www.seznam.cz/'
1324
+ -
1325
+ user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
1326
+ bot:
1327
+ name: 'Seznam Bot'
1328
+ category: 'Search bot'
1329
+ url: 'http://www.mapy.cz/cz/seznambot.html'
1330
+ producer:
1331
+ name: 'Seznam.cz, a.s.'
1332
+ url: 'http://www.seznam.cz/'
1333
+ -
1334
+ user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
1335
+ bot:
1336
+ name: 'Seznam Bot'
1337
+ category: 'Search bot'
1338
+ url: 'http://www.mapy.cz/cz/seznambot.html'
1339
+ producer:
1340
+ name: 'Seznam.cz, a.s.'
1341
+ url: 'http://www.seznam.cz/'
1342
+ -
1343
+ user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
1344
+ bot:
1345
+ name: 'ShopWiki'
1346
+ category: 'Search tools'
1347
+ url: 'http://www.shopwiki.com/wiki/Help:Bot'
1348
+ producer:
1349
+ name: 'ShopWiki Corp.'
1350
+ url: 'http://www.shopwiki.com'
1351
+ -
1352
+ user_agent: SilverReader/1.0; http://silverreader.com
1353
+ bot:
1354
+ name: 'SilverReader'
1355
+ url: 'http://silverreader.com'
1356
+ category: 'Feed Fetcher'
1357
+ producer:
1358
+ name: ''
1359
+ url: ''
1360
+ -
1361
+ user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
1362
+ bot:
1363
+ name: 'SimplePie'
1364
+ url: 'http://www.simplepie.org'
1365
+ category: 'Feed Parser'
1366
+ producer:
1367
+ name: ''
1368
+ url: ''
1369
+ -
1370
+ user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
1371
+ bot:
1372
+ name: 'SimplePie'
1373
+ url: 'http://www.simplepie.org'
1374
+ category: 'Feed Parser'
1375
+ producer:
1376
+ name: ''
1377
+ url: ''
1378
+ -
1379
+ user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
1380
+ bot:
1381
+ name: 'SimplePie'
1382
+ url: 'http://www.simplepie.org'
1383
+ category: 'Feed Parser'
1384
+ producer:
1385
+ name: ''
1386
+ url: ''
1387
+ -
1388
+ user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
1389
+ bot:
1390
+ name: 'SISTRIX Crawler'
1391
+ category: 'Crawler'
1392
+ url: 'http://crawler.sistrix.net'
1393
+ producer:
1394
+ name: 'SISTRIX GmbH'
1395
+ url: 'http://www.sistrix.de'
1396
+ -
1397
+ user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
1398
+ bot:
1399
+ name: 'Sogou Spider'
1400
+ category: 'Search bot'
1401
+ url: 'http://www.sogou.com/docs/help/webmasters.htm'
1402
+ producer:
1403
+ name: 'Sohu, Inc.'
1404
+ url: 'http://www.sogou.com'
1405
+ -
1406
+ user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
1407
+ bot:
1408
+ name: 'Sogou Spider'
1409
+ category: 'Search bot'
1410
+ url: 'http://www.sogou.com/docs/help/webmasters.htm'
1411
+ producer:
1412
+ name: 'Sohu, Inc.'
1413
+ url: 'http://www.sogou.com'
1414
+ -
1415
+ user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
1416
+ bot:
1417
+ name: 'Sogou Spider'
1418
+ category: 'Search bot'
1419
+ url: 'http://www.sogou.com/docs/help/webmasters.htm'
1420
+ producer:
1421
+ name: 'Sohu, Inc.'
1422
+ url: 'http://www.sogou.com'
1423
+ -
1424
+ user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
1425
+ bot:
1426
+ name: 'Sogou Spider'
1427
+ category: 'Search bot'
1428
+ url: 'http://www.sogou.com/docs/help/webmasters.htm'
1429
+ producer:
1430
+ name: 'Sohu, Inc.'
1431
+ url: 'http://www.sogou.com'
1432
+ -
1433
+ user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
1434
+ bot:
1435
+ name: 'Soso Spider'
1436
+ category: 'Search bot'
1437
+ url: 'http://help.soso.com/webspider.htm'
1438
+ producer:
1439
+ name: 'Tencent Holdings'
1440
+ url: 'http://www.soso.com'
1441
+ -
1442
+ user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
1443
+ bot:
1444
+ name: 'Superfeedr Bot'
1445
+ category: 'Feed Fetcher'
1446
+ url: ''
1447
+ producer:
1448
+ name: 'Superfeedr'
1449
+ url: 'https://superfeedr.com/'
1450
+ -
1451
+ user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
1452
+ bot:
1453
+ name: 'Spinn3r'
1454
+ category: 'Crawler'
1455
+ url: 'http://spinn3r.com/robot'
1456
+ producer:
1457
+ name: 'Tailrank Inc'
1458
+ url: 'http://spinn3r.com'
1459
+ -
1460
+ user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
1461
+ bot:
1462
+ name: 'Sputnik Bot'
1463
+ category: ''
1464
+ url: ''
1465
+ producer:
1466
+ name: ''
1467
+ url: ''
1468
+ -
1469
+ user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
1470
+ bot:
1471
+ name: 'Sputnik Bot'
1472
+ category: ''
1473
+ url: ''
1474
+ producer:
1475
+ name: ''
1476
+ url: ''
1477
+ -
1478
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
1479
+ bot:
1480
+ name: 'Survey Bot'
1481
+ category: 'Search bot'
1482
+ url: 'http://www.domaintools.com/webmasters/surveybot.php'
1483
+ producer:
1484
+ name: 'Domain Tools'
1485
+ url: 'http://www.domaintools.com'
1486
+ -
1487
+ user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
1488
+ bot:
1489
+ name: 'TinEye Crawler'
1490
+ category: 'Search bot'
1491
+ url: 'http://www.tineye.com/crawler.html'
1492
+ producer:
1493
+ name: 'Idée Inc.'
1494
+ url: 'http://ideeinc.com'
1495
+ -
1496
+ user_agent: 'Tiny Tiny RSS/1.10 (http://tt-rss.org/)'
1497
+ bot:
1498
+ name: 'Tiny Tiny RSS'
1499
+ url: 'http://tt-rss.org'
1500
+ category: 'Feed Fetcher'
1501
+ producer:
1502
+ name: ''
1503
+ url: ''
1504
+ -
1505
+ user_agent: 'Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)'
1506
+ bot:
1507
+ name: 'Tiny Tiny RSS'
1508
+ url: 'http://tt-rss.org'
1509
+ category: 'Feed Fetcher'
1510
+ producer:
1511
+ name: ''
1512
+ url: ''
1513
+ -
1514
+ user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
1515
+ bot:
1516
+ name: 'TurnitinBot'
1517
+ category: 'Crawler'
1518
+ url: 'http://www.turnitin.com/robot/crawlerinfo.html'
1519
+ producer:
1520
+ name: 'iParadigms, LLC.'
1521
+ url: 'http://www.turnitin.com'
1522
+ -
1523
+ user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
1524
+ bot:
1525
+ name: 'TweetedTimes Bot'
1526
+ category: 'Crawler'
1527
+ url: 'http://tweetedtimes.com'
1528
+ producer:
1529
+ name: 'TweetedTimes'
1530
+ url: 'http://tweetedtimes.com/'
1531
+ -
1532
+ user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
1533
+ bot:
1534
+ name: 'TweetedTimes Bot'
1535
+ category: 'Crawler'
1536
+ url: 'http://tweetedtimes.com'
1537
+ producer:
1538
+ name: 'TweetedTimes'
1539
+ url: 'http://tweetedtimes.com/'
1540
+ -
1541
+ user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
1542
+ bot:
1543
+ name: 'Tweetmeme Bot'
1544
+ category: 'Crawler'
1545
+ url: 'http://tweetmeme.com/'
1546
+ producer:
1547
+ name: 'Mediasift'
1548
+ url: ''
1549
+ -
1550
+ user_agent: Twitterbot/1.0
1551
+ bot:
1552
+ name: 'Twitterbot'
1553
+ category: 'Social Media Agent'
1554
+ url: 'https://dev.twitter.com/docs/cards/getting-started'
1555
+ producer:
1556
+ name: 'Twitter'
1557
+ url: 'http://www.twitter.com'
1558
+ -
1559
+ user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
1560
+ bot:
1561
+ name: 'Uptime Robot'
1562
+ category: 'Site Monitor'
1563
+ url: ''
1564
+ producer:
1565
+ name: 'Uptime Robot'
1566
+ url: 'http://uptimerobot.com'
1567
+ -
1568
+ user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
1569
+ bot:
1570
+ name: 'URLAppendBot'
1571
+ category: 'Crawler'
1572
+ url: 'http://www.profound.net/urlappendbot.html'
1573
+ producer:
1574
+ name: 'Profound Networks'
1575
+ url: 'http://www.profound.net'
1576
+ -
1577
+ user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
1578
+ bot:
1579
+ name: 'Visual Site Mapper Crawler'
1580
+ category: 'Crawler'
1581
+ url: 'http://www.visualsitemapper.com/crawler'
1582
+ producer:
1583
+ name: 'Alentum Software Ltd.'
1584
+ url: 'http://www.alentum.com'
1585
+ -
1586
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
1587
+ bot:
1588
+ name: 'Voila Bot'
1589
+ category: 'Search bot'
1590
+ url: 'http://www.voila.fr'
1591
+ producer:
1592
+ name: ''
1593
+ url: ''
1594
+ -
1595
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
1596
+ bot:
1597
+ name: 'Voila Bot'
1598
+ category: 'Search bot'
1599
+ url: 'http://www.voila.fr'
1600
+ producer:
1601
+ name: ''
1602
+ url: ''
1603
+ -
1604
+ user_agent: Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)
1605
+ bot:
1606
+ name: 'W3C CSS Validator'
1607
+ category: 'Validator'
1608
+ url: 'http://jigsaw.w3.org/css-validator'
1609
+ producer:
1610
+ name: 'W3C'
1611
+ url: 'http://www.w3.org'
1612
+ -
1613
+ user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
1614
+ bot:
1615
+ name: 'W3C I18N Checker'
1616
+ category: 'Validator'
1617
+ url: 'http://validator.w3.org/i18n-checker'
1618
+ producer:
1619
+ name: 'W3C'
1620
+ url: 'http://www.w3.org'
1621
+ -
1622
+ user_agent: W3C-checklink/4.0 [4.4] libwww-perl/5.803
1623
+ bot:
1624
+ name: 'W3C Link Checker'
1625
+ category: 'Validator'
1626
+ url: 'http://validator.w3.org/checklink'
1627
+ producer:
1628
+ name: 'W3C'
1629
+ url: 'http://www.w3.org'
1630
+ -
1631
+ user_agent: W3C-checklink/4.81 libwww-perl/5.836
1632
+ bot:
1633
+ name: 'W3C Link Checker'
1634
+ category: 'Validator'
1635
+ url: 'http://validator.w3.org/checklink'
1636
+ producer:
1637
+ name: 'W3C'
1638
+ url: 'http://www.w3.org'
1639
+ -
1640
+ user_agent: W3C_Validator/1.3 http://validator.w3.org/services
1641
+ bot:
1642
+ name: 'W3C Markup Validation Service'
1643
+ category: 'Validator'
1644
+ url: 'http://validator.w3.org/services'
1645
+ producer:
1646
+ name: 'W3C'
1647
+ url: 'http://www.w3.org'
1648
+ -
1649
+ user_agent: W3C_Validator/1.767
1650
+ bot:
1651
+ name: 'W3C Markup Validation Service'
1652
+ category: 'Validator'
1653
+ url: 'http://validator.w3.org/services'
1654
+ producer:
1655
+ name: 'W3C'
1656
+ url: 'http://www.w3.org'
1657
+ -
1658
+ user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
1659
+ bot:
1660
+ name: 'W3C MobileOK Checker'
1661
+ category: 'Validator'
1662
+ url: 'http://validator.w3.org/mobile'
1663
+ producer:
1664
+ name: 'W3C'
1665
+ url: 'http://www.w3.org'
1666
+ -
1667
+ user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
1668
+ bot:
1669
+ name: 'W3C Unified Validator'
1670
+ category: 'Validator'
1671
+ url: 'http://validator.w3.org/unicorn'
1672
+ producer:
1673
+ name: 'W3C'
1674
+ url: 'http://www.w3.org'
1675
+ -
1676
+ user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
1677
+ bot:
1678
+ name: 'WebbCrawler'
1679
+ category: 'Crawler'
1680
+ url: 'http://badcheese.com/crawler.html'
1681
+ producer:
1682
+ name: 'Steve Webb'
1683
+ url: 'http://badcheese.com'
1684
+ -
1685
+ user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
1686
+ bot:
1687
+ name: 'WeSEE:Search'
1688
+ category: 'Search bot'
1689
+ url: 'http://www.wesee.com/bot'
1690
+ producer:
1691
+ name: 'WeSEE Ltd'
1692
+ url: 'http://www.wesee.com'
1693
+ -
1694
+ user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
1695
+ bot:
1696
+ name: 'Wotbox'
1697
+ category: 'Search bot'
1698
+ url: 'http://www.wotbox.com/bot/'
1699
+ producer:
1700
+ name: 'Wotbox'
1701
+ url: 'http://www.wotbox.com'
1702
+ -
1703
+ user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
1704
+ bot:
1705
+ name: 'YaCy'
1706
+ category: 'Search bot'
1707
+ url: 'http://yacy.net/bot.html'
1708
+ producer:
1709
+ name: 'YaCy'
1710
+ url: 'http://yacy.net'
1711
+ -
1712
+ user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
1713
+ bot:
1714
+ name: 'YaCy'
1715
+ category: 'Search bot'
1716
+ url: 'http://yacy.net/bot.html'
1717
+ producer:
1718
+ name: 'YaCy'
1719
+ url: 'http://yacy.net'
1720
+ -
1721
+ user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
1722
+ bot:
1723
+ name: 'Yahoo! Slurp'
1724
+ category: 'Search bot'
1725
+ url: 'http://help.yahoo.com/ysearch/slurp'
1726
+ producer:
1727
+ name: 'Yahoo! Inc.'
1728
+ url: 'http://www.yahoo.com'
1729
+ -
1730
+ user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
1731
+ bot:
1732
+ name: 'Yahoo! Slurp'
1733
+ category: 'Search bot'
1734
+ url: 'http://help.yahoo.com/ysearch/slurp'
1735
+ producer:
1736
+ name: 'Yahoo! Inc.'
1737
+ url: 'http://www.yahoo.com'
1738
+ -
1739
+ user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
1740
+ bot:
1741
+ name: 'Yandex Bot'
1742
+ category: 'Search bot'
1743
+ url: 'http://www.yandex.com/bots'
1744
+ producer:
1745
+ name: 'Yandex LLC'
1746
+ url: 'http://company.yandex.com'
1747
+ -
1748
+ user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
1749
+ bot:
1750
+ name: 'Yandex Bot'
1751
+ category: 'Search bot'
1752
+ url: 'http://www.yandex.com/bots'
1753
+ producer:
1754
+ name: 'Yandex LLC'
1755
+ url: 'http://company.yandex.com'
1756
+ -
1757
+ user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
1758
+ bot:
1759
+ name: 'Yandex Bot'
1760
+ category: 'Search bot'
1761
+ url: 'http://www.yandex.com/bots'
1762
+ producer:
1763
+ name: 'Yandex LLC'
1764
+ url: 'http://company.yandex.com'
1765
+ -
1766
+ user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
1767
+ bot:
1768
+ name: 'Yandex Bot'
1769
+ category: 'Search bot'
1770
+ url: 'http://www.yandex.com/bots'
1771
+ producer:
1772
+ name: 'Yandex LLC'
1773
+ url: 'http://company.yandex.com'
1774
+ -
1775
+ user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
1776
+ bot:
1777
+ name: 'Yandex Bot'
1778
+ category: 'Search bot'
1779
+ url: 'http://www.yandex.com/bots'
1780
+ producer:
1781
+ name: 'Yandex LLC'
1782
+ url: 'http://company.yandex.com'
1783
+ -
1784
+ user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
1785
+ bot:
1786
+ name: 'Yandex Bot'
1787
+ category: 'Search bot'
1788
+ url: 'http://www.yandex.com/bots'
1789
+ producer:
1790
+ name: 'Yandex LLC'
1791
+ url: 'http://company.yandex.com'
1792
+ -
1793
+ user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
1794
+ bot:
1795
+ name: 'Yandex Bot'
1796
+ category: 'Search bot'
1797
+ url: 'http://www.yandex.com/bots'
1798
+ producer:
1799
+ name: 'Yandex LLC'
1800
+ url: 'http://company.yandex.com'
1801
+ -
1802
+ user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
1803
+ bot:
1804
+ name: 'Yandex Bot'
1805
+ category: 'Search bot'
1806
+ url: 'http://www.yandex.com/bots'
1807
+ producer:
1808
+ name: 'Yandex LLC'
1809
+ url: 'http://company.yandex.com'
1810
+ -
1811
+ user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
1812
+ bot:
1813
+ name: 'Yandex Bot'
1814
+ category: 'Search bot'
1815
+ url: 'http://www.yandex.com/bots'
1816
+ producer:
1817
+ name: 'Yandex LLC'
1818
+ url: 'http://company.yandex.com'
1819
+ -
1820
+ user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
1821
+ bot:
1822
+ name: 'Yandex Bot'
1823
+ category: 'Search bot'
1824
+ url: 'http://www.yandex.com/bots'
1825
+ producer:
1826
+ name: 'Yandex LLC'
1827
+ url: 'http://company.yandex.com'
1828
+ -
1829
+ user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
1830
+ bot:
1831
+ name: 'Yandex Bot'
1832
+ category: 'Search bot'
1833
+ url: 'http://www.yandex.com/bots'
1834
+ producer:
1835
+ name: 'Yandex LLC'
1836
+ url: 'http://company.yandex.com'
1837
+ -
1838
+ user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
1839
+ bot:
1840
+ name: 'Yandex Bot'
1841
+ category: 'Search bot'
1842
+ url: 'http://www.yandex.com/bots'
1843
+ producer:
1844
+ name: 'Yandex LLC'
1845
+ url: 'http://company.yandex.com'
1846
+ -
1847
+ user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
1848
+ bot:
1849
+ name: 'Yandex Bot'
1850
+ category: 'Search bot'
1851
+ url: 'http://www.yandex.com/bots'
1852
+ producer:
1853
+ name: 'Yandex LLC'
1854
+ url: 'http://company.yandex.com'
1855
+ -
1856
+ user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
1857
+ bot:
1858
+ name: 'Yeti/Naverbot'
1859
+ category: 'Search bot'
1860
+ url: 'http://help.naver.com/robots/'
1861
+ producer:
1862
+ name: 'Naver'
1863
+ url: 'http://www.naver.com'
1864
+ -
1865
+ user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
1866
+ bot:
1867
+ name: 'Youdao Bot'
1868
+ category: 'Search bot'
1869
+ url: 'http://www.youdao.com/help/webmaster/spider'
1870
+ producer:
1871
+ name: 'NetEase, Inc.'
1872
+ url: 'http://corp.163.com'
1873
+ -
1874
+ user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
1875
+ bot:
1876
+ name: 'Yunyun Bot'
1877
+ category: 'Search bot'
1878
+ url: 'http://www.yunyun.com/SiteInfo.php?r=about'
1879
+ producer:
1880
+ name: 'YunYun'
1881
+ url: 'http://www.yunyun.com'
1882
+ -
1883
+ user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
1884
+ bot:
1885
+ name: 'Yunyun Bot'
1886
+ category: 'Search bot'
1887
+ url: 'http://www.yunyun.com/SiteInfo.php?r=about'
1888
+ producer:
1889
+ name: 'YunYun'
1890
+ url: 'http://www.yunyun.com'
1891
+ -
1892
+ user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
1893
+ bot:
1894
+ name: 'Yunyun Bot'
1895
+ category: 'Search bot'
1896
+ url: 'http://www.yunyun.com/SiteInfo.php?r=about'
1897
+ producer:
1898
+ name: 'YunYun'
1899
+ url: 'http://www.yunyun.com'
1900
+ -
1901
+ user_agent: Zookabot/2.5;++http://zookabot.com
1902
+ bot:
1903
+ name: 'Zookabot'
1904
+ category: 'Crawler'
1905
+ url: 'http://zookabot.com'
1906
+ producer:
1907
+ name: 'Hwacha ApS'
1908
+ url: 'http://hwacha.dk'
1909
+ -
1910
+ user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
1911
+ bot:
1912
+ name: 'ZumBot'
1913
+ category: 'Search bot'
1914
+ url: 'http://help.zum.com/inquiry'
1915
+ producer:
1916
+ name: 'ZUM internet'
1917
+ url: 'http://www.zuminternet.com/'
1918
+ -
1919
+ user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
1920
+ bot:
1921
+ name: 'ZumBot'
1922
+ category: 'Search bot'
1923
+ url: 'http://help.zum.com/inquiry'
1924
+ producer:
1925
+ name: 'ZUM internet'
1926
+ url: 'http://www.zuminternet.com/'
1927
+ -
1928
+ user_agent: Your Nutch Spider/Nutch-2.2.1
1929
+ bot:
1930
+ name: 'Nutch-based Bot'
1931
+ category: 'crawler'
1932
+ url: 'https://nutch.apache.org'
1933
+ producer:
1934
+ name: 'The Apache Software Foundation'
1935
+ url: 'http://www.apache.org/foundation/'
1936
+ -
1937
+ user_agent: Nutch12/Nutch-1.2
1938
+ bot:
1939
+ name: 'Nutch-based Bot'
1940
+ category: 'crawler'
1941
+ url: 'https://nutch.apache.org'
1942
+ producer:
1943
+ name: 'The Apache Software Foundation'
1944
+ url: 'http://www.apache.org/foundation/'
1945
+ -
1946
+ user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
1947
+ bot:
1948
+ name: 'Nutch-based Bot'
1949
+ category: 'crawler'
1950
+ url: 'https://nutch.apache.org'
1951
+ producer:
1952
+ name: 'The Apache Software Foundation'
1953
+ url: 'http://www.apache.org/foundation/'
1954
+ -
1955
+ user_agent: MySpider/Nutch-2.2
1956
+ bot:
1957
+ name: 'Nutch-based Bot'
1958
+ category: 'crawler'
1959
+ url: 'https://nutch.apache.org'
1960
+ producer:
1961
+ name: 'The Apache Software Foundation'
1962
+ url: 'http://www.apache.org/foundation/'
1963
+ -
1964
+ user_agent: My Nutch Spider/Nutch-1.6
1965
+ bot:
1966
+ name: 'Nutch-based Bot'
1967
+ category: 'crawler'
1968
+ url: 'https://nutch.apache.org'
1969
+ producer:
1970
+ name: 'The Apache Software Foundation'
1971
+ url: 'http://www.apache.org/foundation/'
1972
+ -
1973
+ user_agent: NutchSpider/Nutch-1.4
1974
+ bot:
1975
+ name: 'Nutch-based Bot'
1976
+ category: 'crawler'
1977
+ url: 'https://nutch.apache.org'
1978
+ producer:
1979
+ name: 'The Apache Software Foundation'
1980
+ url: 'http://www.apache.org/foundation/'
1981
+ -
1982
+ user_agent: testnutch/Nutch-1.8
1983
+ bot:
1984
+ name: 'Nutch-based Bot'
1985
+ category: 'crawler'
1986
+ url: 'https://nutch.apache.org'
1987
+ producer:
1988
+ name: 'The Apache Software Foundation'
1989
+ url: 'http://www.apache.org/foundation/'
1990
+ -
1991
+ user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
1992
+ bot:
1993
+ name: 'Nutch-based Bot'
1994
+ category: 'crawler'
1995
+ url: 'https://nutch.apache.org'
1996
+ producer:
1997
+ name: 'The Apache Software Foundation'
1998
+ url: 'http://www.apache.org/foundation/'
1999
+ -
2000
+ user_agent: your sipder name/Nutch-1.7
2001
+ bot:
2002
+ name: 'Nutch-based Bot'
2003
+ category: 'crawler'
2004
+ url: 'https://nutch.apache.org'
2005
+ producer:
2006
+ name: 'The Apache Software Foundation'
2007
+ url: 'http://www.apache.org/foundation/'
2008
+ -
2009
+ user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
2010
+ bot:
2011
+ name: 'Nutch-based Bot'
2012
+ category: 'crawler'
2013
+ url: 'https://nutch.apache.org'
2014
+ producer:
2015
+ name: 'The Apache Software Foundation'
2016
+ url: 'http://www.apache.org/foundation/'
2017
+ -
2018
+ user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
2019
+ bot:
2020
+ name: 'Nutch-based Bot'
2021
+ category: 'crawler'
2022
+ url: 'https://nutch.apache.org'
2023
+ producer:
2024
+ name: 'The Apache Software Foundation'
2025
+ url: 'http://www.apache.org/foundation/'
2026
+ -
2027
+ user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
2028
+ bot:
2029
+ name: 'Nutch-based Bot'
2030
+ category: 'crawler'
2031
+ url: 'https://nutch.apache.org'
2032
+ producer:
2033
+ name: 'The Apache Software Foundation'
2034
+ url: 'http://www.apache.org/foundation/'
2035
+ -
2036
+ user_agent: CB/Nutch-1.7
2037
+ bot:
2038
+ name: 'Nutch-based Bot'
2039
+ category: 'crawler'
2040
+ url: 'https://nutch.apache.org'
2041
+ producer:
2042
+ name: 'The Apache Software Foundation'
2043
+ url: 'http://www.apache.org/foundation/'
2044
+ -
2045
+ user_agent: NetLyzer FastProbe
2046
+ bot:
2047
+ name: 'NetLyzer FastProbe'
2048
+ -
2049
+ user_agent: StatusCake Error Detector Crawler V0.01
2050
+ bot:
2051
+ name: 'Generic Bot'
2052
+ -
2053
+ user_agent: niki-bot
2054
+ bot:
2055
+ name: 'Generic Bot'