device_detector 1.0.0 → 1.1.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +5 -5
- data/CHANGELOG.md +58 -4
- data/README.md +57 -21
- data/lib/device_detector/bot.rb +2 -2
- data/lib/device_detector/browser.rb +691 -0
- data/lib/device_detector/client.rb +11 -2
- data/lib/device_detector/client_hint.rb +249 -0
- data/lib/device_detector/device.rb +1954 -23
- data/lib/device_detector/memory_cache.rb +26 -19
- data/lib/device_detector/metadata_extractor.rb +7 -8
- data/lib/device_detector/model_extractor.rb +3 -3
- data/lib/device_detector/name_extractor.rb +2 -2
- data/lib/device_detector/os.rb +289 -112
- data/lib/device_detector/parser.rb +49 -13
- data/lib/device_detector/vendor_fragment.rb +25 -0
- data/lib/device_detector/version.rb +3 -1
- data/lib/device_detector/version_extractor.rb +29 -2
- data/lib/device_detector.rb +192 -44
- data/regexes/bots.yml +3399 -91
- data/regexes/client/browser_engine.yml +28 -4
- data/regexes/client/browsers.yml +2697 -408
- data/regexes/client/feed_readers.yml +60 -22
- data/regexes/client/hints/apps.yml +150 -0
- data/regexes/client/hints/browsers.yml +292 -0
- data/regexes/client/libraries.yml +598 -4
- data/regexes/client/mediaplayers.yml +110 -5
- data/regexes/client/mobile_apps.yml +2451 -14
- data/regexes/client/pim.yml +128 -3
- data/regexes/device/cameras.yml +6 -6
- data/regexes/device/car_browsers.yml +39 -3
- data/regexes/device/consoles.yml +40 -6
- data/regexes/device/mobiles.yml +38844 -2907
- data/regexes/device/notebooks.yml +127 -0
- data/regexes/device/portable_media_player.yml +75 -12
- data/regexes/device/shell_tv.yml +145 -0
- data/regexes/device/televisions.yml +981 -40
- data/regexes/oss.yml +1560 -311
- data/regexes/vendorfragments.yml +6 -2
- metadata +31 -105
- data/.gitignore +0 -14
- data/.travis.yml +0 -18
- data/Gemfile +0 -8
- data/Rakefile +0 -79
- data/device_detector.gemspec +0 -26
- data/spec/device_detector/bot_fixtures_spec.rb +0 -30
- data/spec/device_detector/client_fixtures_spec.rb +0 -31
- data/spec/device_detector/concrete_user_agent_spec.rb +0 -136
- data/spec/device_detector/detector_fixtures_spec.rb +0 -60
- data/spec/device_detector/device_fixtures_spec.rb +0 -36
- data/spec/device_detector/device_spec.rb +0 -151
- data/spec/device_detector/memory_cache_spec.rb +0 -116
- data/spec/device_detector/model_extractor_spec.rb +0 -63
- data/spec/device_detector/os_fixtures_spec.rb +0 -26
- data/spec/device_detector/version_extractor_spec.rb +0 -80
- data/spec/device_detector_spec.rb +0 -198
- data/spec/fixtures/client/browser.yml +0 -1313
- data/spec/fixtures/client/feed_reader.yml +0 -187
- data/spec/fixtures/client/library.yml +0 -84
- data/spec/fixtures/client/mediaplayer.yml +0 -168
- data/spec/fixtures/client/mobile_app.yml +0 -30
- data/spec/fixtures/client/pim.yml +0 -96
- data/spec/fixtures/detector/bots.yml +0 -2418
- data/spec/fixtures/detector/camera.yml +0 -115
- data/spec/fixtures/detector/car_browser.yml +0 -20
- data/spec/fixtures/detector/console.yml +0 -267
- data/spec/fixtures/detector/desktop.yml +0 -4828
- data/spec/fixtures/detector/feature_phone.yml +0 -782
- data/spec/fixtures/detector/feed_reader.yml +0 -486
- data/spec/fixtures/detector/mediaplayer.yml +0 -179
- data/spec/fixtures/detector/mobile_apps.yml +0 -149
- data/spec/fixtures/detector/phablet.yml +0 -2140
- data/spec/fixtures/detector/portable_media_player.yml +0 -153
- data/spec/fixtures/detector/smart_display.yml +0 -58
- data/spec/fixtures/detector/smartphone-1.yml +0 -9469
- data/spec/fixtures/detector/smartphone-2.yml +0 -9414
- data/spec/fixtures/detector/smartphone-3.yml +0 -9396
- data/spec/fixtures/detector/smartphone-4.yml +0 -5742
- data/spec/fixtures/detector/smartphone.yml +0 -9411
- data/spec/fixtures/detector/tablet-1.yml +0 -9495
- data/spec/fixtures/detector/tablet-2.yml +0 -248
- data/spec/fixtures/detector/tablet.yml +0 -9484
- data/spec/fixtures/detector/tv.yml +0 -2582
- data/spec/fixtures/detector/unknown.yml +0 -3196
- data/spec/fixtures/device/camera.yml +0 -18
- data/spec/fixtures/device/car_browser.yml +0 -6
- data/spec/fixtures/device/console.yml +0 -78
- data/spec/fixtures/parser/oss.yml +0 -800
- data/spec/fixtures/parser/vendorfragments.yml +0 -162
- data/spec/spec_helper.rb +0 -9
@@ -1,2418 +0,0 @@
|
|
1
|
-
---
|
2
|
-
-
|
3
|
-
user_agent: 360spider-image
|
4
|
-
bot:
|
5
|
-
name: 360Spider
|
6
|
-
category: Search bot
|
7
|
-
url: http://www.so.com/help/help_3_2.html
|
8
|
-
producer:
|
9
|
-
name: Online Media Group, Inc.
|
10
|
-
url:
|
11
|
-
-
|
12
|
-
user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
|
13
|
-
bot:
|
14
|
-
name: 360Spider
|
15
|
-
category: Search bot
|
16
|
-
url: http://www.so.com/help/help_3_2.html
|
17
|
-
producer:
|
18
|
-
name: Online Media Group, Inc.
|
19
|
-
url:
|
20
|
-
-
|
21
|
-
user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
|
22
|
-
bot:
|
23
|
-
name: 360Spider
|
24
|
-
category: Search bot
|
25
|
-
url: http://www.so.com/help/help_3_2.html
|
26
|
-
producer:
|
27
|
-
name: Online Media Group, Inc.
|
28
|
-
url:
|
29
|
-
-
|
30
|
-
user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
|
31
|
-
bot:
|
32
|
-
name: 360Spider
|
33
|
-
category: Search bot
|
34
|
-
url: http://www.so.com/help/help_3_2.html
|
35
|
-
producer:
|
36
|
-
name: Online Media Group, Inc.
|
37
|
-
url:
|
38
|
-
-
|
39
|
-
user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
|
40
|
-
bot:
|
41
|
-
name: ADMantX
|
42
|
-
-
|
43
|
-
user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
|
44
|
-
bot:
|
45
|
-
name: Aboundexbot
|
46
|
-
category: Search bot
|
47
|
-
url: http://www.aboundex.com/crawler/
|
48
|
-
producer:
|
49
|
-
name: Aboundex.com
|
50
|
-
url: http://www.aboundex.com
|
51
|
-
-
|
52
|
-
user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
|
53
|
-
bot:
|
54
|
-
name: Acoon
|
55
|
-
category: Search bot
|
56
|
-
url: http://www.acoon.de/robot.asp
|
57
|
-
producer:
|
58
|
-
name: Acoon GmbH
|
59
|
-
url: http://www.acoon.de
|
60
|
-
-
|
61
|
-
user_agent: AddThis.com robot tech.support@clearspring.com
|
62
|
-
bot:
|
63
|
-
name: AddThis.com
|
64
|
-
category: Social Media Agent
|
65
|
-
url:
|
66
|
-
producer:
|
67
|
-
name: Clearspring Technologies, Inc.
|
68
|
-
url: http://www.clearspring.com
|
69
|
-
-
|
70
|
-
user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
|
71
|
-
bot:
|
72
|
-
name: Alexa Crawler
|
73
|
-
category: Search bot
|
74
|
-
url: https://alexa.zendesk.com/hc/en-us/sections/200100794-Crawlers
|
75
|
-
producer:
|
76
|
-
name: Alexa Internet
|
77
|
-
url: http://www.alexa.com
|
78
|
-
-
|
79
|
-
user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
|
80
|
-
bot:
|
81
|
-
name: Amorank Spider
|
82
|
-
category: Crawler
|
83
|
-
url: http://amorank.com/webcrawler.html
|
84
|
-
producer:
|
85
|
-
name: Amorank
|
86
|
-
url: http://www.amorank.com
|
87
|
-
-
|
88
|
-
user_agent: 'Curious George - www.analyticsseo.com/crawler'
|
89
|
-
bot:
|
90
|
-
name: Analytics SEO Crawler
|
91
|
-
category: Crawler
|
92
|
-
url: http://www.analyticsseo.com/crawler
|
93
|
-
producer:
|
94
|
-
name: Analytics SEO
|
95
|
-
url: http://www.analyticsseo.com
|
96
|
-
-
|
97
|
-
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
|
98
|
-
bot:
|
99
|
-
name: Applebot
|
100
|
-
category: Crawler
|
101
|
-
url: http://www.apple.com/go/applebot
|
102
|
-
producer:
|
103
|
-
name: Apple Inc
|
104
|
-
url: http://www.apple.com
|
105
|
-
-
|
106
|
-
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
|
107
|
-
bot:
|
108
|
-
name: Applebot
|
109
|
-
category: Crawler
|
110
|
-
url: http://www.apple.com/go/applebot
|
111
|
-
producer:
|
112
|
-
name: Apple Inc
|
113
|
-
url: http://www.apple.com
|
114
|
-
-
|
115
|
-
user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
|
116
|
-
bot:
|
117
|
-
name: Ask Jeeves
|
118
|
-
category: Search bot
|
119
|
-
url:
|
120
|
-
producer:
|
121
|
-
name: Ask Jeeves Inc.
|
122
|
-
url: http://www.ask.com
|
123
|
-
-
|
124
|
-
user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
|
125
|
-
bot:
|
126
|
-
name: BLEXBot Crawler
|
127
|
-
category: Crawler
|
128
|
-
url: http://webmeup-crawler.com
|
129
|
-
producer:
|
130
|
-
name: WebMeUp
|
131
|
-
url: http://webmeup.com
|
132
|
-
-
|
133
|
-
user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
|
134
|
-
bot:
|
135
|
-
name: BUbiNG
|
136
|
-
category: Crawler
|
137
|
-
url: http://law.di.unimi.it/BUbiNG.html
|
138
|
-
producer:
|
139
|
-
name:
|
140
|
-
url:
|
141
|
-
-
|
142
|
-
user_agent: Backlink-Ceck.de (+http://www.backlink-check.de/bot.html)
|
143
|
-
bot:
|
144
|
-
name: Backlink-Ceck.de
|
145
|
-
category: Crawler
|
146
|
-
url: http://www.backlink-check.de/bot.html
|
147
|
-
producer:
|
148
|
-
name: Mediagreen Medienservice
|
149
|
-
url: http://www.backlink-check.de
|
150
|
-
-
|
151
|
-
user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
|
152
|
-
bot:
|
153
|
-
name: BacklinkCrawler
|
154
|
-
category: Crawler
|
155
|
-
url: http://www.backlinktest.com/crawler.html
|
156
|
-
producer:
|
157
|
-
name: 2.0Promotion GbR
|
158
|
-
url: http://www.backlinktest.com
|
159
|
-
-
|
160
|
-
user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
|
161
|
-
bot:
|
162
|
-
name: Baidu Spider
|
163
|
-
category: Search bot
|
164
|
-
url: http://www.baidu.com/search/spider.htm
|
165
|
-
producer:
|
166
|
-
name: Baidu
|
167
|
-
url: http://www.baidu.com
|
168
|
-
-
|
169
|
-
user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
|
170
|
-
bot:
|
171
|
-
name: Baidu Spider
|
172
|
-
category: Search bot
|
173
|
-
url: http://www.baidu.com/search/spider.htm
|
174
|
-
producer:
|
175
|
-
name: Baidu
|
176
|
-
url: http://www.baidu.com
|
177
|
-
-
|
178
|
-
user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
|
179
|
-
bot:
|
180
|
-
name: Baidu Spider
|
181
|
-
category: Search bot
|
182
|
-
url: http://www.baidu.com/search/spider.htm
|
183
|
-
producer:
|
184
|
-
name: Baidu
|
185
|
-
url: http://www.baidu.com
|
186
|
-
-
|
187
|
-
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
|
188
|
-
bot:
|
189
|
-
name: Baidu Spider
|
190
|
-
category: Search bot
|
191
|
-
url: http://www.baidu.com/search/spider.htm
|
192
|
-
producer:
|
193
|
-
name: Baidu
|
194
|
-
url: http://www.baidu.com
|
195
|
-
-
|
196
|
-
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
|
197
|
-
bot:
|
198
|
-
name: Baidu Spider
|
199
|
-
category: Search bot
|
200
|
-
url: http://www.baidu.com/search/spider.htm
|
201
|
-
producer:
|
202
|
-
name: Baidu
|
203
|
-
url: http://www.baidu.com
|
204
|
-
-
|
205
|
-
user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
|
206
|
-
bot:
|
207
|
-
name: Baidu Spider
|
208
|
-
category: Search bot
|
209
|
-
url: http://www.baidu.com/search/spider.htm
|
210
|
-
producer:
|
211
|
-
name: Baidu
|
212
|
-
url: http://www.baidu.com
|
213
|
-
-
|
214
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
|
215
|
-
bot:
|
216
|
-
name: Baidu Spider
|
217
|
-
category: Search bot
|
218
|
-
url: http://www.baidu.com/search/spider.htm
|
219
|
-
producer:
|
220
|
-
name: Baidu
|
221
|
-
url: http://www.baidu.com
|
222
|
-
-
|
223
|
-
user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
|
224
|
-
bot:
|
225
|
-
name: BazQux Reader
|
226
|
-
url: https://bazqux.com/fetcher
|
227
|
-
category: Feed Fetcher
|
228
|
-
producer:
|
229
|
-
name:
|
230
|
-
url:
|
231
|
-
-
|
232
|
-
user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
|
233
|
-
bot:
|
234
|
-
name: BingBot
|
235
|
-
category: Search bot
|
236
|
-
url: http://search.msn.com/msnbot.htmn
|
237
|
-
producer:
|
238
|
-
name: Microsoft Corporation
|
239
|
-
url: http://www.microsoft.com
|
240
|
-
-
|
241
|
-
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
|
242
|
-
bot:
|
243
|
-
name: BingBot
|
244
|
-
category: Search bot
|
245
|
-
url: http://search.msn.com/msnbot.htmn
|
246
|
-
producer:
|
247
|
-
name: Microsoft Corporation
|
248
|
-
url: http://www.microsoft.com
|
249
|
-
-
|
250
|
-
user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
|
251
|
-
bot:
|
252
|
-
name: BingBot
|
253
|
-
category: Search bot
|
254
|
-
url: http://search.msn.com/msnbot.htmn
|
255
|
-
producer:
|
256
|
-
name: Microsoft Corporation
|
257
|
-
url: http://www.microsoft.com
|
258
|
-
-
|
259
|
-
user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
|
260
|
-
bot:
|
261
|
-
name: BingBot
|
262
|
-
category: Search bot
|
263
|
-
url: http://search.msn.com/msnbot.htmn
|
264
|
-
producer:
|
265
|
-
name: Microsoft Corporation
|
266
|
-
url: http://www.microsoft.com
|
267
|
-
-
|
268
|
-
user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
|
269
|
-
bot:
|
270
|
-
name: BingBot
|
271
|
-
category: Search bot
|
272
|
-
url: http://search.msn.com/msnbot.htmn
|
273
|
-
producer:
|
274
|
-
name: Microsoft Corporation
|
275
|
-
url: http://www.microsoft.com
|
276
|
-
-
|
277
|
-
user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
|
278
|
-
bot:
|
279
|
-
name: BingBot
|
280
|
-
category: Search bot
|
281
|
-
url: http://search.msn.com/msnbot.htmn
|
282
|
-
producer:
|
283
|
-
name: Microsoft Corporation
|
284
|
-
url: http://www.microsoft.com
|
285
|
-
-
|
286
|
-
user_agent: msnbot/2.0b v1394720947.6703
|
287
|
-
bot:
|
288
|
-
name: BingBot
|
289
|
-
category: Search bot
|
290
|
-
url: http://search.msn.com/msnbot.htmn
|
291
|
-
producer:
|
292
|
-
name: Microsoft Corporation
|
293
|
-
url: http://www.microsoft.com
|
294
|
-
-
|
295
|
-
user_agent: MSNBot/Nutch-1.5.1
|
296
|
-
bot:
|
297
|
-
name: BingBot
|
298
|
-
category: Search bot
|
299
|
-
url: http://search.msn.com/msnbot.htmn
|
300
|
-
producer:
|
301
|
-
name: Microsoft Corporation
|
302
|
-
url: http://www.microsoft.com
|
303
|
-
-
|
304
|
-
user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
|
305
|
-
bot:
|
306
|
-
name: Blekkobot
|
307
|
-
category: Search bot
|
308
|
-
url: http://blekko.com/about/blekkobot
|
309
|
-
producer:
|
310
|
-
name: Blekko
|
311
|
-
url: http://blekko.com
|
312
|
-
-
|
313
|
-
user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
|
314
|
-
bot:
|
315
|
-
name: Bloglovin
|
316
|
-
url: http://www.bloglovin.com
|
317
|
-
category: Feed Fetcher
|
318
|
-
producer:
|
319
|
-
name:
|
320
|
-
url:
|
321
|
-
-
|
322
|
-
user_agent: Blogtrottr/2.0
|
323
|
-
bot:
|
324
|
-
name: Blogtrottr
|
325
|
-
url:
|
326
|
-
category: Feed Fetcher
|
327
|
-
producer:
|
328
|
-
name: Blogtrottr Ltd
|
329
|
-
url: https://blogtrottr.com/
|
330
|
-
-
|
331
|
-
user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
|
332
|
-
bot:
|
333
|
-
name: Bountii Bot
|
334
|
-
category: Search bot
|
335
|
-
url: http://bountii.com/contact.php
|
336
|
-
producer:
|
337
|
-
name: Bountii Inc.
|
338
|
-
url: http://bountii.com
|
339
|
-
-
|
340
|
-
user_agent: Browsershots
|
341
|
-
bot:
|
342
|
-
name: Browsershots
|
343
|
-
category: Service Agent
|
344
|
-
url: http://browsershots.org/faq
|
345
|
-
producer:
|
346
|
-
name: Browsershots.org
|
347
|
-
url: http://browsershots.org
|
348
|
-
-
|
349
|
-
user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
350
|
-
bot:
|
351
|
-
name: Butterfly Robot
|
352
|
-
category: Search bot
|
353
|
-
url: http://labs.topsy.com/butterfly
|
354
|
-
producer:
|
355
|
-
name: Topsy Labs
|
356
|
-
url: http://labs.topsy.com
|
357
|
-
-
|
358
|
-
user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
359
|
-
bot:
|
360
|
-
name: Butterfly Robot
|
361
|
-
category: Search bot
|
362
|
-
url: http://labs.topsy.com/butterfly
|
363
|
-
producer:
|
364
|
-
name: Topsy Labs
|
365
|
-
url: http://labs.topsy.com
|
366
|
-
-
|
367
|
-
user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
|
368
|
-
bot:
|
369
|
-
name: CareerBot
|
370
|
-
category: Crawler
|
371
|
-
url: http://www.career-x.de/bot.html
|
372
|
-
producer:
|
373
|
-
name: career-x GmbH
|
374
|
-
url: http://www.career-x.de
|
375
|
-
-
|
376
|
-
user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
|
377
|
-
bot:
|
378
|
-
name: Cliqzbot
|
379
|
-
category: Crawler
|
380
|
-
url: http://cliqz.com/company/cliqzbot
|
381
|
-
producer:
|
382
|
-
name: 10betterpages GmbH
|
383
|
-
url: http://cliqz.com
|
384
|
-
-
|
385
|
-
user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
|
386
|
-
bot:
|
387
|
-
name: CloudFlare Always Online
|
388
|
-
category: Site Monitor
|
389
|
-
url: http://www.cloudflare.com/always-online
|
390
|
-
producer:
|
391
|
-
name: CloudFlare
|
392
|
-
url: http://www.cloudflare.com
|
393
|
-
-
|
394
|
-
user_agent: CommaFeed/1.0 (http://www.commafeed.com)
|
395
|
-
bot:
|
396
|
-
name: CommaFeed
|
397
|
-
url: http://www.commafeed.com
|
398
|
-
category: Feed Fetcher
|
399
|
-
producer:
|
400
|
-
name:
|
401
|
-
url:
|
402
|
-
-
|
403
|
-
user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
|
404
|
-
bot:
|
405
|
-
name: Cốc Cốc Bot
|
406
|
-
url: http://help.coccoc.com/
|
407
|
-
category: Search bot
|
408
|
-
producer:
|
409
|
-
name: Cốc Cốc
|
410
|
-
url: http://coccoc.com/
|
411
|
-
-
|
412
|
-
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
|
413
|
-
bot:
|
414
|
-
name: Daum
|
415
|
-
category: Search bot
|
416
|
-
url: http://tab.search.daum.net/aboutWebSearch_en.html
|
417
|
-
producer:
|
418
|
-
name: Daum Communications Corp.
|
419
|
-
url: http://www.kakaocorp.com/main
|
420
|
-
-
|
421
|
-
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
|
422
|
-
bot:
|
423
|
-
name: Daum
|
424
|
-
category: Search bot
|
425
|
-
url: http://tab.search.daum.net/aboutWebSearch_en.html
|
426
|
-
producer:
|
427
|
-
name: Daum Communications Corp.
|
428
|
-
url: http://www.kakaocorp.com/main
|
429
|
-
-
|
430
|
-
user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
|
431
|
-
bot:
|
432
|
-
name: Dazoobot
|
433
|
-
category: Search bot
|
434
|
-
url:
|
435
|
-
producer:
|
436
|
-
name: DAZOO.FR
|
437
|
-
url: http://dazoo.fr
|
438
|
-
-
|
439
|
-
user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
|
440
|
-
bot:
|
441
|
-
name: Discobot
|
442
|
-
category: Search bot
|
443
|
-
url: http://discoveryengine.com/discobot.html
|
444
|
-
producer:
|
445
|
-
name: Discovery Engine
|
446
|
-
url: http://discoveryengine.com
|
447
|
-
-
|
448
|
-
user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
|
449
|
-
bot:
|
450
|
-
name: Domain Re-Animator Bot
|
451
|
-
category: Crawler
|
452
|
-
url:
|
453
|
-
producer:
|
454
|
-
name: Domain Re-Animator, LLC
|
455
|
-
url: http://domainreanimator.com
|
456
|
-
-
|
457
|
-
user_agent: support@domainreanimator.com
|
458
|
-
bot:
|
459
|
-
name: Domain Re-Animator Bot
|
460
|
-
category: Crawler
|
461
|
-
url:
|
462
|
-
producer:
|
463
|
-
name: Domain Re-Animator, LLC
|
464
|
-
url: http://domainreanimator.com
|
465
|
-
-
|
466
|
-
user_agent: dotbot
|
467
|
-
bot:
|
468
|
-
name: DotBot
|
469
|
-
category: Crawler
|
470
|
-
url: http://www.opensiteexplorer.org/dotbot
|
471
|
-
producer:
|
472
|
-
name: SEOmoz, Inc.
|
473
|
-
url: http://moz.com/
|
474
|
-
-
|
475
|
-
user_agent: EMail Exractor
|
476
|
-
bot:
|
477
|
-
name: EMail Exractor
|
478
|
-
category: Crawler
|
479
|
-
url:
|
480
|
-
producer:
|
481
|
-
name:
|
482
|
-
url:
|
483
|
-
-
|
484
|
-
user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
|
485
|
-
bot:
|
486
|
-
name: Easou Spider
|
487
|
-
category: Search bot
|
488
|
-
url: http://www.easou.com/search/spider.html
|
489
|
-
producer:
|
490
|
-
name: easou ICP
|
491
|
-
url: http://www.easou.com
|
492
|
-
-
|
493
|
-
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
|
494
|
-
bot:
|
495
|
-
name: Easou Spider
|
496
|
-
category: Search bot
|
497
|
-
url: http://www.easou.com/search/spider.html
|
498
|
-
producer:
|
499
|
-
name: easou ICP
|
500
|
-
url: http://www.easou.com
|
501
|
-
-
|
502
|
-
user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
|
503
|
-
bot:
|
504
|
-
name: ExaBot
|
505
|
-
category: Crawler
|
506
|
-
url: http://www.exabot.com/go/robot
|
507
|
-
producer:
|
508
|
-
name: Dassault Systèmes
|
509
|
-
url: http://www.3ds.com
|
510
|
-
-
|
511
|
-
user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
|
512
|
-
bot:
|
513
|
-
name: ExaBot
|
514
|
-
category: Crawler
|
515
|
-
url: http://www.exabot.com/go/robot
|
516
|
-
producer:
|
517
|
-
name: Dassault Systèmes
|
518
|
-
url: http://www.3ds.com
|
519
|
-
-
|
520
|
-
user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
|
521
|
-
bot:
|
522
|
-
name: ExaBot
|
523
|
-
category: Crawler
|
524
|
-
url: http://www.exabot.com/go/robot
|
525
|
-
producer:
|
526
|
-
name: Dassault Systèmes
|
527
|
-
url: http://www.3ds.com
|
528
|
-
-
|
529
|
-
user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
|
530
|
-
bot:
|
531
|
-
name: ExactSeek Crawler
|
532
|
-
category: Search bot
|
533
|
-
url: http://www.exactseek.com
|
534
|
-
producer:
|
535
|
-
name: Jayde Online, Inc.
|
536
|
-
url: http://www.jaydeonlineinc.com
|
537
|
-
-
|
538
|
-
user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
|
539
|
-
bot:
|
540
|
-
name: Ezooms
|
541
|
-
category: Crawler
|
542
|
-
url:
|
543
|
-
producer:
|
544
|
-
name: SEOmoz, Inc.
|
545
|
-
url: http://moz.com/
|
546
|
-
-
|
547
|
-
user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
|
548
|
-
bot:
|
549
|
-
name: Facebook External Hit
|
550
|
-
category: Social Media Agent
|
551
|
-
url: https://www.facebook.com/externalhit_uatext.php
|
552
|
-
producer:
|
553
|
-
name: Facebook
|
554
|
-
url: http://www.facebook.com
|
555
|
-
-
|
556
|
-
user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
|
557
|
-
bot:
|
558
|
-
name: Facebook External Hit
|
559
|
-
category: Social Media Agent
|
560
|
-
url: https://www.facebook.com/externalhit_uatext.php
|
561
|
-
producer:
|
562
|
-
name: Facebook
|
563
|
-
url: http://www.facebook.com
|
564
|
-
-
|
565
|
-
user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
|
566
|
-
bot:
|
567
|
-
name: Feed Wrangler
|
568
|
-
url: https://feedwrangler.net/
|
569
|
-
category: Feed Fetcher
|
570
|
-
producer:
|
571
|
-
name: 'David Smith & Developing Perspective, LLC'
|
572
|
-
url: https://david-smith.org
|
573
|
-
-
|
574
|
-
user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
|
575
|
-
bot:
|
576
|
-
name: FeedBurner
|
577
|
-
url: http://www.feedburner.com
|
578
|
-
category: Feed Fetcher
|
579
|
-
producer:
|
580
|
-
name:
|
581
|
-
url:
|
582
|
-
-
|
583
|
-
user_agent: 'Feedbin - 9 subscribers'
|
584
|
-
bot:
|
585
|
-
name: Feedbin
|
586
|
-
url: http://feedbin.com/
|
587
|
-
category: Feed Fetcher
|
588
|
-
producer:
|
589
|
-
name:
|
590
|
-
url:
|
591
|
-
-
|
592
|
-
user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
|
593
|
-
bot:
|
594
|
-
name: Feedly
|
595
|
-
url: http://www.feedly.com
|
596
|
-
category: Feed Fetcher
|
597
|
-
producer:
|
598
|
-
name:
|
599
|
-
url:
|
600
|
-
-
|
601
|
-
user_agent: FeedlyApp/1.0 (http://www.feedly.com)
|
602
|
-
bot:
|
603
|
-
name: Feedly
|
604
|
-
url: http://www.feedly.com
|
605
|
-
category: Feed Fetcher
|
606
|
-
producer:
|
607
|
-
name:
|
608
|
-
url:
|
609
|
-
-
|
610
|
-
user_agent: FeedlyBot/1.0 (http://feedly.com)
|
611
|
-
bot:
|
612
|
-
name: Feedly
|
613
|
-
url: http://www.feedly.com
|
614
|
-
category: Feed Fetcher
|
615
|
-
producer:
|
616
|
-
name:
|
617
|
-
url:
|
618
|
-
-
|
619
|
-
user_agent: MetaFeedly/1.0 (http://www.feedly.com)
|
620
|
-
bot:
|
621
|
-
name: Feedly
|
622
|
-
url: http://www.feedly.com
|
623
|
-
category: Feed Fetcher
|
624
|
-
producer:
|
625
|
-
name:
|
626
|
-
url:
|
627
|
-
-
|
628
|
-
user_agent: Feedspot http://www.feedspot.com
|
629
|
-
bot:
|
630
|
-
name: Feedspot
|
631
|
-
url: http://www.feedspot.com
|
632
|
-
category: Feed Fetcher
|
633
|
-
producer:
|
634
|
-
name:
|
635
|
-
url:
|
636
|
-
-
|
637
|
-
user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
|
638
|
-
bot:
|
639
|
-
name: Fever
|
640
|
-
url: http://feedafever.com/
|
641
|
-
category: Feed Fetcher
|
642
|
-
producer:
|
643
|
-
name:
|
644
|
-
url:
|
645
|
-
-
|
646
|
-
user_agent: niki-bot
|
647
|
-
bot:
|
648
|
-
name: Generic Bot
|
649
|
-
-
|
650
|
-
user_agent: StatusCake Error Detector Crawler V0.01
|
651
|
-
bot:
|
652
|
-
name: Generic Bot
|
653
|
-
-
|
654
|
-
user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
|
655
|
-
bot:
|
656
|
-
name: Genieo Web filter
|
657
|
-
category:
|
658
|
-
url: http://www.genieo.com/webfilter.html
|
659
|
-
producer:
|
660
|
-
name: Genieo
|
661
|
-
url: http://www.genieo.com
|
662
|
-
-
|
663
|
-
user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
|
664
|
-
bot:
|
665
|
-
name: Gluten Free Crawler
|
666
|
-
category: Crawler
|
667
|
-
url: http://glutenfreepleasure.com/
|
668
|
-
producer:
|
669
|
-
name:
|
670
|
-
url:
|
671
|
-
-
|
672
|
-
user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
|
673
|
-
bot:
|
674
|
-
name: Gmail Image Proxy
|
675
|
-
category: Crawler
|
676
|
-
url:
|
677
|
-
producer:
|
678
|
-
name: Google Inc.
|
679
|
-
url: http://www.google.com
|
680
|
-
-
|
681
|
-
user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
|
682
|
-
bot:
|
683
|
-
name: Goo
|
684
|
-
category: Search bot
|
685
|
-
url: http://search.goo.ne.jp/option/use/sub4/sub4-1
|
686
|
-
producer:
|
687
|
-
name: NTT Resonant
|
688
|
-
url: http://goo.ne.jp
|
689
|
-
-
|
690
|
-
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
|
691
|
-
bot:
|
692
|
-
name: Google PageSpeed Insights
|
693
|
-
category: Site Monitor
|
694
|
-
url: http://developers.google.com/speed/pagespeed/insights/
|
695
|
-
producer:
|
696
|
-
name: Google Inc.
|
697
|
-
url: http://www.google.com
|
698
|
-
-
|
699
|
-
user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
|
700
|
-
bot:
|
701
|
-
name: Google Partner Monitoring
|
702
|
-
category: Site Monitor
|
703
|
-
url:
|
704
|
-
producer:
|
705
|
-
name: Google Inc.
|
706
|
-
url: http://www.google.com
|
707
|
-
-
|
708
|
-
user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
|
709
|
-
bot:
|
710
|
-
name: Googlebot
|
711
|
-
category: Search bot
|
712
|
-
url: http://www.google.com/bot.html
|
713
|
-
producer:
|
714
|
-
name: Google Inc.
|
715
|
-
url: http://www.google.com
|
716
|
-
-
|
717
|
-
user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
|
718
|
-
bot:
|
719
|
-
name: Googlebot
|
720
|
-
category: Search bot
|
721
|
-
url: http://www.google.com/bot.html
|
722
|
-
producer:
|
723
|
-
name: Google Inc.
|
724
|
-
url: http://www.google.com
|
725
|
-
-
|
726
|
-
user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
727
|
-
bot:
|
728
|
-
name: Googlebot
|
729
|
-
category: Search bot
|
730
|
-
url: http://www.google.com/bot.html
|
731
|
-
producer:
|
732
|
-
name: Google Inc.
|
733
|
-
url: http://www.google.com
|
734
|
-
-
|
735
|
-
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
|
736
|
-
bot:
|
737
|
-
name: Googlebot
|
738
|
-
category: Search bot
|
739
|
-
url: http://www.google.com/bot.html
|
740
|
-
producer:
|
741
|
-
name: Google Inc.
|
742
|
-
url: http://www.google.com
|
743
|
-
-
|
744
|
-
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
|
745
|
-
bot:
|
746
|
-
name: Googlebot
|
747
|
-
category: Search bot
|
748
|
-
url: http://www.google.com/bot.html
|
749
|
-
producer:
|
750
|
-
name: Google Inc.
|
751
|
-
url: http://www.google.com
|
752
|
-
-
|
753
|
-
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
|
754
|
-
bot:
|
755
|
-
name: Googlebot
|
756
|
-
category: Search bot
|
757
|
-
url: http://www.google.com/bot.html
|
758
|
-
producer:
|
759
|
-
name: Google Inc.
|
760
|
-
url: http://www.google.com
|
761
|
-
-
|
762
|
-
user_agent: Googlebot (gocrawl v0.4)
|
763
|
-
bot:
|
764
|
-
name: Googlebot
|
765
|
-
category: Search bot
|
766
|
-
url: http://www.google.com/bot.html
|
767
|
-
producer:
|
768
|
-
name: Google Inc.
|
769
|
-
url: http://www.google.com
|
770
|
-
-
|
771
|
-
user_agent: Googlebot-Image/1.0
|
772
|
-
bot:
|
773
|
-
name: Googlebot
|
774
|
-
category: Search bot
|
775
|
-
url: http://www.google.com/bot.html
|
776
|
-
producer:
|
777
|
-
name: Google Inc.
|
778
|
-
url: http://www.google.com
|
779
|
-
-
|
780
|
-
user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
|
781
|
-
bot:
|
782
|
-
name: Googlebot
|
783
|
-
category: Search bot
|
784
|
-
url: http://www.google.com/bot.html
|
785
|
-
producer:
|
786
|
-
name: Google Inc.
|
787
|
-
url: http://www.google.com
|
788
|
-
-
|
789
|
-
user_agent: Googlebot-Video/1.0
|
790
|
-
bot:
|
791
|
-
name: Googlebot
|
792
|
-
category: Search bot
|
793
|
-
url: http://www.google.com/bot.html
|
794
|
-
producer:
|
795
|
-
name: Google Inc.
|
796
|
-
url: http://www.google.com
|
797
|
-
-
|
798
|
-
user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
|
799
|
-
bot:
|
800
|
-
name: Googlebot
|
801
|
-
category: Search bot
|
802
|
-
url: http://www.google.com/bot.html
|
803
|
-
producer:
|
804
|
-
name: Google Inc.
|
805
|
-
url: http://www.google.com
|
806
|
-
-
|
807
|
-
user_agent: Googlebot/Nutch-1.7
|
808
|
-
bot:
|
809
|
-
name: Googlebot
|
810
|
-
category: Search bot
|
811
|
-
url: http://www.google.com/bot.html
|
812
|
-
producer:
|
813
|
-
name: Google Inc.
|
814
|
-
url: http://www.google.com
|
815
|
-
-
|
816
|
-
user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
|
817
|
-
bot:
|
818
|
-
name: Googlebot
|
819
|
-
category: Search bot
|
820
|
-
url: http://www.google.com/bot.html
|
821
|
-
producer:
|
822
|
-
name: Google Inc.
|
823
|
-
url: http://www.google.com
|
824
|
-
-
|
825
|
-
user_agent: Mediapartners-Google
|
826
|
-
bot:
|
827
|
-
name: Googlebot
|
828
|
-
category: Search bot
|
829
|
-
url: http://www.google.com/bot.html
|
830
|
-
producer:
|
831
|
-
name: Google Inc.
|
832
|
-
url: http://www.google.com
|
833
|
-
-
|
834
|
-
user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
|
835
|
-
bot:
|
836
|
-
name: Googlebot
|
837
|
-
category: Search bot
|
838
|
-
url: http://www.google.com/bot.html
|
839
|
-
producer:
|
840
|
-
name: Google Inc.
|
841
|
-
url: http://www.google.com
|
842
|
-
-
|
843
|
-
user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
|
844
|
-
bot:
|
845
|
-
name: Googlebot
|
846
|
-
category: Search bot
|
847
|
-
url: http://www.google.com/bot.html
|
848
|
-
producer:
|
849
|
-
name: Google Inc.
|
850
|
-
url: http://www.google.com
|
851
|
-
-
|
852
|
-
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
853
|
-
bot:
|
854
|
-
name: Googlebot
|
855
|
-
category: Search bot
|
856
|
-
url: http://www.google.com/bot.html
|
857
|
-
producer:
|
858
|
-
name: Google Inc.
|
859
|
-
url: http://www.google.com
|
860
|
-
-
|
861
|
-
user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
|
862
|
-
bot:
|
863
|
-
name: Googlebot
|
864
|
-
category: Search bot
|
865
|
-
url: http://www.google.com/bot.html
|
866
|
-
producer:
|
867
|
-
name: Google Inc.
|
868
|
-
url: http://www.google.com
|
869
|
-
-
|
870
|
-
user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
|
871
|
-
bot:
|
872
|
-
name: Googlebot
|
873
|
-
category: Search bot
|
874
|
-
url: http://www.google.com/bot.html
|
875
|
-
producer:
|
876
|
-
name: Google Inc.
|
877
|
-
url: http://www.google.com
|
878
|
-
-
|
879
|
-
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
|
880
|
-
bot:
|
881
|
-
name: Googlebot
|
882
|
-
category: Search bot
|
883
|
-
url: http://www.google.com/bot.html
|
884
|
-
producer:
|
885
|
-
name: Google Inc.
|
886
|
-
url: http://www.google.com
|
887
|
-
-
|
888
|
-
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
|
889
|
-
bot:
|
890
|
-
name: Googlebot
|
891
|
-
category: Search bot
|
892
|
-
url: http://www.google.com/bot.html
|
893
|
-
producer:
|
894
|
-
name: Google Inc.
|
895
|
-
url: http://www.google.com
|
896
|
-
-
|
897
|
-
user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
898
|
-
bot:
|
899
|
-
name: Googlebot
|
900
|
-
category: Search bot
|
901
|
-
url: http://www.google.com/bot.html
|
902
|
-
producer:
|
903
|
-
name: Google Inc.
|
904
|
-
url: http://www.google.com
|
905
|
-
-
|
906
|
-
user_agent: HTTPMon/1.0b (http://www.httpmon.com)
|
907
|
-
bot:
|
908
|
-
name: HTTPMon
|
909
|
-
category: Site Monitor
|
910
|
-
url: http://www.httpmon.com
|
911
|
-
producer:
|
912
|
-
name: towards GmbH
|
913
|
-
url: http://www.towards.ch/
|
914
|
-
-
|
915
|
-
user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
|
916
|
-
bot:
|
917
|
-
name: Heritrix
|
918
|
-
category: Crawler
|
919
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
920
|
-
producer:
|
921
|
-
name: The Internet Archive
|
922
|
-
url: http://www.archive.org
|
923
|
-
-
|
924
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
|
925
|
-
bot:
|
926
|
-
name: Heritrix
|
927
|
-
category: Crawler
|
928
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
929
|
-
producer:
|
930
|
-
name: The Internet Archive
|
931
|
-
url: http://www.archive.org
|
932
|
-
-
|
933
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
|
934
|
-
bot:
|
935
|
-
name: Heritrix
|
936
|
-
category: Crawler
|
937
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
938
|
-
producer:
|
939
|
-
name: The Internet Archive
|
940
|
-
url: http://www.archive.org
|
941
|
-
-
|
942
|
-
user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
|
943
|
-
bot:
|
944
|
-
name: Heritrix
|
945
|
-
category: Crawler
|
946
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
947
|
-
producer:
|
948
|
-
name: The Internet Archive
|
949
|
-
url: http://www.archive.org
|
950
|
-
-
|
951
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
|
952
|
-
bot:
|
953
|
-
name: Heritrix
|
954
|
-
category: Crawler
|
955
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
956
|
-
producer:
|
957
|
-
name: The Internet Archive
|
958
|
-
url: http://www.archive.org
|
959
|
-
-
|
960
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
|
961
|
-
bot:
|
962
|
-
name: Heritrix
|
963
|
-
category: Crawler
|
964
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
965
|
-
producer:
|
966
|
-
name: The Internet Archive
|
967
|
-
url: http://www.archive.org
|
968
|
-
-
|
969
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
|
970
|
-
bot:
|
971
|
-
name: Heritrix
|
972
|
-
category: Crawler
|
973
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
974
|
-
producer:
|
975
|
-
name: The Internet Archive
|
976
|
-
url: http://www.archive.org
|
977
|
-
-
|
978
|
-
user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
|
979
|
-
bot:
|
980
|
-
name: Heritrix
|
981
|
-
category: Crawler
|
982
|
-
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
983
|
-
producer:
|
984
|
-
name: The Internet Archive
|
985
|
-
url: http://www.archive.org
|
986
|
-
-
|
987
|
-
user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
|
988
|
-
bot:
|
989
|
-
name: HubPages
|
990
|
-
category: Crawler
|
991
|
-
url: http://hubpages.com/help/crawlingpolicy
|
992
|
-
producer:
|
993
|
-
name: HubPages
|
994
|
-
url: http://hubpages.com/
|
995
|
-
-
|
996
|
-
user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
|
997
|
-
bot:
|
998
|
-
name: ICC-Crawler
|
999
|
-
category: Crawler
|
1000
|
-
url: http://www.nict.go.jp/en/univ-com/plan/crawl.html
|
1001
|
-
producer:
|
1002
|
-
name:
|
1003
|
-
url:
|
1004
|
-
-
|
1005
|
-
user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
|
1006
|
-
bot:
|
1007
|
-
name: IIS Site Analysis
|
1008
|
-
category: Crawler
|
1009
|
-
url: http://www.iis.net/iisbot.html
|
1010
|
-
producer:
|
1011
|
-
name: Microsoft Corporation
|
1012
|
-
url: http://www.microsoft.com
|
1013
|
-
-
|
1014
|
-
user_agent: kouio.com RSS reader
|
1015
|
-
bot:
|
1016
|
-
name: Kouio
|
1017
|
-
url: http://kouio.com/
|
1018
|
-
category: Feed Fetcher
|
1019
|
-
producer:
|
1020
|
-
name:
|
1021
|
-
url:
|
1022
|
-
-
|
1023
|
-
user_agent: 'kouio.com RSS reader - 6 subscribers'
|
1024
|
-
bot:
|
1025
|
-
name: Kouio
|
1026
|
-
url: http://kouio.com/
|
1027
|
-
category: Feed Fetcher
|
1028
|
-
producer:
|
1029
|
-
name:
|
1030
|
-
url:
|
1031
|
-
-
|
1032
|
-
user_agent: 'ltx71 - (http://ltx71.com/)'
|
1033
|
-
bot:
|
1034
|
-
name: LTX71
|
1035
|
-
url: http://ltx71.com/
|
1036
|
-
producer:
|
1037
|
-
name:
|
1038
|
-
url:
|
1039
|
-
-
|
1040
|
-
user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
|
1041
|
-
bot:
|
1042
|
-
name: Larbin web crawler
|
1043
|
-
category: Crawler
|
1044
|
-
url: http://larbin.sourceforge.net
|
1045
|
-
producer:
|
1046
|
-
name:
|
1047
|
-
url:
|
1048
|
-
-
|
1049
|
-
user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
|
1050
|
-
bot:
|
1051
|
-
name: Linkdex Bot
|
1052
|
-
category: Search bot
|
1053
|
-
url: http://www.linkdex.com/bots
|
1054
|
-
producer:
|
1055
|
-
name: Mojeek Ltd.
|
1056
|
-
url: http://www.mojeek.com
|
1057
|
-
-
|
1058
|
-
user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
|
1059
|
-
bot:
|
1060
|
-
name: Linkdex Bot
|
1061
|
-
category: Search bot
|
1062
|
-
url: http://www.linkdex.com/bots
|
1063
|
-
producer:
|
1064
|
-
name: Mojeek Ltd.
|
1065
|
-
url: http://www.mojeek.com
|
1066
|
-
-
|
1067
|
-
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
|
1068
|
-
bot:
|
1069
|
-
name: Linkdex Bot
|
1070
|
-
category: Search bot
|
1071
|
-
url: http://www.linkdex.com/bots
|
1072
|
-
producer:
|
1073
|
-
name: Mojeek Ltd.
|
1074
|
-
url: http://www.mojeek.com
|
1075
|
-
-
|
1076
|
-
user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
|
1077
|
-
bot:
|
1078
|
-
name: LinkedIn Bot
|
1079
|
-
category: Social Media Agent
|
1080
|
-
url: http://www.linkedin.com
|
1081
|
-
producer:
|
1082
|
-
name: LinkedIn
|
1083
|
-
url: http://www.linkedin.com
|
1084
|
-
-
|
1085
|
-
user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
|
1086
|
-
bot:
|
1087
|
-
name: MJ12 Bot
|
1088
|
-
category: Search bot
|
1089
|
-
url: http://majestic12.co.uk/bot.php
|
1090
|
-
producer:
|
1091
|
-
name: Majestic-12
|
1092
|
-
url: http://majestic12.co.uk
|
1093
|
-
-
|
1094
|
-
user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
|
1095
|
-
bot:
|
1096
|
-
name: Magpie-Crawler
|
1097
|
-
category: Social Media Agent
|
1098
|
-
url: http://www.brandwatch.com/magpie-crawler/
|
1099
|
-
producer:
|
1100
|
-
name: Brandwatch
|
1101
|
-
url: http://www.brandwatch.com
|
1102
|
-
-
|
1103
|
-
user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
|
1104
|
-
bot:
|
1105
|
-
name: MagpieRSS
|
1106
|
-
url: http://magpierss.sourceforge.net/
|
1107
|
-
category: Feed Parser
|
1108
|
-
producer:
|
1109
|
-
name:
|
1110
|
-
url:
|
1111
|
-
-
|
1112
|
-
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
|
1113
|
-
bot:
|
1114
|
-
name: Mail.Ru Bot
|
1115
|
-
category: Search bot
|
1116
|
-
url: http://help.mail.ru/webmaster/indexing/robots/types_robots
|
1117
|
-
producer:
|
1118
|
-
name: Mail.Ru Group
|
1119
|
-
url: http://corp.mail.ru
|
1120
|
-
-
|
1121
|
-
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
|
1122
|
-
bot:
|
1123
|
-
name: Mail.Ru Bot
|
1124
|
-
category: Search bot
|
1125
|
-
url: http://help.mail.ru/webmaster/indexing/robots/types_robots
|
1126
|
-
producer:
|
1127
|
-
name: Mail.Ru Group
|
1128
|
-
url: http://corp.mail.ru
|
1129
|
-
-
|
1130
|
-
user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
|
1131
|
-
bot:
|
1132
|
-
name: Meanpath Bot
|
1133
|
-
category: Search bot
|
1134
|
-
url: http://www.meanpath.com/meanpathbot.html
|
1135
|
-
producer:
|
1136
|
-
name: Meanpath
|
1137
|
-
url: http://www.meanpath.com
|
1138
|
-
-
|
1139
|
-
user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
|
1140
|
-
bot:
|
1141
|
-
name: Mixrank Bot
|
1142
|
-
category: Crawler
|
1143
|
-
url: http://mixrank.com
|
1144
|
-
producer:
|
1145
|
-
name: Online Media Group, Inc.
|
1146
|
-
url:
|
1147
|
-
-
|
1148
|
-
user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
|
1149
|
-
bot:
|
1150
|
-
name: MojeekBot
|
1151
|
-
category: Search bot
|
1152
|
-
url: http://www.mojeek.com/bot.html
|
1153
|
-
producer:
|
1154
|
-
name: Mojeek Ltd.
|
1155
|
-
url: http://www.mojeek.com
|
1156
|
-
-
|
1157
|
-
user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
|
1158
|
-
bot:
|
1159
|
-
name: Monitor.Us
|
1160
|
-
category: Site Monitor
|
1161
|
-
url: http://www.monitor.us
|
1162
|
-
producer:
|
1163
|
-
name: Monitor.Us
|
1164
|
-
url: http://www.monitor.us
|
1165
|
-
-
|
1166
|
-
user_agent: nlcrawler/1.0 (+http://northernlight.com/)
|
1167
|
-
bot:
|
1168
|
-
name: NLCrawler
|
1169
|
-
category: Crawler
|
1170
|
-
url:
|
1171
|
-
producer:
|
1172
|
-
name: Northern Light
|
1173
|
-
url: http://northernlight.com
|
1174
|
-
-
|
1175
|
-
user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
|
1176
|
-
bot:
|
1177
|
-
name: NalezenCzBot
|
1178
|
-
category: Crawler
|
1179
|
-
url: http://www.nalezen.cz/about-crawler
|
1180
|
-
producer:
|
1181
|
-
name: Jaroslav Kuboš
|
1182
|
-
url:
|
1183
|
-
-
|
1184
|
-
user_agent: NetLyzer FastProbe
|
1185
|
-
bot:
|
1186
|
-
name: NetLyzer FastProbe
|
1187
|
-
-
|
1188
|
-
user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
|
1189
|
-
bot:
|
1190
|
-
name: Netcraft Survey Bot
|
1191
|
-
category: Search bot
|
1192
|
-
url:
|
1193
|
-
producer:
|
1194
|
-
name: Netcraft
|
1195
|
-
url: http://www.netcraft.com
|
1196
|
-
-
|
1197
|
-
user_agent: Netvibes (http://www.netvibes.com)
|
1198
|
-
bot:
|
1199
|
-
name: Netvibes
|
1200
|
-
url: http://www.netvibes.com/
|
1201
|
-
category: Feed Fetcher
|
1202
|
-
producer:
|
1203
|
-
name:
|
1204
|
-
url:
|
1205
|
-
-
|
1206
|
-
user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
|
1207
|
-
bot:
|
1208
|
-
name: Netvibes
|
1209
|
-
url: http://www.netvibes.com/
|
1210
|
-
category: Feed Fetcher
|
1211
|
-
producer:
|
1212
|
-
name:
|
1213
|
-
url:
|
1214
|
-
-
|
1215
|
-
user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1216
|
-
bot:
|
1217
|
-
name: NewsBlur
|
1218
|
-
url: http://www.newsblur.com
|
1219
|
-
category: Feed Fetcher
|
1220
|
-
producer:
|
1221
|
-
name:
|
1222
|
-
url:
|
1223
|
-
-
|
1224
|
-
user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1225
|
-
bot:
|
1226
|
-
name: NewsBlur
|
1227
|
-
url: http://www.newsblur.com
|
1228
|
-
category: Feed Fetcher
|
1229
|
-
producer:
|
1230
|
-
name:
|
1231
|
-
url:
|
1232
|
-
-
|
1233
|
-
user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
1234
|
-
bot:
|
1235
|
-
name: NewsBlur
|
1236
|
-
url: http://www.newsblur.com
|
1237
|
-
category: Feed Fetcher
|
1238
|
-
producer:
|
1239
|
-
name:
|
1240
|
-
url:
|
1241
|
-
-
|
1242
|
-
user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1243
|
-
bot:
|
1244
|
-
name: NewsBlur
|
1245
|
-
url: http://www.newsblur.com
|
1246
|
-
category: Feed Fetcher
|
1247
|
-
producer:
|
1248
|
-
name:
|
1249
|
-
url:
|
1250
|
-
-
|
1251
|
-
user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
|
1252
|
-
bot:
|
1253
|
-
name: NewsGator
|
1254
|
-
url: http://www.newsgator.com
|
1255
|
-
category: Feed Fetcher
|
1256
|
-
producer:
|
1257
|
-
name:
|
1258
|
-
url:
|
1259
|
-
-
|
1260
|
-
user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
|
1261
|
-
bot:
|
1262
|
-
name: Nutch-based Bot
|
1263
|
-
category: Crawler
|
1264
|
-
url: https://nutch.apache.org
|
1265
|
-
producer:
|
1266
|
-
name: The Apache Software Foundation
|
1267
|
-
url: http://www.apache.org/foundation/
|
1268
|
-
-
|
1269
|
-
user_agent: CB/Nutch-1.7
|
1270
|
-
bot:
|
1271
|
-
name: Nutch-based Bot
|
1272
|
-
category: Crawler
|
1273
|
-
url: https://nutch.apache.org
|
1274
|
-
producer:
|
1275
|
-
name: The Apache Software Foundation
|
1276
|
-
url: http://www.apache.org/foundation/
|
1277
|
-
-
|
1278
|
-
user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
|
1279
|
-
bot:
|
1280
|
-
name: Nutch-based Bot
|
1281
|
-
category: Crawler
|
1282
|
-
url: https://nutch.apache.org
|
1283
|
-
producer:
|
1284
|
-
name: The Apache Software Foundation
|
1285
|
-
url: http://www.apache.org/foundation/
|
1286
|
-
-
|
1287
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
|
1288
|
-
bot:
|
1289
|
-
name: Nutch-based Bot
|
1290
|
-
category: Crawler
|
1291
|
-
url: https://nutch.apache.org
|
1292
|
-
producer:
|
1293
|
-
name: The Apache Software Foundation
|
1294
|
-
url: http://www.apache.org/foundation/
|
1295
|
-
-
|
1296
|
-
user_agent: My Nutch Spider/Nutch-1.6
|
1297
|
-
bot:
|
1298
|
-
name: Nutch-based Bot
|
1299
|
-
category: Crawler
|
1300
|
-
url: https://nutch.apache.org
|
1301
|
-
producer:
|
1302
|
-
name: The Apache Software Foundation
|
1303
|
-
url: http://www.apache.org/foundation/
|
1304
|
-
-
|
1305
|
-
user_agent: MySpider/Nutch-2.2
|
1306
|
-
bot:
|
1307
|
-
name: Nutch-based Bot
|
1308
|
-
category: Crawler
|
1309
|
-
url: https://nutch.apache.org
|
1310
|
-
producer:
|
1311
|
-
name: The Apache Software Foundation
|
1312
|
-
url: http://www.apache.org/foundation/
|
1313
|
-
-
|
1314
|
-
user_agent: Nutch12/Nutch-1.2
|
1315
|
-
bot:
|
1316
|
-
name: Nutch-based Bot
|
1317
|
-
category: Crawler
|
1318
|
-
url: https://nutch.apache.org
|
1319
|
-
producer:
|
1320
|
-
name: The Apache Software Foundation
|
1321
|
-
url: http://www.apache.org/foundation/
|
1322
|
-
-
|
1323
|
-
user_agent: NutchSpider/Nutch-1.4
|
1324
|
-
bot:
|
1325
|
-
name: Nutch-based Bot
|
1326
|
-
category: Crawler
|
1327
|
-
url: https://nutch.apache.org
|
1328
|
-
producer:
|
1329
|
-
name: The Apache Software Foundation
|
1330
|
-
url: http://www.apache.org/foundation/
|
1331
|
-
-
|
1332
|
-
user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
|
1333
|
-
bot:
|
1334
|
-
name: Nutch-based Bot
|
1335
|
-
category: Crawler
|
1336
|
-
url: https://nutch.apache.org
|
1337
|
-
producer:
|
1338
|
-
name: The Apache Software Foundation
|
1339
|
-
url: http://www.apache.org/foundation/
|
1340
|
-
-
|
1341
|
-
user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
|
1342
|
-
bot:
|
1343
|
-
name: Nutch-based Bot
|
1344
|
-
category: Crawler
|
1345
|
-
url: https://nutch.apache.org
|
1346
|
-
producer:
|
1347
|
-
name: The Apache Software Foundation
|
1348
|
-
url: http://www.apache.org/foundation/
|
1349
|
-
-
|
1350
|
-
user_agent: testnutch/Nutch-1.8
|
1351
|
-
bot:
|
1352
|
-
name: Nutch-based Bot
|
1353
|
-
category: Crawler
|
1354
|
-
url: https://nutch.apache.org
|
1355
|
-
producer:
|
1356
|
-
name: The Apache Software Foundation
|
1357
|
-
url: http://www.apache.org/foundation/
|
1358
|
-
-
|
1359
|
-
user_agent: Your Nutch Spider/Nutch-2.2.1
|
1360
|
-
bot:
|
1361
|
-
name: Nutch-based Bot
|
1362
|
-
category: Crawler
|
1363
|
-
url: https://nutch.apache.org
|
1364
|
-
producer:
|
1365
|
-
name: The Apache Software Foundation
|
1366
|
-
url: http://www.apache.org/foundation/
|
1367
|
-
-
|
1368
|
-
user_agent: your sipder name/Nutch-1.7
|
1369
|
-
bot:
|
1370
|
-
name: Nutch-based Bot
|
1371
|
-
category: Crawler
|
1372
|
-
url: https://nutch.apache.org
|
1373
|
-
producer:
|
1374
|
-
name: The Apache Software Foundation
|
1375
|
-
url: http://www.apache.org/foundation/
|
1376
|
-
-
|
1377
|
-
user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
|
1378
|
-
bot:
|
1379
|
-
name: Omgili bot
|
1380
|
-
category: Search bot
|
1381
|
-
url: http://www.omgili.com/Crawler.html
|
1382
|
-
producer:
|
1383
|
-
name: Omgili
|
1384
|
-
url: http://www.omgili.com
|
1385
|
-
-
|
1386
|
-
user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
|
1387
|
-
bot:
|
1388
|
-
name: OpenLinkProfiler
|
1389
|
-
category: Crawler
|
1390
|
-
url: http://openlinkprofiler.org/bot
|
1391
|
-
producer:
|
1392
|
-
name: Axandra GmbH
|
1393
|
-
url: http://www.axandra.com
|
1394
|
-
-
|
1395
|
-
user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
|
1396
|
-
bot:
|
1397
|
-
name: OpenWebSpider
|
1398
|
-
category: Crawler
|
1399
|
-
url: http://www.openwebspider.org
|
1400
|
-
producer:
|
1401
|
-
name: OpenWebSpider Lab
|
1402
|
-
url: http://lab.openwebspider.org
|
1403
|
-
-
|
1404
|
-
user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
|
1405
|
-
bot:
|
1406
|
-
name: Openindex Spider
|
1407
|
-
category: Search bot
|
1408
|
-
url: http://www.openindex.io/en/webmasters/spider.html
|
1409
|
-
producer:
|
1410
|
-
name: Openindex B.V.
|
1411
|
-
url: http://www.openindex.io
|
1412
|
-
-
|
1413
|
-
user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
|
1414
|
-
bot:
|
1415
|
-
name: Orange Bot
|
1416
|
-
category: Search bot
|
1417
|
-
url: http://lemoteur.orange.fr
|
1418
|
-
producer:
|
1419
|
-
name: Orange
|
1420
|
-
url: http://www.orange.fr
|
1421
|
-
-
|
1422
|
-
user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
|
1423
|
-
bot:
|
1424
|
-
name: Orange Bot
|
1425
|
-
category: Search bot
|
1426
|
-
url: http://lemoteur.orange.fr
|
1427
|
-
producer:
|
1428
|
-
name: Orange
|
1429
|
-
url: http://www.orange.fr
|
1430
|
-
-
|
1431
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
|
1432
|
-
bot:
|
1433
|
-
name: Orange Bot
|
1434
|
-
category: Search bot
|
1435
|
-
url: http://lemoteur.orange.fr
|
1436
|
-
producer:
|
1437
|
-
name: Orange
|
1438
|
-
url: http://www.orange.fr
|
1439
|
-
-
|
1440
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
|
1441
|
-
bot:
|
1442
|
-
name: Orange Bot
|
1443
|
-
category: Search bot
|
1444
|
-
url: http://lemoteur.orange.fr
|
1445
|
-
producer:
|
1446
|
-
name: Orange
|
1447
|
-
url: http://www.orange.fr
|
1448
|
-
-
|
1449
|
-
user_agent: Mozilla/5.0 (Java) outbrain
|
1450
|
-
bot:
|
1451
|
-
name: Outbrain
|
1452
|
-
category: Crawler
|
1453
|
-
url:
|
1454
|
-
producer:
|
1455
|
-
name: Outbrain
|
1456
|
-
url: http://www.outbrain.com/
|
1457
|
-
-
|
1458
|
-
user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
|
1459
|
-
bot:
|
1460
|
-
name: PHP Server Monitor
|
1461
|
-
category: Site Monitor
|
1462
|
-
url: https://github.com/phpservermon/phpservermon
|
1463
|
-
producer:
|
1464
|
-
name: PHP Server Monitor
|
1465
|
-
url: http://www.phpservermonitor.org/
|
1466
|
-
-
|
1467
|
-
user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
|
1468
|
-
bot:
|
1469
|
-
name: PaperLiBot
|
1470
|
-
category: Search bot
|
1471
|
-
url: http://support.paper.li/entries/20023257-what-is-paper-li
|
1472
|
-
producer:
|
1473
|
-
name: Smallrivers SA
|
1474
|
-
url: http://www.paper.li
|
1475
|
-
-
|
1476
|
-
user_agent: psbot-page (+http://www.picsearch.com/bot.html)
|
1477
|
-
bot:
|
1478
|
-
name: Picsearch bot
|
1479
|
-
category: Search bot
|
1480
|
-
url: http://www.picsearch.com/bot.html
|
1481
|
-
producer:
|
1482
|
-
name: Picsearch
|
1483
|
-
url: http://www.picsearch.com
|
1484
|
-
-
|
1485
|
-
user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
|
1486
|
-
bot:
|
1487
|
-
name: Picsearch bot
|
1488
|
-
category: Search bot
|
1489
|
-
url: http://www.picsearch.com/bot.html
|
1490
|
-
producer:
|
1491
|
-
name: Picsearch
|
1492
|
-
url: http://www.picsearch.com
|
1493
|
-
-
|
1494
|
-
user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
|
1495
|
-
bot:
|
1496
|
-
name: Pingdom Bot
|
1497
|
-
category: Site Monitor
|
1498
|
-
url:
|
1499
|
-
producer:
|
1500
|
-
name: Pingdom AB
|
1501
|
-
url: https://www.pingdom.com
|
1502
|
-
-
|
1503
|
-
user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
|
1504
|
-
bot:
|
1505
|
-
name: Pinterest
|
1506
|
-
url:
|
1507
|
-
category: Crawler
|
1508
|
-
producer:
|
1509
|
-
name: Pinterest
|
1510
|
-
url: http://www.pinterest.com/
|
1511
|
-
-
|
1512
|
-
user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
|
1513
|
-
bot:
|
1514
|
-
name: QuerySeekerSpider
|
1515
|
-
category: Crawler
|
1516
|
-
url: http://queryseeker.com/bot.html
|
1517
|
-
producer:
|
1518
|
-
name: QueryEye Inc.
|
1519
|
-
url: http://queryeye.com
|
1520
|
-
-
|
1521
|
-
user_agent: ROI Hunter; https://api-dev.roihunter.com
|
1522
|
-
bot:
|
1523
|
-
name: ROI Hunter
|
1524
|
-
category: Crawler
|
1525
|
-
url:
|
1526
|
-
producer:
|
1527
|
-
name: Roihunter a.s.
|
1528
|
-
url: http://roihunter.com/
|
1529
|
-
-
|
1530
|
-
user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
|
1531
|
-
bot:
|
1532
|
-
name: Reddit Bot
|
1533
|
-
category: Social Media Agent
|
1534
|
-
url: http://www.reddit.com/feedback
|
1535
|
-
producer:
|
1536
|
-
name: reddit inc.
|
1537
|
-
url: http://www.reddit.com
|
1538
|
-
-
|
1539
|
-
user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
|
1540
|
-
bot:
|
1541
|
-
name: Rogerbot
|
1542
|
-
category: Crawler
|
1543
|
-
url: http://moz.com/help/pro/what-is-rogerbot-
|
1544
|
-
producer:
|
1545
|
-
name: SEOmoz, Inc.
|
1546
|
-
url: http://moz.com/
|
1547
|
-
-
|
1548
|
-
user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
|
1549
|
-
bot:
|
1550
|
-
name: Rogerbot
|
1551
|
-
category: Crawler
|
1552
|
-
url: http://moz.com/help/pro/what-is-rogerbot-
|
1553
|
-
producer:
|
1554
|
-
name: SEOmoz, Inc.
|
1555
|
-
url: http://moz.com/
|
1556
|
-
-
|
1557
|
-
user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
|
1558
|
-
bot:
|
1559
|
-
name: Rogerbot
|
1560
|
-
category: Crawler
|
1561
|
-
url: http://moz.com/help/pro/what-is-rogerbot-
|
1562
|
-
producer:
|
1563
|
-
name: SEOmoz, Inc.
|
1564
|
-
url: http://moz.com/
|
1565
|
-
-
|
1566
|
-
user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
|
1567
|
-
bot:
|
1568
|
-
name: SEOENGBot
|
1569
|
-
category: Crawler
|
1570
|
-
url: http://www.seoengine.com/seoengbot.htm
|
1571
|
-
producer:
|
1572
|
-
name: SEO Engine
|
1573
|
-
url: http://www.seoengine.com
|
1574
|
-
-
|
1575
|
-
user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
|
1576
|
-
bot:
|
1577
|
-
name: SISTRIX Crawler
|
1578
|
-
category: Crawler
|
1579
|
-
url: http://crawler.sistrix.net
|
1580
|
-
producer:
|
1581
|
-
name: SISTRIX GmbH
|
1582
|
-
url: http://www.sistrix.de
|
1583
|
-
-
|
1584
|
-
user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
|
1585
|
-
bot:
|
1586
|
-
name: Scrapy
|
1587
|
-
category: Crawler
|
1588
|
-
url: http://scrapy.org
|
1589
|
-
-
|
1590
|
-
user_agent: Screaming Frog SEO Spider/2.22
|
1591
|
-
bot:
|
1592
|
-
name: Screaming Frog SEO Spider
|
1593
|
-
category: Crawler
|
1594
|
-
url: http://www.screamingfrog.co.uk/seo-spider
|
1595
|
-
producer:
|
1596
|
-
name: Screaming Frog Ltd
|
1597
|
-
url: http://www.screamingfrog.co.uk
|
1598
|
-
-
|
1599
|
-
user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
|
1600
|
-
bot:
|
1601
|
-
name: ScreenerBot
|
1602
|
-
category: Crawler
|
1603
|
-
url: http://www.screenerbot.com
|
1604
|
-
producer:
|
1605
|
-
name:
|
1606
|
-
url:
|
1607
|
-
-
|
1608
|
-
user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
|
1609
|
-
bot:
|
1610
|
-
name: Semrush Bot
|
1611
|
-
category: Crawler
|
1612
|
-
url: http://www.semrush.com/bot.html
|
1613
|
-
producer:
|
1614
|
-
name: SEMrush
|
1615
|
-
url: http://www.semrush.com
|
1616
|
-
-
|
1617
|
-
user_agent: SensikaBot/x.33 (+http://sensika.com)
|
1618
|
-
bot:
|
1619
|
-
name: Sensika Bot
|
1620
|
-
category:
|
1621
|
-
url:
|
1622
|
-
producer:
|
1623
|
-
name: Sensika
|
1624
|
-
url: http://sensika.com
|
1625
|
-
-
|
1626
|
-
user_agent: Server Density Service Monitoring v2
|
1627
|
-
bot:
|
1628
|
-
name: Server Density
|
1629
|
-
-
|
1630
|
-
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
|
1631
|
-
bot:
|
1632
|
-
name: Seznam Bot
|
1633
|
-
category: Search bot
|
1634
|
-
url: http://www.mapy.cz/cz/seznambot.html
|
1635
|
-
producer:
|
1636
|
-
name: Seznam.cz, a.s.
|
1637
|
-
url: http://www.seznam.cz/
|
1638
|
-
-
|
1639
|
-
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
|
1640
|
-
bot:
|
1641
|
-
name: Seznam Bot
|
1642
|
-
category: Search bot
|
1643
|
-
url: http://www.mapy.cz/cz/seznambot.html
|
1644
|
-
producer:
|
1645
|
-
name: Seznam.cz, a.s.
|
1646
|
-
url: http://www.seznam.cz/
|
1647
|
-
-
|
1648
|
-
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
|
1649
|
-
bot:
|
1650
|
-
name: Seznam Bot
|
1651
|
-
category: Search bot
|
1652
|
-
url: http://www.mapy.cz/cz/seznambot.html
|
1653
|
-
producer:
|
1654
|
-
name: Seznam.cz, a.s.
|
1655
|
-
url: http://www.seznam.cz/
|
1656
|
-
-
|
1657
|
-
user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
|
1658
|
-
bot:
|
1659
|
-
name: Seznam Bot
|
1660
|
-
category: Search bot
|
1661
|
-
url: http://www.mapy.cz/cz/seznambot.html
|
1662
|
-
producer:
|
1663
|
-
name: Seznam.cz, a.s.
|
1664
|
-
url: http://www.seznam.cz/
|
1665
|
-
-
|
1666
|
-
user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
|
1667
|
-
bot:
|
1668
|
-
name: ShopWiki
|
1669
|
-
category: Search tools
|
1670
|
-
url: http://www.shopwiki.com/wiki/Help:Bot
|
1671
|
-
producer:
|
1672
|
-
name: ShopWiki Corp.
|
1673
|
-
url: http://www.shopwiki.com
|
1674
|
-
-
|
1675
|
-
user_agent: SilverReader/1.0; http://silverreader.com
|
1676
|
-
bot:
|
1677
|
-
name: SilverReader
|
1678
|
-
url: http://silverreader.com
|
1679
|
-
category: Feed Fetcher
|
1680
|
-
producer:
|
1681
|
-
name:
|
1682
|
-
url:
|
1683
|
-
-
|
1684
|
-
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
1685
|
-
bot:
|
1686
|
-
name: SimplePie
|
1687
|
-
url: http://www.simplepie.org
|
1688
|
-
category: Feed Parser
|
1689
|
-
producer:
|
1690
|
-
name:
|
1691
|
-
url:
|
1692
|
-
-
|
1693
|
-
user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
|
1694
|
-
bot:
|
1695
|
-
name: SimplePie
|
1696
|
-
url: http://www.simplepie.org
|
1697
|
-
category: Feed Parser
|
1698
|
-
producer:
|
1699
|
-
name:
|
1700
|
-
url:
|
1701
|
-
-
|
1702
|
-
user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
|
1703
|
-
bot:
|
1704
|
-
name: SimplePie
|
1705
|
-
url: http://www.simplepie.org
|
1706
|
-
category: Feed Parser
|
1707
|
-
producer:
|
1708
|
-
name:
|
1709
|
-
url:
|
1710
|
-
-
|
1711
|
-
user_agent: Site24x7
|
1712
|
-
bot:
|
1713
|
-
name: Site24x7 Website Monitoring
|
1714
|
-
category: Site Monitor
|
1715
|
-
url: https://www.site24x7.com/site24x7-faq.html
|
1716
|
-
producer:
|
1717
|
-
name: Site24x7
|
1718
|
-
url: https://www.site24x7.com
|
1719
|
-
-
|
1720
|
-
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
|
1721
|
-
bot:
|
1722
|
-
name: Skype URI Preview
|
1723
|
-
category: Service Agent
|
1724
|
-
url:
|
1725
|
-
producer:
|
1726
|
-
name: Skype Communications S.à.r.l.
|
1727
|
-
url: https://www.skype.com
|
1728
|
-
-
|
1729
|
-
user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
|
1730
|
-
bot:
|
1731
|
-
name: Slackbot
|
1732
|
-
category: Crawler
|
1733
|
-
url: https://api.slack.com/robots
|
1734
|
-
producer:
|
1735
|
-
name: Slack Technologies
|
1736
|
-
url: http://slack.com
|
1737
|
-
-
|
1738
|
-
user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
|
1739
|
-
bot:
|
1740
|
-
name: Sogou Spider
|
1741
|
-
category: Search bot
|
1742
|
-
url: http://www.sogou.com/docs/help/webmasters.htm
|
1743
|
-
producer:
|
1744
|
-
name: Sohu, Inc.
|
1745
|
-
url: http://www.sogou.com
|
1746
|
-
-
|
1747
|
-
user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
1748
|
-
bot:
|
1749
|
-
name: Sogou Spider
|
1750
|
-
category: Search bot
|
1751
|
-
url: http://www.sogou.com/docs/help/webmasters.htm
|
1752
|
-
producer:
|
1753
|
-
name: Sohu, Inc.
|
1754
|
-
url: http://www.sogou.com
|
1755
|
-
-
|
1756
|
-
user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
|
1757
|
-
bot:
|
1758
|
-
name: Sogou Spider
|
1759
|
-
category: Search bot
|
1760
|
-
url: http://www.sogou.com/docs/help/webmasters.htm
|
1761
|
-
producer:
|
1762
|
-
name: Sohu, Inc.
|
1763
|
-
url: http://www.sogou.com
|
1764
|
-
-
|
1765
|
-
user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
1766
|
-
bot:
|
1767
|
-
name: Sogou Spider
|
1768
|
-
category: Search bot
|
1769
|
-
url: http://www.sogou.com/docs/help/webmasters.htm
|
1770
|
-
producer:
|
1771
|
-
name: Sohu, Inc.
|
1772
|
-
url: http://www.sogou.com
|
1773
|
-
-
|
1774
|
-
user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
|
1775
|
-
bot:
|
1776
|
-
name: Soso Spider
|
1777
|
-
category: Search bot
|
1778
|
-
url: http://help.soso.com/webspider.htm
|
1779
|
-
producer:
|
1780
|
-
name: Tencent Holdings
|
1781
|
-
url: http://www.soso.com
|
1782
|
-
-
|
1783
|
-
user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
|
1784
|
-
bot:
|
1785
|
-
name: Spinn3r
|
1786
|
-
category: Crawler
|
1787
|
-
url: http://spinn3r.com/robot
|
1788
|
-
producer:
|
1789
|
-
name: Tailrank Inc
|
1790
|
-
url: http://spinn3r.com
|
1791
|
-
-
|
1792
|
-
user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
|
1793
|
-
bot:
|
1794
|
-
name: Sputnik Bot
|
1795
|
-
category:
|
1796
|
-
url:
|
1797
|
-
producer:
|
1798
|
-
name:
|
1799
|
-
url:
|
1800
|
-
-
|
1801
|
-
user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
|
1802
|
-
bot:
|
1803
|
-
name: Sputnik Bot
|
1804
|
-
category:
|
1805
|
-
url:
|
1806
|
-
producer:
|
1807
|
-
name:
|
1808
|
-
url:
|
1809
|
-
-
|
1810
|
-
user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
|
1811
|
-
bot:
|
1812
|
-
name: Superfeedr Bot
|
1813
|
-
category: Feed Fetcher
|
1814
|
-
url:
|
1815
|
-
producer:
|
1816
|
-
name: Superfeedr
|
1817
|
-
url: https://superfeedr.com/
|
1818
|
-
-
|
1819
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
|
1820
|
-
bot:
|
1821
|
-
name: Survey Bot
|
1822
|
-
category: Search bot
|
1823
|
-
url: http://www.domaintools.com/webmasters/surveybot.php
|
1824
|
-
producer:
|
1825
|
-
name: Domain Tools
|
1826
|
-
url: http://www.domaintools.com
|
1827
|
-
-
|
1828
|
-
user_agent: TelegramBot (like TwitterBot)
|
1829
|
-
bot:
|
1830
|
-
name: TelgramBot
|
1831
|
-
url: https://telegram.org/blog/bot-revolution
|
1832
|
-
-
|
1833
|
-
user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
|
1834
|
-
bot:
|
1835
|
-
name: TinEye Crawler
|
1836
|
-
category: Search bot
|
1837
|
-
url: http://www.tineye.com/crawler.html
|
1838
|
-
producer:
|
1839
|
-
name: Idée Inc.
|
1840
|
-
url: http://ideeinc.com
|
1841
|
-
-
|
1842
|
-
user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
|
1843
|
-
bot:
|
1844
|
-
name: Tiny Tiny RSS
|
1845
|
-
url: http://tt-rss.org
|
1846
|
-
category: Feed Fetcher
|
1847
|
-
producer:
|
1848
|
-
name:
|
1849
|
-
url:
|
1850
|
-
-
|
1851
|
-
user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
|
1852
|
-
bot:
|
1853
|
-
name: Tiny Tiny RSS
|
1854
|
-
url: http://tt-rss.org
|
1855
|
-
category: Feed Fetcher
|
1856
|
-
producer:
|
1857
|
-
name:
|
1858
|
-
url:
|
1859
|
-
-
|
1860
|
-
user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
|
1861
|
-
bot:
|
1862
|
-
name: TurnitinBot
|
1863
|
-
category: Crawler
|
1864
|
-
url: http://www.turnitin.com/robot/crawlerinfo.html
|
1865
|
-
producer:
|
1866
|
-
name: iParadigms, LLC.
|
1867
|
-
url: http://www.turnitin.com
|
1868
|
-
-
|
1869
|
-
user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
|
1870
|
-
bot:
|
1871
|
-
name: TweetedTimes Bot
|
1872
|
-
category: Crawler
|
1873
|
-
url: http://tweetedtimes.com
|
1874
|
-
producer:
|
1875
|
-
name: TweetedTimes
|
1876
|
-
url: http://tweetedtimes.com/
|
1877
|
-
-
|
1878
|
-
user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
|
1879
|
-
bot:
|
1880
|
-
name: TweetedTimes Bot
|
1881
|
-
category: Crawler
|
1882
|
-
url: http://tweetedtimes.com
|
1883
|
-
producer:
|
1884
|
-
name: TweetedTimes
|
1885
|
-
url: http://tweetedtimes.com/
|
1886
|
-
-
|
1887
|
-
user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
|
1888
|
-
bot:
|
1889
|
-
name: Tweetmeme Bot
|
1890
|
-
category: Crawler
|
1891
|
-
url: http://tweetmeme.com/
|
1892
|
-
producer:
|
1893
|
-
name: Mediasift
|
1894
|
-
url:
|
1895
|
-
-
|
1896
|
-
user_agent: Twitterbot/1.0
|
1897
|
-
bot:
|
1898
|
-
name: Twitterbot
|
1899
|
-
category: Social Media Agent
|
1900
|
-
url: https://dev.twitter.com/docs/cards/getting-started
|
1901
|
-
producer:
|
1902
|
-
name: Twitter
|
1903
|
-
url: http://www.twitter.com
|
1904
|
-
-
|
1905
|
-
user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
|
1906
|
-
bot:
|
1907
|
-
name: URLAppendBot
|
1908
|
-
category: Crawler
|
1909
|
-
url: http://www.profound.net/urlappendbot.html
|
1910
|
-
producer:
|
1911
|
-
name: Profound Networks
|
1912
|
-
url: http://www.profound.net
|
1913
|
-
-
|
1914
|
-
user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
|
1915
|
-
bot:
|
1916
|
-
name: Uptime Robot
|
1917
|
-
category: Site Monitor
|
1918
|
-
url:
|
1919
|
-
producer:
|
1920
|
-
name: Uptime Robot
|
1921
|
-
url: http://uptimerobot.com
|
1922
|
-
-
|
1923
|
-
user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
|
1924
|
-
bot:
|
1925
|
-
name: Visual Site Mapper Crawler
|
1926
|
-
category: Crawler
|
1927
|
-
url: http://www.visualsitemapper.com/crawler
|
1928
|
-
producer:
|
1929
|
-
name: Alentum Software Ltd.
|
1930
|
-
url: http://www.alentum.com
|
1931
|
-
-
|
1932
|
-
user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
|
1933
|
-
bot:
|
1934
|
-
name: W3C CSS Validator
|
1935
|
-
category: Validator
|
1936
|
-
url: http://jigsaw.w3.org/css-validator
|
1937
|
-
producer:
|
1938
|
-
name: W3C
|
1939
|
-
url: http://www.w3.org
|
1940
|
-
-
|
1941
|
-
user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
|
1942
|
-
bot:
|
1943
|
-
name: W3C I18N Checker
|
1944
|
-
category: Validator
|
1945
|
-
url: http://validator.w3.org/i18n-checker
|
1946
|
-
producer:
|
1947
|
-
name: W3C
|
1948
|
-
url: http://www.w3.org
|
1949
|
-
-
|
1950
|
-
user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
|
1951
|
-
bot:
|
1952
|
-
name: W3C Link Checker
|
1953
|
-
category: Validator
|
1954
|
-
url: http://validator.w3.org/checklink
|
1955
|
-
producer:
|
1956
|
-
name: W3C
|
1957
|
-
url: http://www.w3.org
|
1958
|
-
-
|
1959
|
-
user_agent: W3C-checklink/4.81 libwww-perl/5.836
|
1960
|
-
bot:
|
1961
|
-
name: W3C Link Checker
|
1962
|
-
category: Validator
|
1963
|
-
url: http://validator.w3.org/checklink
|
1964
|
-
producer:
|
1965
|
-
name: W3C
|
1966
|
-
url: http://www.w3.org
|
1967
|
-
-
|
1968
|
-
user_agent: W3C_Validator/1.3 http://validator.w3.org/services
|
1969
|
-
bot:
|
1970
|
-
name: W3C Markup Validation Service
|
1971
|
-
category: Validator
|
1972
|
-
url: http://validator.w3.org/services
|
1973
|
-
producer:
|
1974
|
-
name: W3C
|
1975
|
-
url: http://www.w3.org
|
1976
|
-
-
|
1977
|
-
user_agent: W3C_Validator/1.767
|
1978
|
-
bot:
|
1979
|
-
name: W3C Markup Validation Service
|
1980
|
-
category: Validator
|
1981
|
-
url: http://validator.w3.org/services
|
1982
|
-
producer:
|
1983
|
-
name: W3C
|
1984
|
-
url: http://www.w3.org
|
1985
|
-
-
|
1986
|
-
user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
|
1987
|
-
bot:
|
1988
|
-
name: W3C MobileOK Checker
|
1989
|
-
category: Validator
|
1990
|
-
url: http://validator.w3.org/mobile
|
1991
|
-
producer:
|
1992
|
-
name: W3C
|
1993
|
-
url: http://www.w3.org
|
1994
|
-
-
|
1995
|
-
user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
|
1996
|
-
bot:
|
1997
|
-
name: W3C Unified Validator
|
1998
|
-
category: Validator
|
1999
|
-
url: http://validator.w3.org/unicorn
|
2000
|
-
producer:
|
2001
|
-
name: W3C
|
2002
|
-
url: http://www.w3.org
|
2003
|
-
-
|
2004
|
-
user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
|
2005
|
-
bot:
|
2006
|
-
name: WeSEE:Search
|
2007
|
-
category: Search bot
|
2008
|
-
url: http://www.wesee.com/bot
|
2009
|
-
producer:
|
2010
|
-
name: WeSEE Ltd
|
2011
|
-
url: http://www.wesee.com
|
2012
|
-
-
|
2013
|
-
user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
|
2014
|
-
bot:
|
2015
|
-
name: WebSitePulse
|
2016
|
-
category: Site Monitor
|
2017
|
-
url: http://badcheese.com/crawler.html
|
2018
|
-
producer:
|
2019
|
-
name: WebSitePulse
|
2020
|
-
url: http://www.websitepulse.com/
|
2021
|
-
-
|
2022
|
-
user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
|
2023
|
-
bot:
|
2024
|
-
name: WebbCrawler
|
2025
|
-
category: Crawler
|
2026
|
-
url: http://badcheese.com/crawler.html
|
2027
|
-
producer:
|
2028
|
-
name: Steve Webb
|
2029
|
-
url: http://badcheese.com
|
2030
|
-
-
|
2031
|
-
user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
|
2032
|
-
bot:
|
2033
|
-
name: Wotbox
|
2034
|
-
category: Search bot
|
2035
|
-
url: http://www.wotbox.com/bot/
|
2036
|
-
producer:
|
2037
|
-
name: Wotbox
|
2038
|
-
url: http://www.wotbox.com
|
2039
|
-
-
|
2040
|
-
user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
|
2041
|
-
bot:
|
2042
|
-
name: YaCy
|
2043
|
-
category: Search bot
|
2044
|
-
url: http://yacy.net/bot.html
|
2045
|
-
producer:
|
2046
|
-
name: YaCy
|
2047
|
-
url: http://yacy.net
|
2048
|
-
-
|
2049
|
-
user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
|
2050
|
-
bot:
|
2051
|
-
name: YaCy
|
2052
|
-
category: Search bot
|
2053
|
-
url: http://yacy.net/bot.html
|
2054
|
-
producer:
|
2055
|
-
name: YaCy
|
2056
|
-
url: http://yacy.net
|
2057
|
-
-
|
2058
|
-
user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
|
2059
|
-
bot:
|
2060
|
-
name: Yahoo Gemini
|
2061
|
-
category: Crawler
|
2062
|
-
url: https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html
|
2063
|
-
producer:
|
2064
|
-
name: Yahoo! Inc.
|
2065
|
-
url: http://www.yahoo.com
|
2066
|
-
-
|
2067
|
-
user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
|
2068
|
-
bot:
|
2069
|
-
name: Yahoo! Link Preview
|
2070
|
-
category: Crawler
|
2071
|
-
url: https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html
|
2072
|
-
producer:
|
2073
|
-
name: Yahoo! Inc.
|
2074
|
-
url: http://www.yahoo.com
|
2075
|
-
-
|
2076
|
-
user_agent: Yahoo:LinkExpander:Slingstone
|
2077
|
-
bot:
|
2078
|
-
name: Yahoo! Link Preview
|
2079
|
-
category: Crawler
|
2080
|
-
url: https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html
|
2081
|
-
producer:
|
2082
|
-
name: Yahoo! Inc.
|
2083
|
-
url: http://www.yahoo.com
|
2084
|
-
-
|
2085
|
-
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
|
2086
|
-
bot:
|
2087
|
-
name: Yahoo! Slurp
|
2088
|
-
category: Search bot
|
2089
|
-
url: http://help.yahoo.com/ysearch/slurp
|
2090
|
-
producer:
|
2091
|
-
name: Yahoo! Inc.
|
2092
|
-
url: http://www.yahoo.com
|
2093
|
-
-
|
2094
|
-
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
|
2095
|
-
bot:
|
2096
|
-
name: Yahoo! Slurp
|
2097
|
-
category: Search bot
|
2098
|
-
url: http://help.yahoo.com/ysearch/slurp
|
2099
|
-
producer:
|
2100
|
-
name: Yahoo! Inc.
|
2101
|
-
url: http://www.yahoo.com
|
2102
|
-
-
|
2103
|
-
user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
|
2104
|
-
bot:
|
2105
|
-
name: Yandex Bot
|
2106
|
-
category: Search bot
|
2107
|
-
url: http://www.yandex.com/bots
|
2108
|
-
producer:
|
2109
|
-
name: Yandex LLC
|
2110
|
-
url: http://company.yandex.com
|
2111
|
-
-
|
2112
|
-
user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
|
2113
|
-
bot:
|
2114
|
-
name: Yandex Bot
|
2115
|
-
category: Search bot
|
2116
|
-
url: http://www.yandex.com/bots
|
2117
|
-
producer:
|
2118
|
-
name: Yandex LLC
|
2119
|
-
url: http://company.yandex.com
|
2120
|
-
-
|
2121
|
-
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
2122
|
-
bot:
|
2123
|
-
name: Yandex Bot
|
2124
|
-
category: Search bot
|
2125
|
-
url: http://www.yandex.com/bots
|
2126
|
-
producer:
|
2127
|
-
name: Yandex LLC
|
2128
|
-
url: http://company.yandex.com
|
2129
|
-
-
|
2130
|
-
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
2131
|
-
bot:
|
2132
|
-
name: Yandex Bot
|
2133
|
-
category: Search bot
|
2134
|
-
url: http://www.yandex.com/bots
|
2135
|
-
producer:
|
2136
|
-
name: Yandex LLC
|
2137
|
-
url: http://company.yandex.com
|
2138
|
-
-
|
2139
|
-
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
2140
|
-
bot:
|
2141
|
-
name: Yandex Bot
|
2142
|
-
category: Search bot
|
2143
|
-
url: http://www.yandex.com/bots
|
2144
|
-
producer:
|
2145
|
-
name: Yandex LLC
|
2146
|
-
url: http://company.yandex.com
|
2147
|
-
-
|
2148
|
-
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
2149
|
-
bot:
|
2150
|
-
name: Yandex Bot
|
2151
|
-
category: Search bot
|
2152
|
-
url: http://www.yandex.com/bots
|
2153
|
-
producer:
|
2154
|
-
name: Yandex LLC
|
2155
|
-
url: http://company.yandex.com
|
2156
|
-
-
|
2157
|
-
user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
|
2158
|
-
bot:
|
2159
|
-
name: Yandex Bot
|
2160
|
-
category: Search bot
|
2161
|
-
url: http://www.yandex.com/bots
|
2162
|
-
producer:
|
2163
|
-
name: Yandex LLC
|
2164
|
-
url: http://company.yandex.com
|
2165
|
-
-
|
2166
|
-
user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
|
2167
|
-
bot:
|
2168
|
-
name: Yandex Bot
|
2169
|
-
category: Search bot
|
2170
|
-
url: http://www.yandex.com/bots
|
2171
|
-
producer:
|
2172
|
-
name: Yandex LLC
|
2173
|
-
url: http://company.yandex.com
|
2174
|
-
-
|
2175
|
-
user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
|
2176
|
-
bot:
|
2177
|
-
name: Yandex Bot
|
2178
|
-
category: Search bot
|
2179
|
-
url: http://www.yandex.com/bots
|
2180
|
-
producer:
|
2181
|
-
name: Yandex LLC
|
2182
|
-
url: http://company.yandex.com
|
2183
|
-
-
|
2184
|
-
user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
|
2185
|
-
bot:
|
2186
|
-
name: Yandex Bot
|
2187
|
-
category: Search bot
|
2188
|
-
url: http://www.yandex.com/bots
|
2189
|
-
producer:
|
2190
|
-
name: Yandex LLC
|
2191
|
-
url: http://company.yandex.com
|
2192
|
-
-
|
2193
|
-
user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
|
2194
|
-
bot:
|
2195
|
-
name: Yandex Bot
|
2196
|
-
category: Search bot
|
2197
|
-
url: http://www.yandex.com/bots
|
2198
|
-
producer:
|
2199
|
-
name: Yandex LLC
|
2200
|
-
url: http://company.yandex.com
|
2201
|
-
-
|
2202
|
-
user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
|
2203
|
-
bot:
|
2204
|
-
name: Yandex Bot
|
2205
|
-
category: Search bot
|
2206
|
-
url: http://www.yandex.com/bots
|
2207
|
-
producer:
|
2208
|
-
name: Yandex LLC
|
2209
|
-
url: http://company.yandex.com
|
2210
|
-
-
|
2211
|
-
user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
|
2212
|
-
bot:
|
2213
|
-
name: Yandex Bot
|
2214
|
-
category: Search bot
|
2215
|
-
url: http://www.yandex.com/bots
|
2216
|
-
producer:
|
2217
|
-
name: Yandex LLC
|
2218
|
-
url: http://company.yandex.com
|
2219
|
-
-
|
2220
|
-
user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
|
2221
|
-
bot:
|
2222
|
-
name: Yandex Bot
|
2223
|
-
category: Search bot
|
2224
|
-
url: http://www.yandex.com/bots
|
2225
|
-
producer:
|
2226
|
-
name: Yandex LLC
|
2227
|
-
url: http://company.yandex.com
|
2228
|
-
-
|
2229
|
-
user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
|
2230
|
-
bot:
|
2231
|
-
name: Yeti/Naverbot
|
2232
|
-
category: Search bot
|
2233
|
-
url: http://help.naver.com/robots/
|
2234
|
-
producer:
|
2235
|
-
name: Naver
|
2236
|
-
url: http://www.naver.com
|
2237
|
-
-
|
2238
|
-
user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
|
2239
|
-
bot:
|
2240
|
-
name: Youdao Bot
|
2241
|
-
category: Search bot
|
2242
|
-
url: http://www.youdao.com/help/webmaster/spider
|
2243
|
-
producer:
|
2244
|
-
name: NetEase, Inc.
|
2245
|
-
url: http://corp.163.com
|
2246
|
-
-
|
2247
|
-
user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
|
2248
|
-
bot:
|
2249
|
-
name: Yourls
|
2250
|
-
category: Crawler
|
2251
|
-
url: http://yourls.org
|
2252
|
-
-
|
2253
|
-
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
|
2254
|
-
bot:
|
2255
|
-
name: Yunyun Bot
|
2256
|
-
category: Search bot
|
2257
|
-
url: http://www.yunyun.com/SiteInfo.php?r=about
|
2258
|
-
producer:
|
2259
|
-
name: YunYun
|
2260
|
-
url: http://www.yunyun.com
|
2261
|
-
-
|
2262
|
-
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
|
2263
|
-
bot:
|
2264
|
-
name: Yunyun Bot
|
2265
|
-
category: Search bot
|
2266
|
-
url: http://www.yunyun.com/SiteInfo.php?r=about
|
2267
|
-
producer:
|
2268
|
-
name: YunYun
|
2269
|
-
url: http://www.yunyun.com
|
2270
|
-
-
|
2271
|
-
user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
|
2272
|
-
bot:
|
2273
|
-
name: Yunyun Bot
|
2274
|
-
category: Search bot
|
2275
|
-
url: http://www.yunyun.com/SiteInfo.php?r=about
|
2276
|
-
producer:
|
2277
|
-
name: YunYun
|
2278
|
-
url: http://www.yunyun.com
|
2279
|
-
-
|
2280
|
-
user_agent: Zao/0.1 (http://www.kototol.org/zao)
|
2281
|
-
bot:
|
2282
|
-
name: Zao
|
2283
|
-
category: Crawler
|
2284
|
-
-
|
2285
|
-
user_agent: Zookabot/2.5;++http://zookabot.com
|
2286
|
-
bot:
|
2287
|
-
name: Zookabot
|
2288
|
-
category: Crawler
|
2289
|
-
url: http://zookabot.com
|
2290
|
-
producer:
|
2291
|
-
name: Hwacha ApS
|
2292
|
-
url: http://hwacha.dk
|
2293
|
-
-
|
2294
|
-
user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
|
2295
|
-
bot:
|
2296
|
-
name: ZumBot
|
2297
|
-
category: Search bot
|
2298
|
-
url: http://help.zum.com/inquiry
|
2299
|
-
producer:
|
2300
|
-
name: ZUM internet
|
2301
|
-
url: http://www.zuminternet.com/
|
2302
|
-
-
|
2303
|
-
user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
|
2304
|
-
bot:
|
2305
|
-
name: ZumBot
|
2306
|
-
category: Search bot
|
2307
|
-
url: http://help.zum.com/inquiry
|
2308
|
-
producer:
|
2309
|
-
name: ZUM internet
|
2310
|
-
url: http://www.zuminternet.com/
|
2311
|
-
-
|
2312
|
-
user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
|
2313
|
-
bot:
|
2314
|
-
name: aHrefs Bot
|
2315
|
-
category: Crawler
|
2316
|
-
url: http://ahrefs.com/robot
|
2317
|
-
producer:
|
2318
|
-
name: Ahrefs Pte Ltd
|
2319
|
-
url: http://ahrefs.com/robot
|
2320
|
-
-
|
2321
|
-
user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
|
2322
|
-
bot:
|
2323
|
-
name: aHrefs Bot
|
2324
|
-
category: Crawler
|
2325
|
-
url: http://ahrefs.com/robot
|
2326
|
-
producer:
|
2327
|
-
name: Ahrefs Pte Ltd
|
2328
|
-
url: http://ahrefs.com/robot
|
2329
|
-
-
|
2330
|
-
user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
|
2331
|
-
bot:
|
2332
|
-
name: aHrefs Bot
|
2333
|
-
category: Crawler
|
2334
|
-
url: http://ahrefs.com/robot
|
2335
|
-
producer:
|
2336
|
-
name: Ahrefs Pte Ltd
|
2337
|
-
url: http://ahrefs.com/robot
|
2338
|
-
-
|
2339
|
-
user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
|
2340
|
-
bot:
|
2341
|
-
name: aHrefs Bot
|
2342
|
-
category: Crawler
|
2343
|
-
url: http://ahrefs.com/robot
|
2344
|
-
producer:
|
2345
|
-
name: Ahrefs Pte Ltd
|
2346
|
-
url: http://ahrefs.com/robot
|
2347
|
-
-
|
2348
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
|
2349
|
-
bot:
|
2350
|
-
name: archive.org bot
|
2351
|
-
category: Crawler
|
2352
|
-
url: http://www.archive.org/details/archive.org_bot
|
2353
|
-
producer:
|
2354
|
-
name: The Internet Archive
|
2355
|
-
url: http://www.archive.org
|
2356
|
-
-
|
2357
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
|
2358
|
-
bot:
|
2359
|
-
name: archive.org bot
|
2360
|
-
category: Crawler
|
2361
|
-
url: http://www.archive.org/details/archive.org_bot
|
2362
|
-
producer:
|
2363
|
-
name: The Internet Archive
|
2364
|
-
url: http://www.archive.org
|
2365
|
-
-
|
2366
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
|
2367
|
-
bot:
|
2368
|
-
name: archive.org bot
|
2369
|
-
category: Crawler
|
2370
|
-
url: http://www.archive.org/details/archive.org_bot
|
2371
|
-
producer:
|
2372
|
-
name: The Internet Archive
|
2373
|
-
url: http://www.archive.org
|
2374
|
-
-
|
2375
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
|
2376
|
-
bot:
|
2377
|
-
name: archive.org bot
|
2378
|
-
category: Crawler
|
2379
|
-
url: http://www.archive.org/details/archive.org_bot
|
2380
|
-
producer:
|
2381
|
-
name: The Internet Archive
|
2382
|
-
url: http://www.archive.org
|
2383
|
-
-
|
2384
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
|
2385
|
-
bot:
|
2386
|
-
name: archive.org bot
|
2387
|
-
category: Crawler
|
2388
|
-
url: http://www.archive.org/details/archive.org_bot
|
2389
|
-
producer:
|
2390
|
-
name: The Internet Archive
|
2391
|
-
url: http://www.archive.org
|
2392
|
-
-
|
2393
|
-
user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
|
2394
|
-
bot:
|
2395
|
-
name: archive.org bot
|
2396
|
-
category: Crawler
|
2397
|
-
url: http://www.archive.org/details/archive.org_bot
|
2398
|
-
producer:
|
2399
|
-
name: The Internet Archive
|
2400
|
-
url: http://www.archive.org
|
2401
|
-
-
|
2402
|
-
user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
|
2403
|
-
bot:
|
2404
|
-
name: archive.org bot
|
2405
|
-
category: Crawler
|
2406
|
-
url: http://www.archive.org/details/archive.org_bot
|
2407
|
-
producer:
|
2408
|
-
name: The Internet Archive
|
2409
|
-
url: http://www.archive.org
|
2410
|
-
-
|
2411
|
-
user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
|
2412
|
-
bot:
|
2413
|
-
name: ccBot crawler
|
2414
|
-
category: Crawler
|
2415
|
-
url: http://commoncrawl.org/faq/
|
2416
|
-
producer:
|
2417
|
-
name: reddit inc.
|
2418
|
-
url: http://www.reddit.com
|