device_detector 0.8.2 → 0.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.travis.yml +11 -3
- data/CHANGELOG.md +10 -5
- data/README.md +4 -4
- data/Rakefile +24 -19
- data/device_detector.gemspec +1 -1
- data/lib/device_detector.rb +25 -3
- data/lib/device_detector/device.rb +1 -1
- data/lib/device_detector/model_extractor.rb +4 -0
- data/lib/device_detector/os.rb +8 -3
- data/lib/device_detector/parser.rb +1 -1
- data/lib/device_detector/version.rb +1 -1
- data/regexes/bots.yml +211 -27
- data/regexes/client/browsers.yml +192 -58
- data/regexes/client/feed_readers.yml +6 -0
- data/regexes/client/libraries.yml +4 -0
- data/regexes/client/mediaplayers.yml +8 -4
- data/regexes/client/mobile_apps.yml +39 -4
- data/regexes/client/pim.yml +4 -0
- data/regexes/device/mobiles.yml +1803 -242
- data/regexes/device/televisions.yml +53 -11
- data/regexes/oss.yml +180 -12
- data/regexes/vendorfragments.yml +1 -0
- data/spec/device_detector/concrete_user_agent_spec.rb +36 -0
- data/spec/device_detector/detector_fixtures_spec.rb +1 -1
- data/spec/fixtures/client/browser.yml +313 -2
- data/spec/fixtures/client/feed_reader.yml +8 -1
- data/spec/fixtures/client/library.yml +7 -1
- data/spec/fixtures/client/mediaplayer.yml +6 -1
- data/spec/fixtures/client/mobile_app.yml +6 -0
- data/spec/fixtures/client/pim.yml +6 -0
- data/spec/fixtures/detector/bots.yml +2307 -612
- data/spec/fixtures/detector/camera.yml +6 -0
- data/spec/fixtures/detector/car_browser.yml +1 -0
- data/spec/fixtures/detector/console.yml +14 -0
- data/spec/fixtures/detector/desktop.yml +308 -48
- data/spec/fixtures/detector/feature_phone.yml +63 -0
- data/spec/fixtures/detector/feed_reader.yml +50 -26
- data/spec/fixtures/detector/mediaplayer.yml +28 -6
- data/spec/fixtures/detector/mobile_apps.yml +117 -0
- data/spec/fixtures/detector/phablet.yml +1066 -183
- data/spec/fixtures/detector/portable_media_player.yml +8 -0
- data/spec/fixtures/detector/smart_display.yml +39 -0
- data/spec/fixtures/detector/smartphone-1.yml +9469 -0
- data/spec/fixtures/detector/smartphone-2.yml +9414 -0
- data/spec/fixtures/detector/smartphone-3.yml +9396 -0
- data/spec/fixtures/detector/smartphone-4.yml +5742 -0
- data/spec/fixtures/detector/smartphone.yml +3446 -23680
- data/spec/fixtures/detector/tablet-1.yml +9495 -0
- data/spec/fixtures/detector/tablet-2.yml +248 -0
- data/spec/fixtures/detector/tablet.yml +2786 -7961
- data/spec/fixtures/detector/tv.yml +1376 -210
- data/spec/fixtures/detector/unknown.yml +205 -509
- data/spec/fixtures/device/console.yml +6 -0
- data/spec/fixtures/parser/oss.yml +194 -1
- data/spec/fixtures/parser/vendorfragments.yml +6 -0
- metadata +16 -6
- data/spec/fixtures/parser/bots.yml +0 -2055
@@ -25,6 +25,12 @@
|
|
25
25
|
-
|
26
26
|
useragent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; Trident/4.0; .NET CLR 1.1.4322; .NET CLR 2.0.50727; .NET CLR 3.0.4506.2152; .NET CLR 3.5.30729; CMNTDF; InfoPath.2; .NET4.0C; .NET4.0E)
|
27
27
|
vendor: CQ
|
28
|
+
-
|
29
|
+
user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.2; WOW64; Trident/6.0; .NET4.0E; .NET4.0C; .NET CLR 3.5.30729; .NET CLR 2.0.50727; .NET CLR 3.0.30729; CMDTDFJS; Tablet PC 2.0)
|
30
|
+
vendor: CQ
|
31
|
+
-
|
32
|
+
user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Trident/5.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; .NET4.0C; .NET4.0E; CMDTDF; InfoPath.3)
|
33
|
+
vendor: CQ
|
28
34
|
-
|
29
35
|
useragent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Win64; x64; Trident/4.0; .NET CLR 2.0.50727; SLCC2; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDC; .NET4.0C; .NET4.0E)
|
30
36
|
vendor: DL
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: device_detector
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.9.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Mati Sójka
|
@@ -9,7 +9,7 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date:
|
12
|
+
date: 2016-07-28 00:00:00.000000000 Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
15
|
name: minitest
|
@@ -126,20 +126,25 @@ files:
|
|
126
126
|
- spec/fixtures/detector/phablet.yml
|
127
127
|
- spec/fixtures/detector/portable_media_player.yml
|
128
128
|
- spec/fixtures/detector/smart_display.yml
|
129
|
+
- spec/fixtures/detector/smartphone-1.yml
|
130
|
+
- spec/fixtures/detector/smartphone-2.yml
|
131
|
+
- spec/fixtures/detector/smartphone-3.yml
|
132
|
+
- spec/fixtures/detector/smartphone-4.yml
|
129
133
|
- spec/fixtures/detector/smartphone.yml
|
134
|
+
- spec/fixtures/detector/tablet-1.yml
|
135
|
+
- spec/fixtures/detector/tablet-2.yml
|
130
136
|
- spec/fixtures/detector/tablet.yml
|
131
137
|
- spec/fixtures/detector/tv.yml
|
132
138
|
- spec/fixtures/detector/unknown.yml
|
133
139
|
- spec/fixtures/device/camera.yml
|
134
140
|
- spec/fixtures/device/car_browser.yml
|
135
141
|
- spec/fixtures/device/console.yml
|
136
|
-
- spec/fixtures/parser/bots.yml
|
137
142
|
- spec/fixtures/parser/oss.yml
|
138
143
|
- spec/fixtures/parser/vendorfragments.yml
|
139
144
|
- spec/spec_helper.rb
|
140
145
|
homepage: http://podigee.github.io/device_detector
|
141
146
|
licenses:
|
142
|
-
-
|
147
|
+
- LGPL-3.0
|
143
148
|
metadata: {}
|
144
149
|
post_install_message:
|
145
150
|
rdoc_options: []
|
@@ -157,7 +162,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
157
162
|
version: '0'
|
158
163
|
requirements: []
|
159
164
|
rubyforge_project:
|
160
|
-
rubygems_version: 2.
|
165
|
+
rubygems_version: 2.5.1
|
161
166
|
signing_key:
|
162
167
|
specification_version: 4
|
163
168
|
summary: Precise and fast user agent parser and device detector
|
@@ -191,14 +196,19 @@ test_files:
|
|
191
196
|
- spec/fixtures/detector/phablet.yml
|
192
197
|
- spec/fixtures/detector/portable_media_player.yml
|
193
198
|
- spec/fixtures/detector/smart_display.yml
|
199
|
+
- spec/fixtures/detector/smartphone-1.yml
|
200
|
+
- spec/fixtures/detector/smartphone-2.yml
|
201
|
+
- spec/fixtures/detector/smartphone-3.yml
|
202
|
+
- spec/fixtures/detector/smartphone-4.yml
|
194
203
|
- spec/fixtures/detector/smartphone.yml
|
204
|
+
- spec/fixtures/detector/tablet-1.yml
|
205
|
+
- spec/fixtures/detector/tablet-2.yml
|
195
206
|
- spec/fixtures/detector/tablet.yml
|
196
207
|
- spec/fixtures/detector/tv.yml
|
197
208
|
- spec/fixtures/detector/unknown.yml
|
198
209
|
- spec/fixtures/device/camera.yml
|
199
210
|
- spec/fixtures/device/car_browser.yml
|
200
211
|
- spec/fixtures/device/console.yml
|
201
|
-
- spec/fixtures/parser/bots.yml
|
202
212
|
- spec/fixtures/parser/oss.yml
|
203
213
|
- spec/fixtures/parser/vendorfragments.yml
|
204
214
|
- spec/spec_helper.rb
|
@@ -1,2055 +0,0 @@
|
|
1
|
-
-
|
2
|
-
user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
|
3
|
-
bot:
|
4
|
-
name: '360Spider'
|
5
|
-
category: 'Search bot'
|
6
|
-
url: 'http://www.so.com/help/help_3_2.html'
|
7
|
-
producer:
|
8
|
-
name: 'Online Media Group, Inc.'
|
9
|
-
url: ''
|
10
|
-
-
|
11
|
-
user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
|
12
|
-
bot:
|
13
|
-
name: '360Spider'
|
14
|
-
category: 'Search bot'
|
15
|
-
url: 'http://www.so.com/help/help_3_2.html'
|
16
|
-
producer:
|
17
|
-
name: 'Online Media Group, Inc.'
|
18
|
-
url: ''
|
19
|
-
-
|
20
|
-
user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
|
21
|
-
bot:
|
22
|
-
name: '360Spider'
|
23
|
-
category: 'Search bot'
|
24
|
-
url: 'http://www.so.com/help/help_3_2.html'
|
25
|
-
producer:
|
26
|
-
name: 'Online Media Group, Inc.'
|
27
|
-
url: ''
|
28
|
-
-
|
29
|
-
user_agent: 360spider-image
|
30
|
-
bot:
|
31
|
-
name: '360Spider'
|
32
|
-
category: 'Search bot'
|
33
|
-
url: 'http://www.so.com/help/help_3_2.html'
|
34
|
-
producer:
|
35
|
-
name: 'Online Media Group, Inc.'
|
36
|
-
url: ''
|
37
|
-
-
|
38
|
-
user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
|
39
|
-
bot:
|
40
|
-
name: 'Aboundexbot'
|
41
|
-
category: 'Search bot'
|
42
|
-
url: 'http://www.aboundex.com/crawler/'
|
43
|
-
producer:
|
44
|
-
name: 'Aboundex.com'
|
45
|
-
url: 'http://www.aboundex.com'
|
46
|
-
-
|
47
|
-
user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
|
48
|
-
bot:
|
49
|
-
name: 'Acoon'
|
50
|
-
category: 'Search bot'
|
51
|
-
url: 'http://www.acoon.de/robot.asp'
|
52
|
-
producer:
|
53
|
-
name: 'Acoon GmbH'
|
54
|
-
url: 'http://www.acoon.de'
|
55
|
-
-
|
56
|
-
user_agent: AddThis.com robot tech.support@clearspring.com
|
57
|
-
bot:
|
58
|
-
name: 'AddThis.com'
|
59
|
-
category: 'Social Media Agent'
|
60
|
-
url: ''
|
61
|
-
producer:
|
62
|
-
name: 'Clearspring Technologies, Inc.'
|
63
|
-
url: 'http://www.clearspring.com'
|
64
|
-
-
|
65
|
-
user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
|
66
|
-
bot:
|
67
|
-
name: 'aHrefs Bot'
|
68
|
-
category: 'Crawler'
|
69
|
-
url: 'http://ahrefs.com/robot'
|
70
|
-
producer:
|
71
|
-
name: 'Ahrefs Pte Ltd'
|
72
|
-
url: 'http://ahrefs.com/robot'
|
73
|
-
-
|
74
|
-
user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
|
75
|
-
bot:
|
76
|
-
name: 'aHrefs Bot'
|
77
|
-
category: 'Crawler'
|
78
|
-
url: 'http://ahrefs.com/robot'
|
79
|
-
producer:
|
80
|
-
name: 'Ahrefs Pte Ltd'
|
81
|
-
url: 'http://ahrefs.com/robot'
|
82
|
-
-
|
83
|
-
user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
|
84
|
-
bot:
|
85
|
-
name: 'aHrefs Bot'
|
86
|
-
category: 'Crawler'
|
87
|
-
url: 'http://ahrefs.com/robot'
|
88
|
-
producer:
|
89
|
-
name: 'Ahrefs Pte Ltd'
|
90
|
-
url: 'http://ahrefs.com/robot'
|
91
|
-
-
|
92
|
-
user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
|
93
|
-
bot:
|
94
|
-
name: 'aHrefs Bot'
|
95
|
-
category: 'Crawler'
|
96
|
-
url: 'http://ahrefs.com/robot'
|
97
|
-
producer:
|
98
|
-
name: 'Ahrefs Pte Ltd'
|
99
|
-
url: 'http://ahrefs.com/robot'
|
100
|
-
-
|
101
|
-
user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
|
102
|
-
bot:
|
103
|
-
name: 'Alexa Crawler'
|
104
|
-
category: 'Search bot'
|
105
|
-
url: 'https://alexa.zendesk.com/hc/en-us/sections/200100794-Crawlers'
|
106
|
-
producer:
|
107
|
-
name: 'Alexa Internet'
|
108
|
-
url: 'http://www.alexa.com'
|
109
|
-
-
|
110
|
-
user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
|
111
|
-
bot:
|
112
|
-
name: 'Amorank Spider'
|
113
|
-
category: 'Crawler'
|
114
|
-
url: 'http://amorank.com/webcrawler.html'
|
115
|
-
producer:
|
116
|
-
name: 'Amorank'
|
117
|
-
url: 'http://www.amorank.com'
|
118
|
-
-
|
119
|
-
user_agent: Curious George - www.analyticsseo.com/crawler
|
120
|
-
bot:
|
121
|
-
name: 'Analytics SEO Crawler'
|
122
|
-
category: 'Crawler'
|
123
|
-
url: 'http://www.analyticsseo.com/crawler'
|
124
|
-
producer:
|
125
|
-
name: 'Analytics SEO'
|
126
|
-
url: 'http://www.analyticsseo.com'
|
127
|
-
-
|
128
|
-
user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
|
129
|
-
bot:
|
130
|
-
name: 'archive.org bot'
|
131
|
-
category: 'Crawler'
|
132
|
-
url: 'http://www.archive.org/details/archive.org_bot'
|
133
|
-
producer:
|
134
|
-
name: 'The Internet Archive'
|
135
|
-
url: 'http://www.archive.org'
|
136
|
-
-
|
137
|
-
user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
|
138
|
-
bot:
|
139
|
-
name: 'archive.org bot'
|
140
|
-
category: 'Crawler'
|
141
|
-
url: 'http://www.archive.org/details/archive.org_bot'
|
142
|
-
producer:
|
143
|
-
name: 'The Internet Archive'
|
144
|
-
url: 'http://www.archive.org'
|
145
|
-
-
|
146
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
|
147
|
-
bot:
|
148
|
-
name: 'archive.org bot'
|
149
|
-
category: 'Crawler'
|
150
|
-
url: 'http://www.archive.org/details/archive.org_bot'
|
151
|
-
producer:
|
152
|
-
name: 'The Internet Archive'
|
153
|
-
url: 'http://www.archive.org'
|
154
|
-
-
|
155
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
|
156
|
-
bot:
|
157
|
-
name: 'archive.org bot'
|
158
|
-
category: 'Crawler'
|
159
|
-
url: 'http://www.archive.org/details/archive.org_bot'
|
160
|
-
producer:
|
161
|
-
name: 'The Internet Archive'
|
162
|
-
url: 'http://www.archive.org'
|
163
|
-
-
|
164
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
|
165
|
-
bot:
|
166
|
-
name: 'archive.org bot'
|
167
|
-
category: 'Crawler'
|
168
|
-
url: 'http://www.archive.org/details/archive.org_bot'
|
169
|
-
producer:
|
170
|
-
name: 'The Internet Archive'
|
171
|
-
url: 'http://www.archive.org'
|
172
|
-
-
|
173
|
-
user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
|
174
|
-
bot:
|
175
|
-
name: 'archive.org bot'
|
176
|
-
category: 'Crawler'
|
177
|
-
url: 'http://www.archive.org/details/archive.org_bot'
|
178
|
-
producer:
|
179
|
-
name: 'The Internet Archive'
|
180
|
-
url: 'http://www.archive.org'
|
181
|
-
-
|
182
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
|
183
|
-
bot:
|
184
|
-
name: 'archive.org bot'
|
185
|
-
category: 'Crawler'
|
186
|
-
url: 'http://www.archive.org/details/archive.org_bot'
|
187
|
-
producer:
|
188
|
-
name: 'The Internet Archive'
|
189
|
-
url: 'http://www.archive.org'
|
190
|
-
-
|
191
|
-
user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
|
192
|
-
bot:
|
193
|
-
name: 'Ask Jeeves'
|
194
|
-
category: 'Search bot'
|
195
|
-
url: ''
|
196
|
-
producer:
|
197
|
-
name: 'Ask Jeeves Inc.'
|
198
|
-
url: 'http://www.ask.com'
|
199
|
-
-
|
200
|
-
user_agent: Backlink-Ceck.de (+http://www.backlink-check.de/bot.html)
|
201
|
-
bot:
|
202
|
-
name: 'Backlink-Ceck.de'
|
203
|
-
category: 'Crawler'
|
204
|
-
url: 'http://www.backlink-check.de/bot.html'
|
205
|
-
producer:
|
206
|
-
name: 'Mediagreen Medienservice'
|
207
|
-
url: 'http://www.backlink-check.de'
|
208
|
-
-
|
209
|
-
user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
|
210
|
-
bot:
|
211
|
-
name: 'BacklinkCrawler'
|
212
|
-
category: 'Crawler'
|
213
|
-
url: 'http://www.backlinktest.com/crawler.html'
|
214
|
-
producer:
|
215
|
-
name: '2.0Promotion GbR'
|
216
|
-
url: 'http://www.backlinktest.com'
|
217
|
-
-
|
218
|
-
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
|
219
|
-
bot:
|
220
|
-
name: 'Baidu Spider'
|
221
|
-
category: 'Search bot'
|
222
|
-
url: 'http://www.baidu.com/search/spider.htm'
|
223
|
-
producer:
|
224
|
-
name: 'Baidu'
|
225
|
-
url: 'http://www.baidu.com'
|
226
|
-
-
|
227
|
-
user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
|
228
|
-
bot:
|
229
|
-
name: 'Baidu Spider'
|
230
|
-
category: 'Search bot'
|
231
|
-
url: 'http://www.baidu.com/search/spider.htm'
|
232
|
-
producer:
|
233
|
-
name: 'Baidu'
|
234
|
-
url: 'http://www.baidu.com'
|
235
|
-
-
|
236
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
|
237
|
-
bot:
|
238
|
-
name: 'Baidu Spider'
|
239
|
-
category: 'Search bot'
|
240
|
-
url: 'http://www.baidu.com/search/spider.htm'
|
241
|
-
producer:
|
242
|
-
name: 'Baidu'
|
243
|
-
url: 'http://www.baidu.com'
|
244
|
-
-
|
245
|
-
user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
|
246
|
-
bot:
|
247
|
-
name: 'Baidu Spider'
|
248
|
-
category: 'Search bot'
|
249
|
-
url: 'http://www.baidu.com/search/spider.htm'
|
250
|
-
producer:
|
251
|
-
name: 'Baidu'
|
252
|
-
url: 'http://www.baidu.com'
|
253
|
-
-
|
254
|
-
user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
|
255
|
-
bot:
|
256
|
-
name: 'Baidu Spider'
|
257
|
-
category: 'Search bot'
|
258
|
-
url: 'http://www.baidu.com/search/spider.htm'
|
259
|
-
producer:
|
260
|
-
name: 'Baidu'
|
261
|
-
url: 'http://www.baidu.com'
|
262
|
-
-
|
263
|
-
user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
|
264
|
-
bot:
|
265
|
-
name: 'Baidu Spider'
|
266
|
-
category: 'Search bot'
|
267
|
-
url: 'http://www.baidu.com/search/spider.htm'
|
268
|
-
producer:
|
269
|
-
name: 'Baidu'
|
270
|
-
url: 'http://www.baidu.com'
|
271
|
-
-
|
272
|
-
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
|
273
|
-
bot:
|
274
|
-
name: 'Baidu Spider'
|
275
|
-
category: 'Search bot'
|
276
|
-
url: 'http://www.baidu.com/search/spider.htm'
|
277
|
-
producer:
|
278
|
-
name: 'Baidu'
|
279
|
-
url: 'http://www.baidu.com'
|
280
|
-
-
|
281
|
-
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
|
282
|
-
bot:
|
283
|
-
name: 'BingBot'
|
284
|
-
category: 'Search bot'
|
285
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
286
|
-
producer:
|
287
|
-
name: 'Microsoft Corporation'
|
288
|
-
url: 'http://www.microsoft.com'
|
289
|
-
-
|
290
|
-
user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
|
291
|
-
bot:
|
292
|
-
name: 'BingBot'
|
293
|
-
category: 'Search bot'
|
294
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
295
|
-
producer:
|
296
|
-
name: 'Microsoft Corporation'
|
297
|
-
url: 'http://www.microsoft.com'
|
298
|
-
-
|
299
|
-
user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
|
300
|
-
bot:
|
301
|
-
name: 'BingBot'
|
302
|
-
category: 'Search bot'
|
303
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
304
|
-
producer:
|
305
|
-
name: 'Microsoft Corporation'
|
306
|
-
url: 'http://www.microsoft.com'
|
307
|
-
-
|
308
|
-
user_agent: MSNBot/Nutch-1.5.1
|
309
|
-
bot:
|
310
|
-
name: 'BingBot'
|
311
|
-
category: 'Search bot'
|
312
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
313
|
-
producer:
|
314
|
-
name: 'Microsoft Corporation'
|
315
|
-
url: 'http://www.microsoft.com'
|
316
|
-
-
|
317
|
-
user_agent: msnbot/2.0b v1394720947.6703
|
318
|
-
bot:
|
319
|
-
name: 'BingBot'
|
320
|
-
category: 'Search bot'
|
321
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
322
|
-
producer:
|
323
|
-
name: 'Microsoft Corporation'
|
324
|
-
url: 'http://www.microsoft.com'
|
325
|
-
-
|
326
|
-
user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
|
327
|
-
bot:
|
328
|
-
name: 'BingBot'
|
329
|
-
category: 'Search bot'
|
330
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
331
|
-
producer:
|
332
|
-
name: 'Microsoft Corporation'
|
333
|
-
url: 'http://www.microsoft.com'
|
334
|
-
-
|
335
|
-
user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
|
336
|
-
bot:
|
337
|
-
name: 'BingBot'
|
338
|
-
category: 'Search bot'
|
339
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
340
|
-
producer:
|
341
|
-
name: 'Microsoft Corporation'
|
342
|
-
url: 'http://www.microsoft.com'
|
343
|
-
-
|
344
|
-
user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
|
345
|
-
bot:
|
346
|
-
name: 'BingBot'
|
347
|
-
category: 'Search bot'
|
348
|
-
url: 'http://search.msn.com/msnbot.htmn'
|
349
|
-
producer:
|
350
|
-
name: 'Microsoft Corporation'
|
351
|
-
url: 'http://www.microsoft.com'
|
352
|
-
-
|
353
|
-
user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
|
354
|
-
bot:
|
355
|
-
name: 'Blekkobot'
|
356
|
-
category: 'Search bot'
|
357
|
-
url: 'http://blekko.com/about/blekkobot'
|
358
|
-
producer:
|
359
|
-
name: 'Blekko'
|
360
|
-
url: 'http://blekko.com'
|
361
|
-
-
|
362
|
-
user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
|
363
|
-
bot:
|
364
|
-
name: 'BLEXBot Crawler'
|
365
|
-
category: 'Crawler'
|
366
|
-
url: 'http://webmeup-crawler.com'
|
367
|
-
producer:
|
368
|
-
name: 'WebMeUp'
|
369
|
-
url: 'http://webmeup.com'
|
370
|
-
-
|
371
|
-
user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
|
372
|
-
bot:
|
373
|
-
name: 'Bloglovin'
|
374
|
-
url: 'http://www.bloglovin.com'
|
375
|
-
category: 'Feed Fetcher'
|
376
|
-
producer:
|
377
|
-
name: ''
|
378
|
-
url: ''
|
379
|
-
-
|
380
|
-
user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
|
381
|
-
bot:
|
382
|
-
name: 'Bountii Bot'
|
383
|
-
category: 'Search bot'
|
384
|
-
url: 'http://bountii.com/contact.php'
|
385
|
-
producer:
|
386
|
-
name: 'Bountii Inc.'
|
387
|
-
url: 'http://bountii.com'
|
388
|
-
-
|
389
|
-
user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
390
|
-
bot:
|
391
|
-
name: 'Butterfly Robot'
|
392
|
-
category: 'Search bot'
|
393
|
-
url: 'http://labs.topsy.com/butterfly'
|
394
|
-
producer:
|
395
|
-
name: 'Topsy Labs'
|
396
|
-
url: 'http://labs.topsy.com'
|
397
|
-
-
|
398
|
-
user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
399
|
-
bot:
|
400
|
-
name: 'Butterfly Robot'
|
401
|
-
category: 'Search bot'
|
402
|
-
url: 'http://labs.topsy.com/butterfly'
|
403
|
-
producer:
|
404
|
-
name: 'Topsy Labs'
|
405
|
-
url: 'http://labs.topsy.com'
|
406
|
-
-
|
407
|
-
user_agent: Browsershots
|
408
|
-
bot:
|
409
|
-
name: 'Browsershots'
|
410
|
-
category: 'Service Agent'
|
411
|
-
url: 'http://browsershots.org/faq'
|
412
|
-
producer:
|
413
|
-
name: 'Browsershots.org'
|
414
|
-
url: 'http://browsershots.org'
|
415
|
-
-
|
416
|
-
user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
|
417
|
-
bot:
|
418
|
-
name: 'CareerBot'
|
419
|
-
category: 'Crawler'
|
420
|
-
url: 'http://www.career-x.de/bot.html'
|
421
|
-
producer:
|
422
|
-
name: 'career-x GmbH'
|
423
|
-
url: 'http://www.career-x.de'
|
424
|
-
-
|
425
|
-
user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
|
426
|
-
bot:
|
427
|
-
name: 'ccBot crawler'
|
428
|
-
category: 'Crawler'
|
429
|
-
url: 'http://commoncrawl.org/faq/'
|
430
|
-
producer:
|
431
|
-
name: 'reddit inc.'
|
432
|
-
url: 'http://www.reddit.com'
|
433
|
-
-
|
434
|
-
user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
|
435
|
-
bot:
|
436
|
-
name: 'Cliqzbot'
|
437
|
-
category: 'Crawler'
|
438
|
-
url: 'http://cliqz.com/company/cliqzbot'
|
439
|
-
producer:
|
440
|
-
name: '10betterpages GmbH'
|
441
|
-
url: 'http://cliqz.com'
|
442
|
-
-
|
443
|
-
user_agent: CommaFeed/1.0 (http://www.commafeed.com)
|
444
|
-
bot:
|
445
|
-
name: 'CommaFeed'
|
446
|
-
url: 'http://www.commafeed.com'
|
447
|
-
category: 'Feed Fetcher'
|
448
|
-
producer:
|
449
|
-
name: ''
|
450
|
-
url: ''
|
451
|
-
-
|
452
|
-
user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
|
453
|
-
bot:
|
454
|
-
name: 'Dazoobot'
|
455
|
-
category: 'Search bot'
|
456
|
-
url: ''
|
457
|
-
producer:
|
458
|
-
name: 'DAZOO.FR'
|
459
|
-
url: 'http://dazoo.fr'
|
460
|
-
-
|
461
|
-
user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
|
462
|
-
bot:
|
463
|
-
name: 'Discobot'
|
464
|
-
category: 'Search bot'
|
465
|
-
url: 'http://discoveryengine.com/discobot.html'
|
466
|
-
producer:
|
467
|
-
name: 'Discovery Engine'
|
468
|
-
url: 'http://discoveryengine.com'
|
469
|
-
-
|
470
|
-
user_agent: dotbot
|
471
|
-
bot:
|
472
|
-
name: 'DotBot'
|
473
|
-
category: 'Crawler'
|
474
|
-
url: 'http://www.opensiteexplorer.org/dotbot'
|
475
|
-
producer:
|
476
|
-
name: 'SEOmoz, Inc.'
|
477
|
-
url: 'http://moz.com/'
|
478
|
-
-
|
479
|
-
user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
|
480
|
-
bot:
|
481
|
-
name: 'Easou Spider'
|
482
|
-
category: 'Search bot'
|
483
|
-
url: 'http://www.easou.com/search/spider.html'
|
484
|
-
producer:
|
485
|
-
name: 'easou ICP'
|
486
|
-
url: 'http://www.easou.com'
|
487
|
-
-
|
488
|
-
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
|
489
|
-
bot:
|
490
|
-
name: 'Easou Spider'
|
491
|
-
category: 'Search bot'
|
492
|
-
url: 'http://www.easou.com/search/spider.html'
|
493
|
-
producer:
|
494
|
-
name: 'easou ICP'
|
495
|
-
url: 'http://www.easou.com'
|
496
|
-
-
|
497
|
-
user_agent: EMail Exractor
|
498
|
-
bot:
|
499
|
-
name: 'EMail Exractor'
|
500
|
-
category: 'Crawler'
|
501
|
-
url: ''
|
502
|
-
producer:
|
503
|
-
name: ''
|
504
|
-
url: ''
|
505
|
-
-
|
506
|
-
user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
|
507
|
-
bot:
|
508
|
-
name: 'ExaBot'
|
509
|
-
category: 'Crawler'
|
510
|
-
url: 'http://www.exabot.com/go/robot'
|
511
|
-
producer:
|
512
|
-
name: 'Dassault Systèmes'
|
513
|
-
url: 'http://www.3ds.com'
|
514
|
-
-
|
515
|
-
user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
|
516
|
-
bot:
|
517
|
-
name: 'ExaBot'
|
518
|
-
category: 'Crawler'
|
519
|
-
url: 'http://www.exabot.com/go/robot'
|
520
|
-
producer:
|
521
|
-
name: 'Dassault Systèmes'
|
522
|
-
url: 'http://www.3ds.com'
|
523
|
-
-
|
524
|
-
user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
|
525
|
-
bot:
|
526
|
-
name: 'ExaBot'
|
527
|
-
category: 'Crawler'
|
528
|
-
url: 'http://www.exabot.com/go/robot'
|
529
|
-
producer:
|
530
|
-
name: 'Dassault Systèmes'
|
531
|
-
url: 'http://www.3ds.com'
|
532
|
-
-
|
533
|
-
user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
|
534
|
-
bot:
|
535
|
-
name: 'ExactSeek Crawler'
|
536
|
-
category: 'Search bot'
|
537
|
-
url: 'http://www.exactseek.com'
|
538
|
-
producer:
|
539
|
-
name: 'Jayde Online, Inc.'
|
540
|
-
url: 'http://www.jaydeonlineinc.com'
|
541
|
-
-
|
542
|
-
user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
|
543
|
-
bot:
|
544
|
-
name: 'Ezooms'
|
545
|
-
category: 'Crawler'
|
546
|
-
url: ''
|
547
|
-
producer:
|
548
|
-
name: 'SEOmoz, Inc.'
|
549
|
-
url: 'http://moz.com/'
|
550
|
-
-
|
551
|
-
user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
|
552
|
-
bot:
|
553
|
-
name: 'Facebook External Hit'
|
554
|
-
category: 'Social Media Agent'
|
555
|
-
url: 'https://www.facebook.com/externalhit_uatext.php'
|
556
|
-
producer:
|
557
|
-
name: 'Facebook'
|
558
|
-
url: 'http://www.facebook.com'
|
559
|
-
-
|
560
|
-
user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
|
561
|
-
bot:
|
562
|
-
name: 'Facebook External Hit'
|
563
|
-
category: 'Social Media Agent'
|
564
|
-
url: 'https://www.facebook.com/externalhit_uatext.php'
|
565
|
-
producer:
|
566
|
-
name: 'Facebook'
|
567
|
-
url: 'http://www.facebook.com'
|
568
|
-
-
|
569
|
-
user_agent: Feedbin - 9 subscribers
|
570
|
-
bot:
|
571
|
-
name: 'Feedbin'
|
572
|
-
url: 'http://feedbin.com/'
|
573
|
-
category: 'Feed Fetcher'
|
574
|
-
producer:
|
575
|
-
name: ''
|
576
|
-
url: ''
|
577
|
-
-
|
578
|
-
user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
|
579
|
-
bot:
|
580
|
-
name: 'FeedBurner'
|
581
|
-
url: 'http://www.feedburner.com'
|
582
|
-
category: 'Feed Fetcher'
|
583
|
-
producer:
|
584
|
-
name: ''
|
585
|
-
url: ''
|
586
|
-
-
|
587
|
-
user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
|
588
|
-
bot:
|
589
|
-
name: 'Feedly'
|
590
|
-
url: 'http://www.feedly.com'
|
591
|
-
category: 'Feed Fetcher'
|
592
|
-
producer:
|
593
|
-
name: ''
|
594
|
-
url: ''
|
595
|
-
-
|
596
|
-
user_agent: FeedlyBot/1.0 (http://feedly.com)
|
597
|
-
bot:
|
598
|
-
name: 'Feedly'
|
599
|
-
url: 'http://www.feedly.com'
|
600
|
-
category: 'Feed Fetcher'
|
601
|
-
producer:
|
602
|
-
name: ''
|
603
|
-
url: ''
|
604
|
-
-
|
605
|
-
user_agent: FeedlyApp/1.0 (http://www.feedly.com)
|
606
|
-
bot:
|
607
|
-
name: 'Feedly'
|
608
|
-
url: 'http://www.feedly.com'
|
609
|
-
category: 'Feed Fetcher'
|
610
|
-
producer:
|
611
|
-
name: ''
|
612
|
-
url: ''
|
613
|
-
-
|
614
|
-
user_agent: MetaFeedly/1.0 (http://www.feedly.com)
|
615
|
-
bot:
|
616
|
-
name: 'Feedly'
|
617
|
-
url: 'http://www.feedly.com'
|
618
|
-
category: 'Feed Fetcher'
|
619
|
-
producer:
|
620
|
-
name: ''
|
621
|
-
url: ''
|
622
|
-
-
|
623
|
-
user_agent: Feedspot http://www.feedspot.com
|
624
|
-
bot:
|
625
|
-
name: 'Feedspot'
|
626
|
-
url: 'http://www.feedspot.com'
|
627
|
-
category: 'Feed Fetcher'
|
628
|
-
producer:
|
629
|
-
name: ''
|
630
|
-
url: ''
|
631
|
-
-
|
632
|
-
user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
|
633
|
-
bot:
|
634
|
-
name: 'Fever'
|
635
|
-
url: 'http://feedafever.com/'
|
636
|
-
category: 'Feed Fetcher'
|
637
|
-
producer:
|
638
|
-
name: ''
|
639
|
-
url: ''
|
640
|
-
-
|
641
|
-
user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
|
642
|
-
bot:
|
643
|
-
name: 'Genieo Web filter'
|
644
|
-
category: ''
|
645
|
-
url: 'http://www.genieo.com/webfilter.html'
|
646
|
-
producer:
|
647
|
-
name: 'Genieo'
|
648
|
-
url: 'http://www.genieo.com'
|
649
|
-
-
|
650
|
-
user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
|
651
|
-
bot:
|
652
|
-
name: 'Goo'
|
653
|
-
category: 'Search bot'
|
654
|
-
url: 'http://search.goo.ne.jp/option/use/sub4/sub4-1'
|
655
|
-
producer:
|
656
|
-
name: 'NTT Resonant'
|
657
|
-
url: 'http://goo.ne.jp'
|
658
|
-
-
|
659
|
-
user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
|
660
|
-
bot:
|
661
|
-
name: 'Googlebot'
|
662
|
-
category: 'Search bot'
|
663
|
-
url: 'http://www.google.com/bot.html'
|
664
|
-
producer:
|
665
|
-
name: 'Google Inc.'
|
666
|
-
url: 'http://www.google.com'
|
667
|
-
-
|
668
|
-
user_agent: Googlebot/Nutch-1.7
|
669
|
-
bot:
|
670
|
-
name: 'Googlebot'
|
671
|
-
category: 'Search bot'
|
672
|
-
url: 'http://www.google.com/bot.html'
|
673
|
-
producer:
|
674
|
-
name: 'Google Inc.'
|
675
|
-
url: 'http://www.google.com'
|
676
|
-
-
|
677
|
-
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
|
678
|
-
bot:
|
679
|
-
name: 'Googlebot'
|
680
|
-
category: 'Search bot'
|
681
|
-
url: 'http://www.google.com/bot.html'
|
682
|
-
producer:
|
683
|
-
name: 'Google Inc.'
|
684
|
-
url: 'http://www.google.com'
|
685
|
-
-
|
686
|
-
user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
|
687
|
-
bot:
|
688
|
-
name: 'Googlebot'
|
689
|
-
category: 'Search bot'
|
690
|
-
url: 'http://www.google.com/bot.html'
|
691
|
-
producer:
|
692
|
-
name: 'Google Inc.'
|
693
|
-
url: 'http://www.google.com'
|
694
|
-
-
|
695
|
-
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
696
|
-
bot:
|
697
|
-
name: 'Googlebot'
|
698
|
-
category: 'Search bot'
|
699
|
-
url: 'http://www.google.com/bot.html'
|
700
|
-
producer:
|
701
|
-
name: 'Google Inc.'
|
702
|
-
url: 'http://www.google.com'
|
703
|
-
-
|
704
|
-
user_agent: Googlebot-Image/1.0
|
705
|
-
bot:
|
706
|
-
name: 'Googlebot'
|
707
|
-
category: 'Search bot'
|
708
|
-
url: 'http://www.google.com/bot.html'
|
709
|
-
producer:
|
710
|
-
name: 'Google Inc.'
|
711
|
-
url: 'http://www.google.com'
|
712
|
-
-
|
713
|
-
user_agent: Googlebot (gocrawl v0.4)
|
714
|
-
bot:
|
715
|
-
name: 'Googlebot'
|
716
|
-
category: 'Search bot'
|
717
|
-
url: 'http://www.google.com/bot.html'
|
718
|
-
producer:
|
719
|
-
name: 'Google Inc.'
|
720
|
-
url: 'http://www.google.com'
|
721
|
-
-
|
722
|
-
user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
|
723
|
-
bot:
|
724
|
-
name: 'Googlebot'
|
725
|
-
category: 'Search bot'
|
726
|
-
url: 'http://www.google.com/bot.html'
|
727
|
-
producer:
|
728
|
-
name: 'Google Inc.'
|
729
|
-
url: 'http://www.google.com'
|
730
|
-
-
|
731
|
-
user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
732
|
-
bot:
|
733
|
-
name: 'Googlebot'
|
734
|
-
category: 'Search bot'
|
735
|
-
url: 'http://www.google.com/bot.html'
|
736
|
-
producer:
|
737
|
-
name: 'Google Inc.'
|
738
|
-
url: 'http://www.google.com'
|
739
|
-
-
|
740
|
-
user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
741
|
-
bot:
|
742
|
-
name: 'Googlebot'
|
743
|
-
category: 'Search bot'
|
744
|
-
url: 'http://www.google.com/bot.html'
|
745
|
-
producer:
|
746
|
-
name: 'Google Inc.'
|
747
|
-
url: 'http://www.google.com'
|
748
|
-
-
|
749
|
-
user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
|
750
|
-
bot:
|
751
|
-
name: 'Googlebot'
|
752
|
-
category: 'Search bot'
|
753
|
-
url: 'http://www.google.com/bot.html'
|
754
|
-
producer:
|
755
|
-
name: 'Google Inc.'
|
756
|
-
url: 'http://www.google.com'
|
757
|
-
-
|
758
|
-
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
|
759
|
-
bot:
|
760
|
-
name: 'Googlebot'
|
761
|
-
category: 'Search bot'
|
762
|
-
url: 'http://www.google.com/bot.html'
|
763
|
-
producer:
|
764
|
-
name: 'Google Inc.'
|
765
|
-
url: 'http://www.google.com'
|
766
|
-
-
|
767
|
-
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
|
768
|
-
bot:
|
769
|
-
name: 'Googlebot'
|
770
|
-
category: 'Search bot'
|
771
|
-
url: 'http://www.google.com/bot.html'
|
772
|
-
producer:
|
773
|
-
name: 'Google Inc.'
|
774
|
-
url: 'http://www.google.com'
|
775
|
-
-
|
776
|
-
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
|
777
|
-
bot:
|
778
|
-
name: 'Googlebot'
|
779
|
-
category: 'Search bot'
|
780
|
-
url: 'http://www.google.com/bot.html'
|
781
|
-
producer:
|
782
|
-
name: 'Google Inc.'
|
783
|
-
url: 'http://www.google.com'
|
784
|
-
-
|
785
|
-
user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
|
786
|
-
bot:
|
787
|
-
name: 'Googlebot'
|
788
|
-
category: 'Search bot'
|
789
|
-
url: 'http://www.google.com/bot.html'
|
790
|
-
producer:
|
791
|
-
name: 'Google Inc.'
|
792
|
-
url: 'http://www.google.com'
|
793
|
-
-
|
794
|
-
user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
|
795
|
-
bot:
|
796
|
-
name: 'Googlebot'
|
797
|
-
category: 'Search bot'
|
798
|
-
url: 'http://www.google.com/bot.html'
|
799
|
-
producer:
|
800
|
-
name: 'Google Inc.'
|
801
|
-
url: 'http://www.google.com'
|
802
|
-
-
|
803
|
-
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
|
804
|
-
bot:
|
805
|
-
name: 'Googlebot'
|
806
|
-
category: 'Search bot'
|
807
|
-
url: 'http://www.google.com/bot.html'
|
808
|
-
producer:
|
809
|
-
name: 'Google Inc.'
|
810
|
-
url: 'http://www.google.com'
|
811
|
-
-
|
812
|
-
user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
|
813
|
-
bot:
|
814
|
-
name: 'Googlebot'
|
815
|
-
category: 'Search bot'
|
816
|
-
url: 'http://www.google.com/bot.html'
|
817
|
-
producer:
|
818
|
-
name: 'Google Inc.'
|
819
|
-
url: 'http://www.google.com'
|
820
|
-
-
|
821
|
-
user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
|
822
|
-
bot:
|
823
|
-
name: 'Googlebot'
|
824
|
-
category: 'Search bot'
|
825
|
-
url: 'http://www.google.com/bot.html'
|
826
|
-
producer:
|
827
|
-
name: 'Google Inc.'
|
828
|
-
url: 'http://www.google.com'
|
829
|
-
-
|
830
|
-
user_agent: Mediapartners-Google
|
831
|
-
bot:
|
832
|
-
name: 'Googlebot'
|
833
|
-
category: 'Search bot'
|
834
|
-
url: 'http://www.google.com/bot.html'
|
835
|
-
producer:
|
836
|
-
name: 'Google Inc.'
|
837
|
-
url: 'http://www.google.com'
|
838
|
-
-
|
839
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
|
840
|
-
bot:
|
841
|
-
name: 'Heritrix'
|
842
|
-
category: 'Crawler'
|
843
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
844
|
-
producer:
|
845
|
-
name: 'The Internet Archive'
|
846
|
-
url: 'http://www.archive.org'
|
847
|
-
-
|
848
|
-
user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
|
849
|
-
bot:
|
850
|
-
name: 'Heritrix'
|
851
|
-
category: 'Crawler'
|
852
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
853
|
-
producer:
|
854
|
-
name: 'The Internet Archive'
|
855
|
-
url: 'http://www.archive.org'
|
856
|
-
-
|
857
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
|
858
|
-
bot:
|
859
|
-
name: 'Heritrix'
|
860
|
-
category: 'Crawler'
|
861
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
862
|
-
producer:
|
863
|
-
name: 'The Internet Archive'
|
864
|
-
url: 'http://www.archive.org'
|
865
|
-
-
|
866
|
-
user_agent: flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)
|
867
|
-
bot:
|
868
|
-
name: 'Heritrix'
|
869
|
-
category: 'Crawler'
|
870
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
871
|
-
producer:
|
872
|
-
name: 'The Internet Archive'
|
873
|
-
url: 'http://www.archive.org'
|
874
|
-
-
|
875
|
-
user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
|
876
|
-
bot:
|
877
|
-
name: 'Heritrix'
|
878
|
-
category: 'Crawler'
|
879
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
880
|
-
producer:
|
881
|
-
name: 'The Internet Archive'
|
882
|
-
url: 'http://www.archive.org'
|
883
|
-
-
|
884
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
|
885
|
-
bot:
|
886
|
-
name: 'Heritrix'
|
887
|
-
category: 'Crawler'
|
888
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
889
|
-
producer:
|
890
|
-
name: 'The Internet Archive'
|
891
|
-
url: 'http://www.archive.org'
|
892
|
-
-
|
893
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
|
894
|
-
bot:
|
895
|
-
name: 'Heritrix'
|
896
|
-
category: 'Crawler'
|
897
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
898
|
-
producer:
|
899
|
-
name: 'The Internet Archive'
|
900
|
-
url: 'http://www.archive.org'
|
901
|
-
-
|
902
|
-
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
|
903
|
-
bot:
|
904
|
-
name: 'Heritrix'
|
905
|
-
category: 'Crawler'
|
906
|
-
url: 'https://webarchive.jira.com/wiki/display/Heritrix/Heritrix'
|
907
|
-
producer:
|
908
|
-
name: 'The Internet Archive'
|
909
|
-
url: 'http://www.archive.org'
|
910
|
-
-
|
911
|
-
user_agent: HTTPMon/1.0b (http://www.httpmon.com)
|
912
|
-
bot:
|
913
|
-
name: 'HTTPMon'
|
914
|
-
category: 'Site Monitor'
|
915
|
-
url: 'http://www.httpmon.com'
|
916
|
-
producer:
|
917
|
-
name: 'towards GmbH'
|
918
|
-
url: 'http://www.towards.ch/'
|
919
|
-
-
|
920
|
-
user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
|
921
|
-
bot:
|
922
|
-
name: 'IIS Site Analysis'
|
923
|
-
category: 'crawler'
|
924
|
-
url: 'http://www.iis.net/iisbot.html'
|
925
|
-
producer:
|
926
|
-
name: 'Microsoft Corporation'
|
927
|
-
url: 'http://www.microsoft.com'
|
928
|
-
-
|
929
|
-
user_agent: kouio.com RSS reader
|
930
|
-
bot:
|
931
|
-
name: 'Kouio'
|
932
|
-
url: 'http://kouio.com/'
|
933
|
-
category: 'Feed Fetcher'
|
934
|
-
producer:
|
935
|
-
name: ''
|
936
|
-
url: ''
|
937
|
-
-
|
938
|
-
user_agent: kouio.com RSS reader - 6 subscribers
|
939
|
-
bot:
|
940
|
-
name: 'Kouio'
|
941
|
-
url: 'http://kouio.com/'
|
942
|
-
category: 'Feed Fetcher'
|
943
|
-
producer:
|
944
|
-
name: ''
|
945
|
-
url: ''
|
946
|
-
-
|
947
|
-
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
|
948
|
-
bot:
|
949
|
-
name: 'Linkdex Bot'
|
950
|
-
category: 'Search bot'
|
951
|
-
url: 'http://www.linkdex.com/bots'
|
952
|
-
producer:
|
953
|
-
name: 'Mojeek Ltd.'
|
954
|
-
url: 'http://www.mojeek.com'
|
955
|
-
-
|
956
|
-
user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
|
957
|
-
bot:
|
958
|
-
name: 'Linkdex Bot'
|
959
|
-
category: 'Search bot'
|
960
|
-
url: 'http://www.linkdex.com/bots'
|
961
|
-
producer:
|
962
|
-
name: 'Mojeek Ltd.'
|
963
|
-
url: 'http://www.mojeek.com'
|
964
|
-
-
|
965
|
-
user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
|
966
|
-
bot:
|
967
|
-
name: 'Linkdex Bot'
|
968
|
-
category: 'Search bot'
|
969
|
-
url: 'http://www.linkdex.com/bots'
|
970
|
-
producer:
|
971
|
-
name: 'Mojeek Ltd.'
|
972
|
-
url: 'http://www.mojeek.com'
|
973
|
-
-
|
974
|
-
user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
|
975
|
-
bot:
|
976
|
-
name: 'LinkedIn Bot'
|
977
|
-
category: 'Social Media Agent'
|
978
|
-
url: 'http://www.linkedin.com'
|
979
|
-
producer:
|
980
|
-
name: 'LinkedIn'
|
981
|
-
url: 'http://www.linkedin.com'
|
982
|
-
-
|
983
|
-
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
|
984
|
-
bot:
|
985
|
-
name: 'Mail.Ru Bot'
|
986
|
-
category: 'Search bot'
|
987
|
-
url: 'http://help.mail.ru/webmaster/indexing/robots/types_robots'
|
988
|
-
producer:
|
989
|
-
name: 'Mail.Ru Group'
|
990
|
-
url: 'http://corp.mail.ru'
|
991
|
-
-
|
992
|
-
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
|
993
|
-
bot:
|
994
|
-
name: 'Mail.Ru Bot'
|
995
|
-
category: 'Search bot'
|
996
|
-
url: 'http://help.mail.ru/webmaster/indexing/robots/types_robots'
|
997
|
-
producer:
|
998
|
-
name: 'Mail.Ru Group'
|
999
|
-
url: 'http://corp.mail.ru'
|
1000
|
-
-
|
1001
|
-
user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
|
1002
|
-
bot:
|
1003
|
-
name: 'Magpie-Crawler'
|
1004
|
-
category: 'Social Media Agent'
|
1005
|
-
url: 'http://www.brandwatch.com/magpie-crawler/'
|
1006
|
-
producer:
|
1007
|
-
name: 'Brandwatch'
|
1008
|
-
url: 'http://www.brandwatch.com'
|
1009
|
-
-
|
1010
|
-
user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
|
1011
|
-
bot:
|
1012
|
-
name: 'MagpieRSS'
|
1013
|
-
url: 'http://magpierss.sourceforge.net/'
|
1014
|
-
category: 'Feed Parser'
|
1015
|
-
producer:
|
1016
|
-
name: ''
|
1017
|
-
url: ''
|
1018
|
-
-
|
1019
|
-
user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
|
1020
|
-
bot:
|
1021
|
-
name: 'Meanpath Bot'
|
1022
|
-
category: 'Search bot'
|
1023
|
-
url: 'http://www.meanpath.com/meanpathbot.html'
|
1024
|
-
producer:
|
1025
|
-
name: 'Meanpath'
|
1026
|
-
url: 'http://www.meanpath.com'
|
1027
|
-
-
|
1028
|
-
user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
|
1029
|
-
bot:
|
1030
|
-
name: 'Mixrank Bot'
|
1031
|
-
category: 'Crawler'
|
1032
|
-
url: 'http://mixrank.com'
|
1033
|
-
producer:
|
1034
|
-
name: 'Online Media Group, Inc.'
|
1035
|
-
url: ''
|
1036
|
-
-
|
1037
|
-
user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
|
1038
|
-
bot:
|
1039
|
-
name: 'MJ12 Bot'
|
1040
|
-
category: 'Search bot'
|
1041
|
-
url: 'http://majestic12.co.uk/bot.php'
|
1042
|
-
producer:
|
1043
|
-
name: 'Majestic-12'
|
1044
|
-
url: 'http://majestic12.co.uk'
|
1045
|
-
-
|
1046
|
-
user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
|
1047
|
-
bot:
|
1048
|
-
name: 'MojeekBot'
|
1049
|
-
category: 'Search bot'
|
1050
|
-
url: 'http://www.mojeek.com/bot.html'
|
1051
|
-
producer:
|
1052
|
-
name: 'Mojeek Ltd.'
|
1053
|
-
url: 'http://www.mojeek.com'
|
1054
|
-
-
|
1055
|
-
user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
|
1056
|
-
bot:
|
1057
|
-
name: 'NalezenCzBot'
|
1058
|
-
category: 'Crawler'
|
1059
|
-
url: 'http://www.nalezen.cz/about-crawler'
|
1060
|
-
producer:
|
1061
|
-
name: 'Jaroslav Kuboš'
|
1062
|
-
url: ''
|
1063
|
-
-
|
1064
|
-
user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
|
1065
|
-
bot:
|
1066
|
-
name: 'Netcraft Survey Bot'
|
1067
|
-
category: 'Search bot'
|
1068
|
-
url: ''
|
1069
|
-
producer:
|
1070
|
-
name: 'Netcraft'
|
1071
|
-
url: 'http://www.netcraft.com'
|
1072
|
-
-
|
1073
|
-
user_agent: Netvibes (http://www.netvibes.com)
|
1074
|
-
bot:
|
1075
|
-
name: 'Netvibes'
|
1076
|
-
url: 'http://www.netvibes.com/'
|
1077
|
-
category: 'Feed Fetcher'
|
1078
|
-
producer:
|
1079
|
-
name: ''
|
1080
|
-
url: ''
|
1081
|
-
-
|
1082
|
-
user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
|
1083
|
-
bot:
|
1084
|
-
name: 'Netvibes'
|
1085
|
-
url: 'http://www.netvibes.com/'
|
1086
|
-
category: 'Feed Fetcher'
|
1087
|
-
producer:
|
1088
|
-
name: ''
|
1089
|
-
url: ''
|
1090
|
-
-
|
1091
|
-
user_agent: NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
1092
|
-
bot:
|
1093
|
-
name: 'NewsBlur'
|
1094
|
-
url: 'http://www.newsblur.com'
|
1095
|
-
category: 'Feed Fetcher'
|
1096
|
-
producer:
|
1097
|
-
name: ''
|
1098
|
-
url: ''
|
1099
|
-
-
|
1100
|
-
user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
1101
|
-
bot:
|
1102
|
-
name: 'NewsBlur'
|
1103
|
-
url: 'http://www.newsblur.com'
|
1104
|
-
category: 'Feed Fetcher'
|
1105
|
-
producer:
|
1106
|
-
name: ''
|
1107
|
-
url: ''
|
1108
|
-
-
|
1109
|
-
user_agent: NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
1110
|
-
bot:
|
1111
|
-
name: 'NewsBlur'
|
1112
|
-
url: 'http://www.newsblur.com'
|
1113
|
-
category: 'Feed Fetcher'
|
1114
|
-
producer:
|
1115
|
-
name: ''
|
1116
|
-
url: ''
|
1117
|
-
-
|
1118
|
-
user_agent: NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
1119
|
-
bot:
|
1120
|
-
name: 'NewsBlur'
|
1121
|
-
url: 'http://www.newsblur.com'
|
1122
|
-
category: 'Feed Fetcher'
|
1123
|
-
producer:
|
1124
|
-
name: ''
|
1125
|
-
url: ''
|
1126
|
-
-
|
1127
|
-
user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
|
1128
|
-
bot:
|
1129
|
-
name: NewsGator
|
1130
|
-
url: 'http://www.newsgator.com'
|
1131
|
-
category: 'Feed Fetcher'
|
1132
|
-
producer:
|
1133
|
-
name: ''
|
1134
|
-
url: ''
|
1135
|
-
-
|
1136
|
-
user_agent: nlcrawler/1.0 (+http://northernlight.com/)
|
1137
|
-
bot:
|
1138
|
-
name: 'NLCrawler'
|
1139
|
-
category: 'Crawler'
|
1140
|
-
url: ''
|
1141
|
-
producer:
|
1142
|
-
name: 'Northern Light'
|
1143
|
-
url: 'http://northernlight.com'
|
1144
|
-
-
|
1145
|
-
user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
|
1146
|
-
bot:
|
1147
|
-
name: 'Omgili bot'
|
1148
|
-
category: 'Search bot'
|
1149
|
-
url: 'http://www.omgili.com/Crawler.html'
|
1150
|
-
producer:
|
1151
|
-
name: 'Omgili'
|
1152
|
-
url: 'http://www.omgili.com'
|
1153
|
-
-
|
1154
|
-
user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
|
1155
|
-
bot:
|
1156
|
-
name: 'Openindex Spider'
|
1157
|
-
category: 'Search bot'
|
1158
|
-
url: 'http://www.openindex.io/en/webmasters/spider.html'
|
1159
|
-
producer:
|
1160
|
-
name: 'Openindex B.V.'
|
1161
|
-
url: 'http://www.openindex.io'
|
1162
|
-
-
|
1163
|
-
user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
|
1164
|
-
bot:
|
1165
|
-
name: 'OpenLinkProfiler'
|
1166
|
-
category: 'Crawler'
|
1167
|
-
url: 'http://openlinkprofiler.org/bot'
|
1168
|
-
producer:
|
1169
|
-
name: 'Axandra GmbH'
|
1170
|
-
url: 'http://www.axandra.com'
|
1171
|
-
-
|
1172
|
-
user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
|
1173
|
-
bot:
|
1174
|
-
name: 'OpenWebSpider'
|
1175
|
-
category: 'Crawler'
|
1176
|
-
url: 'http://www.openwebspider.org'
|
1177
|
-
producer:
|
1178
|
-
name: 'OpenWebSpider Lab'
|
1179
|
-
url: 'http://lab.openwebspider.org'
|
1180
|
-
-
|
1181
|
-
user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
|
1182
|
-
bot:
|
1183
|
-
name: 'PaperLiBot'
|
1184
|
-
category: 'Search bot'
|
1185
|
-
url: 'http://support.paper.li/entries/20023257-what-is-paper-li'
|
1186
|
-
producer:
|
1187
|
-
name: 'Smallrivers SA'
|
1188
|
-
url: 'http://www.paper.li'
|
1189
|
-
-
|
1190
|
-
user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
|
1191
|
-
bot:
|
1192
|
-
name: 'Picsearch bot'
|
1193
|
-
category: 'Search bot'
|
1194
|
-
url: 'http://www.picsearch.com/bot.html'
|
1195
|
-
producer:
|
1196
|
-
name: 'Picsearch'
|
1197
|
-
url: 'http://www.picsearch.com'
|
1198
|
-
-
|
1199
|
-
user_agent: psbot-page (+http://www.picsearch.com/bot.html)
|
1200
|
-
bot:
|
1201
|
-
name: 'Picsearch bot'
|
1202
|
-
category: 'Search bot'
|
1203
|
-
url: 'http://www.picsearch.com/bot.html'
|
1204
|
-
producer:
|
1205
|
-
name: 'Picsearch'
|
1206
|
-
url: 'http://www.picsearch.com'
|
1207
|
-
-
|
1208
|
-
user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
|
1209
|
-
bot:
|
1210
|
-
name: 'Pingdom Bot'
|
1211
|
-
category: 'Site Monitors'
|
1212
|
-
url: ''
|
1213
|
-
producer:
|
1214
|
-
name: 'Pingdom AB'
|
1215
|
-
url: 'https://www.pingdom.com'
|
1216
|
-
-
|
1217
|
-
user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
|
1218
|
-
bot:
|
1219
|
-
name: 'QuerySeekerSpider'
|
1220
|
-
category: 'Crawler'
|
1221
|
-
url: 'http://queryseeker.com/bot.html'
|
1222
|
-
producer:
|
1223
|
-
name: 'QueryEye Inc.'
|
1224
|
-
url: 'http://queryeye.com'
|
1225
|
-
-
|
1226
|
-
user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
|
1227
|
-
bot:
|
1228
|
-
name: 'Reddit Bot'
|
1229
|
-
category: 'Social Media Agent'
|
1230
|
-
url: 'http://www.reddit.com/feedback'
|
1231
|
-
producer:
|
1232
|
-
name: 'reddit inc.'
|
1233
|
-
url: 'http://www.reddit.com'
|
1234
|
-
-
|
1235
|
-
user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
|
1236
|
-
bot:
|
1237
|
-
name: 'Rogerbot'
|
1238
|
-
category: 'Crawler'
|
1239
|
-
url: 'http://moz.com/help/pro/what-is-rogerbot-'
|
1240
|
-
producer:
|
1241
|
-
name: 'SEOmoz, Inc.'
|
1242
|
-
url: 'http://moz.com/'
|
1243
|
-
-
|
1244
|
-
user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
|
1245
|
-
bot:
|
1246
|
-
name: 'Rogerbot'
|
1247
|
-
category: 'Crawler'
|
1248
|
-
url: 'http://moz.com/help/pro/what-is-rogerbot-'
|
1249
|
-
producer:
|
1250
|
-
name: 'SEOmoz, Inc.'
|
1251
|
-
url: 'http://moz.com/'
|
1252
|
-
-
|
1253
|
-
user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
|
1254
|
-
bot:
|
1255
|
-
name: 'Rogerbot'
|
1256
|
-
category: 'Crawler'
|
1257
|
-
url: 'http://moz.com/help/pro/what-is-rogerbot-'
|
1258
|
-
producer:
|
1259
|
-
name: 'SEOmoz, Inc.'
|
1260
|
-
url: 'http://moz.com/'
|
1261
|
-
-
|
1262
|
-
user_agent: Screaming Frog SEO Spider/2.22
|
1263
|
-
bot:
|
1264
|
-
name: 'Screaming Frog SEO Spider'
|
1265
|
-
category: 'Crawler'
|
1266
|
-
url: 'http://www.screamingfrog.co.uk/seo-spider'
|
1267
|
-
producer:
|
1268
|
-
name: 'Screaming Frog Ltd'
|
1269
|
-
url: 'http://www.screamingfrog.co.uk'
|
1270
|
-
-
|
1271
|
-
user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
|
1272
|
-
bot:
|
1273
|
-
name: 'ScreenerBot'
|
1274
|
-
category: 'Crawler'
|
1275
|
-
url: 'http://www.screenerbot.com'
|
1276
|
-
producer:
|
1277
|
-
name: ''
|
1278
|
-
url: ''
|
1279
|
-
-
|
1280
|
-
user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
|
1281
|
-
bot:
|
1282
|
-
name: 'Semrush Bot'
|
1283
|
-
category: 'Crawler'
|
1284
|
-
url: 'http://www.semrush.com/bot.html'
|
1285
|
-
producer:
|
1286
|
-
name: 'SEMrush'
|
1287
|
-
url: 'http://www.semrush.com'
|
1288
|
-
-
|
1289
|
-
user_agent: SensikaBot/x.33 (+http://sensika.com)
|
1290
|
-
bot:
|
1291
|
-
name: 'Sensika Bot'
|
1292
|
-
category: ''
|
1293
|
-
url: ''
|
1294
|
-
producer:
|
1295
|
-
name: 'Sensika'
|
1296
|
-
url: 'http://sensika.com'
|
1297
|
-
-
|
1298
|
-
user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
|
1299
|
-
bot:
|
1300
|
-
name: 'SEOENGBot'
|
1301
|
-
category: 'Crawler'
|
1302
|
-
url: 'http://www.seoengine.com/seoengbot.htm'
|
1303
|
-
producer:
|
1304
|
-
name: 'SEO Engine'
|
1305
|
-
url: 'http://www.seoengine.com'
|
1306
|
-
-
|
1307
|
-
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
|
1308
|
-
bot:
|
1309
|
-
name: 'Seznam Bot'
|
1310
|
-
category: 'Search bot'
|
1311
|
-
url: 'http://www.mapy.cz/cz/seznambot.html'
|
1312
|
-
producer:
|
1313
|
-
name: 'Seznam.cz, a.s.'
|
1314
|
-
url: 'http://www.seznam.cz/'
|
1315
|
-
-
|
1316
|
-
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
|
1317
|
-
bot:
|
1318
|
-
name: 'Seznam Bot'
|
1319
|
-
category: 'Search bot'
|
1320
|
-
url: 'http://www.mapy.cz/cz/seznambot.html'
|
1321
|
-
producer:
|
1322
|
-
name: 'Seznam.cz, a.s.'
|
1323
|
-
url: 'http://www.seznam.cz/'
|
1324
|
-
-
|
1325
|
-
user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
|
1326
|
-
bot:
|
1327
|
-
name: 'Seznam Bot'
|
1328
|
-
category: 'Search bot'
|
1329
|
-
url: 'http://www.mapy.cz/cz/seznambot.html'
|
1330
|
-
producer:
|
1331
|
-
name: 'Seznam.cz, a.s.'
|
1332
|
-
url: 'http://www.seznam.cz/'
|
1333
|
-
-
|
1334
|
-
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
|
1335
|
-
bot:
|
1336
|
-
name: 'Seznam Bot'
|
1337
|
-
category: 'Search bot'
|
1338
|
-
url: 'http://www.mapy.cz/cz/seznambot.html'
|
1339
|
-
producer:
|
1340
|
-
name: 'Seznam.cz, a.s.'
|
1341
|
-
url: 'http://www.seznam.cz/'
|
1342
|
-
-
|
1343
|
-
user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
|
1344
|
-
bot:
|
1345
|
-
name: 'ShopWiki'
|
1346
|
-
category: 'Search tools'
|
1347
|
-
url: 'http://www.shopwiki.com/wiki/Help:Bot'
|
1348
|
-
producer:
|
1349
|
-
name: 'ShopWiki Corp.'
|
1350
|
-
url: 'http://www.shopwiki.com'
|
1351
|
-
-
|
1352
|
-
user_agent: SilverReader/1.0; http://silverreader.com
|
1353
|
-
bot:
|
1354
|
-
name: 'SilverReader'
|
1355
|
-
url: 'http://silverreader.com'
|
1356
|
-
category: 'Feed Fetcher'
|
1357
|
-
producer:
|
1358
|
-
name: ''
|
1359
|
-
url: ''
|
1360
|
-
-
|
1361
|
-
user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
|
1362
|
-
bot:
|
1363
|
-
name: 'SimplePie'
|
1364
|
-
url: 'http://www.simplepie.org'
|
1365
|
-
category: 'Feed Parser'
|
1366
|
-
producer:
|
1367
|
-
name: ''
|
1368
|
-
url: ''
|
1369
|
-
-
|
1370
|
-
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
1371
|
-
bot:
|
1372
|
-
name: 'SimplePie'
|
1373
|
-
url: 'http://www.simplepie.org'
|
1374
|
-
category: 'Feed Parser'
|
1375
|
-
producer:
|
1376
|
-
name: ''
|
1377
|
-
url: ''
|
1378
|
-
-
|
1379
|
-
user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
|
1380
|
-
bot:
|
1381
|
-
name: 'SimplePie'
|
1382
|
-
url: 'http://www.simplepie.org'
|
1383
|
-
category: 'Feed Parser'
|
1384
|
-
producer:
|
1385
|
-
name: ''
|
1386
|
-
url: ''
|
1387
|
-
-
|
1388
|
-
user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
|
1389
|
-
bot:
|
1390
|
-
name: 'SISTRIX Crawler'
|
1391
|
-
category: 'Crawler'
|
1392
|
-
url: 'http://crawler.sistrix.net'
|
1393
|
-
producer:
|
1394
|
-
name: 'SISTRIX GmbH'
|
1395
|
-
url: 'http://www.sistrix.de'
|
1396
|
-
-
|
1397
|
-
user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
|
1398
|
-
bot:
|
1399
|
-
name: 'Sogou Spider'
|
1400
|
-
category: 'Search bot'
|
1401
|
-
url: 'http://www.sogou.com/docs/help/webmasters.htm'
|
1402
|
-
producer:
|
1403
|
-
name: 'Sohu, Inc.'
|
1404
|
-
url: 'http://www.sogou.com'
|
1405
|
-
-
|
1406
|
-
user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
|
1407
|
-
bot:
|
1408
|
-
name: 'Sogou Spider'
|
1409
|
-
category: 'Search bot'
|
1410
|
-
url: 'http://www.sogou.com/docs/help/webmasters.htm'
|
1411
|
-
producer:
|
1412
|
-
name: 'Sohu, Inc.'
|
1413
|
-
url: 'http://www.sogou.com'
|
1414
|
-
-
|
1415
|
-
user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)
|
1416
|
-
bot:
|
1417
|
-
name: 'Sogou Spider'
|
1418
|
-
category: 'Search bot'
|
1419
|
-
url: 'http://www.sogou.com/docs/help/webmasters.htm'
|
1420
|
-
producer:
|
1421
|
-
name: 'Sohu, Inc.'
|
1422
|
-
url: 'http://www.sogou.com'
|
1423
|
-
-
|
1424
|
-
user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
|
1425
|
-
bot:
|
1426
|
-
name: 'Sogou Spider'
|
1427
|
-
category: 'Search bot'
|
1428
|
-
url: 'http://www.sogou.com/docs/help/webmasters.htm'
|
1429
|
-
producer:
|
1430
|
-
name: 'Sohu, Inc.'
|
1431
|
-
url: 'http://www.sogou.com'
|
1432
|
-
-
|
1433
|
-
user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
|
1434
|
-
bot:
|
1435
|
-
name: 'Soso Spider'
|
1436
|
-
category: 'Search bot'
|
1437
|
-
url: 'http://help.soso.com/webspider.htm'
|
1438
|
-
producer:
|
1439
|
-
name: 'Tencent Holdings'
|
1440
|
-
url: 'http://www.soso.com'
|
1441
|
-
-
|
1442
|
-
user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
|
1443
|
-
bot:
|
1444
|
-
name: 'Superfeedr Bot'
|
1445
|
-
category: 'Feed Fetcher'
|
1446
|
-
url: ''
|
1447
|
-
producer:
|
1448
|
-
name: 'Superfeedr'
|
1449
|
-
url: 'https://superfeedr.com/'
|
1450
|
-
-
|
1451
|
-
user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
|
1452
|
-
bot:
|
1453
|
-
name: 'Spinn3r'
|
1454
|
-
category: 'Crawler'
|
1455
|
-
url: 'http://spinn3r.com/robot'
|
1456
|
-
producer:
|
1457
|
-
name: 'Tailrank Inc'
|
1458
|
-
url: 'http://spinn3r.com'
|
1459
|
-
-
|
1460
|
-
user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
|
1461
|
-
bot:
|
1462
|
-
name: 'Sputnik Bot'
|
1463
|
-
category: ''
|
1464
|
-
url: ''
|
1465
|
-
producer:
|
1466
|
-
name: ''
|
1467
|
-
url: ''
|
1468
|
-
-
|
1469
|
-
user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
|
1470
|
-
bot:
|
1471
|
-
name: 'Sputnik Bot'
|
1472
|
-
category: ''
|
1473
|
-
url: ''
|
1474
|
-
producer:
|
1475
|
-
name: ''
|
1476
|
-
url: ''
|
1477
|
-
-
|
1478
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
|
1479
|
-
bot:
|
1480
|
-
name: 'Survey Bot'
|
1481
|
-
category: 'Search bot'
|
1482
|
-
url: 'http://www.domaintools.com/webmasters/surveybot.php'
|
1483
|
-
producer:
|
1484
|
-
name: 'Domain Tools'
|
1485
|
-
url: 'http://www.domaintools.com'
|
1486
|
-
-
|
1487
|
-
user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
|
1488
|
-
bot:
|
1489
|
-
name: 'TinEye Crawler'
|
1490
|
-
category: 'Search bot'
|
1491
|
-
url: 'http://www.tineye.com/crawler.html'
|
1492
|
-
producer:
|
1493
|
-
name: 'Idée Inc.'
|
1494
|
-
url: 'http://ideeinc.com'
|
1495
|
-
-
|
1496
|
-
user_agent: 'Tiny Tiny RSS/1.10 (http://tt-rss.org/)'
|
1497
|
-
bot:
|
1498
|
-
name: 'Tiny Tiny RSS'
|
1499
|
-
url: 'http://tt-rss.org'
|
1500
|
-
category: 'Feed Fetcher'
|
1501
|
-
producer:
|
1502
|
-
name: ''
|
1503
|
-
url: ''
|
1504
|
-
-
|
1505
|
-
user_agent: 'Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)'
|
1506
|
-
bot:
|
1507
|
-
name: 'Tiny Tiny RSS'
|
1508
|
-
url: 'http://tt-rss.org'
|
1509
|
-
category: 'Feed Fetcher'
|
1510
|
-
producer:
|
1511
|
-
name: ''
|
1512
|
-
url: ''
|
1513
|
-
-
|
1514
|
-
user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
|
1515
|
-
bot:
|
1516
|
-
name: 'TurnitinBot'
|
1517
|
-
category: 'Crawler'
|
1518
|
-
url: 'http://www.turnitin.com/robot/crawlerinfo.html'
|
1519
|
-
producer:
|
1520
|
-
name: 'iParadigms, LLC.'
|
1521
|
-
url: 'http://www.turnitin.com'
|
1522
|
-
-
|
1523
|
-
user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
|
1524
|
-
bot:
|
1525
|
-
name: 'TweetedTimes Bot'
|
1526
|
-
category: 'Crawler'
|
1527
|
-
url: 'http://tweetedtimes.com'
|
1528
|
-
producer:
|
1529
|
-
name: 'TweetedTimes'
|
1530
|
-
url: 'http://tweetedtimes.com/'
|
1531
|
-
-
|
1532
|
-
user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
|
1533
|
-
bot:
|
1534
|
-
name: 'TweetedTimes Bot'
|
1535
|
-
category: 'Crawler'
|
1536
|
-
url: 'http://tweetedtimes.com'
|
1537
|
-
producer:
|
1538
|
-
name: 'TweetedTimes'
|
1539
|
-
url: 'http://tweetedtimes.com/'
|
1540
|
-
-
|
1541
|
-
user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
|
1542
|
-
bot:
|
1543
|
-
name: 'Tweetmeme Bot'
|
1544
|
-
category: 'Crawler'
|
1545
|
-
url: 'http://tweetmeme.com/'
|
1546
|
-
producer:
|
1547
|
-
name: 'Mediasift'
|
1548
|
-
url: ''
|
1549
|
-
-
|
1550
|
-
user_agent: Twitterbot/1.0
|
1551
|
-
bot:
|
1552
|
-
name: 'Twitterbot'
|
1553
|
-
category: 'Social Media Agent'
|
1554
|
-
url: 'https://dev.twitter.com/docs/cards/getting-started'
|
1555
|
-
producer:
|
1556
|
-
name: 'Twitter'
|
1557
|
-
url: 'http://www.twitter.com'
|
1558
|
-
-
|
1559
|
-
user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
|
1560
|
-
bot:
|
1561
|
-
name: 'Uptime Robot'
|
1562
|
-
category: 'Site Monitor'
|
1563
|
-
url: ''
|
1564
|
-
producer:
|
1565
|
-
name: 'Uptime Robot'
|
1566
|
-
url: 'http://uptimerobot.com'
|
1567
|
-
-
|
1568
|
-
user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
|
1569
|
-
bot:
|
1570
|
-
name: 'URLAppendBot'
|
1571
|
-
category: 'Crawler'
|
1572
|
-
url: 'http://www.profound.net/urlappendbot.html'
|
1573
|
-
producer:
|
1574
|
-
name: 'Profound Networks'
|
1575
|
-
url: 'http://www.profound.net'
|
1576
|
-
-
|
1577
|
-
user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
|
1578
|
-
bot:
|
1579
|
-
name: 'Visual Site Mapper Crawler'
|
1580
|
-
category: 'Crawler'
|
1581
|
-
url: 'http://www.visualsitemapper.com/crawler'
|
1582
|
-
producer:
|
1583
|
-
name: 'Alentum Software Ltd.'
|
1584
|
-
url: 'http://www.alentum.com'
|
1585
|
-
-
|
1586
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
|
1587
|
-
bot:
|
1588
|
-
name: 'Voila Bot'
|
1589
|
-
category: 'Search bot'
|
1590
|
-
url: 'http://www.voila.fr'
|
1591
|
-
producer:
|
1592
|
-
name: ''
|
1593
|
-
url: ''
|
1594
|
-
-
|
1595
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
|
1596
|
-
bot:
|
1597
|
-
name: 'Voila Bot'
|
1598
|
-
category: 'Search bot'
|
1599
|
-
url: 'http://www.voila.fr'
|
1600
|
-
producer:
|
1601
|
-
name: ''
|
1602
|
-
url: ''
|
1603
|
-
-
|
1604
|
-
user_agent: Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)
|
1605
|
-
bot:
|
1606
|
-
name: 'W3C CSS Validator'
|
1607
|
-
category: 'Validator'
|
1608
|
-
url: 'http://jigsaw.w3.org/css-validator'
|
1609
|
-
producer:
|
1610
|
-
name: 'W3C'
|
1611
|
-
url: 'http://www.w3.org'
|
1612
|
-
-
|
1613
|
-
user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
|
1614
|
-
bot:
|
1615
|
-
name: 'W3C I18N Checker'
|
1616
|
-
category: 'Validator'
|
1617
|
-
url: 'http://validator.w3.org/i18n-checker'
|
1618
|
-
producer:
|
1619
|
-
name: 'W3C'
|
1620
|
-
url: 'http://www.w3.org'
|
1621
|
-
-
|
1622
|
-
user_agent: W3C-checklink/4.0 [4.4] libwww-perl/5.803
|
1623
|
-
bot:
|
1624
|
-
name: 'W3C Link Checker'
|
1625
|
-
category: 'Validator'
|
1626
|
-
url: 'http://validator.w3.org/checklink'
|
1627
|
-
producer:
|
1628
|
-
name: 'W3C'
|
1629
|
-
url: 'http://www.w3.org'
|
1630
|
-
-
|
1631
|
-
user_agent: W3C-checklink/4.81 libwww-perl/5.836
|
1632
|
-
bot:
|
1633
|
-
name: 'W3C Link Checker'
|
1634
|
-
category: 'Validator'
|
1635
|
-
url: 'http://validator.w3.org/checklink'
|
1636
|
-
producer:
|
1637
|
-
name: 'W3C'
|
1638
|
-
url: 'http://www.w3.org'
|
1639
|
-
-
|
1640
|
-
user_agent: W3C_Validator/1.3 http://validator.w3.org/services
|
1641
|
-
bot:
|
1642
|
-
name: 'W3C Markup Validation Service'
|
1643
|
-
category: 'Validator'
|
1644
|
-
url: 'http://validator.w3.org/services'
|
1645
|
-
producer:
|
1646
|
-
name: 'W3C'
|
1647
|
-
url: 'http://www.w3.org'
|
1648
|
-
-
|
1649
|
-
user_agent: W3C_Validator/1.767
|
1650
|
-
bot:
|
1651
|
-
name: 'W3C Markup Validation Service'
|
1652
|
-
category: 'Validator'
|
1653
|
-
url: 'http://validator.w3.org/services'
|
1654
|
-
producer:
|
1655
|
-
name: 'W3C'
|
1656
|
-
url: 'http://www.w3.org'
|
1657
|
-
-
|
1658
|
-
user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
|
1659
|
-
bot:
|
1660
|
-
name: 'W3C MobileOK Checker'
|
1661
|
-
category: 'Validator'
|
1662
|
-
url: 'http://validator.w3.org/mobile'
|
1663
|
-
producer:
|
1664
|
-
name: 'W3C'
|
1665
|
-
url: 'http://www.w3.org'
|
1666
|
-
-
|
1667
|
-
user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
|
1668
|
-
bot:
|
1669
|
-
name: 'W3C Unified Validator'
|
1670
|
-
category: 'Validator'
|
1671
|
-
url: 'http://validator.w3.org/unicorn'
|
1672
|
-
producer:
|
1673
|
-
name: 'W3C'
|
1674
|
-
url: 'http://www.w3.org'
|
1675
|
-
-
|
1676
|
-
user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
|
1677
|
-
bot:
|
1678
|
-
name: 'WebbCrawler'
|
1679
|
-
category: 'Crawler'
|
1680
|
-
url: 'http://badcheese.com/crawler.html'
|
1681
|
-
producer:
|
1682
|
-
name: 'Steve Webb'
|
1683
|
-
url: 'http://badcheese.com'
|
1684
|
-
-
|
1685
|
-
user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
|
1686
|
-
bot:
|
1687
|
-
name: 'WeSEE:Search'
|
1688
|
-
category: 'Search bot'
|
1689
|
-
url: 'http://www.wesee.com/bot'
|
1690
|
-
producer:
|
1691
|
-
name: 'WeSEE Ltd'
|
1692
|
-
url: 'http://www.wesee.com'
|
1693
|
-
-
|
1694
|
-
user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
|
1695
|
-
bot:
|
1696
|
-
name: 'Wotbox'
|
1697
|
-
category: 'Search bot'
|
1698
|
-
url: 'http://www.wotbox.com/bot/'
|
1699
|
-
producer:
|
1700
|
-
name: 'Wotbox'
|
1701
|
-
url: 'http://www.wotbox.com'
|
1702
|
-
-
|
1703
|
-
user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
|
1704
|
-
bot:
|
1705
|
-
name: 'YaCy'
|
1706
|
-
category: 'Search bot'
|
1707
|
-
url: 'http://yacy.net/bot.html'
|
1708
|
-
producer:
|
1709
|
-
name: 'YaCy'
|
1710
|
-
url: 'http://yacy.net'
|
1711
|
-
-
|
1712
|
-
user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
|
1713
|
-
bot:
|
1714
|
-
name: 'YaCy'
|
1715
|
-
category: 'Search bot'
|
1716
|
-
url: 'http://yacy.net/bot.html'
|
1717
|
-
producer:
|
1718
|
-
name: 'YaCy'
|
1719
|
-
url: 'http://yacy.net'
|
1720
|
-
-
|
1721
|
-
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
|
1722
|
-
bot:
|
1723
|
-
name: 'Yahoo! Slurp'
|
1724
|
-
category: 'Search bot'
|
1725
|
-
url: 'http://help.yahoo.com/ysearch/slurp'
|
1726
|
-
producer:
|
1727
|
-
name: 'Yahoo! Inc.'
|
1728
|
-
url: 'http://www.yahoo.com'
|
1729
|
-
-
|
1730
|
-
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
|
1731
|
-
bot:
|
1732
|
-
name: 'Yahoo! Slurp'
|
1733
|
-
category: 'Search bot'
|
1734
|
-
url: 'http://help.yahoo.com/ysearch/slurp'
|
1735
|
-
producer:
|
1736
|
-
name: 'Yahoo! Inc.'
|
1737
|
-
url: 'http://www.yahoo.com'
|
1738
|
-
-
|
1739
|
-
user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
|
1740
|
-
bot:
|
1741
|
-
name: 'Yandex Bot'
|
1742
|
-
category: 'Search bot'
|
1743
|
-
url: 'http://www.yandex.com/bots'
|
1744
|
-
producer:
|
1745
|
-
name: 'Yandex LLC'
|
1746
|
-
url: 'http://company.yandex.com'
|
1747
|
-
-
|
1748
|
-
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
1749
|
-
bot:
|
1750
|
-
name: 'Yandex Bot'
|
1751
|
-
category: 'Search bot'
|
1752
|
-
url: 'http://www.yandex.com/bots'
|
1753
|
-
producer:
|
1754
|
-
name: 'Yandex LLC'
|
1755
|
-
url: 'http://company.yandex.com'
|
1756
|
-
-
|
1757
|
-
user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
|
1758
|
-
bot:
|
1759
|
-
name: 'Yandex Bot'
|
1760
|
-
category: 'Search bot'
|
1761
|
-
url: 'http://www.yandex.com/bots'
|
1762
|
-
producer:
|
1763
|
-
name: 'Yandex LLC'
|
1764
|
-
url: 'http://company.yandex.com'
|
1765
|
-
-
|
1766
|
-
user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
|
1767
|
-
bot:
|
1768
|
-
name: 'Yandex Bot'
|
1769
|
-
category: 'Search bot'
|
1770
|
-
url: 'http://www.yandex.com/bots'
|
1771
|
-
producer:
|
1772
|
-
name: 'Yandex LLC'
|
1773
|
-
url: 'http://company.yandex.com'
|
1774
|
-
-
|
1775
|
-
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
1776
|
-
bot:
|
1777
|
-
name: 'Yandex Bot'
|
1778
|
-
category: 'Search bot'
|
1779
|
-
url: 'http://www.yandex.com/bots'
|
1780
|
-
producer:
|
1781
|
-
name: 'Yandex LLC'
|
1782
|
-
url: 'http://company.yandex.com'
|
1783
|
-
-
|
1784
|
-
user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
|
1785
|
-
bot:
|
1786
|
-
name: 'Yandex Bot'
|
1787
|
-
category: 'Search bot'
|
1788
|
-
url: 'http://www.yandex.com/bots'
|
1789
|
-
producer:
|
1790
|
-
name: 'Yandex LLC'
|
1791
|
-
url: 'http://company.yandex.com'
|
1792
|
-
-
|
1793
|
-
user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
|
1794
|
-
bot:
|
1795
|
-
name: 'Yandex Bot'
|
1796
|
-
category: 'Search bot'
|
1797
|
-
url: 'http://www.yandex.com/bots'
|
1798
|
-
producer:
|
1799
|
-
name: 'Yandex LLC'
|
1800
|
-
url: 'http://company.yandex.com'
|
1801
|
-
-
|
1802
|
-
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
1803
|
-
bot:
|
1804
|
-
name: 'Yandex Bot'
|
1805
|
-
category: 'Search bot'
|
1806
|
-
url: 'http://www.yandex.com/bots'
|
1807
|
-
producer:
|
1808
|
-
name: 'Yandex LLC'
|
1809
|
-
url: 'http://company.yandex.com'
|
1810
|
-
-
|
1811
|
-
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
1812
|
-
bot:
|
1813
|
-
name: 'Yandex Bot'
|
1814
|
-
category: 'Search bot'
|
1815
|
-
url: 'http://www.yandex.com/bots'
|
1816
|
-
producer:
|
1817
|
-
name: 'Yandex LLC'
|
1818
|
-
url: 'http://company.yandex.com'
|
1819
|
-
-
|
1820
|
-
user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
|
1821
|
-
bot:
|
1822
|
-
name: 'Yandex Bot'
|
1823
|
-
category: 'Search bot'
|
1824
|
-
url: 'http://www.yandex.com/bots'
|
1825
|
-
producer:
|
1826
|
-
name: 'Yandex LLC'
|
1827
|
-
url: 'http://company.yandex.com'
|
1828
|
-
-
|
1829
|
-
user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
|
1830
|
-
bot:
|
1831
|
-
name: 'Yandex Bot'
|
1832
|
-
category: 'Search bot'
|
1833
|
-
url: 'http://www.yandex.com/bots'
|
1834
|
-
producer:
|
1835
|
-
name: 'Yandex LLC'
|
1836
|
-
url: 'http://company.yandex.com'
|
1837
|
-
-
|
1838
|
-
user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
|
1839
|
-
bot:
|
1840
|
-
name: 'Yandex Bot'
|
1841
|
-
category: 'Search bot'
|
1842
|
-
url: 'http://www.yandex.com/bots'
|
1843
|
-
producer:
|
1844
|
-
name: 'Yandex LLC'
|
1845
|
-
url: 'http://company.yandex.com'
|
1846
|
-
-
|
1847
|
-
user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
|
1848
|
-
bot:
|
1849
|
-
name: 'Yandex Bot'
|
1850
|
-
category: 'Search bot'
|
1851
|
-
url: 'http://www.yandex.com/bots'
|
1852
|
-
producer:
|
1853
|
-
name: 'Yandex LLC'
|
1854
|
-
url: 'http://company.yandex.com'
|
1855
|
-
-
|
1856
|
-
user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
|
1857
|
-
bot:
|
1858
|
-
name: 'Yeti/Naverbot'
|
1859
|
-
category: 'Search bot'
|
1860
|
-
url: 'http://help.naver.com/robots/'
|
1861
|
-
producer:
|
1862
|
-
name: 'Naver'
|
1863
|
-
url: 'http://www.naver.com'
|
1864
|
-
-
|
1865
|
-
user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
|
1866
|
-
bot:
|
1867
|
-
name: 'Youdao Bot'
|
1868
|
-
category: 'Search bot'
|
1869
|
-
url: 'http://www.youdao.com/help/webmaster/spider'
|
1870
|
-
producer:
|
1871
|
-
name: 'NetEase, Inc.'
|
1872
|
-
url: 'http://corp.163.com'
|
1873
|
-
-
|
1874
|
-
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
|
1875
|
-
bot:
|
1876
|
-
name: 'Yunyun Bot'
|
1877
|
-
category: 'Search bot'
|
1878
|
-
url: 'http://www.yunyun.com/SiteInfo.php?r=about'
|
1879
|
-
producer:
|
1880
|
-
name: 'YunYun'
|
1881
|
-
url: 'http://www.yunyun.com'
|
1882
|
-
-
|
1883
|
-
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
|
1884
|
-
bot:
|
1885
|
-
name: 'Yunyun Bot'
|
1886
|
-
category: 'Search bot'
|
1887
|
-
url: 'http://www.yunyun.com/SiteInfo.php?r=about'
|
1888
|
-
producer:
|
1889
|
-
name: 'YunYun'
|
1890
|
-
url: 'http://www.yunyun.com'
|
1891
|
-
-
|
1892
|
-
user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
|
1893
|
-
bot:
|
1894
|
-
name: 'Yunyun Bot'
|
1895
|
-
category: 'Search bot'
|
1896
|
-
url: 'http://www.yunyun.com/SiteInfo.php?r=about'
|
1897
|
-
producer:
|
1898
|
-
name: 'YunYun'
|
1899
|
-
url: 'http://www.yunyun.com'
|
1900
|
-
-
|
1901
|
-
user_agent: Zookabot/2.5;++http://zookabot.com
|
1902
|
-
bot:
|
1903
|
-
name: 'Zookabot'
|
1904
|
-
category: 'Crawler'
|
1905
|
-
url: 'http://zookabot.com'
|
1906
|
-
producer:
|
1907
|
-
name: 'Hwacha ApS'
|
1908
|
-
url: 'http://hwacha.dk'
|
1909
|
-
-
|
1910
|
-
user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
|
1911
|
-
bot:
|
1912
|
-
name: 'ZumBot'
|
1913
|
-
category: 'Search bot'
|
1914
|
-
url: 'http://help.zum.com/inquiry'
|
1915
|
-
producer:
|
1916
|
-
name: 'ZUM internet'
|
1917
|
-
url: 'http://www.zuminternet.com/'
|
1918
|
-
-
|
1919
|
-
user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
|
1920
|
-
bot:
|
1921
|
-
name: 'ZumBot'
|
1922
|
-
category: 'Search bot'
|
1923
|
-
url: 'http://help.zum.com/inquiry'
|
1924
|
-
producer:
|
1925
|
-
name: 'ZUM internet'
|
1926
|
-
url: 'http://www.zuminternet.com/'
|
1927
|
-
-
|
1928
|
-
user_agent: Your Nutch Spider/Nutch-2.2.1
|
1929
|
-
bot:
|
1930
|
-
name: 'Nutch-based Bot'
|
1931
|
-
category: 'crawler'
|
1932
|
-
url: 'https://nutch.apache.org'
|
1933
|
-
producer:
|
1934
|
-
name: 'The Apache Software Foundation'
|
1935
|
-
url: 'http://www.apache.org/foundation/'
|
1936
|
-
-
|
1937
|
-
user_agent: Nutch12/Nutch-1.2
|
1938
|
-
bot:
|
1939
|
-
name: 'Nutch-based Bot'
|
1940
|
-
category: 'crawler'
|
1941
|
-
url: 'https://nutch.apache.org'
|
1942
|
-
producer:
|
1943
|
-
name: 'The Apache Software Foundation'
|
1944
|
-
url: 'http://www.apache.org/foundation/'
|
1945
|
-
-
|
1946
|
-
user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
|
1947
|
-
bot:
|
1948
|
-
name: 'Nutch-based Bot'
|
1949
|
-
category: 'crawler'
|
1950
|
-
url: 'https://nutch.apache.org'
|
1951
|
-
producer:
|
1952
|
-
name: 'The Apache Software Foundation'
|
1953
|
-
url: 'http://www.apache.org/foundation/'
|
1954
|
-
-
|
1955
|
-
user_agent: MySpider/Nutch-2.2
|
1956
|
-
bot:
|
1957
|
-
name: 'Nutch-based Bot'
|
1958
|
-
category: 'crawler'
|
1959
|
-
url: 'https://nutch.apache.org'
|
1960
|
-
producer:
|
1961
|
-
name: 'The Apache Software Foundation'
|
1962
|
-
url: 'http://www.apache.org/foundation/'
|
1963
|
-
-
|
1964
|
-
user_agent: My Nutch Spider/Nutch-1.6
|
1965
|
-
bot:
|
1966
|
-
name: 'Nutch-based Bot'
|
1967
|
-
category: 'crawler'
|
1968
|
-
url: 'https://nutch.apache.org'
|
1969
|
-
producer:
|
1970
|
-
name: 'The Apache Software Foundation'
|
1971
|
-
url: 'http://www.apache.org/foundation/'
|
1972
|
-
-
|
1973
|
-
user_agent: NutchSpider/Nutch-1.4
|
1974
|
-
bot:
|
1975
|
-
name: 'Nutch-based Bot'
|
1976
|
-
category: 'crawler'
|
1977
|
-
url: 'https://nutch.apache.org'
|
1978
|
-
producer:
|
1979
|
-
name: 'The Apache Software Foundation'
|
1980
|
-
url: 'http://www.apache.org/foundation/'
|
1981
|
-
-
|
1982
|
-
user_agent: testnutch/Nutch-1.8
|
1983
|
-
bot:
|
1984
|
-
name: 'Nutch-based Bot'
|
1985
|
-
category: 'crawler'
|
1986
|
-
url: 'https://nutch.apache.org'
|
1987
|
-
producer:
|
1988
|
-
name: 'The Apache Software Foundation'
|
1989
|
-
url: 'http://www.apache.org/foundation/'
|
1990
|
-
-
|
1991
|
-
user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
|
1992
|
-
bot:
|
1993
|
-
name: 'Nutch-based Bot'
|
1994
|
-
category: 'crawler'
|
1995
|
-
url: 'https://nutch.apache.org'
|
1996
|
-
producer:
|
1997
|
-
name: 'The Apache Software Foundation'
|
1998
|
-
url: 'http://www.apache.org/foundation/'
|
1999
|
-
-
|
2000
|
-
user_agent: your sipder name/Nutch-1.7
|
2001
|
-
bot:
|
2002
|
-
name: 'Nutch-based Bot'
|
2003
|
-
category: 'crawler'
|
2004
|
-
url: 'https://nutch.apache.org'
|
2005
|
-
producer:
|
2006
|
-
name: 'The Apache Software Foundation'
|
2007
|
-
url: 'http://www.apache.org/foundation/'
|
2008
|
-
-
|
2009
|
-
user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
|
2010
|
-
bot:
|
2011
|
-
name: 'Nutch-based Bot'
|
2012
|
-
category: 'crawler'
|
2013
|
-
url: 'https://nutch.apache.org'
|
2014
|
-
producer:
|
2015
|
-
name: 'The Apache Software Foundation'
|
2016
|
-
url: 'http://www.apache.org/foundation/'
|
2017
|
-
-
|
2018
|
-
user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
|
2019
|
-
bot:
|
2020
|
-
name: 'Nutch-based Bot'
|
2021
|
-
category: 'crawler'
|
2022
|
-
url: 'https://nutch.apache.org'
|
2023
|
-
producer:
|
2024
|
-
name: 'The Apache Software Foundation'
|
2025
|
-
url: 'http://www.apache.org/foundation/'
|
2026
|
-
-
|
2027
|
-
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
|
2028
|
-
bot:
|
2029
|
-
name: 'Nutch-based Bot'
|
2030
|
-
category: 'crawler'
|
2031
|
-
url: 'https://nutch.apache.org'
|
2032
|
-
producer:
|
2033
|
-
name: 'The Apache Software Foundation'
|
2034
|
-
url: 'http://www.apache.org/foundation/'
|
2035
|
-
-
|
2036
|
-
user_agent: CB/Nutch-1.7
|
2037
|
-
bot:
|
2038
|
-
name: 'Nutch-based Bot'
|
2039
|
-
category: 'crawler'
|
2040
|
-
url: 'https://nutch.apache.org'
|
2041
|
-
producer:
|
2042
|
-
name: 'The Apache Software Foundation'
|
2043
|
-
url: 'http://www.apache.org/foundation/'
|
2044
|
-
-
|
2045
|
-
user_agent: NetLyzer FastProbe
|
2046
|
-
bot:
|
2047
|
-
name: 'NetLyzer FastProbe'
|
2048
|
-
-
|
2049
|
-
user_agent: StatusCake Error Detector Crawler V0.01
|
2050
|
-
bot:
|
2051
|
-
name: 'Generic Bot'
|
2052
|
-
-
|
2053
|
-
user_agent: niki-bot
|
2054
|
-
bot:
|
2055
|
-
name: 'Generic Bot'
|