device_detector 1.0.2 → 1.0.6
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +5 -5
- data/.rubocop.yml +49 -0
- data/.ruby-version +1 -0
- data/.travis.yml +5 -6
- data/CHANGELOG.md +11 -0
- data/README.md +8 -7
- data/Rakefile +7 -4
- data/device_detector.gemspec +1 -0
- data/lib/device_detector/bot.rb +2 -2
- data/lib/device_detector/browser.rb +364 -0
- data/lib/device_detector/client.rb +11 -2
- data/lib/device_detector/device.rb +1168 -22
- data/lib/device_detector/memory_cache.rb +5 -5
- data/lib/device_detector/metadata_extractor.rb +7 -8
- data/lib/device_detector/model_extractor.rb +3 -3
- data/lib/device_detector/name_extractor.rb +2 -2
- data/lib/device_detector/os.rb +148 -116
- data/lib/device_detector/parser.rb +22 -9
- data/lib/device_detector/version.rb +1 -1
- data/lib/device_detector/version_extractor.rb +10 -2
- data/lib/device_detector.rb +73 -40
- data/regexes/bots.yml +909 -59
- data/regexes/client/browser_engine.yml +14 -2
- data/regexes/client/browsers.yml +1356 -241
- data/regexes/client/feed_readers.yml +10 -10
- data/regexes/client/libraries.yml +75 -1
- data/regexes/client/mediaplayers.yml +39 -3
- data/regexes/client/mobile_apps.yml +524 -45
- data/regexes/client/pim.yml +55 -2
- data/regexes/device/cameras.yml +6 -6
- data/regexes/device/car_browsers.yml +23 -3
- data/regexes/device/consoles.yml +9 -3
- data/regexes/device/mobiles.yml +16903 -3199
- data/regexes/device/notebooks.yml +114 -0
- data/regexes/device/portable_media_player.yml +20 -3
- data/regexes/device/shell_tv.yml +117 -0
- data/regexes/device/televisions.yml +440 -35
- data/regexes/oss.yml +603 -165
- data/regexes/vendorfragments.yml +6 -2
- data/spec/device_detector/concrete_user_agent_spec.rb +38 -51
- data/spec/device_detector/detector_fixtures_spec.rb +36 -37
- data/spec/device_detector/device_spec.rb +52 -56
- data/spec/device_detector/memory_cache_spec.rb +19 -19
- data/spec/device_detector/model_extractor_spec.rb +3 -3
- data/spec/device_detector/version_extractor_spec.rb +5 -6
- data/spec/device_detector_spec.rb +26 -26
- data/spec/fixtures/client/browser.yml +2617 -555
- data/spec/fixtures/client/feed_reader.yml +34 -52
- data/spec/fixtures/client/library.yml +129 -38
- data/spec/fixtures/client/mediaplayer.yml +59 -28
- data/spec/fixtures/client/mobile_app.yml +589 -20
- data/spec/fixtures/client/pim.yml +92 -19
- data/spec/fixtures/detector/bots.yml +1749 -458
- data/spec/fixtures/detector/camera.yml +30 -24
- data/spec/fixtures/detector/car_browser.yml +199 -3
- data/spec/fixtures/detector/console.yml +107 -45
- data/spec/fixtures/detector/desktop.yml +3216 -758
- data/spec/fixtures/detector/feature_phone.yml +935 -181
- data/spec/fixtures/detector/feed_reader.yml +181 -193
- data/spec/fixtures/detector/mediaplayer.yml +157 -60
- data/spec/fixtures/detector/mobile_apps.yml +914 -136
- data/spec/fixtures/detector/peripheral.yml +271 -0
- data/spec/fixtures/detector/phablet.yml +5593 -1533
- data/spec/fixtures/detector/portable_media_player.yml +398 -32
- data/spec/fixtures/detector/smart_display.yml +183 -9
- data/spec/fixtures/detector/smart_speaker.yml +60 -0
- data/spec/fixtures/detector/smartphone-1.yml +3930 -4239
- data/spec/fixtures/detector/smartphone-10.yml +3985 -7366
- data/spec/fixtures/detector/smartphone-11.yml +5083 -3784
- data/spec/fixtures/detector/smartphone-12.yml +8989 -0
- data/spec/fixtures/detector/smartphone-13.yml +9412 -0
- data/spec/fixtures/detector/smartphone-14.yml +9477 -0
- data/spec/fixtures/detector/smartphone-15.yml +9281 -0
- data/spec/fixtures/detector/smartphone-16.yml +9678 -0
- data/spec/fixtures/detector/smartphone-17.yml +9965 -0
- data/spec/fixtures/detector/smartphone-18.yml +9806 -0
- data/spec/fixtures/detector/smartphone-19.yml +9965 -0
- data/spec/fixtures/detector/smartphone-2.yml +6670 -4375
- data/spec/fixtures/detector/smartphone-20.yml +9710 -0
- data/spec/fixtures/detector/smartphone-21.yml +8693 -0
- data/spec/fixtures/detector/smartphone-22.yml +10178 -0
- data/spec/fixtures/detector/smartphone-23.yml +9453 -0
- data/spec/fixtures/detector/smartphone-24.yml +9843 -0
- data/spec/fixtures/detector/smartphone-25.yml +9703 -0
- data/spec/fixtures/detector/smartphone-26.yml +10007 -0
- data/spec/fixtures/detector/smartphone-27.yml +4927 -0
- data/spec/fixtures/detector/smartphone-3.yml +4656 -4711
- data/spec/fixtures/detector/smartphone-4.yml +3518 -4479
- data/spec/fixtures/detector/smartphone-5.yml +3805 -4803
- data/spec/fixtures/detector/smartphone-6.yml +3745 -4693
- data/spec/fixtures/detector/smartphone-7.yml +3721 -4645
- data/spec/fixtures/detector/smartphone-8.yml +4564 -4699
- data/spec/fixtures/detector/smartphone-9.yml +3897 -4888
- data/spec/fixtures/detector/smartphone.yml +3154 -4141
- data/spec/fixtures/detector/tablet-1.yml +4742 -4576
- data/spec/fixtures/detector/tablet-2.yml +3803 -4731
- data/spec/fixtures/detector/tablet-3.yml +6210 -2309
- data/spec/fixtures/detector/tablet-4.yml +9062 -0
- data/spec/fixtures/detector/tablet-5.yml +9273 -0
- data/spec/fixtures/detector/tablet-6.yml +4588 -0
- data/spec/fixtures/detector/tablet.yml +3629 -4613
- data/spec/fixtures/detector/tv-1.yml +2501 -0
- data/spec/fixtures/detector/tv.yml +8856 -2064
- data/spec/fixtures/detector/unknown.yml +412 -587
- data/spec/fixtures/detector/wearable.yml +915 -0
- data/spec/fixtures/device/camera.yml +4 -3
- data/spec/fixtures/device/car_browser.yml +9 -2
- data/spec/fixtures/device/console.yml +15 -14
- data/spec/fixtures/device/notebook.yml +7 -0
- data/spec/fixtures/parser/oss.yml +1392 -21
- data/spec/fixtures/parser/vendorfragments.yml +57 -51
- metadata +70 -4
@@ -1,45 +1,51 @@
|
|
1
1
|
---
|
2
|
-
-
|
2
|
+
-
|
3
3
|
user_agent: 360spider-image
|
4
4
|
bot:
|
5
5
|
name: 360Spider
|
6
6
|
category: Search bot
|
7
|
-
url:
|
7
|
+
url: https://www.so.com/help/help_3_2.html
|
8
8
|
producer:
|
9
9
|
name: Online Media Group, Inc.
|
10
10
|
url: ""
|
11
|
-
-
|
11
|
+
-
|
12
12
|
user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
|
13
13
|
bot:
|
14
14
|
name: 360Spider
|
15
15
|
category: Search bot
|
16
|
-
url:
|
16
|
+
url: https://www.so.com/help/help_3_2.html
|
17
17
|
producer:
|
18
18
|
name: Online Media Group, Inc.
|
19
19
|
url: ""
|
20
|
-
-
|
20
|
+
-
|
21
21
|
user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
|
22
22
|
bot:
|
23
23
|
name: 360Spider
|
24
24
|
category: Search bot
|
25
|
-
url:
|
25
|
+
url: https://www.so.com/help/help_3_2.html
|
26
26
|
producer:
|
27
27
|
name: Online Media Group, Inc.
|
28
28
|
url: ""
|
29
|
-
-
|
29
|
+
-
|
30
30
|
user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
|
31
31
|
bot:
|
32
32
|
name: 360Spider
|
33
33
|
category: Search bot
|
34
|
-
url:
|
34
|
+
url: https://www.so.com/help/help_3_2.html
|
35
35
|
producer:
|
36
36
|
name: Online Media Group, Inc.
|
37
37
|
url: ""
|
38
|
-
-
|
38
|
+
-
|
39
39
|
user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
|
40
40
|
bot:
|
41
41
|
name: ADMantX
|
42
|
-
-
|
42
|
+
-
|
43
|
+
user_agent: ias-va/3.1 (+https://www.admantx.com/service-fetcher.html)
|
44
|
+
bot:
|
45
|
+
name: ADmantX Service Fetcher
|
46
|
+
category: Service bot
|
47
|
+
url: https://www.admantx.com/service-fetcher.html
|
48
|
+
-
|
43
49
|
user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
|
44
50
|
bot:
|
45
51
|
name: Aboundexbot
|
@@ -48,7 +54,7 @@
|
|
48
54
|
producer:
|
49
55
|
name: Aboundex.com
|
50
56
|
url: http://www.aboundex.com
|
51
|
-
-
|
57
|
+
-
|
52
58
|
user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
|
53
59
|
bot:
|
54
60
|
name: Acoon
|
@@ -57,7 +63,7 @@
|
|
57
63
|
producer:
|
58
64
|
name: Acoon GmbH
|
59
65
|
url: http://www.acoon.de
|
60
|
-
-
|
66
|
+
-
|
61
67
|
user_agent: AddThis.com robot tech.support@clearspring.com
|
62
68
|
bot:
|
63
69
|
name: AddThis.com
|
@@ -66,25 +72,50 @@
|
|
66
72
|
producer:
|
67
73
|
name: Clearspring Technologies, Inc.
|
68
74
|
url: http://www.clearspring.com
|
69
|
-
-
|
75
|
+
-
|
70
76
|
user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
|
71
77
|
bot:
|
72
78
|
name: Alexa Crawler
|
73
79
|
category: Search bot
|
74
|
-
url: https://alexa.
|
80
|
+
url: https://support.alexa.com/hc/en-us/sections/200100794-Crawlers
|
75
81
|
producer:
|
76
82
|
name: Alexa Internet
|
77
|
-
url:
|
78
|
-
-
|
83
|
+
url: https://www.alexa.com
|
84
|
+
-
|
79
85
|
user_agent: Mozilla/5.0 (compatible; alexa site audit/1.0; http://www.alexa.com/help/webmasters; )
|
80
86
|
bot:
|
81
87
|
name: Alexa Site Audit
|
82
88
|
category: Site Monitor
|
83
|
-
url:
|
89
|
+
url: https://support.alexa.com/hc/en-us/articles/200450194
|
84
90
|
producer:
|
85
91
|
name: Alexa Internet
|
86
|
-
url:
|
87
|
-
-
|
92
|
+
url: https://www.alexa.com
|
93
|
+
-
|
94
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Amazonbot/0.1; +https://developer.amazon.com/support/amazonbot)
|
95
|
+
bot:
|
96
|
+
name: Amazon Bot
|
97
|
+
category: Crawler
|
98
|
+
url: https://developer.amazon.com/support/amazonbot
|
99
|
+
producer:
|
100
|
+
name: Amazon.com, Inc.
|
101
|
+
url: https://www.amazon.com/
|
102
|
+
-
|
103
|
+
user_agent: Amazon Route 53 Health Check Service; ref:xxxxxxxx-xxxx-xxxxxxxxx-xxxxxxxxxxxx; report http://amzn.to/xxxxxxx
|
104
|
+
bot:
|
105
|
+
name: Amazon Route53 Health Check
|
106
|
+
category: Service Agent
|
107
|
+
producer:
|
108
|
+
name: Amazon Web Services
|
109
|
+
url: https://aws.amazon.com/
|
110
|
+
-
|
111
|
+
user_agent: Amazon-Route53-Health-Check-Service (ref b0eb04d5-cb5e-40e7-839b-558e52fc3f0d; report http://amzn.to/1vsZADi)
|
112
|
+
bot:
|
113
|
+
name: Amazon Route53 Health Check
|
114
|
+
category: Service Agent
|
115
|
+
producer:
|
116
|
+
name: Amazon Web Services
|
117
|
+
url: https://aws.amazon.com/
|
118
|
+
-
|
88
119
|
user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
|
89
120
|
bot:
|
90
121
|
name: Amorank Spider
|
@@ -93,7 +124,7 @@
|
|
93
124
|
producer:
|
94
125
|
name: Amorank
|
95
126
|
url: http://www.amorank.com
|
96
|
-
-
|
127
|
+
-
|
97
128
|
user_agent: 'Curious George - www.analyticsseo.com/crawler'
|
98
129
|
bot:
|
99
130
|
name: Analytics SEO Crawler
|
@@ -102,7 +133,7 @@
|
|
102
133
|
producer:
|
103
134
|
name: Analytics SEO
|
104
135
|
url: http://www.analyticsseo.com
|
105
|
-
-
|
136
|
+
-
|
106
137
|
user_agent: ApacheBench/2.3
|
107
138
|
bot:
|
108
139
|
name: ApacheBench
|
@@ -110,35 +141,44 @@
|
|
110
141
|
url: https://httpd.apache.org/docs/2.4/programs/ab.html
|
111
142
|
producer:
|
112
143
|
name: The Apache Software Foundation
|
113
|
-
url:
|
114
|
-
-
|
144
|
+
url: https://www.apache.org/foundation/
|
145
|
+
-
|
115
146
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
|
116
147
|
bot:
|
117
148
|
name: Applebot
|
118
149
|
category: Crawler
|
119
|
-
url:
|
150
|
+
url: https://support.apple.com/en-us/HT204683
|
120
151
|
producer:
|
121
152
|
name: Apple Inc
|
122
|
-
url:
|
123
|
-
-
|
153
|
+
url: https://www.apple.com
|
154
|
+
-
|
155
|
+
user_agent: AppSignalBot/1.0 (+https://appsignal.com)
|
156
|
+
bot:
|
157
|
+
name: AppSignalBot
|
158
|
+
category: Site Monitor
|
159
|
+
url: https://docs.appsignal.com/uptime-monitoring/
|
160
|
+
producer:
|
161
|
+
name: AppSignal
|
162
|
+
url: https://appsignal.com/
|
163
|
+
-
|
124
164
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
|
125
165
|
bot:
|
126
166
|
name: Applebot
|
127
167
|
category: Crawler
|
128
|
-
url:
|
168
|
+
url: https://support.apple.com/en-us/HT204683
|
129
169
|
producer:
|
130
170
|
name: Apple Inc
|
131
|
-
url:
|
132
|
-
-
|
171
|
+
url: https://www.apple.com
|
172
|
+
-
|
133
173
|
user_agent: Arachni/v1.5.1
|
134
174
|
bot:
|
135
175
|
name: Arachni
|
136
176
|
category: Security Checker
|
137
|
-
url:
|
177
|
+
url: https://www.arachni-scanner.com/
|
138
178
|
producer:
|
139
179
|
name: Sarosys LLC
|
140
|
-
url:
|
141
|
-
-
|
180
|
+
url: https://www.sarosys.com/
|
181
|
+
-
|
142
182
|
user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
|
143
183
|
bot:
|
144
184
|
name: Ask Jeeves
|
@@ -147,7 +187,43 @@
|
|
147
187
|
producer:
|
148
188
|
name: Ask Jeeves Inc.
|
149
189
|
url: http://www.ask.com
|
150
|
-
-
|
190
|
+
-
|
191
|
+
user_agent: Mozilla/5.0 (compatible;AspiegelBot)
|
192
|
+
bot:
|
193
|
+
name: AspiegelBot
|
194
|
+
category: Crawler
|
195
|
+
url: https://aspiegel.com/
|
196
|
+
producer:
|
197
|
+
name: Huawei
|
198
|
+
url: https://www.huawei.com/
|
199
|
+
-
|
200
|
+
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; AspiegelBot)
|
201
|
+
bot:
|
202
|
+
name: AspiegelBot
|
203
|
+
category: Crawler
|
204
|
+
url: https://aspiegel.com/
|
205
|
+
producer:
|
206
|
+
name: Huawei
|
207
|
+
url: https://www.huawei.com/
|
208
|
+
-
|
209
|
+
user_agent: AwarioRssBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
210
|
+
bot:
|
211
|
+
name: Awario
|
212
|
+
category: Feed Fetcher
|
213
|
+
url: https://awario.com/bots.html
|
214
|
+
producer:
|
215
|
+
name: Awario
|
216
|
+
url: https://awario.com/
|
217
|
+
-
|
218
|
+
user_agent: AwarioSmartBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
219
|
+
bot:
|
220
|
+
name: Awario
|
221
|
+
category: Search bot
|
222
|
+
url: https://awario.com/bots.html
|
223
|
+
producer:
|
224
|
+
name: Awario
|
225
|
+
url: https://awario.com/
|
226
|
+
-
|
151
227
|
user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
|
152
228
|
bot:
|
153
229
|
name: BLEXBot Crawler
|
@@ -156,7 +232,7 @@
|
|
156
232
|
producer:
|
157
233
|
name: WebMeUp
|
158
234
|
url: http://webmeup.com
|
159
|
-
-
|
235
|
+
-
|
160
236
|
user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
|
161
237
|
bot:
|
162
238
|
name: BUbiNG
|
@@ -165,7 +241,7 @@
|
|
165
241
|
producer:
|
166
242
|
name: The Laboratory for Web Algorithmics (LAW)
|
167
243
|
url: 'http://law.di.unimi.it/software.php#buging'
|
168
|
-
-
|
244
|
+
-
|
169
245
|
user_agent: Backlink-Check.de (+http://www.backlink-check.de/bot.html)
|
170
246
|
bot:
|
171
247
|
name: Backlink-Check.de
|
@@ -174,7 +250,7 @@
|
|
174
250
|
producer:
|
175
251
|
name: Mediagreen Medienservice
|
176
252
|
url: http://www.backlink-check.de
|
177
|
-
-
|
253
|
+
-
|
178
254
|
user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
|
179
255
|
bot:
|
180
256
|
name: BacklinkCrawler
|
@@ -183,7 +259,7 @@
|
|
183
259
|
producer:
|
184
260
|
name: 2.0Promotion GbR
|
185
261
|
url: http://www.backlinktest.com
|
186
|
-
-
|
262
|
+
-
|
187
263
|
user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
|
188
264
|
bot:
|
189
265
|
name: Baidu Spider
|
@@ -192,7 +268,7 @@
|
|
192
268
|
producer:
|
193
269
|
name: Baidu
|
194
270
|
url: http://www.baidu.com
|
195
|
-
-
|
271
|
+
-
|
196
272
|
user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
|
197
273
|
bot:
|
198
274
|
name: Baidu Spider
|
@@ -201,7 +277,7 @@
|
|
201
277
|
producer:
|
202
278
|
name: Baidu
|
203
279
|
url: http://www.baidu.com
|
204
|
-
-
|
280
|
+
-
|
205
281
|
user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
|
206
282
|
bot:
|
207
283
|
name: Baidu Spider
|
@@ -210,7 +286,7 @@
|
|
210
286
|
producer:
|
211
287
|
name: Baidu
|
212
288
|
url: http://www.baidu.com
|
213
|
-
-
|
289
|
+
-
|
214
290
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
|
215
291
|
bot:
|
216
292
|
name: Baidu Spider
|
@@ -219,7 +295,7 @@
|
|
219
295
|
producer:
|
220
296
|
name: Baidu
|
221
297
|
url: http://www.baidu.com
|
222
|
-
-
|
298
|
+
-
|
223
299
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
|
224
300
|
bot:
|
225
301
|
name: Baidu Spider
|
@@ -228,7 +304,7 @@
|
|
228
304
|
producer:
|
229
305
|
name: Baidu
|
230
306
|
url: http://www.baidu.com
|
231
|
-
-
|
307
|
+
-
|
232
308
|
user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
|
233
309
|
bot:
|
234
310
|
name: Baidu Spider
|
@@ -237,7 +313,7 @@
|
|
237
313
|
producer:
|
238
314
|
name: Baidu
|
239
315
|
url: http://www.baidu.com
|
240
|
-
-
|
316
|
+
-
|
241
317
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
|
242
318
|
bot:
|
243
319
|
name: Baidu Spider
|
@@ -246,7 +322,13 @@
|
|
246
322
|
producer:
|
247
323
|
name: Baidu
|
248
324
|
url: http://www.baidu.com
|
249
|
-
-
|
325
|
+
-
|
326
|
+
user_agent: Barkrowler/0.9 (+http://www.exensa.com/crawl)
|
327
|
+
bot:
|
328
|
+
name: Barkrowler
|
329
|
+
category: Crawler
|
330
|
+
url: http://www.exensa.com/crawl
|
331
|
+
-
|
250
332
|
user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
|
251
333
|
bot:
|
252
334
|
name: BazQux Reader
|
@@ -255,7 +337,7 @@
|
|
255
337
|
producer:
|
256
338
|
name: ""
|
257
339
|
url: ""
|
258
|
-
-
|
340
|
+
-
|
259
341
|
user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
|
260
342
|
bot:
|
261
343
|
name: BingBot
|
@@ -264,7 +346,7 @@
|
|
264
346
|
producer:
|
265
347
|
name: Microsoft Corporation
|
266
348
|
url: http://www.microsoft.com
|
267
|
-
-
|
349
|
+
-
|
268
350
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
|
269
351
|
bot:
|
270
352
|
name: BingBot
|
@@ -273,7 +355,7 @@
|
|
273
355
|
producer:
|
274
356
|
name: Microsoft Corporation
|
275
357
|
url: http://www.microsoft.com
|
276
|
-
-
|
358
|
+
-
|
277
359
|
user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
|
278
360
|
bot:
|
279
361
|
name: BingBot
|
@@ -282,7 +364,7 @@
|
|
282
364
|
producer:
|
283
365
|
name: Microsoft Corporation
|
284
366
|
url: http://www.microsoft.com
|
285
|
-
-
|
367
|
+
-
|
286
368
|
user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
|
287
369
|
bot:
|
288
370
|
name: BingBot
|
@@ -291,7 +373,7 @@
|
|
291
373
|
producer:
|
292
374
|
name: Microsoft Corporation
|
293
375
|
url: http://www.microsoft.com
|
294
|
-
-
|
376
|
+
-
|
295
377
|
user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
|
296
378
|
bot:
|
297
379
|
name: BingBot
|
@@ -300,7 +382,7 @@
|
|
300
382
|
producer:
|
301
383
|
name: Microsoft Corporation
|
302
384
|
url: http://www.microsoft.com
|
303
|
-
-
|
385
|
+
-
|
304
386
|
user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
|
305
387
|
bot:
|
306
388
|
name: BingBot
|
@@ -309,7 +391,7 @@
|
|
309
391
|
producer:
|
310
392
|
name: Microsoft Corporation
|
311
393
|
url: http://www.microsoft.com
|
312
|
-
-
|
394
|
+
-
|
313
395
|
user_agent: msnbot/2.0b v1394720947.6703
|
314
396
|
bot:
|
315
397
|
name: BingBot
|
@@ -318,7 +400,7 @@
|
|
318
400
|
producer:
|
319
401
|
name: Microsoft Corporation
|
320
402
|
url: http://www.microsoft.com
|
321
|
-
-
|
403
|
+
-
|
322
404
|
user_agent: MSNBot/Nutch-1.5.1
|
323
405
|
bot:
|
324
406
|
name: BingBot
|
@@ -327,7 +409,7 @@
|
|
327
409
|
producer:
|
328
410
|
name: Microsoft Corporation
|
329
411
|
url: http://www.microsoft.com
|
330
|
-
-
|
412
|
+
-
|
331
413
|
user_agent: bitlybot/3.0
|
332
414
|
bot:
|
333
415
|
name: BitlyBot
|
@@ -336,7 +418,7 @@
|
|
336
418
|
producer:
|
337
419
|
name: Bitly, Inc.
|
338
420
|
url: https://bitly.com
|
339
|
-
-
|
421
|
+
-
|
340
422
|
user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
|
341
423
|
bot:
|
342
424
|
name: Blekkobot
|
@@ -345,7 +427,7 @@
|
|
345
427
|
producer:
|
346
428
|
name: Blekko
|
347
429
|
url: http://blekko.com
|
348
|
-
-
|
430
|
+
-
|
349
431
|
user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
|
350
432
|
bot:
|
351
433
|
name: Bloglovin
|
@@ -354,7 +436,7 @@
|
|
354
436
|
producer:
|
355
437
|
name: ""
|
356
438
|
url: ""
|
357
|
-
-
|
439
|
+
-
|
358
440
|
user_agent: Blogtrottr/2.0
|
359
441
|
bot:
|
360
442
|
name: Blogtrottr
|
@@ -363,7 +445,24 @@
|
|
363
445
|
producer:
|
364
446
|
name: Blogtrottr Ltd
|
365
447
|
url: https://blogtrottr.com/
|
366
|
-
-
|
448
|
+
-
|
449
|
+
user_agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com
|
450
|
+
bot:
|
451
|
+
name: BoardReader
|
452
|
+
category: Search bot
|
453
|
+
url: https://boardreader.com/
|
454
|
+
producer:
|
455
|
+
name: Effyis Inc
|
456
|
+
url: https://boardreader.com/
|
457
|
+
-
|
458
|
+
user_agent: BoardReader Blog Indexer(http://boardreader.com)
|
459
|
+
bot:
|
460
|
+
name: BoardReader Blog Indexer
|
461
|
+
category: Crawler
|
462
|
+
producer:
|
463
|
+
name: BoardReader
|
464
|
+
url: https://boardreader.com/
|
465
|
+
-
|
367
466
|
user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
|
368
467
|
bot:
|
369
468
|
name: Bountii Bot
|
@@ -372,7 +471,16 @@
|
|
372
471
|
producer:
|
373
472
|
name: Bountii Inc.
|
374
473
|
url: http://bountii.com
|
375
|
-
-
|
474
|
+
-
|
475
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10.10; rv:41.0) Gecko/20100101 Firefox/55.0 BrandVerity/1.0 (http://www.brandverity.com/why-is-brandverity-visiting-me)
|
476
|
+
bot:
|
477
|
+
name: BrandVerity
|
478
|
+
category: Crawler
|
479
|
+
url: https://www.brandverity.com/why-is-brandverity-visiting-me
|
480
|
+
producer:
|
481
|
+
name: BrandVerity, Inc.
|
482
|
+
url: https://www.brandverity.com/
|
483
|
+
-
|
376
484
|
user_agent: Browsershots
|
377
485
|
bot:
|
378
486
|
name: Browsershots
|
@@ -381,7 +489,16 @@
|
|
381
489
|
producer:
|
382
490
|
name: Browsershots.org
|
383
491
|
url: http://browsershots.org
|
384
|
-
-
|
492
|
+
-
|
493
|
+
user_agent: Buck/2.2; (+https://app.hypefactors.com/media-monitoring/about.html)
|
494
|
+
bot:
|
495
|
+
name: Buck
|
496
|
+
category: Search bot
|
497
|
+
url: https://hypefactors.com/
|
498
|
+
producer:
|
499
|
+
name: Hypefactors A/S
|
500
|
+
url: https://hypefactors.com/
|
501
|
+
-
|
385
502
|
user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
386
503
|
bot:
|
387
504
|
name: Butterfly Robot
|
@@ -390,7 +507,7 @@
|
|
390
507
|
producer:
|
391
508
|
name: Topsy Labs
|
392
509
|
url: http://labs.topsy.com
|
393
|
-
-
|
510
|
+
-
|
394
511
|
user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
395
512
|
bot:
|
396
513
|
name: Butterfly Robot
|
@@ -399,7 +516,25 @@
|
|
399
516
|
producer:
|
400
517
|
name: Topsy Labs
|
401
518
|
url: http://labs.topsy.com
|
402
|
-
-
|
519
|
+
-
|
520
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.5668.1446 Mobile Safari/537.36; Bytespider;bytespider@bytedance.com
|
521
|
+
bot:
|
522
|
+
name: Bytespider
|
523
|
+
category: Search bot
|
524
|
+
url: https://bytedance.com/
|
525
|
+
producer:
|
526
|
+
name: ByteDance Ltd.
|
527
|
+
url: https://bytedance.com/
|
528
|
+
-
|
529
|
+
user_agent: CATExplorador/1.0beta (sistemes at domini dot cat; http://domini.cat/catexplorador.html)
|
530
|
+
bot:
|
531
|
+
name: CATExplorador
|
532
|
+
category: Search bot
|
533
|
+
url: https://fundacio.cat/ca/domini/
|
534
|
+
producer:
|
535
|
+
name: Fundació puntCAT
|
536
|
+
url: https://fundacio.cat/ca/domini/
|
537
|
+
-
|
403
538
|
user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
|
404
539
|
bot:
|
405
540
|
name: CareerBot
|
@@ -408,7 +543,7 @@
|
|
408
543
|
producer:
|
409
544
|
name: career-x GmbH
|
410
545
|
url: http://www.career-x.de
|
411
|
-
-
|
546
|
+
-
|
412
547
|
user_agent: Castro 2, Episode Duration Lookup
|
413
548
|
bot:
|
414
549
|
name: Castro 2
|
@@ -417,7 +552,7 @@
|
|
417
552
|
producer:
|
418
553
|
name: Supertop
|
419
554
|
url: http://supertop.co
|
420
|
-
-
|
555
|
+
-
|
421
556
|
user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
|
422
557
|
bot:
|
423
558
|
name: Cliqzbot
|
@@ -426,7 +561,7 @@
|
|
426
561
|
producer:
|
427
562
|
name: 10betterpages GmbH
|
428
563
|
url: http://cliqz.com
|
429
|
-
-
|
564
|
+
-
|
430
565
|
user_agent: Mozilla/5.0 (compatible; Cloudflare-AMP/1.0; +https://amp.cloudflare.com/doc/fetcher.html) AppleWebKit/534.34
|
431
566
|
bot:
|
432
567
|
name: CloudFlare AMP Fetcher
|
@@ -435,7 +570,7 @@
|
|
435
570
|
producer:
|
436
571
|
name: CloudFlare
|
437
572
|
url: http://www.cloudflare.com
|
438
|
-
-
|
573
|
+
-
|
439
574
|
user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
|
440
575
|
bot:
|
441
576
|
name: CloudFlare Always Online
|
@@ -444,7 +579,7 @@
|
|
444
579
|
producer:
|
445
580
|
name: CloudFlare
|
446
581
|
url: http://www.cloudflare.com
|
447
|
-
-
|
582
|
+
-
|
448
583
|
user_agent: collectd/5.5.1
|
449
584
|
bot:
|
450
585
|
name: Collectd
|
@@ -453,7 +588,7 @@
|
|
453
588
|
producer:
|
454
589
|
name: Collectd
|
455
590
|
url: https://collectd.org/
|
456
|
-
-
|
591
|
+
-
|
457
592
|
user_agent: CommaFeed/1.0 (http://www.commafeed.com)
|
458
593
|
bot:
|
459
594
|
name: CommaFeed
|
@@ -462,16 +597,79 @@
|
|
462
597
|
producer:
|
463
598
|
name: ""
|
464
599
|
url: ""
|
465
|
-
-
|
600
|
+
-
|
601
|
+
user_agent: coccocbot-web/1.0 (+http://help.coccoc.com/searchengine)
|
602
|
+
bot:
|
603
|
+
name: Cốc Cốc Bot
|
604
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
605
|
+
category: Search bot
|
606
|
+
producer:
|
607
|
+
name: Cốc Cốc
|
608
|
+
url: https://coccoc.com/
|
609
|
+
-
|
466
610
|
user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
|
467
611
|
bot:
|
468
612
|
name: Cốc Cốc Bot
|
469
|
-
url:
|
613
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
614
|
+
category: Search bot
|
615
|
+
producer:
|
616
|
+
name: Cốc Cốc
|
617
|
+
url: https://coccoc.com/
|
618
|
+
-
|
619
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-ads/1.0; +http://help.coccoc.com/searchengine)
|
620
|
+
bot:
|
621
|
+
name: Cốc Cốc Bot
|
622
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
623
|
+
category: Search bot
|
624
|
+
producer:
|
625
|
+
name: Cốc Cốc
|
626
|
+
url: https://coccoc.com/
|
627
|
+
-
|
628
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-fast/1.0; +http://help.coccoc.com/searchengine)
|
629
|
+
bot:
|
630
|
+
name: Cốc Cốc Bot
|
631
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
632
|
+
category: Search bot
|
633
|
+
producer:
|
634
|
+
name: Cốc Cốc
|
635
|
+
url: https://coccoc.com/
|
636
|
+
-
|
637
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-image/1.0; +http://help.coccoc.com/searchengine)
|
638
|
+
bot:
|
639
|
+
name: Cốc Cốc Bot
|
640
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
641
|
+
category: Search bot
|
642
|
+
producer:
|
643
|
+
name: Cốc Cốc
|
644
|
+
url: https://coccoc.com/
|
645
|
+
-
|
646
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-shopping/1.0; +http://help.coccoc.com/searchengine)
|
647
|
+
bot:
|
648
|
+
name: Cốc Cốc Bot
|
649
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
650
|
+
category: Search bot
|
651
|
+
producer:
|
652
|
+
name: Cốc Cốc
|
653
|
+
url: https://coccoc.com/
|
654
|
+
-
|
655
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-web/1.0; +http://help.coccoc.com/searchengine)
|
656
|
+
bot:
|
657
|
+
name: Cốc Cốc Bot
|
658
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
659
|
+
category: Search bot
|
660
|
+
producer:
|
661
|
+
name: Cốc Cốc
|
662
|
+
url: https://coccoc.com/
|
663
|
+
-
|
664
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot/1.0; +http://help.coccoc.com/searchengine)
|
665
|
+
bot:
|
666
|
+
name: Cốc Cốc Bot
|
667
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
470
668
|
category: Search bot
|
471
669
|
producer:
|
472
670
|
name: Cốc Cốc
|
473
|
-
url:
|
474
|
-
-
|
671
|
+
url: https://coccoc.com/
|
672
|
+
-
|
475
673
|
user_agent: Datadog Agent/5.10.1
|
476
674
|
bot:
|
477
675
|
name: Datadog Agent
|
@@ -480,7 +678,16 @@
|
|
480
678
|
producer:
|
481
679
|
name: Datadog
|
482
680
|
url: https://www.datadoghq.com/
|
483
|
-
-
|
681
|
+
-
|
682
|
+
user_agent: Mozilla/5.0 (X11; Datanyze; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36
|
683
|
+
bot:
|
684
|
+
name: Datanyze
|
685
|
+
url: ""
|
686
|
+
category: Crawler
|
687
|
+
producer:
|
688
|
+
name: Datanyze
|
689
|
+
url: https://www.datanyze.com
|
690
|
+
-
|
484
691
|
user_agent: Mozilla/5.0 (compatible; Dataprovider/6.92; +https://www.dataprovider.com/)
|
485
692
|
bot:
|
486
693
|
name: Dataprovider
|
@@ -489,7 +696,7 @@
|
|
489
696
|
producer:
|
490
697
|
name: Dataprovider B.V.
|
491
698
|
url: https://www.dataprovider.com/
|
492
|
-
-
|
699
|
+
-
|
493
700
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
|
494
701
|
bot:
|
495
702
|
name: Daum
|
@@ -498,7 +705,7 @@
|
|
498
705
|
producer:
|
499
706
|
name: Daum Communications Corp.
|
500
707
|
url: http://www.kakaocorp.com/main
|
501
|
-
-
|
708
|
+
-
|
502
709
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
|
503
710
|
bot:
|
504
711
|
name: Daum
|
@@ -507,7 +714,7 @@
|
|
507
714
|
producer:
|
508
715
|
name: Daum Communications Corp.
|
509
716
|
url: http://www.kakaocorp.com/main
|
510
|
-
-
|
717
|
+
-
|
511
718
|
user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
|
512
719
|
bot:
|
513
720
|
name: Dazoobot
|
@@ -516,7 +723,7 @@
|
|
516
723
|
producer:
|
517
724
|
name: DAZOO.FR
|
518
725
|
url: http://dazoo.fr
|
519
|
-
-
|
726
|
+
-
|
520
727
|
user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
|
521
728
|
bot:
|
522
729
|
name: Discobot
|
@@ -525,7 +732,7 @@
|
|
525
732
|
producer:
|
526
733
|
name: Discovery Engine
|
527
734
|
url: http://discoveryengine.com
|
528
|
-
-
|
735
|
+
-
|
529
736
|
user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
|
530
737
|
bot:
|
531
738
|
name: Domain Re-Animator Bot
|
@@ -534,7 +741,7 @@
|
|
534
741
|
producer:
|
535
742
|
name: Domain Re-Animator, LLC
|
536
743
|
url: http://domainreanimator.com
|
537
|
-
-
|
744
|
+
-
|
538
745
|
user_agent: support@domainreanimator.com
|
539
746
|
bot:
|
540
747
|
name: Domain Re-Animator Bot
|
@@ -543,7 +750,13 @@
|
|
543
750
|
producer:
|
544
751
|
name: Domain Re-Animator, LLC
|
545
752
|
url: http://domainreanimator.com
|
546
|
-
-
|
753
|
+
-
|
754
|
+
user_agent: Mozilla/5.0 (compatible; Domains Project/1.1.0; +https://domainsproject.org)
|
755
|
+
bot:
|
756
|
+
name: Domains Project
|
757
|
+
category: Crawler
|
758
|
+
url: https://domainsproject.org
|
759
|
+
-
|
547
760
|
user_agent: dotbot
|
548
761
|
bot:
|
549
762
|
name: DotBot
|
@@ -552,7 +765,16 @@
|
|
552
765
|
producer:
|
553
766
|
name: SEOmoz, Inc.
|
554
767
|
url: http://moz.com/
|
555
|
-
-
|
768
|
+
-
|
769
|
+
user_agent: DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)
|
770
|
+
bot:
|
771
|
+
name: DuckDuckGo Bot
|
772
|
+
category: Search bot
|
773
|
+
url: https://duckduckgo.com/duckduckbot
|
774
|
+
producer:
|
775
|
+
name: DuckDuckGo
|
776
|
+
url: https://duckduckgo.com/
|
777
|
+
-
|
556
778
|
user_agent: Mozilla/5.0 (compatible; DuckDuckGo-Favicons-Bot/1.0; +http://duckduckgo.com)
|
557
779
|
bot:
|
558
780
|
name: DuckDuckGo Bot
|
@@ -561,7 +783,7 @@
|
|
561
783
|
producer:
|
562
784
|
name: DuckDuckGo
|
563
785
|
url: https://duckduckgo.com/
|
564
|
-
-
|
786
|
+
-
|
565
787
|
user_agent: EMail Exractor
|
566
788
|
bot:
|
567
789
|
name: EMail Exractor
|
@@ -570,7 +792,7 @@
|
|
570
792
|
producer:
|
571
793
|
name: ""
|
572
794
|
url: ""
|
573
|
-
-
|
795
|
+
-
|
574
796
|
user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
|
575
797
|
bot:
|
576
798
|
name: Easou Spider
|
@@ -579,7 +801,7 @@
|
|
579
801
|
producer:
|
580
802
|
name: easou ICP
|
581
803
|
url: http://www.easou.com
|
582
|
-
-
|
804
|
+
-
|
583
805
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
|
584
806
|
bot:
|
585
807
|
name: Easou Spider
|
@@ -588,7 +810,16 @@
|
|
588
810
|
producer:
|
589
811
|
name: easou ICP
|
590
812
|
url: http://www.easou.com
|
591
|
-
-
|
813
|
+
-
|
814
|
+
user_agent: Mozilla/5.0 (compatible; Embedly/0.2; +http://support.embed.ly/)
|
815
|
+
bot:
|
816
|
+
name: Embedly
|
817
|
+
category: Crawler
|
818
|
+
url: https://support.embed.ly/hc/en-us
|
819
|
+
producer:
|
820
|
+
name: A Medium, Corp.
|
821
|
+
url: https://medium.com/
|
822
|
+
-
|
592
823
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
|
593
824
|
bot:
|
594
825
|
name: ExaBot
|
@@ -597,7 +828,7 @@
|
|
597
828
|
producer:
|
598
829
|
name: Dassault Systèmes
|
599
830
|
url: http://www.3ds.com
|
600
|
-
-
|
831
|
+
-
|
601
832
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
|
602
833
|
bot:
|
603
834
|
name: ExaBot
|
@@ -606,7 +837,7 @@
|
|
606
837
|
producer:
|
607
838
|
name: Dassault Systèmes
|
608
839
|
url: http://www.3ds.com
|
609
|
-
-
|
840
|
+
-
|
610
841
|
user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
|
611
842
|
bot:
|
612
843
|
name: ExaBot
|
@@ -615,7 +846,7 @@
|
|
615
846
|
producer:
|
616
847
|
name: Dassault Systèmes
|
617
848
|
url: http://www.3ds.com
|
618
|
-
-
|
849
|
+
-
|
619
850
|
user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
|
620
851
|
bot:
|
621
852
|
name: ExactSeek Crawler
|
@@ -624,7 +855,7 @@
|
|
624
855
|
producer:
|
625
856
|
name: Jayde Online, Inc.
|
626
857
|
url: http://www.jaydeonlineinc.com
|
627
|
-
-
|
858
|
+
-
|
628
859
|
user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
|
629
860
|
bot:
|
630
861
|
name: Ezooms
|
@@ -633,7 +864,7 @@
|
|
633
864
|
producer:
|
634
865
|
name: SEOmoz, Inc.
|
635
866
|
url: http://moz.com/
|
636
|
-
-
|
867
|
+
-
|
637
868
|
user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
|
638
869
|
bot:
|
639
870
|
name: Facebook External Hit
|
@@ -642,7 +873,16 @@
|
|
642
873
|
producer:
|
643
874
|
name: Facebook
|
644
875
|
url: http://www.facebook.com
|
645
|
-
-
|
876
|
+
-
|
877
|
+
user_agent: facebookexternalua
|
878
|
+
bot:
|
879
|
+
name: Facebook External Hit
|
880
|
+
category: Social Media Agent
|
881
|
+
url: https://www.facebook.com/externalhit_uatext.php
|
882
|
+
producer:
|
883
|
+
name: Facebook
|
884
|
+
url: http://www.facebook.com
|
885
|
+
-
|
646
886
|
user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
|
647
887
|
bot:
|
648
888
|
name: Facebook External Hit
|
@@ -651,7 +891,7 @@
|
|
651
891
|
producer:
|
652
892
|
name: Facebook
|
653
893
|
url: http://www.facebook.com
|
654
|
-
-
|
894
|
+
-
|
655
895
|
user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
|
656
896
|
bot:
|
657
897
|
name: Feed Wrangler
|
@@ -660,7 +900,7 @@
|
|
660
900
|
producer:
|
661
901
|
name: 'David Smith & Developing Perspective, LLC'
|
662
902
|
url: https://david-smith.org
|
663
|
-
-
|
903
|
+
-
|
664
904
|
user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
|
665
905
|
bot:
|
666
906
|
name: FeedBurner
|
@@ -669,7 +909,7 @@
|
|
669
909
|
producer:
|
670
910
|
name: ""
|
671
911
|
url: ""
|
672
|
-
-
|
912
|
+
-
|
673
913
|
user_agent: 'Feedbin - 9 subscribers'
|
674
914
|
bot:
|
675
915
|
name: Feedbin
|
@@ -678,7 +918,7 @@
|
|
678
918
|
producer:
|
679
919
|
name: ""
|
680
920
|
url: ""
|
681
|
-
-
|
921
|
+
-
|
682
922
|
user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
|
683
923
|
bot:
|
684
924
|
name: Feedly
|
@@ -687,7 +927,7 @@
|
|
687
927
|
producer:
|
688
928
|
name: ""
|
689
929
|
url: ""
|
690
|
-
-
|
930
|
+
-
|
691
931
|
user_agent: FeedlyApp/1.0 (http://www.feedly.com)
|
692
932
|
bot:
|
693
933
|
name: Feedly
|
@@ -696,7 +936,7 @@
|
|
696
936
|
producer:
|
697
937
|
name: ""
|
698
938
|
url: ""
|
699
|
-
-
|
939
|
+
-
|
700
940
|
user_agent: FeedlyBot/1.0 (http://feedly.com)
|
701
941
|
bot:
|
702
942
|
name: Feedly
|
@@ -705,7 +945,7 @@
|
|
705
945
|
producer:
|
706
946
|
name: ""
|
707
947
|
url: ""
|
708
|
-
-
|
948
|
+
-
|
709
949
|
user_agent: MetaFeedly/1.0 (http://www.feedly.com)
|
710
950
|
bot:
|
711
951
|
name: Feedly
|
@@ -714,7 +954,7 @@
|
|
714
954
|
producer:
|
715
955
|
name: ""
|
716
956
|
url: ""
|
717
|
-
-
|
957
|
+
-
|
718
958
|
user_agent: Feedspot http://www.feedspot.com
|
719
959
|
bot:
|
720
960
|
name: Feedspot
|
@@ -723,7 +963,7 @@
|
|
723
963
|
producer:
|
724
964
|
name: ""
|
725
965
|
url: ""
|
726
|
-
-
|
966
|
+
-
|
727
967
|
user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
|
728
968
|
bot:
|
729
969
|
name: Fever
|
@@ -732,13 +972,13 @@
|
|
732
972
|
producer:
|
733
973
|
name: ""
|
734
974
|
url: ""
|
735
|
-
-
|
975
|
+
-
|
736
976
|
user_agent: Mozilla/5.0 (compatible; Findxbot/1.0; +http://www.findxbot.com)
|
737
977
|
bot:
|
738
978
|
name: Findxbot
|
739
979
|
category: Crawler
|
740
980
|
url: http://www.findxbot.com
|
741
|
-
-
|
981
|
+
-
|
742
982
|
user_agent: Mozilla/5.0 (compatible; FlipboardProxy/1.2; +http://flipboard.com/browserproxy)
|
743
983
|
bot:
|
744
984
|
name: Flipboard
|
@@ -747,7 +987,7 @@
|
|
747
987
|
producer:
|
748
988
|
name: Flipboard
|
749
989
|
url: http://flipboard.com/
|
750
|
-
-
|
990
|
+
-
|
751
991
|
user_agent: Mozilla/5.0 (compatible; FlipboardRSS/1.2; +http://flipboard.com/browserproxy)
|
752
992
|
bot:
|
753
993
|
name: Flipboard
|
@@ -756,39 +996,76 @@
|
|
756
996
|
producer:
|
757
997
|
name: Flipboard
|
758
998
|
url: http://flipboard.com/
|
759
|
-
-
|
999
|
+
-
|
1000
|
+
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
1001
|
+
bot:
|
1002
|
+
name: FreshRSS
|
1003
|
+
category: Feed Fetcher
|
1004
|
+
url: https://freshrss.org/
|
1005
|
+
-
|
1006
|
+
user_agent: FreshRSS/1.12.0 (Linux; https://freshrss.org)
|
1007
|
+
bot:
|
1008
|
+
name: FreshRSS
|
1009
|
+
category: Feed Fetcher
|
1010
|
+
url: https://freshrss.org/
|
1011
|
+
-
|
1012
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64; GTmetrix https://gtmetrix.com/) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/75.0.3770.100 Safari/537.36
|
1013
|
+
bot:
|
1014
|
+
name: GTmetrix
|
1015
|
+
category: Crawler
|
1016
|
+
url: https://gtmetrix.com/
|
1017
|
+
producer:
|
1018
|
+
name: Carbon60 Operating Co. Ltd.
|
1019
|
+
url: https://www.carbon60.com/
|
1020
|
+
-
|
1021
|
+
user_agent: 7Siters/1.07 (+https://7ooo.ru/siters/)
|
1022
|
+
bot:
|
1023
|
+
name: Generic Bot
|
1024
|
+
-
|
760
1025
|
user_agent: COMODO SSL Checker
|
761
1026
|
bot:
|
762
1027
|
name: Generic Bot
|
763
|
-
-
|
1028
|
+
-
|
764
1029
|
user_agent: help@dataminr.com
|
765
1030
|
bot:
|
766
1031
|
name: Generic Bot
|
767
|
-
-
|
1032
|
+
-
|
768
1033
|
user_agent: 'HybridBot (hybrid.ru/about. If our bot caused problems please contact us. Contact email: m.lyashkov@targetix.net)'
|
769
1034
|
bot:
|
770
1035
|
name: Generic Bot
|
771
|
-
-
|
1036
|
+
-
|
1037
|
+
user_agent: 'Mozilla/5.0 (compatible; +centuryb.o.t9[at]gmail.com)'
|
1038
|
+
bot:
|
1039
|
+
name: Generic Bot
|
1040
|
+
-
|
772
1041
|
user_agent: Mozilla/5.0 (compatible; +http://tweetedtimes.com)
|
773
1042
|
bot:
|
774
1043
|
name: Generic Bot
|
775
|
-
-
|
1044
|
+
-
|
776
1045
|
user_agent: Mozilla/5.0 (compatible; Shareaholicbot/2.0; +http://www.shareaholic.com/bot)
|
777
1046
|
bot:
|
778
1047
|
name: Generic Bot
|
779
|
-
-
|
1048
|
+
-
|
780
1049
|
user_agent: Mozilla/5.0 (compatible; TrendsmapResolver/0.1)
|
781
1050
|
bot:
|
782
1051
|
name: Generic Bot
|
783
|
-
-
|
1052
|
+
-
|
784
1053
|
user_agent: niki-bot
|
785
1054
|
bot:
|
786
1055
|
name: Generic Bot
|
787
|
-
-
|
1056
|
+
-
|
788
1057
|
user_agent: PHPCrawl
|
789
1058
|
bot:
|
790
1059
|
name: Generic Bot
|
791
|
-
-
|
1060
|
+
-
|
1061
|
+
user_agent: robots
|
1062
|
+
bot:
|
1063
|
+
name: Generic Bot
|
1064
|
+
-
|
1065
|
+
user_agent: SeopultContentAnalyzer/1.0
|
1066
|
+
bot:
|
1067
|
+
name: Generic Bot
|
1068
|
+
-
|
792
1069
|
user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
|
793
1070
|
bot:
|
794
1071
|
name: Genieo Web filter
|
@@ -797,7 +1074,7 @@
|
|
797
1074
|
producer:
|
798
1075
|
name: Genieo
|
799
1076
|
url: http://www.genieo.com
|
800
|
-
-
|
1077
|
+
-
|
801
1078
|
user_agent: GigablastOpenSource/1.0
|
802
1079
|
bot:
|
803
1080
|
name: Gigablast
|
@@ -806,7 +1083,7 @@
|
|
806
1083
|
producer:
|
807
1084
|
name: Matt Wells
|
808
1085
|
url: http://www.gigablast.com/faq.html
|
809
|
-
-
|
1086
|
+
-
|
810
1087
|
user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
|
811
1088
|
bot:
|
812
1089
|
name: Gluten Free Crawler
|
@@ -815,7 +1092,7 @@
|
|
815
1092
|
producer:
|
816
1093
|
name: ""
|
817
1094
|
url: ""
|
818
|
-
-
|
1095
|
+
-
|
819
1096
|
user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
|
820
1097
|
bot:
|
821
1098
|
name: Gmail Image Proxy
|
@@ -824,7 +1101,7 @@
|
|
824
1101
|
producer:
|
825
1102
|
name: Google Inc.
|
826
1103
|
url: http://www.google.com
|
827
|
-
-
|
1104
|
+
-
|
828
1105
|
user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
|
829
1106
|
bot:
|
830
1107
|
name: Goo
|
@@ -833,7 +1110,12 @@
|
|
833
1110
|
producer:
|
834
1111
|
name: NTT Resonant
|
835
1112
|
url: http://goo.ne.jp
|
836
|
-
-
|
1113
|
+
-
|
1114
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.75 Safari/537.36 Google Favicon
|
1115
|
+
bot:
|
1116
|
+
name: Google Favicon
|
1117
|
+
category: Crawler
|
1118
|
+
-
|
837
1119
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
|
838
1120
|
bot:
|
839
1121
|
name: Google PageSpeed Insights
|
@@ -842,7 +1124,7 @@
|
|
842
1124
|
producer:
|
843
1125
|
name: Google Inc.
|
844
1126
|
url: http://www.google.com
|
845
|
-
-
|
1127
|
+
-
|
846
1128
|
user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
|
847
1129
|
bot:
|
848
1130
|
name: Google Partner Monitoring
|
@@ -851,7 +1133,7 @@
|
|
851
1133
|
producer:
|
852
1134
|
name: Google Inc.
|
853
1135
|
url: http://www.google.com
|
854
|
-
-
|
1136
|
+
-
|
855
1137
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Search Console) Chrome/41.0.2272.118 Safari/537.36
|
856
1138
|
bot:
|
857
1139
|
name: Google Search Console
|
@@ -860,7 +1142,7 @@
|
|
860
1142
|
producer:
|
861
1143
|
name: Google Inc.
|
862
1144
|
url: http://www.google.com
|
863
|
-
-
|
1145
|
+
-
|
864
1146
|
user_agent: Google-Structured-Data-Testing-Tool +https://search.google.com/structured-data/testing-tool)
|
865
1147
|
bot:
|
866
1148
|
name: Google Structured Data Testing Tool
|
@@ -869,7 +1151,7 @@
|
|
869
1151
|
producer:
|
870
1152
|
name: Google Inc.
|
871
1153
|
url: http://www.google.com
|
872
|
-
-
|
1154
|
+
-
|
873
1155
|
user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
|
874
1156
|
bot:
|
875
1157
|
name: Googlebot
|
@@ -878,7 +1160,7 @@
|
|
878
1160
|
producer:
|
879
1161
|
name: Google Inc.
|
880
1162
|
url: http://www.google.com
|
881
|
-
-
|
1163
|
+
-
|
882
1164
|
user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
|
883
1165
|
bot:
|
884
1166
|
name: Googlebot
|
@@ -887,7 +1169,7 @@
|
|
887
1169
|
producer:
|
888
1170
|
name: Google Inc.
|
889
1171
|
url: http://www.google.com
|
890
|
-
-
|
1172
|
+
-
|
891
1173
|
user_agent: APIs-Google (+https://developers.google.com/webmasters/APIs-Google.html)
|
892
1174
|
bot:
|
893
1175
|
name: Googlebot
|
@@ -896,7 +1178,7 @@
|
|
896
1178
|
producer:
|
897
1179
|
name: Google Inc.
|
898
1180
|
url: http://www.google.com
|
899
|
-
-
|
1181
|
+
-
|
900
1182
|
user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
901
1183
|
bot:
|
902
1184
|
name: Googlebot
|
@@ -905,7 +1187,7 @@
|
|
905
1187
|
producer:
|
906
1188
|
name: Google Inc.
|
907
1189
|
url: http://www.google.com
|
908
|
-
-
|
1190
|
+
-
|
909
1191
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
|
910
1192
|
bot:
|
911
1193
|
name: Googlebot
|
@@ -914,7 +1196,7 @@
|
|
914
1196
|
producer:
|
915
1197
|
name: Google Inc.
|
916
1198
|
url: http://www.google.com
|
917
|
-
-
|
1199
|
+
-
|
918
1200
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
|
919
1201
|
bot:
|
920
1202
|
name: Googlebot
|
@@ -923,7 +1205,7 @@
|
|
923
1205
|
producer:
|
924
1206
|
name: Google Inc.
|
925
1207
|
url: http://www.google.com
|
926
|
-
-
|
1208
|
+
-
|
927
1209
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
|
928
1210
|
bot:
|
929
1211
|
name: Googlebot
|
@@ -932,7 +1214,7 @@
|
|
932
1214
|
producer:
|
933
1215
|
name: Google Inc.
|
934
1216
|
url: http://www.google.com
|
935
|
-
-
|
1217
|
+
-
|
936
1218
|
user_agent: Google-AdWords-Express
|
937
1219
|
bot:
|
938
1220
|
name: Googlebot
|
@@ -941,7 +1223,7 @@
|
|
941
1223
|
producer:
|
942
1224
|
name: Google Inc.
|
943
1225
|
url: http://www.google.com
|
944
|
-
-
|
1226
|
+
-
|
945
1227
|
user_agent: Google-Adwords-Instant (+http://www.google.com/adsbot.html)
|
946
1228
|
bot:
|
947
1229
|
name: Googlebot
|
@@ -950,7 +1232,7 @@
|
|
950
1232
|
producer:
|
951
1233
|
name: Google Inc.
|
952
1234
|
url: http://www.google.com
|
953
|
-
-
|
1235
|
+
-
|
954
1236
|
user_agent: Google-speakr
|
955
1237
|
bot:
|
956
1238
|
name: Googlebot
|
@@ -959,7 +1241,7 @@
|
|
959
1241
|
producer:
|
960
1242
|
name: Google Inc.
|
961
1243
|
url: http://www.google.com
|
962
|
-
-
|
1244
|
+
-
|
963
1245
|
user_agent: Googlebot (gocrawl v0.4)
|
964
1246
|
bot:
|
965
1247
|
name: Googlebot
|
@@ -968,7 +1250,7 @@
|
|
968
1250
|
producer:
|
969
1251
|
name: Google Inc.
|
970
1252
|
url: http://www.google.com
|
971
|
-
-
|
1253
|
+
-
|
972
1254
|
user_agent: Googlebot-Image/1.0
|
973
1255
|
bot:
|
974
1256
|
name: Googlebot
|
@@ -977,7 +1259,7 @@
|
|
977
1259
|
producer:
|
978
1260
|
name: Google Inc.
|
979
1261
|
url: http://www.google.com
|
980
|
-
-
|
1262
|
+
-
|
981
1263
|
user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
|
982
1264
|
bot:
|
983
1265
|
name: Googlebot
|
@@ -986,7 +1268,7 @@
|
|
986
1268
|
producer:
|
987
1269
|
name: Google Inc.
|
988
1270
|
url: http://www.google.com
|
989
|
-
-
|
1271
|
+
-
|
990
1272
|
user_agent: Googlebot-Video/1.0
|
991
1273
|
bot:
|
992
1274
|
name: Googlebot
|
@@ -995,7 +1277,7 @@
|
|
995
1277
|
producer:
|
996
1278
|
name: Google Inc.
|
997
1279
|
url: http://www.google.com
|
998
|
-
-
|
1280
|
+
-
|
999
1281
|
user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
|
1000
1282
|
bot:
|
1001
1283
|
name: Googlebot
|
@@ -1004,7 +1286,7 @@
|
|
1004
1286
|
producer:
|
1005
1287
|
name: Google Inc.
|
1006
1288
|
url: http://www.google.com
|
1007
|
-
-
|
1289
|
+
-
|
1008
1290
|
user_agent: Googlebot/Nutch-1.7
|
1009
1291
|
bot:
|
1010
1292
|
name: Googlebot
|
@@ -1013,7 +1295,7 @@
|
|
1013
1295
|
producer:
|
1014
1296
|
name: Google Inc.
|
1015
1297
|
url: http://www.google.com
|
1016
|
-
-
|
1298
|
+
-
|
1017
1299
|
user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
|
1018
1300
|
bot:
|
1019
1301
|
name: Googlebot
|
@@ -1022,7 +1304,7 @@
|
|
1022
1304
|
producer:
|
1023
1305
|
name: Google Inc.
|
1024
1306
|
url: http://www.google.com
|
1025
|
-
-
|
1307
|
+
-
|
1026
1308
|
user_agent: Mediapartners-Google
|
1027
1309
|
bot:
|
1028
1310
|
name: Googlebot
|
@@ -1031,7 +1313,7 @@
|
|
1031
1313
|
producer:
|
1032
1314
|
name: Google Inc.
|
1033
1315
|
url: http://www.google.com
|
1034
|
-
-
|
1316
|
+
-
|
1035
1317
|
user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
|
1036
1318
|
bot:
|
1037
1319
|
name: Googlebot
|
@@ -1040,7 +1322,16 @@
|
|
1040
1322
|
producer:
|
1041
1323
|
name: Google Inc.
|
1042
1324
|
url: http://www.google.com
|
1043
|
-
-
|
1325
|
+
-
|
1326
|
+
user_agent: Mozilla/5.0 (compatible; Google-Youtube-Links)
|
1327
|
+
bot:
|
1328
|
+
name: Googlebot
|
1329
|
+
category: Search bot
|
1330
|
+
url: http://www.google.com/bot.html
|
1331
|
+
producer:
|
1332
|
+
name: Google Inc.
|
1333
|
+
url: http://www.google.com
|
1334
|
+
-
|
1044
1335
|
user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
|
1045
1336
|
bot:
|
1046
1337
|
name: Googlebot
|
@@ -1049,7 +1340,7 @@
|
|
1049
1340
|
producer:
|
1050
1341
|
name: Google Inc.
|
1051
1342
|
url: http://www.google.com
|
1052
|
-
-
|
1343
|
+
-
|
1053
1344
|
user_agent: Mozilla/5.0 (en-US) AppleWebKit/537.36 (KHTML, like Gecko; Google-Assess) Chrome/34.0.1847.116 Safari/537.36
|
1054
1345
|
bot:
|
1055
1346
|
name: Googlebot
|
@@ -1058,7 +1349,7 @@
|
|
1058
1349
|
producer:
|
1059
1350
|
name: Google Inc.
|
1060
1351
|
url: http://www.google.com
|
1061
|
-
-
|
1352
|
+
-
|
1062
1353
|
user_agent: Mozilla/5.0 (en-us) AppleWebKit/537.36(KHTML, like Gecko; Google-Adwords-DisplayAds-WebRender;) Chrome/41.0.2272.118Safari/537.36
|
1063
1354
|
bot:
|
1064
1355
|
name: Googlebot
|
@@ -1067,7 +1358,7 @@
|
|
1067
1358
|
producer:
|
1068
1359
|
name: Google Inc.
|
1069
1360
|
url: http://www.google.com
|
1070
|
-
-
|
1361
|
+
-
|
1071
1362
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
1072
1363
|
bot:
|
1073
1364
|
name: Googlebot
|
@@ -1076,7 +1367,7 @@
|
|
1076
1367
|
producer:
|
1077
1368
|
name: Google Inc.
|
1078
1369
|
url: http://www.google.com
|
1079
|
-
-
|
1370
|
+
-
|
1080
1371
|
user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
|
1081
1372
|
bot:
|
1082
1373
|
name: Googlebot
|
@@ -1085,7 +1376,16 @@
|
|
1085
1376
|
producer:
|
1086
1377
|
name: Google Inc.
|
1087
1378
|
url: http://www.google.com
|
1088
|
-
-
|
1379
|
+
-
|
1380
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-AMPHTML)
|
1381
|
+
bot:
|
1382
|
+
name: Googlebot
|
1383
|
+
category: Search bot
|
1384
|
+
url: http://www.google.com/bot.html
|
1385
|
+
producer:
|
1386
|
+
name: Google Inc.
|
1387
|
+
url: http://www.google.com
|
1388
|
+
-
|
1089
1389
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-Read-Aloud; +https://support.google.com/webmasters/answer/1061943)
|
1090
1390
|
bot:
|
1091
1391
|
name: Googlebot
|
@@ -1094,7 +1394,16 @@
|
|
1094
1394
|
producer:
|
1095
1395
|
name: Google Inc.
|
1096
1396
|
url: http://www.google.com
|
1097
|
-
-
|
1397
|
+
-
|
1398
|
+
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; DuplexWeb-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.131 Mobile Safari/537.36
|
1399
|
+
bot:
|
1400
|
+
name: Googlebot
|
1401
|
+
category: Search bot
|
1402
|
+
url: http://www.google.com/bot.html
|
1403
|
+
producer:
|
1404
|
+
name: Google Inc.
|
1405
|
+
url: http://www.google.com
|
1406
|
+
-
|
1098
1407
|
user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
|
1099
1408
|
bot:
|
1100
1409
|
name: Googlebot
|
@@ -1103,7 +1412,16 @@
|
|
1103
1412
|
producer:
|
1104
1413
|
name: Google Inc.
|
1105
1414
|
url: http://www.google.com
|
1106
|
-
-
|
1415
|
+
-
|
1416
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/27.0.1453 Safari/537.36 (compatible; Google-HotelAdsVerifier/2.0)
|
1417
|
+
bot:
|
1418
|
+
name: Googlebot
|
1419
|
+
category: Search bot
|
1420
|
+
url: http://www.google.com/bot.html
|
1421
|
+
producer:
|
1422
|
+
name: Google Inc.
|
1423
|
+
url: http://www.google.com
|
1424
|
+
-
|
1107
1425
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
|
1108
1426
|
bot:
|
1109
1427
|
name: Googlebot
|
@@ -1112,7 +1430,7 @@
|
|
1112
1430
|
producer:
|
1113
1431
|
name: Google Inc.
|
1114
1432
|
url: http://www.google.com
|
1115
|
-
-
|
1433
|
+
-
|
1116
1434
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36 (compatible; Google-Shopping-Quality +http://www.google.com/merchants/tos/extend/DE/tos.html)
|
1117
1435
|
bot:
|
1118
1436
|
name: Googlebot
|
@@ -1121,7 +1439,7 @@
|
|
1121
1439
|
producer:
|
1122
1440
|
name: Google Inc.
|
1123
1441
|
url: http://www.google.com
|
1124
|
-
-
|
1442
|
+
-
|
1125
1443
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
|
1126
1444
|
bot:
|
1127
1445
|
name: Googlebot
|
@@ -1130,7 +1448,7 @@
|
|
1130
1448
|
producer:
|
1131
1449
|
name: Google Inc.
|
1132
1450
|
url: http://www.google.com
|
1133
|
-
-
|
1451
|
+
-
|
1134
1452
|
user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
1135
1453
|
bot:
|
1136
1454
|
name: Googlebot
|
@@ -1139,7 +1457,13 @@
|
|
1139
1457
|
producer:
|
1140
1458
|
name: Google Inc.
|
1141
1459
|
url: http://www.google.com
|
1142
|
-
-
|
1460
|
+
-
|
1461
|
+
user_agent: Grammarly/1.0 (http://www.grammarly.com)
|
1462
|
+
bot:
|
1463
|
+
name: Grammarly
|
1464
|
+
category: Service bot
|
1465
|
+
url: https://www.grammarly.com
|
1466
|
+
-
|
1143
1467
|
user_agent: Mozilla/5.0 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
1144
1468
|
bot:
|
1145
1469
|
name: Grapeshot
|
@@ -1148,7 +1472,7 @@
|
|
1148
1472
|
producer:
|
1149
1473
|
name: Grapeshot
|
1150
1474
|
url: https://www.grapeshot.com
|
1151
|
-
-
|
1475
|
+
-
|
1152
1476
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1. 4 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
1153
1477
|
bot:
|
1154
1478
|
name: Grapeshot
|
@@ -1157,7 +1481,7 @@
|
|
1157
1481
|
producer:
|
1158
1482
|
name: Grapeshot
|
1159
1483
|
url: https://www.grapeshot.com
|
1160
|
-
-
|
1484
|
+
-
|
1161
1485
|
user_agent: HTTPMon/1.0b (http://www.httpmon.com)
|
1162
1486
|
bot:
|
1163
1487
|
name: HTTPMon
|
@@ -1166,7 +1490,7 @@
|
|
1166
1490
|
producer:
|
1167
1491
|
name: towards GmbH
|
1168
1492
|
url: http://www.towards.ch/
|
1169
|
-
-
|
1493
|
+
-
|
1170
1494
|
user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
|
1171
1495
|
bot:
|
1172
1496
|
name: Heritrix
|
@@ -1174,8 +1498,8 @@
|
|
1174
1498
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1175
1499
|
producer:
|
1176
1500
|
name: The Internet Archive
|
1177
|
-
url:
|
1178
|
-
-
|
1501
|
+
url: https://archive.org
|
1502
|
+
-
|
1179
1503
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
|
1180
1504
|
bot:
|
1181
1505
|
name: Heritrix
|
@@ -1183,8 +1507,8 @@
|
|
1183
1507
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1184
1508
|
producer:
|
1185
1509
|
name: The Internet Archive
|
1186
|
-
url:
|
1187
|
-
-
|
1510
|
+
url: https://archive.org
|
1511
|
+
-
|
1188
1512
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
|
1189
1513
|
bot:
|
1190
1514
|
name: Heritrix
|
@@ -1192,8 +1516,8 @@
|
|
1192
1516
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1193
1517
|
producer:
|
1194
1518
|
name: The Internet Archive
|
1195
|
-
url:
|
1196
|
-
-
|
1519
|
+
url: https://archive.org
|
1520
|
+
-
|
1197
1521
|
user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
|
1198
1522
|
bot:
|
1199
1523
|
name: Heritrix
|
@@ -1201,8 +1525,8 @@
|
|
1201
1525
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1202
1526
|
producer:
|
1203
1527
|
name: The Internet Archive
|
1204
|
-
url:
|
1205
|
-
-
|
1528
|
+
url: https://archive.org
|
1529
|
+
-
|
1206
1530
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
|
1207
1531
|
bot:
|
1208
1532
|
name: Heritrix
|
@@ -1210,8 +1534,8 @@
|
|
1210
1534
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1211
1535
|
producer:
|
1212
1536
|
name: The Internet Archive
|
1213
|
-
url:
|
1214
|
-
-
|
1537
|
+
url: https://archive.org
|
1538
|
+
-
|
1215
1539
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
|
1216
1540
|
bot:
|
1217
1541
|
name: Heritrix
|
@@ -1219,8 +1543,8 @@
|
|
1219
1543
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1220
1544
|
producer:
|
1221
1545
|
name: The Internet Archive
|
1222
|
-
url:
|
1223
|
-
-
|
1546
|
+
url: https://archive.org
|
1547
|
+
-
|
1224
1548
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
|
1225
1549
|
bot:
|
1226
1550
|
name: Heritrix
|
@@ -1228,8 +1552,8 @@
|
|
1228
1552
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1229
1553
|
producer:
|
1230
1554
|
name: The Internet Archive
|
1231
|
-
url:
|
1232
|
-
-
|
1555
|
+
url: https://archive.org
|
1556
|
+
-
|
1233
1557
|
user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
|
1234
1558
|
bot:
|
1235
1559
|
name: Heritrix
|
@@ -1237,8 +1561,8 @@
|
|
1237
1561
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1238
1562
|
producer:
|
1239
1563
|
name: The Internet Archive
|
1240
|
-
url:
|
1241
|
-
-
|
1564
|
+
url: https://archive.org
|
1565
|
+
-
|
1242
1566
|
user_agent: Heurekabot-Feed/1.0 (+https://sluzby.heureka.cz/napoveda/heurekabot/)
|
1243
1567
|
bot:
|
1244
1568
|
name: Heureka Feed
|
@@ -1247,16 +1571,16 @@
|
|
1247
1571
|
producer:
|
1248
1572
|
name: Heureka.cz, a.s.
|
1249
1573
|
url: https://www.heureka.cz/
|
1250
|
-
-
|
1574
|
+
-
|
1251
1575
|
user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
|
1252
1576
|
bot:
|
1253
1577
|
name: HubPages
|
1254
1578
|
category: Crawler
|
1255
|
-
url:
|
1579
|
+
url: https://hubpages.com/help/crawlingpolicy
|
1256
1580
|
producer:
|
1257
|
-
name: HubPages
|
1258
|
-
url:
|
1259
|
-
-
|
1581
|
+
name: HubPages, Inc.
|
1582
|
+
url: https://discover.hubpages.com/
|
1583
|
+
-
|
1260
1584
|
user_agent: HubSpot Website Grader (web-crawlers@hubspot.com)
|
1261
1585
|
bot:
|
1262
1586
|
name: HubSpot
|
@@ -1264,7 +1588,7 @@
|
|
1264
1588
|
producer:
|
1265
1589
|
name: HubSpot Inc.
|
1266
1590
|
url: https://www.hubspot.com
|
1267
|
-
-
|
1591
|
+
-
|
1268
1592
|
user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
|
1269
1593
|
bot:
|
1270
1594
|
name: ICC-Crawler
|
@@ -1273,7 +1597,16 @@
|
|
1273
1597
|
producer:
|
1274
1598
|
name: ""
|
1275
1599
|
url: ""
|
1276
|
-
-
|
1600
|
+
-
|
1601
|
+
user_agent: IDG/IT (http://spaziodati.eu/)
|
1602
|
+
bot:
|
1603
|
+
name: IDG/IT
|
1604
|
+
category: Search bot
|
1605
|
+
url: https://spaziodati.eu/
|
1606
|
+
producer:
|
1607
|
+
name: SpazioDati S.r.l.
|
1608
|
+
url: https://spaziodati.eu/
|
1609
|
+
-
|
1277
1610
|
user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
|
1278
1611
|
bot:
|
1279
1612
|
name: IIS Site Analysis
|
@@ -1282,7 +1615,7 @@
|
|
1282
1615
|
producer:
|
1283
1616
|
name: Microsoft Corporation
|
1284
1617
|
url: http://www.microsoft.com
|
1285
|
-
-
|
1618
|
+
-
|
1286
1619
|
user_agent: IP-Guide.com Crawler/1.0 (https://ip-guide.com)
|
1287
1620
|
bot:
|
1288
1621
|
name: IP-Guide Crawler
|
@@ -1291,15 +1624,24 @@
|
|
1291
1624
|
producer:
|
1292
1625
|
name: ""
|
1293
1626
|
url: https://ip-guide.com
|
1294
|
-
-
|
1627
|
+
-
|
1295
1628
|
user_agent: Mozilla/5.0 (compatible; ips-agent)
|
1296
1629
|
bot:
|
1297
1630
|
name: IPS Agent
|
1298
|
-
category:
|
1631
|
+
category: Crawler
|
1299
1632
|
producer:
|
1300
1633
|
name: VeriSign, Inc
|
1301
1634
|
url: http://www.verisign.com/
|
1302
|
-
-
|
1635
|
+
-
|
1636
|
+
user_agent: Kaspersky Lab CFR link resolver cfradmins@kaspersky.com
|
1637
|
+
bot:
|
1638
|
+
name: Kaspersky
|
1639
|
+
category: Security Checker
|
1640
|
+
url: https://www.kaspersky.com/
|
1641
|
+
producer:
|
1642
|
+
name: AO Kaspersky Lab
|
1643
|
+
url: https://www.kaspersky.com/
|
1644
|
+
-
|
1303
1645
|
user_agent: kouio.com RSS reader
|
1304
1646
|
bot:
|
1305
1647
|
name: Kouio
|
@@ -1308,7 +1650,7 @@
|
|
1308
1650
|
producer:
|
1309
1651
|
name: ""
|
1310
1652
|
url: ""
|
1311
|
-
-
|
1653
|
+
-
|
1312
1654
|
user_agent: 'kouio.com RSS reader - 6 subscribers'
|
1313
1655
|
bot:
|
1314
1656
|
name: Kouio
|
@@ -1317,7 +1659,16 @@
|
|
1317
1659
|
producer:
|
1318
1660
|
name: ""
|
1319
1661
|
url: ""
|
1320
|
-
-
|
1662
|
+
-
|
1663
|
+
user_agent: LCC (+http://corpora.informatik.uni-leipzig.de/crawler_faq.html)
|
1664
|
+
bot:
|
1665
|
+
name: LCC
|
1666
|
+
category: Search bot
|
1667
|
+
url: https://corpora.uni-leipzig.de/crawler_faq.html
|
1668
|
+
producer:
|
1669
|
+
name: Universität Leipzig
|
1670
|
+
url: https://www.uni-leipzig.de/
|
1671
|
+
-
|
1321
1672
|
user_agent: 'ltx71 - (http://ltx71.com/)'
|
1322
1673
|
bot:
|
1323
1674
|
name: LTX71
|
@@ -1325,7 +1676,7 @@
|
|
1325
1676
|
producer:
|
1326
1677
|
name: ""
|
1327
1678
|
url: ""
|
1328
|
-
-
|
1679
|
+
-
|
1329
1680
|
user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
|
1330
1681
|
bot:
|
1331
1682
|
name: Larbin web crawler
|
@@ -1334,7 +1685,7 @@
|
|
1334
1685
|
producer:
|
1335
1686
|
name: ""
|
1336
1687
|
url: ""
|
1337
|
-
-
|
1688
|
+
-
|
1338
1689
|
user_agent: "Mozilla/5.0 (compatible; Let's Encrypt validation server; +https://www.letsencrypt.org)"
|
1339
1690
|
bot:
|
1340
1691
|
name: "Let's Encrypt Validation"
|
@@ -1343,7 +1694,7 @@
|
|
1343
1694
|
producer:
|
1344
1695
|
name: "Let's Encrypt"
|
1345
1696
|
url: https://letsencrypt.org
|
1346
|
-
-
|
1697
|
+
-
|
1347
1698
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/61.0.3116.0 Mobile Safari/537.36 Chrome-Lighthouse
|
1348
1699
|
bot:
|
1349
1700
|
name: Lighthouse
|
@@ -1352,7 +1703,7 @@
|
|
1352
1703
|
producer:
|
1353
1704
|
name: Lighthouse
|
1354
1705
|
url: https://developers.google.com/web/tools/lighthouse
|
1355
|
-
-
|
1706
|
+
-
|
1356
1707
|
user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
|
1357
1708
|
bot:
|
1358
1709
|
name: Linkdex Bot
|
@@ -1361,7 +1712,7 @@
|
|
1361
1712
|
producer:
|
1362
1713
|
name: Mojeek Ltd.
|
1363
1714
|
url: http://www.mojeek.com
|
1364
|
-
-
|
1715
|
+
-
|
1365
1716
|
user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
|
1366
1717
|
bot:
|
1367
1718
|
name: Linkdex Bot
|
@@ -1370,7 +1721,7 @@
|
|
1370
1721
|
producer:
|
1371
1722
|
name: Mojeek Ltd.
|
1372
1723
|
url: http://www.mojeek.com
|
1373
|
-
-
|
1724
|
+
-
|
1374
1725
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
|
1375
1726
|
bot:
|
1376
1727
|
name: Linkdex Bot
|
@@ -1379,7 +1730,7 @@
|
|
1379
1730
|
producer:
|
1380
1731
|
name: Mojeek Ltd.
|
1381
1732
|
url: http://www.mojeek.com
|
1382
|
-
-
|
1733
|
+
-
|
1383
1734
|
user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
|
1384
1735
|
bot:
|
1385
1736
|
name: LinkedIn Bot
|
@@ -1388,7 +1739,7 @@
|
|
1388
1739
|
producer:
|
1389
1740
|
name: LinkedIn
|
1390
1741
|
url: http://www.linkedin.com
|
1391
|
-
-
|
1742
|
+
-
|
1392
1743
|
user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
|
1393
1744
|
bot:
|
1394
1745
|
name: MJ12 Bot
|
@@ -1397,7 +1748,7 @@
|
|
1397
1748
|
producer:
|
1398
1749
|
name: Majestic-12
|
1399
1750
|
url: http://majestic12.co.uk
|
1400
|
-
-
|
1751
|
+
-
|
1401
1752
|
user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
|
1402
1753
|
bot:
|
1403
1754
|
name: Magpie-Crawler
|
@@ -1406,7 +1757,7 @@
|
|
1406
1757
|
producer:
|
1407
1758
|
name: Brandwatch
|
1408
1759
|
url: http://www.brandwatch.com
|
1409
|
-
-
|
1760
|
+
-
|
1410
1761
|
user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
|
1411
1762
|
bot:
|
1412
1763
|
name: MagpieRSS
|
@@ -1415,7 +1766,7 @@
|
|
1415
1766
|
producer:
|
1416
1767
|
name: ""
|
1417
1768
|
url: ""
|
1418
|
-
-
|
1769
|
+
-
|
1419
1770
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
|
1420
1771
|
bot:
|
1421
1772
|
name: Mail.Ru Bot
|
@@ -1424,7 +1775,7 @@
|
|
1424
1775
|
producer:
|
1425
1776
|
name: Mail.Ru Group
|
1426
1777
|
url: http://corp.mail.ru
|
1427
|
-
-
|
1778
|
+
-
|
1428
1779
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
|
1429
1780
|
bot:
|
1430
1781
|
name: Mail.Ru Bot
|
@@ -1433,17 +1784,17 @@
|
|
1433
1784
|
producer:
|
1434
1785
|
name: Mail.Ru Group
|
1435
1786
|
url: http://corp.mail.ru
|
1436
|
-
-
|
1787
|
+
-
|
1437
1788
|
user_agent: http.rb/2.2.2 (Mastodon/1.6.1; +https://mathtod.online/)
|
1438
1789
|
bot:
|
1439
1790
|
name: Mastodon Bot
|
1440
1791
|
category: Social Media Agent
|
1441
|
-
-
|
1792
|
+
-
|
1442
1793
|
user_agent: http.rb/3.2.0 (Mastodon/2.4.3; +https://uwu.social/)
|
1443
1794
|
bot:
|
1444
1795
|
name: Mastodon Bot
|
1445
1796
|
category: Social Media Agent
|
1446
|
-
-
|
1797
|
+
-
|
1447
1798
|
user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
|
1448
1799
|
bot:
|
1449
1800
|
name: Meanpath Bot
|
@@ -1452,13 +1803,13 @@
|
|
1452
1803
|
producer:
|
1453
1804
|
name: Meanpath
|
1454
1805
|
url: http://www.meanpath.com
|
1455
|
-
-
|
1806
|
+
-
|
1456
1807
|
user_agent: MetaInspector/5.4.0 (+https://github.com/jaimeiniesta/metainspector)
|
1457
1808
|
bot:
|
1458
1809
|
name: MetaInspector
|
1459
1810
|
category: Crawler
|
1460
1811
|
url: https://github.com/jaimeiniesta/metainspector
|
1461
|
-
-
|
1812
|
+
-
|
1462
1813
|
user_agent: Mozilla/5.0 (compatible; MetaJobBot; http://www.metajob.de/crawler)
|
1463
1814
|
bot:
|
1464
1815
|
name: MetaJobBot
|
@@ -1467,7 +1818,7 @@
|
|
1467
1818
|
producer:
|
1468
1819
|
name: MetaJob
|
1469
1820
|
url: http://www.metajob.at
|
1470
|
-
-
|
1821
|
+
-
|
1471
1822
|
user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
|
1472
1823
|
bot:
|
1473
1824
|
name: Mixrank Bot
|
@@ -1476,7 +1827,7 @@
|
|
1476
1827
|
producer:
|
1477
1828
|
name: Online Media Group, Inc.
|
1478
1829
|
url: ""
|
1479
|
-
-
|
1830
|
+
-
|
1480
1831
|
user_agent: Mnogosearch-3.1.21
|
1481
1832
|
bot:
|
1482
1833
|
name: Mnogosearch
|
@@ -1485,7 +1836,7 @@
|
|
1485
1836
|
producer:
|
1486
1837
|
name: Lavtech.Com Corp.
|
1487
1838
|
url: ""
|
1488
|
-
-
|
1839
|
+
-
|
1489
1840
|
user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
|
1490
1841
|
bot:
|
1491
1842
|
name: MojeekBot
|
@@ -1494,7 +1845,7 @@
|
|
1494
1845
|
producer:
|
1495
1846
|
name: Mojeek Ltd.
|
1496
1847
|
url: http://www.mojeek.com
|
1497
|
-
-
|
1848
|
+
-
|
1498
1849
|
user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
|
1499
1850
|
bot:
|
1500
1851
|
name: Monitor.Us
|
@@ -1503,7 +1854,7 @@
|
|
1503
1854
|
producer:
|
1504
1855
|
name: Monitor.Us
|
1505
1856
|
url: http://www.monitor.us
|
1506
|
-
-
|
1857
|
+
-
|
1507
1858
|
user_agent: munin/2.0.30-1 (libwww-perl/6.15)
|
1508
1859
|
bot:
|
1509
1860
|
name: Munin
|
@@ -1512,7 +1863,7 @@
|
|
1512
1863
|
producer:
|
1513
1864
|
name: Munin
|
1514
1865
|
url: http://munin-monitoring.org/
|
1515
|
-
-
|
1866
|
+
-
|
1516
1867
|
user_agent: munin/http_loadtime
|
1517
1868
|
bot:
|
1518
1869
|
name: Munin
|
@@ -1521,7 +1872,7 @@
|
|
1521
1872
|
producer:
|
1522
1873
|
name: Munin
|
1523
1874
|
url: http://munin-monitoring.org/
|
1524
|
-
-
|
1875
|
+
-
|
1525
1876
|
user_agent: nlcrawler/1.0 (+http://northernlight.com/)
|
1526
1877
|
bot:
|
1527
1878
|
name: NLCrawler
|
@@ -1530,7 +1881,7 @@
|
|
1530
1881
|
producer:
|
1531
1882
|
name: Northern Light
|
1532
1883
|
url: http://northernlight.com
|
1533
|
-
-
|
1884
|
+
-
|
1534
1885
|
user_agent: check_http/v1.5 (nagios-plugins 1.5)
|
1535
1886
|
bot:
|
1536
1887
|
name: Nagios check_http
|
@@ -1539,7 +1890,7 @@
|
|
1539
1890
|
producer:
|
1540
1891
|
name: Nagios Plugins Development Team
|
1541
1892
|
url: https://nagios.org
|
1542
|
-
-
|
1893
|
+
-
|
1543
1894
|
user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
|
1544
1895
|
bot:
|
1545
1896
|
name: NalezenCzBot
|
@@ -1548,11 +1899,11 @@
|
|
1548
1899
|
producer:
|
1549
1900
|
name: Jaroslav Kuboš
|
1550
1901
|
url: ""
|
1551
|
-
-
|
1902
|
+
-
|
1552
1903
|
user_agent: NetLyzer FastProbe
|
1553
1904
|
bot:
|
1554
1905
|
name: NetLyzer FastProbe
|
1555
|
-
-
|
1906
|
+
-
|
1556
1907
|
user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
|
1557
1908
|
bot:
|
1558
1909
|
name: Netcraft Survey Bot
|
@@ -1561,7 +1912,7 @@
|
|
1561
1912
|
producer:
|
1562
1913
|
name: Netcraft
|
1563
1914
|
url: http://www.netcraft.com
|
1564
|
-
-
|
1915
|
+
-
|
1565
1916
|
user_agent: Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)
|
1566
1917
|
bot:
|
1567
1918
|
name: Netcraft Survey Bot
|
@@ -1570,7 +1921,7 @@
|
|
1570
1921
|
producer:
|
1571
1922
|
name: Netcraft
|
1572
1923
|
url: http://www.netcraft.com
|
1573
|
-
-
|
1924
|
+
-
|
1574
1925
|
user_agent: 'Netcraft SSL Server Survey - contact info@netcraft.com'
|
1575
1926
|
bot:
|
1576
1927
|
name: Netcraft Survey Bot
|
@@ -1579,7 +1930,7 @@
|
|
1579
1930
|
producer:
|
1580
1931
|
name: Netcraft
|
1581
1932
|
url: http://www.netcraft.com
|
1582
|
-
-
|
1933
|
+
-
|
1583
1934
|
user_agent: Netvibes (http://www.netvibes.com)
|
1584
1935
|
bot:
|
1585
1936
|
name: Netvibes
|
@@ -1588,7 +1939,7 @@
|
|
1588
1939
|
producer:
|
1589
1940
|
name: ""
|
1590
1941
|
url: ""
|
1591
|
-
-
|
1942
|
+
-
|
1592
1943
|
user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
|
1593
1944
|
bot:
|
1594
1945
|
name: Netvibes
|
@@ -1597,7 +1948,7 @@
|
|
1597
1948
|
producer:
|
1598
1949
|
name: ""
|
1599
1950
|
url: ""
|
1600
|
-
-
|
1951
|
+
-
|
1601
1952
|
user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1602
1953
|
bot:
|
1603
1954
|
name: NewsBlur
|
@@ -1606,7 +1957,7 @@
|
|
1606
1957
|
producer:
|
1607
1958
|
name: ""
|
1608
1959
|
url: ""
|
1609
|
-
-
|
1960
|
+
-
|
1610
1961
|
user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1611
1962
|
bot:
|
1612
1963
|
name: NewsBlur
|
@@ -1615,7 +1966,7 @@
|
|
1615
1966
|
producer:
|
1616
1967
|
name: ""
|
1617
1968
|
url: ""
|
1618
|
-
-
|
1969
|
+
-
|
1619
1970
|
user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
1620
1971
|
bot:
|
1621
1972
|
name: NewsBlur
|
@@ -1624,7 +1975,7 @@
|
|
1624
1975
|
producer:
|
1625
1976
|
name: ""
|
1626
1977
|
url: ""
|
1627
|
-
-
|
1978
|
+
-
|
1628
1979
|
user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1629
1980
|
bot:
|
1630
1981
|
name: NewsBlur
|
@@ -1633,7 +1984,7 @@
|
|
1633
1984
|
producer:
|
1634
1985
|
name: ""
|
1635
1986
|
url: ""
|
1636
|
-
-
|
1987
|
+
-
|
1637
1988
|
user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
|
1638
1989
|
bot:
|
1639
1990
|
name: NewsGator
|
@@ -1642,7 +1993,7 @@
|
|
1642
1993
|
producer:
|
1643
1994
|
name: ""
|
1644
1995
|
url: ""
|
1645
|
-
-
|
1996
|
+
-
|
1646
1997
|
user_agent: Mozilla/5.0 (compatible; Nmap Scripting Engine; https://nmap.org/book/nse.html)
|
1647
1998
|
bot:
|
1648
1999
|
name: Nmap
|
@@ -1651,7 +2002,7 @@
|
|
1651
2002
|
producer:
|
1652
2003
|
name: Nmap
|
1653
2004
|
url: https://nmap.org/
|
1654
|
-
-
|
2005
|
+
-
|
1655
2006
|
user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
|
1656
2007
|
bot:
|
1657
2008
|
name: Nutch-based Bot
|
@@ -1659,8 +2010,8 @@
|
|
1659
2010
|
url: https://nutch.apache.org
|
1660
2011
|
producer:
|
1661
2012
|
name: The Apache Software Foundation
|
1662
|
-
url:
|
1663
|
-
-
|
2013
|
+
url: https://www.apache.org/foundation/
|
2014
|
+
-
|
1664
2015
|
user_agent: CB/Nutch-1.7
|
1665
2016
|
bot:
|
1666
2017
|
name: Nutch-based Bot
|
@@ -1668,8 +2019,8 @@
|
|
1668
2019
|
url: https://nutch.apache.org
|
1669
2020
|
producer:
|
1670
2021
|
name: The Apache Software Foundation
|
1671
|
-
url:
|
1672
|
-
-
|
2022
|
+
url: https://www.apache.org/foundation/
|
2023
|
+
-
|
1673
2024
|
user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
|
1674
2025
|
bot:
|
1675
2026
|
name: Nutch-based Bot
|
@@ -1677,8 +2028,8 @@
|
|
1677
2028
|
url: https://nutch.apache.org
|
1678
2029
|
producer:
|
1679
2030
|
name: The Apache Software Foundation
|
1680
|
-
url:
|
1681
|
-
-
|
2031
|
+
url: https://www.apache.org/foundation/
|
2032
|
+
-
|
1682
2033
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
|
1683
2034
|
bot:
|
1684
2035
|
name: Nutch-based Bot
|
@@ -1686,8 +2037,8 @@
|
|
1686
2037
|
url: https://nutch.apache.org
|
1687
2038
|
producer:
|
1688
2039
|
name: The Apache Software Foundation
|
1689
|
-
url:
|
1690
|
-
-
|
2040
|
+
url: https://www.apache.org/foundation/
|
2041
|
+
-
|
1691
2042
|
user_agent: My Nutch Spider/Nutch-1.6
|
1692
2043
|
bot:
|
1693
2044
|
name: Nutch-based Bot
|
@@ -1695,8 +2046,8 @@
|
|
1695
2046
|
url: https://nutch.apache.org
|
1696
2047
|
producer:
|
1697
2048
|
name: The Apache Software Foundation
|
1698
|
-
url:
|
1699
|
-
-
|
2049
|
+
url: https://www.apache.org/foundation/
|
2050
|
+
-
|
1700
2051
|
user_agent: MySpider/Nutch-2.2
|
1701
2052
|
bot:
|
1702
2053
|
name: Nutch-based Bot
|
@@ -1704,8 +2055,8 @@
|
|
1704
2055
|
url: https://nutch.apache.org
|
1705
2056
|
producer:
|
1706
2057
|
name: The Apache Software Foundation
|
1707
|
-
url:
|
1708
|
-
-
|
2058
|
+
url: https://www.apache.org/foundation/
|
2059
|
+
-
|
1709
2060
|
user_agent: Nutch12/Nutch-1.2
|
1710
2061
|
bot:
|
1711
2062
|
name: Nutch-based Bot
|
@@ -1713,8 +2064,8 @@
|
|
1713
2064
|
url: https://nutch.apache.org
|
1714
2065
|
producer:
|
1715
2066
|
name: The Apache Software Foundation
|
1716
|
-
url:
|
1717
|
-
-
|
2067
|
+
url: https://www.apache.org/foundation/
|
2068
|
+
-
|
1718
2069
|
user_agent: NutchSpider/Nutch-1.4
|
1719
2070
|
bot:
|
1720
2071
|
name: Nutch-based Bot
|
@@ -1722,8 +2073,8 @@
|
|
1722
2073
|
url: https://nutch.apache.org
|
1723
2074
|
producer:
|
1724
2075
|
name: The Apache Software Foundation
|
1725
|
-
url:
|
1726
|
-
-
|
2076
|
+
url: https://www.apache.org/foundation/
|
2077
|
+
-
|
1727
2078
|
user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
|
1728
2079
|
bot:
|
1729
2080
|
name: Nutch-based Bot
|
@@ -1731,8 +2082,8 @@
|
|
1731
2082
|
url: https://nutch.apache.org
|
1732
2083
|
producer:
|
1733
2084
|
name: The Apache Software Foundation
|
1734
|
-
url:
|
1735
|
-
-
|
2085
|
+
url: https://www.apache.org/foundation/
|
2086
|
+
-
|
1736
2087
|
user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
|
1737
2088
|
bot:
|
1738
2089
|
name: Nutch-based Bot
|
@@ -1740,8 +2091,8 @@
|
|
1740
2091
|
url: https://nutch.apache.org
|
1741
2092
|
producer:
|
1742
2093
|
name: The Apache Software Foundation
|
1743
|
-
url:
|
1744
|
-
-
|
2094
|
+
url: https://www.apache.org/foundation/
|
2095
|
+
-
|
1745
2096
|
user_agent: testnutch/Nutch-1.8
|
1746
2097
|
bot:
|
1747
2098
|
name: Nutch-based Bot
|
@@ -1749,8 +2100,8 @@
|
|
1749
2100
|
url: https://nutch.apache.org
|
1750
2101
|
producer:
|
1751
2102
|
name: The Apache Software Foundation
|
1752
|
-
url:
|
1753
|
-
-
|
2103
|
+
url: https://www.apache.org/foundation/
|
2104
|
+
-
|
1754
2105
|
user_agent: Your Nutch Spider/Nutch-2.2.1
|
1755
2106
|
bot:
|
1756
2107
|
name: Nutch-based Bot
|
@@ -1758,8 +2109,8 @@
|
|
1758
2109
|
url: https://nutch.apache.org
|
1759
2110
|
producer:
|
1760
2111
|
name: The Apache Software Foundation
|
1761
|
-
url:
|
1762
|
-
-
|
2112
|
+
url: https://www.apache.org/foundation/
|
2113
|
+
-
|
1763
2114
|
user_agent: your sipder name/Nutch-1.7
|
1764
2115
|
bot:
|
1765
2116
|
name: Nutch-based Bot
|
@@ -1767,12 +2118,20 @@
|
|
1767
2118
|
url: https://nutch.apache.org
|
1768
2119
|
producer:
|
1769
2120
|
name: The Apache Software Foundation
|
1770
|
-
url:
|
1771
|
-
-
|
2121
|
+
url: https://www.apache.org/foundation/
|
2122
|
+
-
|
2123
|
+
user_agent: Nuzzel
|
2124
|
+
bot:
|
2125
|
+
name: Nuzzel
|
2126
|
+
category: Crawler
|
2127
|
+
producer:
|
2128
|
+
name: Nuzzel
|
2129
|
+
url: https://www.nuzzel.com/
|
2130
|
+
-
|
1772
2131
|
user_agent: Octopus 1.0.2
|
1773
2132
|
bot:
|
1774
2133
|
name: Octopus
|
1775
|
-
-
|
2134
|
+
-
|
1776
2135
|
user_agent: omgili/0.5 +http://omgili.com
|
1777
2136
|
bot:
|
1778
2137
|
name: Omgili bot
|
@@ -1781,7 +2140,7 @@
|
|
1781
2140
|
producer:
|
1782
2141
|
name: Omgili
|
1783
2142
|
url: http://www.omgili.com
|
1784
|
-
-
|
2143
|
+
-
|
1785
2144
|
user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
|
1786
2145
|
bot:
|
1787
2146
|
name: Omgili bot
|
@@ -1790,7 +2149,7 @@
|
|
1790
2149
|
producer:
|
1791
2150
|
name: Omgili
|
1792
2151
|
url: http://www.omgili.com
|
1793
|
-
-
|
2152
|
+
-
|
1794
2153
|
user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
|
1795
2154
|
bot:
|
1796
2155
|
name: OpenLinkProfiler
|
@@ -1799,7 +2158,7 @@
|
|
1799
2158
|
producer:
|
1800
2159
|
name: Axandra GmbH
|
1801
2160
|
url: http://www.axandra.com
|
1802
|
-
-
|
2161
|
+
-
|
1803
2162
|
user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
|
1804
2163
|
bot:
|
1805
2164
|
name: OpenWebSpider
|
@@ -1808,7 +2167,7 @@
|
|
1808
2167
|
producer:
|
1809
2168
|
name: OpenWebSpider Lab
|
1810
2169
|
url: http://lab.openwebspider.org
|
1811
|
-
-
|
2170
|
+
-
|
1812
2171
|
user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
|
1813
2172
|
bot:
|
1814
2173
|
name: Openindex Spider
|
@@ -1817,7 +2176,7 @@
|
|
1817
2176
|
producer:
|
1818
2177
|
name: Openindex B.V.
|
1819
2178
|
url: http://www.openindex.io
|
1820
|
-
-
|
2179
|
+
-
|
1821
2180
|
user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
|
1822
2181
|
bot:
|
1823
2182
|
name: Orange Bot
|
@@ -1826,7 +2185,7 @@
|
|
1826
2185
|
producer:
|
1827
2186
|
name: Orange
|
1828
2187
|
url: http://www.orange.fr
|
1829
|
-
-
|
2188
|
+
-
|
1830
2189
|
user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
|
1831
2190
|
bot:
|
1832
2191
|
name: Orange Bot
|
@@ -1835,7 +2194,7 @@
|
|
1835
2194
|
producer:
|
1836
2195
|
name: Orange
|
1837
2196
|
url: http://www.orange.fr
|
1838
|
-
-
|
2197
|
+
-
|
1839
2198
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
|
1840
2199
|
bot:
|
1841
2200
|
name: Orange Bot
|
@@ -1844,7 +2203,7 @@
|
|
1844
2203
|
producer:
|
1845
2204
|
name: Orange
|
1846
2205
|
url: http://www.orange.fr
|
1847
|
-
-
|
2206
|
+
-
|
1848
2207
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
|
1849
2208
|
bot:
|
1850
2209
|
name: Orange Bot
|
@@ -1853,7 +2212,7 @@
|
|
1853
2212
|
producer:
|
1854
2213
|
name: Orange
|
1855
2214
|
url: http://www.orange.fr
|
1856
|
-
-
|
2215
|
+
-
|
1857
2216
|
user_agent: Mozilla/5.0 (Java) outbrain
|
1858
2217
|
bot:
|
1859
2218
|
name: Outbrain
|
@@ -1862,7 +2221,7 @@
|
|
1862
2221
|
producer:
|
1863
2222
|
name: Outbrain
|
1864
2223
|
url: http://www.outbrain.com/
|
1865
|
-
-
|
2224
|
+
-
|
1866
2225
|
user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
|
1867
2226
|
bot:
|
1868
2227
|
name: PHP Server Monitor
|
@@ -1871,7 +2230,16 @@
|
|
1871
2230
|
producer:
|
1872
2231
|
name: PHP Server Monitor
|
1873
2232
|
url: http://www.phpservermonitor.org/
|
1874
|
-
-
|
2233
|
+
-
|
2234
|
+
user_agent: Mozilla/5.0 (compatible; PRTG Network Monitor (www.paessler.com); Windows)
|
2235
|
+
bot:
|
2236
|
+
name: PRTG Network Monitor
|
2237
|
+
category: Network Monitor
|
2238
|
+
url: https://www.paessler.com/prtg
|
2239
|
+
producer:
|
2240
|
+
name: Paessler AG
|
2241
|
+
url: https://www.paessler.com
|
2242
|
+
-
|
1875
2243
|
user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
|
1876
2244
|
bot:
|
1877
2245
|
name: PaperLiBot
|
@@ -1880,13 +2248,19 @@
|
|
1880
2248
|
producer:
|
1881
2249
|
name: Smallrivers SA
|
1882
2250
|
url: http://www.paper.li
|
1883
|
-
-
|
2251
|
+
-
|
2252
|
+
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; PetalBot;+https://aspiegel.com/petalbot)
|
2253
|
+
bot:
|
2254
|
+
name: Petal Bot
|
2255
|
+
category: Crawler
|
2256
|
+
url: https://aspiegel.com/petalbot
|
2257
|
+
-
|
1884
2258
|
user_agent: phantomas/1.11.0 (PhantomJS/1.9.8; linux x64)
|
1885
2259
|
bot:
|
1886
2260
|
name: Phantomas
|
1887
2261
|
category: Site Monitor
|
1888
2262
|
url: https://github.com/macbre/phantomas
|
1889
|
-
-
|
2263
|
+
-
|
1890
2264
|
user_agent: psbot-page (+http://www.picsearch.com/bot.html)
|
1891
2265
|
bot:
|
1892
2266
|
name: Picsearch bot
|
@@ -1895,7 +2269,7 @@
|
|
1895
2269
|
producer:
|
1896
2270
|
name: Picsearch
|
1897
2271
|
url: http://www.picsearch.com
|
1898
|
-
-
|
2272
|
+
-
|
1899
2273
|
user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
|
1900
2274
|
bot:
|
1901
2275
|
name: Picsearch bot
|
@@ -1904,7 +2278,7 @@
|
|
1904
2278
|
producer:
|
1905
2279
|
name: Picsearch
|
1906
2280
|
url: http://www.picsearch.com
|
1907
|
-
-
|
2281
|
+
-
|
1908
2282
|
user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
|
1909
2283
|
bot:
|
1910
2284
|
name: Pingdom Bot
|
@@ -1913,16 +2287,34 @@
|
|
1913
2287
|
producer:
|
1914
2288
|
name: Pingdom AB
|
1915
2289
|
url: https://www.pingdom.com
|
1916
|
-
-
|
2290
|
+
-
|
2291
|
+
user_agent: Mozilla/5.0 (compatible; Pinterestbot/1.0; http://www.pinterest.com/bot.html)
|
2292
|
+
bot:
|
2293
|
+
name: Pinterest
|
2294
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
2295
|
+
category: Crawler
|
2296
|
+
producer:
|
2297
|
+
name: Pinterest
|
2298
|
+
url: https://www.pinterest.com/
|
2299
|
+
-
|
1917
2300
|
user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
|
1918
2301
|
bot:
|
1919
2302
|
name: Pinterest
|
1920
|
-
url:
|
2303
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
2304
|
+
category: Crawler
|
2305
|
+
producer:
|
2306
|
+
name: Pinterest
|
2307
|
+
url: https://www.pinterest.com/
|
2308
|
+
-
|
2309
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Pinterestbot/1.0; https://www.pinterest.com/bot.html)
|
2310
|
+
bot:
|
2311
|
+
name: Pinterest
|
2312
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
1921
2313
|
category: Crawler
|
1922
2314
|
producer:
|
1923
2315
|
name: Pinterest
|
1924
|
-
url:
|
1925
|
-
-
|
2316
|
+
url: https://www.pinterest.com/
|
2317
|
+
-
|
1926
2318
|
user_agent: PocketParser/2.0 (+https://getpocket.com/pocketparser_ua)
|
1927
2319
|
bot:
|
1928
2320
|
name: PocketParser
|
@@ -1931,7 +2323,7 @@
|
|
1931
2323
|
producer:
|
1932
2324
|
name: Pocket
|
1933
2325
|
url: https://getpocket.com/
|
1934
|
-
-
|
2326
|
+
-
|
1935
2327
|
user_agent: PritTorrent/1.0
|
1936
2328
|
bot:
|
1937
2329
|
name: PritTorrent
|
@@ -1940,7 +2332,7 @@
|
|
1940
2332
|
producer:
|
1941
2333
|
name: Bitlove
|
1942
2334
|
url: http://bitlove.org/
|
1943
|
-
-
|
2335
|
+
-
|
1944
2336
|
user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
|
1945
2337
|
bot:
|
1946
2338
|
name: QuerySeekerSpider
|
@@ -1949,7 +2341,7 @@
|
|
1949
2341
|
producer:
|
1950
2342
|
name: QueryEye Inc.
|
1951
2343
|
url: http://queryeye.com
|
1952
|
-
-
|
2344
|
+
-
|
1953
2345
|
user_agent: Quora Link Preview/1.0 (http://www.quora.com)
|
1954
2346
|
bot:
|
1955
2347
|
name: Quora Link Preview
|
@@ -1958,7 +2350,7 @@
|
|
1958
2350
|
producer:
|
1959
2351
|
name: Quora
|
1960
2352
|
url: http://www.quora.com
|
1961
|
-
-
|
2353
|
+
-
|
1962
2354
|
user_agent: 'Mozilla/5.0 (compatible; Qwantify/2.2w; +https://www.qwant.com/)/*'
|
1963
2355
|
bot:
|
1964
2356
|
name: Qwantify
|
@@ -1967,7 +2359,7 @@
|
|
1967
2359
|
producer:
|
1968
2360
|
name: Qwant Corporation
|
1969
2361
|
url: https://www.qwant.com/
|
1970
|
-
-
|
2362
|
+
-
|
1971
2363
|
user_agent: ROI Hunter; https://api-dev.roihunter.com
|
1972
2364
|
bot:
|
1973
2365
|
name: ROI Hunter
|
@@ -1976,13 +2368,17 @@
|
|
1976
2368
|
producer:
|
1977
2369
|
name: Roihunter a.s.
|
1978
2370
|
url: http://roihunter.com/
|
1979
|
-
-
|
2371
|
+
-
|
2372
|
+
user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
|
2373
|
+
bot:
|
2374
|
+
name: RSSRadio Bot
|
2375
|
+
-
|
1980
2376
|
user_agent: Rainmeter WebParser plugin
|
1981
2377
|
bot:
|
1982
2378
|
name: Rainmeter
|
1983
2379
|
category: Crawler
|
1984
2380
|
url: https://www.rainmeter.net
|
1985
|
-
-
|
2381
|
+
-
|
1986
2382
|
user_agent: RamblerMail/6.0 (incompatible; ImageProxy/6.0)
|
1987
2383
|
bot:
|
1988
2384
|
name: RamblerMail Image Proxy
|
@@ -1991,7 +2387,7 @@
|
|
1991
2387
|
producer:
|
1992
2388
|
name: 'Rambler&Co'
|
1993
2389
|
url: https://rambler-co.ru/
|
1994
|
-
-
|
2390
|
+
-
|
1995
2391
|
user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
|
1996
2392
|
bot:
|
1997
2393
|
name: Reddit Bot
|
@@ -2000,7 +2396,12 @@
|
|
2000
2396
|
producer:
|
2001
2397
|
name: reddit inc.
|
2002
2398
|
url: http://www.reddit.com
|
2003
|
-
-
|
2399
|
+
-
|
2400
|
+
user_agent: Robozilla/1.0
|
2401
|
+
bot:
|
2402
|
+
name: Robozilla
|
2403
|
+
category: Crawler
|
2404
|
+
-
|
2004
2405
|
user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
|
2005
2406
|
bot:
|
2006
2407
|
name: Rogerbot
|
@@ -2009,7 +2410,7 @@
|
|
2009
2410
|
producer:
|
2010
2411
|
name: SEOmoz, Inc.
|
2011
2412
|
url: http://moz.com/
|
2012
|
-
-
|
2413
|
+
-
|
2013
2414
|
user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
|
2014
2415
|
bot:
|
2015
2416
|
name: Rogerbot
|
@@ -2018,7 +2419,7 @@
|
|
2018
2419
|
producer:
|
2019
2420
|
name: SEOmoz, Inc.
|
2020
2421
|
url: http://moz.com/
|
2021
|
-
-
|
2422
|
+
-
|
2022
2423
|
user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
|
2023
2424
|
bot:
|
2024
2425
|
name: Rogerbot
|
@@ -2027,7 +2428,7 @@
|
|
2027
2428
|
producer:
|
2028
2429
|
name: SEOmoz, Inc.
|
2029
2430
|
url: http://moz.com/
|
2030
|
-
-
|
2431
|
+
-
|
2031
2432
|
user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
|
2032
2433
|
bot:
|
2033
2434
|
name: SEOENGBot
|
@@ -2036,7 +2437,7 @@
|
|
2036
2437
|
producer:
|
2037
2438
|
name: SEO Engine
|
2038
2439
|
url: http://www.seoengine.com
|
2039
|
-
-
|
2440
|
+
-
|
2040
2441
|
user_agent: Mozilla/5.0 (compatible; SEOkicks-Robot; +http://www.seokicks.de/robot.html)
|
2041
2442
|
bot:
|
2042
2443
|
name: SEOkicks-Robot
|
@@ -2045,7 +2446,7 @@
|
|
2045
2446
|
producer:
|
2046
2447
|
name: SEOkicks
|
2047
2448
|
url: https://www.seokicks.de/
|
2048
|
-
-
|
2449
|
+
-
|
2049
2450
|
user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
|
2050
2451
|
bot:
|
2051
2452
|
name: SISTRIX Crawler
|
@@ -2054,7 +2455,43 @@
|
|
2054
2455
|
producer:
|
2055
2456
|
name: SISTRIX GmbH
|
2056
2457
|
url: http://www.sistrix.de
|
2057
|
-
-
|
2458
|
+
-
|
2459
|
+
user_agent: Mozilla/5.0 (compatible; Optimizer)
|
2460
|
+
bot:
|
2461
|
+
name: SISTRIX Optimizer
|
2462
|
+
category: Crawler
|
2463
|
+
url: https://optimizer.sistrix.com
|
2464
|
+
producer:
|
2465
|
+
name: SISTRIX GmbH
|
2466
|
+
url: http://www.sistrix.de
|
2467
|
+
-
|
2468
|
+
user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer)
|
2469
|
+
bot:
|
2470
|
+
name: SISTRIX Optimizer
|
2471
|
+
category: Crawler
|
2472
|
+
url: https://optimizer.sistrix.com
|
2473
|
+
producer:
|
2474
|
+
name: SISTRIX GmbH
|
2475
|
+
url: http://www.sistrix.de
|
2476
|
+
-
|
2477
|
+
user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer; Uptime; +https://www.sistrix.com/faq/uptime)
|
2478
|
+
bot:
|
2479
|
+
name: SISTRIX Optimizer
|
2480
|
+
category: Crawler
|
2481
|
+
url: https://optimizer.sistrix.com
|
2482
|
+
producer:
|
2483
|
+
name: SISTRIX GmbH
|
2484
|
+
url: http://www.sistrix.de
|
2485
|
+
-
|
2486
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.75 Safari/537.36 (compatible; SMTBot/1.0; +http://www.similartech.com/smtbot)
|
2487
|
+
bot:
|
2488
|
+
name: SMTBot
|
2489
|
+
category: Search bot
|
2490
|
+
url: https://www.similartech.com/smtbot
|
2491
|
+
producer:
|
2492
|
+
name: SimilarTech Ltd.
|
2493
|
+
url: https://www.similartech.com/
|
2494
|
+
-
|
2058
2495
|
user_agent: SSL Labs (https://www.ssllabs.com/about/assessment.html)
|
2059
2496
|
bot:
|
2060
2497
|
name: SSL Labs
|
@@ -2063,7 +2500,7 @@
|
|
2063
2500
|
producer:
|
2064
2501
|
name: SSL Labs
|
2065
2502
|
url: https://www.ssllabs.com/about/assessment.html
|
2066
|
-
-
|
2503
|
+
-
|
2067
2504
|
user_agent: SafeDNSBot (https://www.safedns.com/searchbot)
|
2068
2505
|
bot:
|
2069
2506
|
name: SafeDNSBot
|
@@ -2072,13 +2509,13 @@
|
|
2072
2509
|
producer:
|
2073
2510
|
name: SafeDNS, Inc.
|
2074
2511
|
url: https://www.safedns.com/
|
2075
|
-
-
|
2512
|
+
-
|
2076
2513
|
user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
|
2077
2514
|
bot:
|
2078
2515
|
name: Scrapy
|
2079
2516
|
category: Crawler
|
2080
2517
|
url: http://scrapy.org
|
2081
|
-
-
|
2518
|
+
-
|
2082
2519
|
user_agent: Screaming Frog SEO Spider/2.22
|
2083
2520
|
bot:
|
2084
2521
|
name: Screaming Frog SEO Spider
|
@@ -2087,7 +2524,7 @@
|
|
2087
2524
|
producer:
|
2088
2525
|
name: Screaming Frog Ltd
|
2089
2526
|
url: http://www.screamingfrog.co.uk
|
2090
|
-
-
|
2527
|
+
-
|
2091
2528
|
user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
|
2092
2529
|
bot:
|
2093
2530
|
name: ScreenerBot
|
@@ -2096,7 +2533,13 @@
|
|
2096
2533
|
producer:
|
2097
2534
|
name: ""
|
2098
2535
|
url: ""
|
2099
|
-
-
|
2536
|
+
-
|
2537
|
+
user_agent: Mozilla/5.0 (compatible) SemanticScholarBot (+https://www.semanticscholar.org/crawler)
|
2538
|
+
bot:
|
2539
|
+
name: Semantic Scholar Bot
|
2540
|
+
category: Crawler
|
2541
|
+
url: https://www.semanticscholar.org/crawler
|
2542
|
+
-
|
2100
2543
|
user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
|
2101
2544
|
bot:
|
2102
2545
|
name: Semrush Bot
|
@@ -2105,7 +2548,7 @@
|
|
2105
2548
|
producer:
|
2106
2549
|
name: SEMrush
|
2107
2550
|
url: http://www.semrush.com
|
2108
|
-
-
|
2551
|
+
-
|
2109
2552
|
user_agent: SensikaBot/x.33 (+http://sensika.com)
|
2110
2553
|
bot:
|
2111
2554
|
name: Sensika Bot
|
@@ -2114,28 +2557,36 @@
|
|
2114
2557
|
producer:
|
2115
2558
|
name: Sensika
|
2116
2559
|
url: http://sensika.com
|
2117
|
-
-
|
2560
|
+
-
|
2118
2561
|
user_agent: sentry/8.6.0 (https://getsentry.com)
|
2119
2562
|
bot:
|
2120
2563
|
name: Sentry Bot
|
2121
2564
|
producer:
|
2122
2565
|
name: Sentry
|
2123
2566
|
url: https://sentry.io
|
2124
|
-
-
|
2567
|
+
-
|
2568
|
+
user_agent: Seobility
|
2569
|
+
bot:
|
2570
|
+
name: Seobility
|
2571
|
+
category: Crawler
|
2572
|
+
url: 'https://www.seobility.net/en/faq/?category=crawling#!aboutourbot'
|
2573
|
+
-
|
2125
2574
|
user_agent: Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)
|
2126
2575
|
bot:
|
2127
2576
|
name: Seoscanners.net
|
2128
2577
|
category: Crawler
|
2129
2578
|
url: ""
|
2130
|
-
-
|
2579
|
+
-
|
2580
|
+
user_agent: SerendeputyBot/0.8.6 (http://serendeputy.com/about/serendeputy-bot)
|
2581
|
+
bot:
|
2582
|
+
name: Serendeputy Bot
|
2583
|
+
category: Crawler
|
2584
|
+
url: https://serendeputy.com/about/serendeputy-bot
|
2585
|
+
-
|
2131
2586
|
user_agent: Server Density Service Monitoring v2
|
2132
2587
|
bot:
|
2133
2588
|
name: Server Density
|
2134
|
-
-
|
2135
|
-
user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
|
2136
|
-
bot:
|
2137
|
-
name: RSSRadio Bot
|
2138
|
-
-
|
2589
|
+
-
|
2139
2590
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
|
2140
2591
|
bot:
|
2141
2592
|
name: Seznam Bot
|
@@ -2144,7 +2595,7 @@
|
|
2144
2595
|
producer:
|
2145
2596
|
name: Seznam.cz, a.s.
|
2146
2597
|
url: http://www.seznam.cz/
|
2147
|
-
-
|
2598
|
+
-
|
2148
2599
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
|
2149
2600
|
bot:
|
2150
2601
|
name: Seznam Bot
|
@@ -2153,7 +2604,7 @@
|
|
2153
2604
|
producer:
|
2154
2605
|
name: Seznam.cz, a.s.
|
2155
2606
|
url: http://www.seznam.cz/
|
2156
|
-
-
|
2607
|
+
-
|
2157
2608
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
|
2158
2609
|
bot:
|
2159
2610
|
name: Seznam Bot
|
@@ -2162,7 +2613,7 @@
|
|
2162
2613
|
producer:
|
2163
2614
|
name: Seznam.cz, a.s.
|
2164
2615
|
url: http://www.seznam.cz/
|
2165
|
-
-
|
2616
|
+
-
|
2166
2617
|
user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
|
2167
2618
|
bot:
|
2168
2619
|
name: Seznam Bot
|
@@ -2171,7 +2622,7 @@
|
|
2171
2622
|
producer:
|
2172
2623
|
name: Seznam.cz, a.s.
|
2173
2624
|
url: http://www.seznam.cz/
|
2174
|
-
-
|
2625
|
+
-
|
2175
2626
|
user_agent: Mozilla/5.0 SeznamEmailProxy/2.0.174
|
2176
2627
|
bot:
|
2177
2628
|
name: Seznam Email Proxy
|
@@ -2180,7 +2631,7 @@
|
|
2180
2631
|
producer:
|
2181
2632
|
name: Seznam.cz, a.s.
|
2182
2633
|
url: http://www.seznam.cz/
|
2183
|
-
-
|
2634
|
+
-
|
2184
2635
|
user_agent: Seznam-Zbozi-robot/3.0
|
2185
2636
|
bot:
|
2186
2637
|
name: Seznam Zbozi.cz
|
@@ -2189,7 +2640,7 @@
|
|
2189
2640
|
producer:
|
2190
2641
|
name: Seznam.cz, a.s.
|
2191
2642
|
url: https://www.zbozi.cz/
|
2192
|
-
-
|
2643
|
+
-
|
2193
2644
|
user_agent: Mozilla/5.0 (ShopAlike; LadenZeile) FeedBot
|
2194
2645
|
bot:
|
2195
2646
|
name: ShopAlike
|
@@ -2198,7 +2649,7 @@
|
|
2198
2649
|
producer:
|
2199
2650
|
name: Visual Meta
|
2200
2651
|
url: https://www.shopalike.cz/
|
2201
|
-
-
|
2652
|
+
-
|
2202
2653
|
user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
|
2203
2654
|
bot:
|
2204
2655
|
name: ShopWiki
|
@@ -2207,7 +2658,16 @@
|
|
2207
2658
|
producer:
|
2208
2659
|
name: ShopWiki Corp.
|
2209
2660
|
url: http://www.shopwiki.com
|
2210
|
-
-
|
2661
|
+
-
|
2662
|
+
user_agent: shopify-partner-homepage-scraper
|
2663
|
+
bot:
|
2664
|
+
name: Shopify Partner
|
2665
|
+
category: Crawler
|
2666
|
+
url: https://www.shopify.com/partners
|
2667
|
+
producer:
|
2668
|
+
name: Shopify
|
2669
|
+
url: https://www.shopify.com/
|
2670
|
+
-
|
2211
2671
|
user_agent: SilverReader/1.0; http://silverreader.com
|
2212
2672
|
bot:
|
2213
2673
|
name: SilverReader
|
@@ -2216,16 +2676,7 @@
|
|
2216
2676
|
producer:
|
2217
2677
|
name: ""
|
2218
2678
|
url: ""
|
2219
|
-
-
|
2220
|
-
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
2221
|
-
bot:
|
2222
|
-
name: SimplePie
|
2223
|
-
url: http://www.simplepie.org
|
2224
|
-
category: Feed Parser
|
2225
|
-
producer:
|
2226
|
-
name: ""
|
2227
|
-
url: ""
|
2228
|
-
-
|
2679
|
+
-
|
2229
2680
|
user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
|
2230
2681
|
bot:
|
2231
2682
|
name: SimplePie
|
@@ -2234,7 +2685,7 @@
|
|
2234
2685
|
producer:
|
2235
2686
|
name: ""
|
2236
2687
|
url: ""
|
2237
|
-
-
|
2688
|
+
-
|
2238
2689
|
user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
|
2239
2690
|
bot:
|
2240
2691
|
name: SimplePie
|
@@ -2243,7 +2694,7 @@
|
|
2243
2694
|
producer:
|
2244
2695
|
name: ""
|
2245
2696
|
url: ""
|
2246
|
-
-
|
2697
|
+
-
|
2247
2698
|
user_agent: Site24x7
|
2248
2699
|
bot:
|
2249
2700
|
name: Site24x7 Website Monitoring
|
@@ -2252,13 +2703,31 @@
|
|
2252
2703
|
producer:
|
2253
2704
|
name: Site24x7
|
2254
2705
|
url: https://www.site24x7.com
|
2255
|
-
-
|
2706
|
+
-
|
2256
2707
|
user_agent: SiteSucker for macOS/2.10.5
|
2257
2708
|
bot:
|
2258
2709
|
name: SiteSucker
|
2259
2710
|
category: Crawler
|
2260
2711
|
url: http://ricks-apps.com/osx/sitesucker/
|
2261
|
-
-
|
2712
|
+
-
|
2713
|
+
user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.0) Match by Siteimprove.com
|
2714
|
+
bot:
|
2715
|
+
name: Siteimprove
|
2716
|
+
category: Search bot
|
2717
|
+
url: https://siteimprove.com/
|
2718
|
+
producer:
|
2719
|
+
name: Siteimprove GmbH
|
2720
|
+
url: https://siteimprove.com/
|
2721
|
+
-
|
2722
|
+
user_agent: Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; Trident/6.0) LinkCheck by Siteimprove.com
|
2723
|
+
bot:
|
2724
|
+
name: Siteimprove
|
2725
|
+
category: Search bot
|
2726
|
+
url: https://siteimprove.com/
|
2727
|
+
producer:
|
2728
|
+
name: Siteimprove GmbH
|
2729
|
+
url: https://siteimprove.com/
|
2730
|
+
-
|
2262
2731
|
user_agent: sixy.ch/1.0
|
2263
2732
|
bot:
|
2264
2733
|
name: Sixy.ch
|
@@ -2267,7 +2736,7 @@
|
|
2267
2736
|
producer:
|
2268
2737
|
name: Manuel Kasper
|
2269
2738
|
url: https://neon1.net/
|
2270
|
-
-
|
2739
|
+
-
|
2271
2740
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
|
2272
2741
|
bot:
|
2273
2742
|
name: Skype URI Preview
|
@@ -2276,7 +2745,7 @@
|
|
2276
2745
|
producer:
|
2277
2746
|
name: Skype Communications S.à.r.l.
|
2278
2747
|
url: https://www.skype.com
|
2279
|
-
-
|
2748
|
+
-
|
2280
2749
|
user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
|
2281
2750
|
bot:
|
2282
2751
|
name: Slackbot
|
@@ -2285,7 +2754,7 @@
|
|
2285
2754
|
producer:
|
2286
2755
|
name: Slack Technologies
|
2287
2756
|
url: http://slack.com
|
2288
|
-
-
|
2757
|
+
-
|
2289
2758
|
user_agent: 'AppEngine-Google; (+http://code.google.com/appengine; appid: s~snapchat-proxy)'
|
2290
2759
|
bot:
|
2291
2760
|
name: Snapchat Proxy
|
@@ -2294,7 +2763,7 @@
|
|
2294
2763
|
producer:
|
2295
2764
|
name: Snapchat Inc.
|
2296
2765
|
url: https://www.snapchat.com
|
2297
|
-
-
|
2766
|
+
-
|
2298
2767
|
user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
|
2299
2768
|
bot:
|
2300
2769
|
name: Sogou Spider
|
@@ -2303,7 +2772,7 @@
|
|
2303
2772
|
producer:
|
2304
2773
|
name: Sohu, Inc.
|
2305
2774
|
url: http://www.sogou.com
|
2306
|
-
-
|
2775
|
+
-
|
2307
2776
|
user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
2308
2777
|
bot:
|
2309
2778
|
name: Sogou Spider
|
@@ -2312,7 +2781,7 @@
|
|
2312
2781
|
producer:
|
2313
2782
|
name: Sohu, Inc.
|
2314
2783
|
url: http://www.sogou.com
|
2315
|
-
-
|
2784
|
+
-
|
2316
2785
|
user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
|
2317
2786
|
bot:
|
2318
2787
|
name: Sogou Spider
|
@@ -2321,7 +2790,7 @@
|
|
2321
2790
|
producer:
|
2322
2791
|
name: Sohu, Inc.
|
2323
2792
|
url: http://www.sogou.com
|
2324
|
-
-
|
2793
|
+
-
|
2325
2794
|
user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
2326
2795
|
bot:
|
2327
2796
|
name: Sogou Spider
|
@@ -2330,7 +2799,7 @@
|
|
2330
2799
|
producer:
|
2331
2800
|
name: Sohu, Inc.
|
2332
2801
|
url: http://www.sogou.com
|
2333
|
-
-
|
2802
|
+
-
|
2334
2803
|
user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
|
2335
2804
|
bot:
|
2336
2805
|
name: Soso Spider
|
@@ -2339,13 +2808,13 @@
|
|
2339
2808
|
producer:
|
2340
2809
|
name: Tencent Holdings
|
2341
2810
|
url: http://www.soso.com
|
2342
|
-
-
|
2811
|
+
-
|
2343
2812
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_6) AppleWebKit/537.36 (KHTML, like Gecko) Sparkler/0.2.0-SNAPSHOT
|
2344
2813
|
bot:
|
2345
2814
|
name: Sparkler
|
2346
2815
|
category: Crawler
|
2347
2816
|
url: https://github.com/USCDataScience/sparkler
|
2348
|
-
-
|
2817
|
+
-
|
2349
2818
|
user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
|
2350
2819
|
bot:
|
2351
2820
|
name: Spinn3r
|
@@ -2354,25 +2823,35 @@
|
|
2354
2823
|
producer:
|
2355
2824
|
name: Tailrank Inc
|
2356
2825
|
url: http://spinn3r.com
|
2357
|
-
-
|
2826
|
+
-
|
2827
|
+
user_agent: Spotify/1.0
|
2828
|
+
bot:
|
2829
|
+
name: Spotify
|
2830
|
+
producer:
|
2831
|
+
name: Spotify
|
2832
|
+
url: https://www.spotify.com
|
2833
|
+
-
|
2358
2834
|
user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
|
2359
2835
|
bot:
|
2360
2836
|
name: Sputnik Bot
|
2361
|
-
category: ""
|
2837
|
+
category: "Crawler"
|
2362
2838
|
url: ""
|
2363
|
-
|
2364
|
-
name: ""
|
2365
|
-
url: ""
|
2366
|
-
-
|
2839
|
+
-
|
2367
2840
|
user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
|
2368
2841
|
bot:
|
2369
|
-
name: Sputnik Bot
|
2370
|
-
category: ""
|
2842
|
+
name: Sputnik Image Bot
|
2843
|
+
category: "Crawler"
|
2371
2844
|
url: ""
|
2845
|
+
-
|
2846
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_8_5) AppleWebKit/536.30.1 (KHTML, like Gecko) (compatible; Startpagina-Linkchecker/1.0; +https://www.startpagina.nl/linkchecker)
|
2847
|
+
bot:
|
2848
|
+
name: Startpagina Linkchecker
|
2849
|
+
category: Search bot
|
2850
|
+
url: https://www.startpagina.nl/linkchecker
|
2372
2851
|
producer:
|
2373
|
-
name:
|
2374
|
-
url:
|
2375
|
-
-
|
2852
|
+
name: Startpagina B.V.
|
2853
|
+
url: https://www.startpagina.nl/
|
2854
|
+
-
|
2376
2855
|
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.4 (KHTML, like Gecko) Chrome/98 Safari/537.4 (StatusCake)
|
2377
2856
|
bot:
|
2378
2857
|
name: StatusCake
|
@@ -2381,7 +2860,7 @@
|
|
2381
2860
|
producer:
|
2382
2861
|
name: StatusCake
|
2383
2862
|
url: https://www.statuscake.com
|
2384
|
-
-
|
2863
|
+
-
|
2385
2864
|
user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
|
2386
2865
|
bot:
|
2387
2866
|
name: Superfeedr Bot
|
@@ -2390,7 +2869,7 @@
|
|
2390
2869
|
producer:
|
2391
2870
|
name: Superfeedr
|
2392
2871
|
url: https://superfeedr.com/
|
2393
|
-
-
|
2872
|
+
-
|
2394
2873
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
|
2395
2874
|
bot:
|
2396
2875
|
name: Survey Bot
|
@@ -2399,7 +2878,7 @@
|
|
2399
2878
|
producer:
|
2400
2879
|
name: Domain Tools
|
2401
2880
|
url: http://www.domaintools.com
|
2402
|
-
-
|
2881
|
+
-
|
2403
2882
|
user_agent: TLSProbe/1.0 (+https://scan.trustnet.venafi.com/)
|
2404
2883
|
bot:
|
2405
2884
|
name: TLSProbe
|
@@ -2408,18 +2887,23 @@
|
|
2408
2887
|
producer:
|
2409
2888
|
name: Venafi TrustNet
|
2410
2889
|
url: https://www.venafi.com
|
2411
|
-
-
|
2890
|
+
-
|
2412
2891
|
user_agent: Tarmot Gezgin/1.0 (compatible; TarmotGezgin/1.1; +http://www.tarmot.com/gezgin)
|
2413
2892
|
bot:
|
2414
2893
|
name: Tarmot Gezgin
|
2415
2894
|
url: http://www.tarmot.com/gezgin/
|
2416
2895
|
category: Search bot
|
2417
|
-
-
|
2896
|
+
-
|
2418
2897
|
user_agent: TelegramBot (like TwitterBot)
|
2419
2898
|
bot:
|
2420
2899
|
name: TelegramBot
|
2421
2900
|
url: https://telegram.org/blog/bot-revolution
|
2422
|
-
-
|
2901
|
+
-
|
2902
|
+
user_agent: The Knowledge AI
|
2903
|
+
bot:
|
2904
|
+
name: The Knowledge AI
|
2905
|
+
category: Crawler
|
2906
|
+
-
|
2423
2907
|
user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
|
2424
2908
|
bot:
|
2425
2909
|
name: TinEye Crawler
|
@@ -2428,7 +2912,7 @@
|
|
2428
2912
|
producer:
|
2429
2913
|
name: Idée Inc.
|
2430
2914
|
url: http://ideeinc.com
|
2431
|
-
-
|
2915
|
+
-
|
2432
2916
|
user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
|
2433
2917
|
bot:
|
2434
2918
|
name: Tiny Tiny RSS
|
@@ -2437,7 +2921,7 @@
|
|
2437
2921
|
producer:
|
2438
2922
|
name: ""
|
2439
2923
|
url: ""
|
2440
|
-
-
|
2924
|
+
-
|
2441
2925
|
user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
|
2442
2926
|
bot:
|
2443
2927
|
name: Tiny Tiny RSS
|
@@ -2446,7 +2930,16 @@
|
|
2446
2930
|
producer:
|
2447
2931
|
name: ""
|
2448
2932
|
url: ""
|
2449
|
-
-
|
2933
|
+
-
|
2934
|
+
user_agent: Mozilla/5.0 (compatible; tracemyfile/1.0)
|
2935
|
+
bot:
|
2936
|
+
name: TraceMyFile
|
2937
|
+
category: Search bot
|
2938
|
+
url: https://www.tracemyfile.com/
|
2939
|
+
producer:
|
2940
|
+
name: Idee Inc.
|
2941
|
+
url: http://ideeinc.com/
|
2942
|
+
-
|
2450
2943
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 6.0; en-GB; rv:1.0; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20071127 Firefox/3.0.0.11
|
2451
2944
|
bot:
|
2452
2945
|
name: Trendiction Bot
|
@@ -2455,7 +2948,7 @@
|
|
2455
2948
|
producer:
|
2456
2949
|
name: Talkwalker Inc.
|
2457
2950
|
url: http://www.talkwalker.com
|
2458
|
-
-
|
2951
|
+
-
|
2459
2952
|
user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
|
2460
2953
|
bot:
|
2461
2954
|
name: TurnitinBot
|
@@ -2464,7 +2957,7 @@
|
|
2464
2957
|
producer:
|
2465
2958
|
name: iParadigms, LLC.
|
2466
2959
|
url: http://www.turnitin.com
|
2467
|
-
-
|
2960
|
+
-
|
2468
2961
|
user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
|
2469
2962
|
bot:
|
2470
2963
|
name: TweetedTimes Bot
|
@@ -2473,7 +2966,7 @@
|
|
2473
2966
|
producer:
|
2474
2967
|
name: TweetedTimes
|
2475
2968
|
url: http://tweetedtimes.com/
|
2476
|
-
-
|
2969
|
+
-
|
2477
2970
|
user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
|
2478
2971
|
bot:
|
2479
2972
|
name: TweetedTimes Bot
|
@@ -2482,7 +2975,7 @@
|
|
2482
2975
|
producer:
|
2483
2976
|
name: TweetedTimes
|
2484
2977
|
url: http://tweetedtimes.com/
|
2485
|
-
-
|
2978
|
+
-
|
2486
2979
|
user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
|
2487
2980
|
bot:
|
2488
2981
|
name: Tweetmeme Bot
|
@@ -2491,7 +2984,15 @@
|
|
2491
2984
|
producer:
|
2492
2985
|
name: Mediasift
|
2493
2986
|
url: ""
|
2494
|
-
-
|
2987
|
+
-
|
2988
|
+
user_agent: Mozilla/5.0 (compatible; Twingly Recon; twingly.com)
|
2989
|
+
bot:
|
2990
|
+
name: Twingly Recon
|
2991
|
+
category: Crawler
|
2992
|
+
producer:
|
2993
|
+
name: Twingly
|
2994
|
+
url: https://www.twingly.com
|
2995
|
+
-
|
2495
2996
|
user_agent: Twitterbot/1.0
|
2496
2997
|
bot:
|
2497
2998
|
name: Twitterbot
|
@@ -2500,7 +3001,7 @@
|
|
2500
3001
|
producer:
|
2501
3002
|
name: Twitter
|
2502
3003
|
url: http://www.twitter.com
|
2503
|
-
-
|
3004
|
+
-
|
2504
3005
|
user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
|
2505
3006
|
bot:
|
2506
3007
|
name: URLAppendBot
|
@@ -2509,7 +3010,7 @@
|
|
2509
3010
|
producer:
|
2510
3011
|
name: Profound Networks
|
2511
3012
|
url: http://www.profound.net
|
2512
|
-
-
|
3013
|
+
-
|
2513
3014
|
user_agent: 'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36 (via secureurl.fwdcdn.com - mail.ukr.net proxy)'
|
2514
3015
|
bot:
|
2515
3016
|
name: UkrNet Mail Proxy
|
@@ -2518,7 +3019,7 @@
|
|
2518
3019
|
producer:
|
2519
3020
|
name: UkrNet Ltd
|
2520
3021
|
url: https://www.ukr.net/
|
2521
|
-
-
|
3022
|
+
-
|
2522
3023
|
user_agent: UniversalFeedParser/5.2.1 +https://code.google.com/p/feedparser/
|
2523
3024
|
bot:
|
2524
3025
|
name: UniversalFeedParser
|
@@ -2527,7 +3028,7 @@
|
|
2527
3028
|
producer:
|
2528
3029
|
name: Kurt McKee
|
2529
3030
|
url: https://github.com/kurtmckee
|
2530
|
-
-
|
3031
|
+
-
|
2531
3032
|
user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
|
2532
3033
|
bot:
|
2533
3034
|
name: Uptime Robot
|
@@ -2536,7 +3037,7 @@
|
|
2536
3037
|
producer:
|
2537
3038
|
name: Uptime Robot
|
2538
3039
|
url: http://uptimerobot.com
|
2539
|
-
-
|
3040
|
+
-
|
2540
3041
|
user_agent: Mozilla/5.0 (compatible; Uptimebot/1.0; +http://www.uptime.com/uptimebot)
|
2541
3042
|
bot:
|
2542
3043
|
name: Uptimebot
|
@@ -2545,7 +3046,7 @@
|
|
2545
3046
|
producer:
|
2546
3047
|
name: Uptime
|
2547
3048
|
url: https://uptime.com
|
2548
|
-
-
|
3049
|
+
-
|
2549
3050
|
user_agent: Mozilla/5.0 (compatible; vkShare; +http://vk.com/dev/Share)
|
2550
3051
|
bot:
|
2551
3052
|
name: VK Share Button
|
@@ -2554,7 +3055,7 @@
|
|
2554
3055
|
producer:
|
2555
3056
|
name: VK
|
2556
3057
|
url: http://vk.com/
|
2557
|
-
-
|
3058
|
+
-
|
2558
3059
|
user_agent: 'Mozilla/4.0 (compatible; Vagabondo/4.0; http://webagent.wise-guys.nl/; http://www.wise-guys.nl/)'
|
2559
3060
|
bot:
|
2560
3061
|
name: Vagabondo
|
@@ -2563,7 +3064,19 @@
|
|
2563
3064
|
producer:
|
2564
3065
|
name: WiseGuys
|
2565
3066
|
url: http://www.wise-guys.nl/
|
2566
|
-
-
|
3067
|
+
-
|
3068
|
+
user_agent: Mozilla/5.0 (compatible; VelenPublicWebCrawler/1.0; +https://velen.io)
|
3069
|
+
bot:
|
3070
|
+
name: Velen Public Web Crawler
|
3071
|
+
category: Crawler
|
3072
|
+
url: https://hunter.io/robot
|
3073
|
+
-
|
3074
|
+
user_agent: Vercelbot (+https://vercel.com)
|
3075
|
+
bot:
|
3076
|
+
name: Vercel Bot
|
3077
|
+
category: Service bot
|
3078
|
+
url: https://vercel.com
|
3079
|
+
-
|
2567
3080
|
user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
|
2568
3081
|
bot:
|
2569
3082
|
name: Visual Site Mapper Crawler
|
@@ -2572,7 +3085,7 @@
|
|
2572
3085
|
producer:
|
2573
3086
|
name: Alentum Software Ltd.
|
2574
3087
|
url: http://www.alentum.com
|
2575
|
-
-
|
3088
|
+
-
|
2576
3089
|
user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
|
2577
3090
|
bot:
|
2578
3091
|
name: W3C CSS Validator
|
@@ -2581,7 +3094,7 @@
|
|
2581
3094
|
producer:
|
2582
3095
|
name: W3C
|
2583
3096
|
url: http://www.w3.org
|
2584
|
-
-
|
3097
|
+
-
|
2585
3098
|
user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
|
2586
3099
|
bot:
|
2587
3100
|
name: W3C I18N Checker
|
@@ -2590,7 +3103,7 @@
|
|
2590
3103
|
producer:
|
2591
3104
|
name: W3C
|
2592
3105
|
url: http://www.w3.org
|
2593
|
-
-
|
3106
|
+
-
|
2594
3107
|
user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
|
2595
3108
|
bot:
|
2596
3109
|
name: W3C Link Checker
|
@@ -2599,7 +3112,7 @@
|
|
2599
3112
|
producer:
|
2600
3113
|
name: W3C
|
2601
3114
|
url: http://www.w3.org
|
2602
|
-
-
|
3115
|
+
-
|
2603
3116
|
user_agent: W3C-checklink/4.81 libwww-perl/5.836
|
2604
3117
|
bot:
|
2605
3118
|
name: W3C Link Checker
|
@@ -2608,7 +3121,7 @@
|
|
2608
3121
|
producer:
|
2609
3122
|
name: W3C
|
2610
3123
|
url: http://www.w3.org
|
2611
|
-
-
|
3124
|
+
-
|
2612
3125
|
user_agent: Validator.nu/LV http://validator.w3.org/services
|
2613
3126
|
bot:
|
2614
3127
|
name: W3C Markup Validation Service
|
@@ -2617,7 +3130,7 @@
|
|
2617
3130
|
producer:
|
2618
3131
|
name: W3C
|
2619
3132
|
url: http://www.w3.org
|
2620
|
-
-
|
3133
|
+
-
|
2621
3134
|
user_agent: W3C_Validator/1.3 http://validator.w3.org/services
|
2622
3135
|
bot:
|
2623
3136
|
name: W3C Markup Validation Service
|
@@ -2626,7 +3139,7 @@
|
|
2626
3139
|
producer:
|
2627
3140
|
name: W3C
|
2628
3141
|
url: http://www.w3.org
|
2629
|
-
-
|
3142
|
+
-
|
2630
3143
|
user_agent: W3C_Validator/1.767
|
2631
3144
|
bot:
|
2632
3145
|
name: W3C Markup Validation Service
|
@@ -2635,7 +3148,7 @@
|
|
2635
3148
|
producer:
|
2636
3149
|
name: W3C
|
2637
3150
|
url: http://www.w3.org
|
2638
|
-
-
|
3151
|
+
-
|
2639
3152
|
user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
|
2640
3153
|
bot:
|
2641
3154
|
name: W3C MobileOK Checker
|
@@ -2644,7 +3157,7 @@
|
|
2644
3157
|
producer:
|
2645
3158
|
name: W3C
|
2646
3159
|
url: http://www.w3.org
|
2647
|
-
-
|
3160
|
+
-
|
2648
3161
|
user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
|
2649
3162
|
bot:
|
2650
3163
|
name: W3C Unified Validator
|
@@ -2653,7 +3166,7 @@
|
|
2653
3166
|
producer:
|
2654
3167
|
name: W3C
|
2655
3168
|
url: http://www.w3.org
|
2656
|
-
-
|
3169
|
+
-
|
2657
3170
|
user_agent: Mozilla/5.0 (compatible; Wappalyzer; +https://github.com/AliasIO/Wappalyzer)
|
2658
3171
|
bot:
|
2659
3172
|
name: Wappalyzer
|
@@ -2661,7 +3174,7 @@
|
|
2661
3174
|
producer:
|
2662
3175
|
name: AliasIO
|
2663
3176
|
url: https://github.com/AliasIO
|
2664
|
-
-
|
3177
|
+
-
|
2665
3178
|
user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
|
2666
3179
|
bot:
|
2667
3180
|
name: WeSEE:Search
|
@@ -2670,13 +3183,13 @@
|
|
2670
3183
|
producer:
|
2671
3184
|
name: WeSEE Ltd
|
2672
3185
|
url: http://www.wesee.com
|
2673
|
-
-
|
3186
|
+
-
|
2674
3187
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Moto G (4) Build/MPJ24.139-64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.146 Mobile Safari/537.36 PTST/180829.190838
|
2675
3188
|
bot:
|
2676
3189
|
name: WebPageTest
|
2677
3190
|
category: Site Monitor
|
2678
3191
|
url: https://www.webpagetest.org
|
2679
|
-
-
|
3192
|
+
-
|
2680
3193
|
user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
|
2681
3194
|
bot:
|
2682
3195
|
name: WebSitePulse
|
@@ -2685,7 +3198,7 @@
|
|
2685
3198
|
producer:
|
2686
3199
|
name: WebSitePulse
|
2687
3200
|
url: http://www.websitepulse.com/
|
2688
|
-
-
|
3201
|
+
-
|
2689
3202
|
user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
|
2690
3203
|
bot:
|
2691
3204
|
name: WebbCrawler
|
@@ -2694,16 +3207,52 @@
|
|
2694
3207
|
producer:
|
2695
3208
|
name: Steve Webb
|
2696
3209
|
url: http://badcheese.com
|
2697
|
-
-
|
2698
|
-
user_agent:
|
3210
|
+
-
|
3211
|
+
user_agent: weborama-fetcher (+http://www.weborama.com)
|
2699
3212
|
bot:
|
2700
|
-
name:
|
2701
|
-
category:
|
3213
|
+
name: Weborama
|
3214
|
+
category: Search bot
|
3215
|
+
url: https://weborama.com/
|
3216
|
+
producer:
|
3217
|
+
name: Weborama SA
|
3218
|
+
url: https://weborama.com/
|
3219
|
+
-
|
3220
|
+
user_agent: WikiDo/1.1 (http://wikido.com; crawler@wikido.com)
|
3221
|
+
bot:
|
3222
|
+
name: WikiDo
|
3223
|
+
category: Search bot
|
3224
|
+
url: https://www.wikido.com/
|
3225
|
+
producer:
|
3226
|
+
name: Fotolitografie Fiorentine di Becchi Antonio s.n.c.
|
3227
|
+
url: https://www.wikido.com/
|
3228
|
+
-
|
3229
|
+
user_agent: Mozilla/5.0 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
3230
|
+
bot:
|
3231
|
+
name: WooRank
|
3232
|
+
category: Search bot
|
3233
|
+
url: https://www.woorank.com/
|
3234
|
+
producer:
|
3235
|
+
name: WooRank sprl
|
3236
|
+
url: https://www.woorank.com/
|
3237
|
+
-
|
3238
|
+
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/604.1.38 (KHTML, like Gecko) Version/11.0 Mobile/15A372 Safari/604.1 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
3239
|
+
bot:
|
3240
|
+
name: WooRank
|
3241
|
+
category: Search bot
|
3242
|
+
url: https://www.woorank.com/
|
3243
|
+
producer:
|
3244
|
+
name: WooRank sprl
|
3245
|
+
url: https://www.woorank.com/
|
3246
|
+
-
|
3247
|
+
user_agent: WordPress/4.7.2; https://example.com
|
3248
|
+
bot:
|
3249
|
+
name: WordPress
|
3250
|
+
category: Service Agent
|
2702
3251
|
url: https://wordpress.org/
|
2703
3252
|
producer:
|
2704
3253
|
name: Wordpress.org
|
2705
3254
|
url: https://wordpress.org/
|
2706
|
-
-
|
3255
|
+
-
|
2707
3256
|
user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
|
2708
3257
|
bot:
|
2709
3258
|
name: Wotbox
|
@@ -2712,7 +3261,16 @@
|
|
2712
3261
|
producer:
|
2713
3262
|
name: Wotbox
|
2714
3263
|
url: http://www.wotbox.com
|
2715
|
-
-
|
3264
|
+
-
|
3265
|
+
user_agent: XenForo/2.x (https://www.example.com)
|
3266
|
+
bot:
|
3267
|
+
name: XenForo
|
3268
|
+
category: Service Agent
|
3269
|
+
url: https://xenforo.com/
|
3270
|
+
producer:
|
3271
|
+
name: XenForo Ltd.
|
3272
|
+
url: https://xenforo.com/
|
3273
|
+
-
|
2716
3274
|
user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
|
2717
3275
|
bot:
|
2718
3276
|
name: YaCy
|
@@ -2721,7 +3279,7 @@
|
|
2721
3279
|
producer:
|
2722
3280
|
name: YaCy
|
2723
3281
|
url: http://yacy.net
|
2724
|
-
-
|
3282
|
+
-
|
2725
3283
|
user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
|
2726
3284
|
bot:
|
2727
3285
|
name: YaCy
|
@@ -2730,7 +3288,7 @@
|
|
2730
3288
|
producer:
|
2731
3289
|
name: YaCy
|
2732
3290
|
url: http://yacy.net
|
2733
|
-
-
|
3291
|
+
-
|
2734
3292
|
user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
|
2735
3293
|
bot:
|
2736
3294
|
name: Yahoo Gemini
|
@@ -2739,7 +3297,16 @@
|
|
2739
3297
|
producer:
|
2740
3298
|
name: Yahoo! Inc.
|
2741
3299
|
url: http://www.yahoo.com
|
2742
|
-
-
|
3300
|
+
-
|
3301
|
+
user_agent: Y!J-BRW/1.0 (https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716)
|
3302
|
+
bot:
|
3303
|
+
name: Yahoo! Japan BRW
|
3304
|
+
category: Crawler
|
3305
|
+
url: https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716/~/ウェブページにアクセスするシステムのユーザーエージェントについて
|
3306
|
+
producer:
|
3307
|
+
name: Yahoo! Japan Corp.
|
3308
|
+
url: https://www.yahoo.co.jp/
|
3309
|
+
-
|
2743
3310
|
user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
|
2744
3311
|
bot:
|
2745
3312
|
name: Yahoo! Link Preview
|
@@ -2748,7 +3315,7 @@
|
|
2748
3315
|
producer:
|
2749
3316
|
name: Yahoo! Inc.
|
2750
3317
|
url: http://www.yahoo.com
|
2751
|
-
-
|
3318
|
+
-
|
2752
3319
|
user_agent: Yahoo:LinkExpander:Slingstone
|
2753
3320
|
bot:
|
2754
3321
|
name: Yahoo! Link Preview
|
@@ -2757,7 +3324,7 @@
|
|
2757
3324
|
producer:
|
2758
3325
|
name: Yahoo! Inc.
|
2759
3326
|
url: http://www.yahoo.com
|
2760
|
-
-
|
3327
|
+
-
|
2761
3328
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
|
2762
3329
|
bot:
|
2763
3330
|
name: Yahoo! Slurp
|
@@ -2766,7 +3333,7 @@
|
|
2766
3333
|
producer:
|
2767
3334
|
name: Yahoo! Inc.
|
2768
3335
|
url: http://www.yahoo.com
|
2769
|
-
-
|
3336
|
+
-
|
2770
3337
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
|
2771
3338
|
bot:
|
2772
3339
|
name: Yahoo! Slurp
|
@@ -2775,7 +3342,7 @@
|
|
2775
3342
|
producer:
|
2776
3343
|
name: Yahoo! Inc.
|
2777
3344
|
url: http://www.yahoo.com
|
2778
|
-
-
|
3345
|
+
-
|
2779
3346
|
user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
|
2780
3347
|
bot:
|
2781
3348
|
name: Yandex Bot
|
@@ -2784,7 +3351,7 @@
|
|
2784
3351
|
producer:
|
2785
3352
|
name: Yandex LLC
|
2786
3353
|
url: http://company.yandex.com
|
2787
|
-
-
|
3354
|
+
-
|
2788
3355
|
user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
|
2789
3356
|
bot:
|
2790
3357
|
name: Yandex Bot
|
@@ -2793,7 +3360,7 @@
|
|
2793
3360
|
producer:
|
2794
3361
|
name: Yandex LLC
|
2795
3362
|
url: http://company.yandex.com
|
2796
|
-
-
|
3363
|
+
-
|
2797
3364
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
2798
3365
|
bot:
|
2799
3366
|
name: Yandex Bot
|
@@ -2802,7 +3369,7 @@
|
|
2802
3369
|
producer:
|
2803
3370
|
name: Yandex LLC
|
2804
3371
|
url: http://company.yandex.com
|
2805
|
-
-
|
3372
|
+
-
|
2806
3373
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
2807
3374
|
bot:
|
2808
3375
|
name: Yandex Bot
|
@@ -2811,7 +3378,7 @@
|
|
2811
3378
|
producer:
|
2812
3379
|
name: Yandex LLC
|
2813
3380
|
url: http://company.yandex.com
|
2814
|
-
-
|
3381
|
+
-
|
2815
3382
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
2816
3383
|
bot:
|
2817
3384
|
name: Yandex Bot
|
@@ -2820,7 +3387,7 @@
|
|
2820
3387
|
producer:
|
2821
3388
|
name: Yandex LLC
|
2822
3389
|
url: http://company.yandex.com
|
2823
|
-
-
|
3390
|
+
-
|
2824
3391
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
2825
3392
|
bot:
|
2826
3393
|
name: Yandex Bot
|
@@ -2829,7 +3396,7 @@
|
|
2829
3396
|
producer:
|
2830
3397
|
name: Yandex LLC
|
2831
3398
|
url: http://company.yandex.com
|
2832
|
-
-
|
3399
|
+
-
|
2833
3400
|
user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
|
2834
3401
|
bot:
|
2835
3402
|
name: Yandex Bot
|
@@ -2838,7 +3405,7 @@
|
|
2838
3405
|
producer:
|
2839
3406
|
name: Yandex LLC
|
2840
3407
|
url: http://company.yandex.com
|
2841
|
-
-
|
3408
|
+
-
|
2842
3409
|
user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
|
2843
3410
|
bot:
|
2844
3411
|
name: Yandex Bot
|
@@ -2847,7 +3414,7 @@
|
|
2847
3414
|
producer:
|
2848
3415
|
name: Yandex LLC
|
2849
3416
|
url: http://company.yandex.com
|
2850
|
-
-
|
3417
|
+
-
|
2851
3418
|
user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
|
2852
3419
|
bot:
|
2853
3420
|
name: Yandex Bot
|
@@ -2856,7 +3423,7 @@
|
|
2856
3423
|
producer:
|
2857
3424
|
name: Yandex LLC
|
2858
3425
|
url: http://company.yandex.com
|
2859
|
-
-
|
3426
|
+
-
|
2860
3427
|
user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
|
2861
3428
|
bot:
|
2862
3429
|
name: Yandex Bot
|
@@ -2865,7 +3432,7 @@
|
|
2865
3432
|
producer:
|
2866
3433
|
name: Yandex LLC
|
2867
3434
|
url: http://company.yandex.com
|
2868
|
-
-
|
3435
|
+
-
|
2869
3436
|
user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
|
2870
3437
|
bot:
|
2871
3438
|
name: Yandex Bot
|
@@ -2874,7 +3441,7 @@
|
|
2874
3441
|
producer:
|
2875
3442
|
name: Yandex LLC
|
2876
3443
|
url: http://company.yandex.com
|
2877
|
-
-
|
3444
|
+
-
|
2878
3445
|
user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
|
2879
3446
|
bot:
|
2880
3447
|
name: Yandex Bot
|
@@ -2883,7 +3450,16 @@
|
|
2883
3450
|
producer:
|
2884
3451
|
name: Yandex LLC
|
2885
3452
|
url: http://company.yandex.com
|
2886
|
-
-
|
3453
|
+
-
|
3454
|
+
user_agent: Mozilla/5.0 (compatible; YandexMobileScreenShotBot/1.0; +http://yandex.com/bots)
|
3455
|
+
bot:
|
3456
|
+
name: Yandex Bot
|
3457
|
+
category: Search bot
|
3458
|
+
url: http://www.yandex.com/bots
|
3459
|
+
producer:
|
3460
|
+
name: Yandex LLC
|
3461
|
+
url: http://company.yandex.com
|
3462
|
+
-
|
2887
3463
|
user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
|
2888
3464
|
bot:
|
2889
3465
|
name: Yandex Bot
|
@@ -2892,7 +3468,7 @@
|
|
2892
3468
|
producer:
|
2893
3469
|
name: Yandex LLC
|
2894
3470
|
url: http://company.yandex.com
|
2895
|
-
-
|
3471
|
+
-
|
2896
3472
|
user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
|
2897
3473
|
bot:
|
2898
3474
|
name: Yandex Bot
|
@@ -2901,7 +3477,70 @@
|
|
2901
3477
|
producer:
|
2902
3478
|
name: Yandex LLC
|
2903
3479
|
url: http://company.yandex.com
|
2904
|
-
-
|
3480
|
+
-
|
3481
|
+
user_agent: Mozilla/5.0 (compatible; YandexOntoDB/1.0; +http://yandex.com/bots)
|
3482
|
+
bot:
|
3483
|
+
name: Yandex Bot
|
3484
|
+
category: Search bot
|
3485
|
+
url: http://www.yandex.com/bots
|
3486
|
+
producer:
|
3487
|
+
name: Yandex LLC
|
3488
|
+
url: http://company.yandex.com
|
3489
|
+
-
|
3490
|
+
user_agent: Mozilla/5.0 (compatible; YandexOntoDBAPI/1.0; +http://yandex.com/bots)
|
3491
|
+
bot:
|
3492
|
+
name: Yandex Bot
|
3493
|
+
category: Search bot
|
3494
|
+
url: http://www.yandex.com/bots
|
3495
|
+
producer:
|
3496
|
+
name: Yandex LLC
|
3497
|
+
url: http://company.yandex.com
|
3498
|
+
-
|
3499
|
+
user_agent: Mozilla/5.0 (compatible; YandexPartner/3.0; +http://yandex.com/bots)
|
3500
|
+
bot:
|
3501
|
+
name: Yandex Bot
|
3502
|
+
category: Search bot
|
3503
|
+
url: http://www.yandex.com/bots
|
3504
|
+
producer:
|
3505
|
+
name: Yandex LLC
|
3506
|
+
url: http://company.yandex.com
|
3507
|
+
-
|
3508
|
+
user_agent: Mozilla/5.0 (compatible; YandexRCA/1.0; +http://yandex.com/bots)
|
3509
|
+
bot:
|
3510
|
+
name: Yandex Bot
|
3511
|
+
category: Search bot
|
3512
|
+
url: http://www.yandex.com/bots
|
3513
|
+
producer:
|
3514
|
+
name: Yandex LLC
|
3515
|
+
url: http://company.yandex.com
|
3516
|
+
-
|
3517
|
+
user_agent: Mozilla/5.0 (compatible; YandexSearchShop/1.0; +http://yandex.com/bots)
|
3518
|
+
bot:
|
3519
|
+
name: Yandex Bot
|
3520
|
+
category: Search bot
|
3521
|
+
url: http://www.yandex.com/bots
|
3522
|
+
producer:
|
3523
|
+
name: Yandex LLC
|
3524
|
+
url: http://company.yandex.com
|
3525
|
+
-
|
3526
|
+
user_agent: Mozilla/5.0 (compatible; YandexTracker/1.0; +http://yandex.com/bots)
|
3527
|
+
bot:
|
3528
|
+
name: Yandex Bot
|
3529
|
+
category: Search bot
|
3530
|
+
url: http://www.yandex.com/bots
|
3531
|
+
producer:
|
3532
|
+
name: Yandex LLC
|
3533
|
+
url: http://company.yandex.com
|
3534
|
+
-
|
3535
|
+
user_agent: Mozilla/5.0 (compatible; YandexTurbo/1.0; +http://yandex.com/bots)
|
3536
|
+
bot:
|
3537
|
+
name: Yandex Bot
|
3538
|
+
category: Search bot
|
3539
|
+
url: http://www.yandex.com/bots
|
3540
|
+
producer:
|
3541
|
+
name: Yandex LLC
|
3542
|
+
url: http://company.yandex.com
|
3543
|
+
-
|
2905
3544
|
user_agent: Mozilla/5.0 (compatible; YandexVerticals/1.0; http://yandex.com/bots)
|
2906
3545
|
bot:
|
2907
3546
|
name: Yandex Bot
|
@@ -2910,7 +3549,16 @@
|
|
2910
3549
|
producer:
|
2911
3550
|
name: Yandex LLC
|
2912
3551
|
url: http://company.yandex.com
|
2913
|
-
-
|
3552
|
+
-
|
3553
|
+
user_agent: Mozilla/5.0 (compatible; NaverJapan/1.0; +http://corp.naver.jp/)
|
3554
|
+
bot:
|
3555
|
+
name: Yeti/Naverbot
|
3556
|
+
category: Search bot
|
3557
|
+
url: http://help.naver.com/robots/
|
3558
|
+
producer:
|
3559
|
+
name: Naver
|
3560
|
+
url: http://www.naver.com
|
3561
|
+
-
|
2914
3562
|
user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
|
2915
3563
|
bot:
|
2916
3564
|
name: Yeti/Naverbot
|
@@ -2919,7 +3567,7 @@
|
|
2919
3567
|
producer:
|
2920
3568
|
name: Naver
|
2921
3569
|
url: http://www.naver.com
|
2922
|
-
-
|
3570
|
+
-
|
2923
3571
|
user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
|
2924
3572
|
bot:
|
2925
3573
|
name: Youdao Bot
|
@@ -2928,13 +3576,13 @@
|
|
2928
3576
|
producer:
|
2929
3577
|
name: NetEase, Inc.
|
2930
3578
|
url: http://corp.163.com
|
2931
|
-
-
|
3579
|
+
-
|
2932
3580
|
user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
|
2933
3581
|
bot:
|
2934
3582
|
name: Yourls
|
2935
3583
|
category: Crawler
|
2936
3584
|
url: http://yourls.org
|
2937
|
-
-
|
3585
|
+
-
|
2938
3586
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
|
2939
3587
|
bot:
|
2940
3588
|
name: Yunyun Bot
|
@@ -2943,7 +3591,7 @@
|
|
2943
3591
|
producer:
|
2944
3592
|
name: YunYun
|
2945
3593
|
url: http://www.yunyun.com
|
2946
|
-
-
|
3594
|
+
-
|
2947
3595
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
|
2948
3596
|
bot:
|
2949
3597
|
name: Yunyun Bot
|
@@ -2952,7 +3600,7 @@
|
|
2952
3600
|
producer:
|
2953
3601
|
name: YunYun
|
2954
3602
|
url: http://www.yunyun.com
|
2955
|
-
-
|
3603
|
+
-
|
2956
3604
|
user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
|
2957
3605
|
bot:
|
2958
3606
|
name: Yunyun Bot
|
@@ -2961,12 +3609,21 @@
|
|
2961
3609
|
producer:
|
2962
3610
|
name: YunYun
|
2963
3611
|
url: http://www.yunyun.com
|
2964
|
-
-
|
3612
|
+
-
|
2965
3613
|
user_agent: Zao/0.1 (http://www.kototol.org/zao)
|
2966
3614
|
bot:
|
2967
3615
|
name: Zao
|
2968
3616
|
category: Crawler
|
2969
|
-
-
|
3617
|
+
-
|
3618
|
+
user_agent: zelist.ro feed parser (+http://www.zelist.ro)
|
3619
|
+
bot:
|
3620
|
+
name: Ze List
|
3621
|
+
url: https://www.zelist.ro/
|
3622
|
+
category: Feed Fetcher
|
3623
|
+
producer:
|
3624
|
+
name: Treeworks SRL
|
3625
|
+
url: https://www.tree.ro/
|
3626
|
+
-
|
2970
3627
|
user_agent: Zookabot/2.5;++http://zookabot.com
|
2971
3628
|
bot:
|
2972
3629
|
name: Zookabot
|
@@ -2975,7 +3632,7 @@
|
|
2975
3632
|
producer:
|
2976
3633
|
name: Hwacha ApS
|
2977
3634
|
url: http://hwacha.dk
|
2978
|
-
-
|
3635
|
+
-
|
2979
3636
|
user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
|
2980
3637
|
bot:
|
2981
3638
|
name: ZumBot
|
@@ -2984,7 +3641,7 @@
|
|
2984
3641
|
producer:
|
2985
3642
|
name: ZUM internet
|
2986
3643
|
url: http://www.zuminternet.com/
|
2987
|
-
-
|
3644
|
+
-
|
2988
3645
|
user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
|
2989
3646
|
bot:
|
2990
3647
|
name: ZumBot
|
@@ -2993,106 +3650,106 @@
|
|
2993
3650
|
producer:
|
2994
3651
|
name: ZUM internet
|
2995
3652
|
url: http://www.zuminternet.com/
|
2996
|
-
-
|
3653
|
+
-
|
2997
3654
|
user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
|
2998
3655
|
bot:
|
2999
3656
|
name: aHrefs Bot
|
3000
3657
|
category: Crawler
|
3001
|
-
url:
|
3658
|
+
url: https://ahrefs.com/robot
|
3002
3659
|
producer:
|
3003
3660
|
name: Ahrefs Pte Ltd
|
3004
|
-
url:
|
3005
|
-
-
|
3661
|
+
url: https://ahrefs.com/robot
|
3662
|
+
-
|
3006
3663
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
|
3007
3664
|
bot:
|
3008
3665
|
name: aHrefs Bot
|
3009
3666
|
category: Crawler
|
3010
|
-
url:
|
3667
|
+
url: https://ahrefs.com/robot
|
3011
3668
|
producer:
|
3012
3669
|
name: Ahrefs Pte Ltd
|
3013
|
-
url:
|
3014
|
-
-
|
3670
|
+
url: https://ahrefs.com/robot
|
3671
|
+
-
|
3015
3672
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
|
3016
3673
|
bot:
|
3017
3674
|
name: aHrefs Bot
|
3018
3675
|
category: Crawler
|
3019
|
-
url:
|
3676
|
+
url: https://ahrefs.com/robot
|
3020
3677
|
producer:
|
3021
3678
|
name: Ahrefs Pte Ltd
|
3022
|
-
url:
|
3023
|
-
-
|
3679
|
+
url: https://ahrefs.com/robot
|
3680
|
+
-
|
3024
3681
|
user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
|
3025
3682
|
bot:
|
3026
3683
|
name: aHrefs Bot
|
3027
3684
|
category: Crawler
|
3028
|
-
url:
|
3685
|
+
url: https://ahrefs.com/robot
|
3029
3686
|
producer:
|
3030
3687
|
name: Ahrefs Pte Ltd
|
3031
|
-
url:
|
3032
|
-
-
|
3688
|
+
url: https://ahrefs.com/robot
|
3689
|
+
-
|
3033
3690
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
|
3034
3691
|
bot:
|
3035
3692
|
name: archive.org bot
|
3036
3693
|
category: Crawler
|
3037
|
-
url:
|
3694
|
+
url: https://archive.org/details/archive.org_bot
|
3038
3695
|
producer:
|
3039
3696
|
name: The Internet Archive
|
3040
|
-
url:
|
3041
|
-
-
|
3697
|
+
url: https://archive.org
|
3698
|
+
-
|
3042
3699
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
|
3043
3700
|
bot:
|
3044
3701
|
name: archive.org bot
|
3045
3702
|
category: Crawler
|
3046
|
-
url:
|
3703
|
+
url: https://archive.org/details/archive.org_bot
|
3047
3704
|
producer:
|
3048
3705
|
name: The Internet Archive
|
3049
|
-
url:
|
3050
|
-
-
|
3706
|
+
url: https://archive.org
|
3707
|
+
-
|
3051
3708
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
|
3052
3709
|
bot:
|
3053
3710
|
name: archive.org bot
|
3054
3711
|
category: Crawler
|
3055
|
-
url:
|
3712
|
+
url: https://archive.org/details/archive.org_bot
|
3056
3713
|
producer:
|
3057
3714
|
name: The Internet Archive
|
3058
|
-
url:
|
3059
|
-
-
|
3715
|
+
url: https://archive.org
|
3716
|
+
-
|
3060
3717
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
|
3061
3718
|
bot:
|
3062
3719
|
name: archive.org bot
|
3063
3720
|
category: Crawler
|
3064
|
-
url:
|
3721
|
+
url: https://archive.org/details/archive.org_bot
|
3065
3722
|
producer:
|
3066
3723
|
name: The Internet Archive
|
3067
|
-
url:
|
3068
|
-
-
|
3724
|
+
url: https://archive.org
|
3725
|
+
-
|
3069
3726
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
|
3070
3727
|
bot:
|
3071
3728
|
name: archive.org bot
|
3072
3729
|
category: Crawler
|
3073
|
-
url:
|
3730
|
+
url: https://archive.org/details/archive.org_bot
|
3074
3731
|
producer:
|
3075
3732
|
name: The Internet Archive
|
3076
|
-
url:
|
3077
|
-
-
|
3733
|
+
url: https://archive.org
|
3734
|
+
-
|
3078
3735
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
|
3079
3736
|
bot:
|
3080
3737
|
name: archive.org bot
|
3081
3738
|
category: Crawler
|
3082
|
-
url:
|
3739
|
+
url: https://archive.org/details/archive.org_bot
|
3083
3740
|
producer:
|
3084
3741
|
name: The Internet Archive
|
3085
|
-
url:
|
3086
|
-
-
|
3742
|
+
url: https://archive.org
|
3743
|
+
-
|
3087
3744
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
|
3088
3745
|
bot:
|
3089
3746
|
name: archive.org bot
|
3090
3747
|
category: Crawler
|
3091
|
-
url:
|
3748
|
+
url: https://archive.org/details/archive.org_bot
|
3092
3749
|
producer:
|
3093
3750
|
name: The Internet Archive
|
3094
|
-
url:
|
3095
|
-
-
|
3751
|
+
url: https://archive.org
|
3752
|
+
-
|
3096
3753
|
user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
|
3097
3754
|
bot:
|
3098
3755
|
name: ccBot crawler
|
@@ -3101,7 +3758,24 @@
|
|
3101
3758
|
producer:
|
3102
3759
|
name: reddit inc.
|
3103
3760
|
url: http://www.reddit.com
|
3104
|
-
-
|
3761
|
+
-
|
3762
|
+
user_agent: Mozilla/5.0 eCairn-Grabber/1.0 (+http://ecairn.com/grabber)
|
3763
|
+
bot:
|
3764
|
+
name: eCairn-Grabber
|
3765
|
+
category: Crawler
|
3766
|
+
producer:
|
3767
|
+
name: eCairn
|
3768
|
+
url: https://ecairn.com
|
3769
|
+
-
|
3770
|
+
user_agent: eZ Publish Link Validator
|
3771
|
+
bot:
|
3772
|
+
name: eZ Publish Link Validator
|
3773
|
+
category: Crawler
|
3774
|
+
url: https://ez.no/
|
3775
|
+
producer:
|
3776
|
+
name: eZ Systems AS
|
3777
|
+
url: https://ez.no/
|
3778
|
+
-
|
3105
3779
|
user_agent: Mozilla/5.0 (compatible; evc-batch/2.0)
|
3106
3780
|
bot:
|
3107
3781
|
name: evc-batch
|
@@ -3110,7 +3784,13 @@
|
|
3110
3784
|
producer:
|
3111
3785
|
name: eVenture Capital Partners II, LLC
|
3112
3786
|
url: http://www.eventures.vc/
|
3113
|
-
-
|
3787
|
+
-
|
3788
|
+
user_agent: Mozilla/5.0 (compatible; inoreader.com; 2 subscribers)
|
3789
|
+
bot:
|
3790
|
+
name: inoreader
|
3791
|
+
category: Feed Reader
|
3792
|
+
url: https://www.inoreader.com
|
3793
|
+
-
|
3114
3794
|
user_agent: masscan/1.0 (https://github.com/robertdavidgraham/masscan)
|
3115
3795
|
bot:
|
3116
3796
|
name: masscan
|
@@ -3119,7 +3799,21 @@
|
|
3119
3799
|
producer:
|
3120
3800
|
name: Robert Graham
|
3121
3801
|
url: https://github.com/robertdavidgraham
|
3122
|
-
-
|
3802
|
+
-
|
3803
|
+
user_agent: 'Mozilla/5.0/Firefox/42.0 - nbertaupete95(at)gmail.com'
|
3804
|
+
bot:
|
3805
|
+
name: nbertaupete95
|
3806
|
+
category: Crawler
|
3807
|
+
-
|
3808
|
+
user_agent: Mozilla/5.0 (compatible; oBot/2.3.1; http://www.xforce-security.com/crawler/)
|
3809
|
+
bot:
|
3810
|
+
name: oBot
|
3811
|
+
category: Search bot
|
3812
|
+
url: https://www.xforce-security.com/crawler/
|
3813
|
+
producer:
|
3814
|
+
name: 'IBM Germany Research & Development GmbH'
|
3815
|
+
url: https://exchange.xforce.ibmcloud.com/
|
3816
|
+
-
|
3123
3817
|
user_agent: 'sqlmap/1.1.8.2#dev (http://sqlmap.org)'
|
3124
3818
|
bot:
|
3125
3819
|
name: sqlmap
|
@@ -3128,16 +3822,613 @@
|
|
3128
3822
|
producer:
|
3129
3823
|
name: sqlmap
|
3130
3824
|
url: http://sqlmap.org/
|
3131
|
-
-
|
3132
|
-
user_agent: Mozilla/5.0
|
3825
|
+
-
|
3826
|
+
user_agent: Mozilla/5.0 (compatible; theoldreader.com; 1 subscribers; feed-id=aaa)
|
3827
|
+
bot:
|
3828
|
+
name: theoldreader
|
3829
|
+
category: Feed Reader
|
3830
|
+
url: https://theoldreader.com
|
3831
|
+
-
|
3832
|
+
user_agent: Sprinklr 2.0
|
3133
3833
|
bot:
|
3134
|
-
name:
|
3834
|
+
name: Sprinklr
|
3835
|
+
category: Crawler
|
3836
|
+
url: ""
|
3837
|
+
producer:
|
3838
|
+
name: Sprinklr, Inc.
|
3839
|
+
url: https://www.sprinklr.com/
|
3840
|
+
-
|
3841
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64)AppleWebKit/537.36 (KHTML, like Gecko; Google-Ads-Qualify)Chrome/85.0.4183.140 Safari/537.36
|
3842
|
+
bot:
|
3843
|
+
name: Googlebot
|
3844
|
+
category: Search bot
|
3845
|
+
url: http://www.google.com/bot.html
|
3846
|
+
producer:
|
3847
|
+
name: Google Inc.
|
3848
|
+
url: http://www.google.com
|
3849
|
+
-
|
3850
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64; BDCbot/1.0; +http://bigweb.bigdatacorp.com.br/faq.aspx) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36
|
3851
|
+
bot:
|
3852
|
+
name: BDCbot
|
3853
|
+
category: Crawler
|
3854
|
+
url: https://bigweb.bigdatacorp.com.br/pages/faq.aspx
|
3855
|
+
producer:
|
3856
|
+
name: BIG Data Solucoes Em Tecnologia de Informatica LTDA
|
3857
|
+
url: https://bigdatacorp.com.br/
|
3858
|
+
-
|
3859
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36 CloudflareDiagnostics/1.0
|
3860
|
+
bot:
|
3861
|
+
name: Cloudflare Diagnostics
|
3862
|
+
category: Site Monitor
|
3863
|
+
url: https://www.cloudflare.com/
|
3864
|
+
producer:
|
3865
|
+
name: Cloudflare
|
3866
|
+
url: https://www.cloudflare.com
|
3867
|
+
-
|
3868
|
+
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 12_0 like Mac OS X) adbeat.com/policy AppleWebKit/605.1.15 (KHTML, like Gecko) CriOS/69.0.3497.105 Mobile/15E148 Safari/605.1
|
3869
|
+
bot:
|
3870
|
+
name: Adbeat
|
3871
|
+
category: Crawler
|
3872
|
+
url: https://www.adbeat.com/operation_policy
|
3873
|
+
producer:
|
3874
|
+
name: PPC Labs LLC
|
3875
|
+
url: https://www.adbeat.com/
|
3876
|
+
-
|
3877
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; BW/1.1; bit.ly/2W6Px8S) Chrome/84.0.4147.105 Safari/537.36
|
3878
|
+
bot:
|
3879
|
+
name: BuiltWith
|
3880
|
+
category: Crawler
|
3881
|
+
url: https://builtwith.com/biup
|
3882
|
+
producer:
|
3883
|
+
name: BuiltWith Pty Ltd
|
3884
|
+
url: https://builtwith.com/
|
3885
|
+
-
|
3886
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36 (+https://whatis.contentkingapp.com)
|
3887
|
+
bot:
|
3888
|
+
name: ContentKing
|
3889
|
+
category: Site Monitor
|
3890
|
+
url: https://whatis.contentkingapp.com/
|
3891
|
+
producer:
|
3892
|
+
name: ContentKing BV
|
3893
|
+
url: https://www.contentkingapp.com/
|
3894
|
+
-
|
3895
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.89 Safari/537.36 MicroAdBot/1.1 (https://www.microad.co.jp/contact/)
|
3896
|
+
bot:
|
3897
|
+
name: MicroAdBot
|
3898
|
+
category: Crawler
|
3899
|
+
url: https://www.microad.co.jp/
|
3900
|
+
producer:
|
3901
|
+
name: MicroAd, Inc.
|
3902
|
+
url: https://www.microad.co.jp/
|
3903
|
+
-
|
3904
|
+
user_agent: Mozilla/5.0 (compatible; PingAdmin.Ru/1.2; +http://pingadmin.ru/free_test/)
|
3905
|
+
bot:
|
3906
|
+
name: PingAdmin.Ru
|
3907
|
+
category: Site Monitor
|
3908
|
+
url: https://ping-admin.ru/
|
3909
|
+
-
|
3910
|
+
user_agent: Mozilla/5.0 (compatible; WebDataStats/1.0 ; +https://webdatastats.com/policy.html)
|
3911
|
+
bot:
|
3912
|
+
name: WebDataStats
|
3913
|
+
category: Crawler
|
3914
|
+
url: https://webdatastats.com/policy.html
|
3915
|
+
producer:
|
3916
|
+
name: WebTehRazrabotka LLC
|
3917
|
+
url: https://webdatastats.com/
|
3918
|
+
-
|
3919
|
+
user_agent: Mozilla/5.0 (compatible; parse.ly scraper/0.14; +http://parsely.com)
|
3920
|
+
bot:
|
3921
|
+
name: parse.ly
|
3922
|
+
category: Crawler
|
3923
|
+
url: https://www.parse.ly/help/integration/crawler
|
3924
|
+
producer:
|
3925
|
+
name: Parsely, Inc.
|
3926
|
+
url: https://www.parse.ly/
|
3927
|
+
-
|
3928
|
+
user_agent: Mozilla/5.0 (compatible; Nimbostratus-Bot/v1.3.2; http://cloudsystemnetworks.com)
|
3929
|
+
bot:
|
3930
|
+
name: Nimbostratus Bot
|
3931
|
+
category: Site Monitor
|
3932
|
+
url: http://cloudsystemnetworks.com
|
3933
|
+
-
|
3934
|
+
user_agent: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.17) Gecko/20110515 HeartRails_Capture/1.0.4 (+http://capture.heartrails.com/) Namoroka/3.6.17
|
3935
|
+
bot:
|
3936
|
+
name: Heart Rails Capture
|
3937
|
+
category: Service Agent
|
3938
|
+
url: http://capture.heartrails.com
|
3939
|
+
-
|
3940
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36 http://notifyninja.com/monitoring
|
3941
|
+
bot:
|
3942
|
+
name: Notify Ninja
|
3943
|
+
category: Site Monitor
|
3944
|
+
url: http://notifyninja.com
|
3945
|
+
-
|
3946
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) Project-Resonance (http://project-resonance.com/) (KHTML, like Gecko) Chrome/83.0.4103.61 Safari/537.36
|
3947
|
+
bot:
|
3948
|
+
name: Project Resonance
|
3949
|
+
category: Crawler
|
3950
|
+
url: http://project-resonance.com
|
3951
|
+
-
|
3952
|
+
user_agent: Mozilla/5.0 (compatible; DataXu/1.0; +http://dataxu.com)
|
3953
|
+
bot:
|
3954
|
+
name: DataXu
|
3955
|
+
category: Service Agent
|
3956
|
+
url: https://advertising.roku.com/dataxu
|
3957
|
+
producer:
|
3958
|
+
name: Roku, Inc.
|
3959
|
+
url: https://roku.com
|
3960
|
+
-
|
3961
|
+
user_agent: Mozilla/5.0 (Unknown; Linux x86_64) AppleWebKit/534.34 (KHTML, like Gecko) PingdomTMS/0.8.5 Safari/534.34
|
3962
|
+
bot:
|
3963
|
+
name: Pingdom Bot
|
3964
|
+
category: Site Monitor
|
3965
|
+
url: ""
|
3966
|
+
producer:
|
3967
|
+
name: Pingdom AB
|
3968
|
+
url: https://www.pingdom.com
|
3969
|
+
-
|
3970
|
+
user_agent: Mozilla/5.0 (compatible; Cocolyzebot/1.0; https://cocolyze.com/bot)
|
3971
|
+
bot:
|
3972
|
+
name: Cocolyzebot
|
3973
|
+
category: Crawler
|
3974
|
+
url: https://cocolyze.com/en/cocolyzebot
|
3975
|
+
producer:
|
3976
|
+
name: VSI INNOVATION SAS
|
3977
|
+
url: https://vsi-innovation.com/
|
3978
|
+
-
|
3979
|
+
user_agent: veryhip (http://veryhip.com/)
|
3980
|
+
bot:
|
3981
|
+
name: VeryHip
|
3982
|
+
category: Crawler
|
3983
|
+
url: https://veryhip.com/
|
3984
|
+
producer:
|
3985
|
+
name: VeryHip
|
3986
|
+
url: https://veryhip.com/
|
3987
|
+
-
|
3988
|
+
user_agent: Mozilla/5.0 (compatible; LinkpadBot/2.3; +http://linkpad.org/robot/)
|
3989
|
+
bot:
|
3990
|
+
name: LinkpadBot
|
3991
|
+
category: Crawler
|
3992
|
+
url: https://www.linkpad.org/
|
3993
|
+
producer:
|
3994
|
+
name: Solomono LLC
|
3995
|
+
url: https://www.linkpad.org/
|
3996
|
+
-
|
3997
|
+
user_agent: Mozilla/4.0 (compatible; MuscatFerret/1.7; http://www.webtop.com/)
|
3998
|
+
bot:
|
3999
|
+
name: MuscatFerret
|
4000
|
+
category: Crawler
|
4001
|
+
url: http://www.webtop.com/
|
4002
|
+
-
|
4003
|
+
user_agent: Quora-Bot/1.0 (http://www.quora.com)
|
4004
|
+
bot:
|
4005
|
+
name: Quora Bot
|
4006
|
+
category: Crawler
|
4007
|
+
url: ""
|
4008
|
+
producer:
|
4009
|
+
name: Quora
|
4010
|
+
url: https://www.quora.com/
|
4011
|
+
-
|
4012
|
+
user_agent: PageThing.com
|
4013
|
+
bot:
|
4014
|
+
name: PageThing
|
4015
|
+
category: Crawler
|
4016
|
+
url: https://www.pagething.com/
|
4017
|
+
producer:
|
4018
|
+
name: SPECIALNOISE LTD
|
4019
|
+
url: https://www.specialnoise.com/
|
4020
|
+
-
|
4021
|
+
user_agent: ArchiveBox/0.5.3 (+https://github.com/ArchiveBox/ArchiveBox/)
|
4022
|
+
bot:
|
4023
|
+
name: ArchiveBox
|
4024
|
+
url: https://archivebox.io/
|
4025
|
+
category: Crawler
|
4026
|
+
producer:
|
4027
|
+
name: ""
|
4028
|
+
url: ""
|
4029
|
+
-
|
4030
|
+
user_agent: Choosito/1.0 +http://www.choosito.com/
|
4031
|
+
bot:
|
4032
|
+
name: Choosito
|
4033
|
+
url: https://www.choosito.com/
|
4034
|
+
category: Crawler
|
4035
|
+
producer:
|
4036
|
+
name: Choosito! Inc.
|
4037
|
+
url: https://www.choosito.com/
|
4038
|
+
-
|
4039
|
+
user_agent: datagnionbot (+http://www.datagnion.com/bot.html)
|
4040
|
+
bot:
|
4041
|
+
name: datagnionbot
|
4042
|
+
url: https://www.datagnion.com/bot.html
|
4043
|
+
category: Crawler
|
4044
|
+
producer:
|
4045
|
+
name: DATAGNION GMBH
|
4046
|
+
url: https://www.datagnion.com/
|
4047
|
+
-
|
4048
|
+
user_agent: InterNaetBoten/0.99 (http://www.xn--internt-bxa.nu)
|
4049
|
+
bot:
|
4050
|
+
name: Generic Bot
|
4051
|
+
-
|
4052
|
+
user_agent: EasyBib AutoCite (http://autocite-info.citation-api.com/)
|
4053
|
+
bot:
|
4054
|
+
name: Generic Bot
|
4055
|
+
-
|
4056
|
+
user_agent: Bidtellect/0.0.643.0
|
4057
|
+
bot:
|
4058
|
+
name: Generic Bot
|
4059
|
+
-
|
4060
|
+
user_agent: Mozilla/5.0 (compatible; meg/0.2; +https://github.com/tomnomnom/meg)
|
4061
|
+
bot:
|
4062
|
+
name: Generic Bot
|
4063
|
+
-
|
4064
|
+
user_agent: Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:66.0) WhatCMS/1.0
|
4065
|
+
bot:
|
4066
|
+
name: WhatCMS
|
4067
|
+
url: https://whatcms.org/
|
4068
|
+
category: Crawler
|
4069
|
+
producer:
|
4070
|
+
name: "Nineteen Ten LLC"
|
4071
|
+
url: "https://whatcms.org/"
|
4072
|
+
-
|
4073
|
+
user_agent: httpx - Open-source project (github.com/projectdiscovery/httpx)
|
4074
|
+
bot:
|
4075
|
+
name: httpx
|
4076
|
+
url: https://github.com/projectdiscovery/httpx
|
4077
|
+
category: Crawler
|
4078
|
+
producer:
|
4079
|
+
name: ""
|
4080
|
+
url: ""
|
4081
|
+
-
|
4082
|
+
user_agent: 'Expanse indexes the network perimeters of our customers. If you have any questions or concerns, please reach out to: scaninfo@expanseinc.com'
|
4083
|
+
bot:
|
4084
|
+
name: Expanse
|
3135
4085
|
category: Security Checker
|
3136
|
-
url: https://
|
3137
|
-
|
3138
|
-
|
4086
|
+
url: https://expanse.co/
|
4087
|
+
producer:
|
4088
|
+
name: Expanse Inc.
|
4089
|
+
url: https://expanse.co/
|
4090
|
+
-
|
4091
|
+
user_agent: 'HuaweiWebCatBot/6.0) (To acquire the allowed html pages as reliable information of URL categorization in the automatic process for Huawei Web Categorization.; https://isecurity.huawei.com/; sec at huawei dot com)'
|
3139
4092
|
bot:
|
3140
|
-
name:
|
4093
|
+
name: HuaweiWebCatBot
|
4094
|
+
category: Crawler
|
4095
|
+
url: https://isecurity.huawei.com
|
3141
4096
|
producer:
|
3142
|
-
name:
|
3143
|
-
url: https://
|
4097
|
+
name: Huawei Technologies Co., Ltd.
|
4098
|
+
url: https://huawei.com
|
4099
|
+
-
|
4100
|
+
user_agent: Mozilla/5.0 (compatible; SputnikFaviconBot/1.2; +http://corp.sputnik.ru/webmaster)
|
4101
|
+
bot:
|
4102
|
+
name: Sputnik Favicon Bot
|
4103
|
+
url: ""
|
4104
|
+
category: Crawler
|
4105
|
+
-
|
4106
|
+
user_agent: Hatena-Favicon2 (http://www.hatena.ne.jp/faq/)
|
4107
|
+
bot:
|
4108
|
+
name: Hatena Favicon
|
4109
|
+
category: Crawler
|
4110
|
+
url: https://www.hatena.ne.jp/faq/
|
4111
|
+
producer:
|
4112
|
+
name: Hatena Co., Ltd.
|
4113
|
+
url: https://www.hatena.ne.jp
|
4114
|
+
-
|
4115
|
+
user_agent: Mozilla/5.0 (compatible; RyowlEngine/1.0; +https://ryowl.org)
|
4116
|
+
bot:
|
4117
|
+
name: Ryowl
|
4118
|
+
category: Crawler
|
4119
|
+
url: https://ryowl.org
|
4120
|
+
-
|
4121
|
+
user_agent: Mozilla/5.0 (compatible; OdklBot/1.0 like Linux; klass@odnoklassniki.ru)
|
4122
|
+
bot:
|
4123
|
+
name: Odnoklassniki Bot
|
4124
|
+
category: Crawler
|
4125
|
+
url: https://odnoklassniki.ru
|
4126
|
+
-
|
4127
|
+
user_agent: Mediatoolkitbot (complaints@mediatoolkit.com)
|
4128
|
+
bot:
|
4129
|
+
name: Mediatoolkit Bot
|
4130
|
+
category: Crawler
|
4131
|
+
url: https://mediatoolkit.com
|
4132
|
+
-
|
4133
|
+
user_agent: ZoominfoBot (zoominfobot at zoominfo dot com)
|
4134
|
+
bot:
|
4135
|
+
name: ZoominfoBot
|
4136
|
+
category: Crawler
|
4137
|
+
url: https://www.zoominfo.com
|
4138
|
+
-
|
4139
|
+
user_agent: Mozilla/5.0 (compatible; WeViKaBot/1.0; +http://www.wevika.de/)
|
4140
|
+
bot:
|
4141
|
+
name: WeViKaBot
|
4142
|
+
category: Crawler
|
4143
|
+
url: http://www.wevika.de
|
4144
|
+
-
|
4145
|
+
user_agent: Mozilla/5.0 (compatible; SEOkicks; +https://www.seokicks.de/robot.html)
|
4146
|
+
bot:
|
4147
|
+
name: SEOkicks
|
4148
|
+
category: Crawler
|
4149
|
+
url: https://www.seokicks.de/robot.html
|
4150
|
+
-
|
4151
|
+
user_agent: Mozilla/5.0 (compatible; Plukkie/1.6; http://www.botje.com/plukkie.htm)
|
4152
|
+
bot:
|
4153
|
+
name: Plukkie
|
4154
|
+
category: Crawler
|
4155
|
+
url: http://www.botje.com/plukkie.htm
|
4156
|
+
-
|
4157
|
+
user_agent: Mozilla/5.0 (compatible; proximic; https://www.comscore.com/Web-Crawler)
|
4158
|
+
bot:
|
4159
|
+
name: Comscore
|
4160
|
+
category: Crawler
|
4161
|
+
url: https://www.comscore.com/Web-Crawler
|
4162
|
+
-
|
4163
|
+
user_agent: Mozilla/5.0 (compatible; SurdotlyBot/1.0; +http://sur.ly/bot.html)
|
4164
|
+
bot:
|
4165
|
+
name: SurdotlyBot
|
4166
|
+
category: Crawler
|
4167
|
+
url: http://sur.ly/bot.html
|
4168
|
+
-
|
4169
|
+
user_agent: Mozilla/5.0 (compatible; Gowikibot/1.0; +http://www.gowikibot.com)
|
4170
|
+
bot:
|
4171
|
+
name: Gowikibot
|
4172
|
+
category: Crawler
|
4173
|
+
url: http:/www.gowikibot.com
|
4174
|
+
-
|
4175
|
+
user_agent: Mozilla/5.0 (compatible; SabsimBot/3.0; +https://sabsim.com)
|
4176
|
+
bot:
|
4177
|
+
name: SabsimBot
|
4178
|
+
category: Crawler
|
4179
|
+
url: https://sabsim.com
|
4180
|
+
-
|
4181
|
+
user_agent: Mozilla/5.0 (compatible; LumtelBot/1.0; +http://lumtel.com)
|
4182
|
+
bot:
|
4183
|
+
name: LumtelBot
|
4184
|
+
category: Crawler
|
4185
|
+
url: https://umtel.com
|
4186
|
+
-
|
4187
|
+
user_agent: Mozilla/5.0+(compatible;+PiplBot;+http://www.pipl.com/bot/)
|
4188
|
+
bot:
|
4189
|
+
name: PiplBot
|
4190
|
+
category: Crawler
|
4191
|
+
url: http://www.pipl.com/bot
|
4192
|
+
-
|
4193
|
+
user_agent: Mozilla/5.0 (compatible; woobot/2.0; +https://www.woorank.com/bot)
|
4194
|
+
bot:
|
4195
|
+
name: WooRank
|
4196
|
+
category: Crawler
|
4197
|
+
url: https://www.woorank.com/bot
|
4198
|
+
-
|
4199
|
+
user_agent: YahooMailProxy; https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
4200
|
+
bot:
|
4201
|
+
name: Yahoo! Mail Proxy
|
4202
|
+
category: Service Agent
|
4203
|
+
url: https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
4204
|
+
producer:
|
4205
|
+
name: Yahoo! Inc.
|
4206
|
+
url: http://www.yahoo.com
|
4207
|
+
-
|
4208
|
+
user_agent: 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; Cookiebot/1.0; http://cookiebot.com/) Chrome/79.0.3945.117 Safari/537.36'
|
4209
|
+
bot:
|
4210
|
+
name: Cookiebot
|
4211
|
+
category: Crawler
|
4212
|
+
url: https://support.cookiebot.com/hc/en-us/articles/360014264140-Scanner-User-Agent
|
4213
|
+
producer:
|
4214
|
+
name: Cybot A/S
|
4215
|
+
url: https://www.cybot.com/
|
4216
|
+
-
|
4217
|
+
user_agent: NetSystemsResearch studies the availability of various services across the internet. Our website is netsystemsresearch.com
|
4218
|
+
bot:
|
4219
|
+
name: NetSystemsResearch
|
4220
|
+
category: Security Checker
|
4221
|
+
url: https://www.netsystemsresearch.com/
|
4222
|
+
producer:
|
4223
|
+
name: NET SYSTEMS RESEARCH LLC
|
4224
|
+
url: https://www.netsystemsresearch.com/
|
4225
|
+
-
|
4226
|
+
user_agent: 'Mozilla/5.0 (compatible; CensysInspect/1.1; https://about.censys.io/)'
|
4227
|
+
bot:
|
4228
|
+
name: CensysInspect
|
4229
|
+
category: Security Checker
|
4230
|
+
url: https://about.censys.io/
|
4231
|
+
producer:
|
4232
|
+
name: Censys, Inc.
|
4233
|
+
url: https://censys.io/
|
4234
|
+
-
|
4235
|
+
user_agent: https://gdnplus.com:Gather Analyze Provide.
|
4236
|
+
bot:
|
4237
|
+
name: GDNP
|
4238
|
+
category: Crawler
|
4239
|
+
url: https://gdnplus.com/
|
4240
|
+
producer:
|
4241
|
+
name: Global Digital Network Plus, LLC
|
4242
|
+
url: https://gdnplus.com/
|
4243
|
+
-
|
4244
|
+
user_agent: WellKnownBot/0.1 (https://well-known.dev)
|
4245
|
+
bot:
|
4246
|
+
name: WellKnownBot
|
4247
|
+
category: Crawler
|
4248
|
+
url: https://well-known.dev
|
4249
|
+
-
|
4250
|
+
user_agent: Mozilla/5.0 (compatible; Adsbot/3.1; https://seostar.co/robot/)
|
4251
|
+
bot:
|
4252
|
+
name: Adsbot
|
4253
|
+
category: Crawler
|
4254
|
+
url: https://seostar.co/robot/
|
4255
|
+
-
|
4256
|
+
user_agent: MTRobot/0.2 (Metrics Tools Analytics Crawler; https://metrics-tools.de/robot.html; crawler@metrics-tools.de)
|
4257
|
+
bot:
|
4258
|
+
name: MTRobot
|
4259
|
+
category: Crawler
|
4260
|
+
url: https://metrics-tools.de/robot.html
|
4261
|
+
producer:
|
4262
|
+
name: Metrics Tools
|
4263
|
+
url: https://metrics-tools.de/
|
4264
|
+
-
|
4265
|
+
user_agent: My User Agent 1.0
|
4266
|
+
bot:
|
4267
|
+
name: Generic Bot
|
4268
|
+
-
|
4269
|
+
user_agent: serpstatbot/1.0 (advanced backlink tracking bot; curl/7.58.0; http://serpstatbot.com/; abuse@serpstatbot.com)
|
4270
|
+
bot:
|
4271
|
+
name: serpstatbot
|
4272
|
+
category: Crawler
|
4273
|
+
url: http://serpstatbot.com/
|
4274
|
+
producer:
|
4275
|
+
name: Netpeak Ltd
|
4276
|
+
url: https://netpeak.net/
|
4277
|
+
-
|
4278
|
+
user_agent: colly - https://github.com/gocolly/colly/v2
|
4279
|
+
bot:
|
4280
|
+
name: colly
|
4281
|
+
category: Crawler
|
4282
|
+
url: https://github.com/gocolly/colly/
|
4283
|
+
-
|
4284
|
+
user_agent: l9tcpid/v1.0.0
|
4285
|
+
bot:
|
4286
|
+
name: l9tcpid
|
4287
|
+
category: Security Checker
|
4288
|
+
url: https://github.com/LeakIX/l9tcpid
|
4289
|
+
-
|
4290
|
+
user_agent: Mozilla/5.0 (compatible; MegaIndex.ru/2.0; +http://megaindex.com/crawler)
|
4291
|
+
bot:
|
4292
|
+
name: MegaIndex
|
4293
|
+
category: Crawler
|
4294
|
+
url: https://megaindex.com/crawler
|
4295
|
+
-
|
4296
|
+
user_agent: Mozilla/5.0 (compatible; Seekport Crawler; http://seekport.com/)
|
4297
|
+
bot:
|
4298
|
+
name: Seekport
|
4299
|
+
category: Crawler
|
4300
|
+
url: http://www.seekport.com/
|
4301
|
+
producer:
|
4302
|
+
name: SISTRIX GmbH
|
4303
|
+
url: https://www.sistrix.de/
|
4304
|
+
-
|
4305
|
+
user_agent: Mozilla/5.0 (compatible; seolyt/1.1; +https://seolyt.com)
|
4306
|
+
bot:
|
4307
|
+
name: seolyt
|
4308
|
+
category: Crawler
|
4309
|
+
url: https://seolyt.com/
|
4310
|
+
-
|
4311
|
+
user_agent: Mozilla/5.0 (compatible; YaK/1.0; http://linkfluence.com/; bot@linkfluence.com)
|
4312
|
+
bot:
|
4313
|
+
name: YaK
|
4314
|
+
category: Crawler
|
4315
|
+
url: https://www.linkfluence.com/
|
4316
|
+
producer:
|
4317
|
+
name: Linkfluence SAS
|
4318
|
+
url: https://www.linkfluence.com/
|
4319
|
+
-
|
4320
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64; +http://www.komodia.com/newwiki/index.php/URL_server_crawler) KomodiaBot/1.0
|
4321
|
+
bot:
|
4322
|
+
name: KomodiaBot
|
4323
|
+
category: Crawler
|
4324
|
+
url: http://www.komodia.com/newwiki/index.php/URL_server_crawler
|
4325
|
+
producer:
|
4326
|
+
name: Komodia Inc.
|
4327
|
+
url: https://www.komodia.com/
|
4328
|
+
-
|
4329
|
+
user_agent: Mozilla/5.0 (Windows NT 6.3; WOW64; Trident/7.0; rv:11.0; Catchpoint) like Gecko
|
4330
|
+
bot:
|
4331
|
+
name: Catchpoint
|
4332
|
+
category: Site Monitor
|
4333
|
+
url: https://www.catchpoint.com/
|
4334
|
+
producer:
|
4335
|
+
name: Catchpoint Systems
|
4336
|
+
url: https://www.catchpoint.com/
|
4337
|
+
-
|
4338
|
+
user_agent: Better Uptime Bot Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36
|
4339
|
+
bot:
|
4340
|
+
name: Better Uptime Bot
|
4341
|
+
category: Site Monitor
|
4342
|
+
url: https://betteruptime.com/faq
|
4343
|
+
producer:
|
4344
|
+
name: Better Uptime
|
4345
|
+
url: https://betteruptime.com/
|
4346
|
+
-
|
4347
|
+
user_agent: gobuster/3.1.0
|
4348
|
+
bot:
|
4349
|
+
name: Gobuster
|
4350
|
+
url: https://github.com/OJ/gobuster
|
4351
|
+
-
|
4352
|
+
user_agent: k6/0.31.1 (https://k6.io/)
|
4353
|
+
bot:
|
4354
|
+
name: K6
|
4355
|
+
url: https://k6.io/
|
4356
|
+
-
|
4357
|
+
user_agent: Mozilla/5.0 (compatible; Neevabot/1.0; https://neeva.com/neevabot)
|
4358
|
+
bot:
|
4359
|
+
name: Neevabot
|
4360
|
+
category: Search bot
|
4361
|
+
url: https://neeva.com/neevabot
|
4362
|
+
producer:
|
4363
|
+
name: Neeva Inc.
|
4364
|
+
url: https://neeva.com/
|
4365
|
+
-
|
4366
|
+
user_agent: LinkPreview/1.5 (http://linkpreview.net)
|
4367
|
+
bot:
|
4368
|
+
name: LinkPreview
|
4369
|
+
category: Service Agent
|
4370
|
+
url: https://www.linkpreview.net/
|
4371
|
+
-
|
4372
|
+
user_agent: Mozilla/5.0 (compatible; JungleKeyThumbnail/1.1; +http://www.junglekey.fr/)
|
4373
|
+
bot:
|
4374
|
+
name: JungleKeyThumbnail
|
4375
|
+
category: Crawler
|
4376
|
+
url: https://junglekey.com/
|
4377
|
+
-
|
4378
|
+
user_agent: rocketmonitor 1.0
|
4379
|
+
bot:
|
4380
|
+
name: RocketMonitorBot
|
4381
|
+
category: Site Monitor
|
4382
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
4383
|
+
producer:
|
4384
|
+
name: Radio Mast, Inc.
|
4385
|
+
url: https://www.radiomast.io/
|
4386
|
+
-
|
4387
|
+
user_agent: RocketMonitorBot/1.0 ( https://www.radiomast.io)
|
4388
|
+
bot:
|
4389
|
+
name: RocketMonitorBot
|
4390
|
+
category: Site Monitor
|
4391
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
4392
|
+
producer:
|
4393
|
+
name: Radio Mast, Inc.
|
4394
|
+
url: https://www.radiomast.io/
|
4395
|
+
-
|
4396
|
+
user_agent: SitemapParser-VIPnytt/1.1 ( https://github.com/VIPnytt/SitemapParser/blob/master/README.md)
|
4397
|
+
bot:
|
4398
|
+
name: SitemapParser-VIPnytt
|
4399
|
+
category: Crawler
|
4400
|
+
url: https://github.com/VIPnytt/SitemapParser/
|
4401
|
+
-
|
4402
|
+
user_agent: Turnitin (https://bit.ly/2UvnfoQ)
|
4403
|
+
bot:
|
4404
|
+
name: Turnitin
|
4405
|
+
category: Crawler
|
4406
|
+
url: https://turnitin.com/robot/crawlerinfo.html
|
4407
|
+
-
|
4408
|
+
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; Storebot-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Mobile Safari/537.36
|
4409
|
+
bot:
|
4410
|
+
name: Google StoreBot
|
4411
|
+
category: Crawler
|
4412
|
+
-
|
4413
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.56 Safari/537.36 DMBrowser/2.1 (UV)
|
4414
|
+
bot:
|
4415
|
+
name: Dotcom Monitor
|
4416
|
+
category: Site Monitor
|
4417
|
+
url: https://www.dotcom-monitor.com
|
4418
|
+
-
|
4419
|
+
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64; rv:29.0) Gecko/20100101 /29.0 DMBrowser-BV
|
4420
|
+
bot:
|
4421
|
+
name: Dotcom Monitor
|
4422
|
+
category: Site Monitor
|
4423
|
+
url: https://www.dotcom-monitor.com
|
4424
|
+
-
|
4425
|
+
user_agent: Mozilla/5.0 (compatible; ThinkChaos/0.3.0; +In_the_test_phase,_if_the_ThinkChaos_brings_you_trouble,_please_add_disallow_to_the_robots.txt._Thank_you.)
|
4426
|
+
bot:
|
4427
|
+
name: ThinkChaos
|
4428
|
+
category: Crawler
|
4429
|
+
-
|
4430
|
+
user_agent: Mozilla/5.0 (compatible; DataForSeoBot/1.0; +https://dataforseo.com/dataforseo-bot)
|
4431
|
+
bot:
|
4432
|
+
name: DataForSeoBot
|
4433
|
+
category: Crawler
|
4434
|
+
url: https://dataforseo.com/dataforseo-bot
|