device_detector 1.0.5 → 1.0.6
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/README.md +7 -6
- data/lib/device_detector/browser.rb +364 -0
- data/lib/device_detector/client.rb +8 -0
- data/lib/device_detector/device.rb +1124 -4
- data/lib/device_detector/os.rb +36 -11
- data/lib/device_detector/version.rb +1 -1
- data/lib/device_detector/version_extractor.rb +9 -0
- data/lib/device_detector.rb +57 -13
- data/regexes/bots.yml +551 -58
- data/regexes/client/browser_engine.yml +7 -1
- data/regexes/client/browsers.yml +594 -71
- data/regexes/client/feed_readers.yml +4 -10
- data/regexes/client/libraries.yml +47 -2
- data/regexes/client/mediaplayers.yml +25 -1
- data/regexes/client/mobile_apps.yml +447 -77
- data/regexes/client/pim.yml +49 -1
- data/regexes/device/cameras.yml +5 -5
- data/regexes/device/car_browsers.yml +16 -0
- data/regexes/device/consoles.yml +6 -0
- data/regexes/device/mobiles.yml +12905 -4561
- data/regexes/device/portable_media_player.yml +20 -3
- data/regexes/device/shell_tv.yml +117 -0
- data/regexes/device/televisions.yml +426 -35
- data/regexes/oss.yml +567 -139
- data/spec/device_detector/concrete_user_agent_spec.rb +30 -42
- data/spec/device_detector/detector_fixtures_spec.rb +9 -5
- data/spec/device_detector/device_spec.rb +26 -10
- data/spec/fixtures/client/browser.yml +1463 -391
- data/spec/fixtures/client/feed_reader.yml +0 -12
- data/spec/fixtures/client/library.yml +91 -37
- data/spec/fixtures/client/mediaplayer.yml +30 -0
- data/spec/fixtures/client/mobile_app.yml +498 -45
- data/spec/fixtures/client/pim.yml +60 -0
- data/spec/fixtures/detector/bots.yml +1189 -568
- data/spec/fixtures/detector/camera.yml +12 -26
- data/spec/fixtures/detector/car_browser.yml +151 -15
- data/spec/fixtures/detector/console.yml +70 -48
- data/spec/fixtures/detector/desktop.yml +2041 -916
- data/spec/fixtures/detector/feature_phone.yml +895 -189
- data/spec/fixtures/detector/feed_reader.yml +50 -77
- data/spec/fixtures/detector/mediaplayer.yml +79 -26
- data/spec/fixtures/detector/mobile_apps.yml +726 -72
- data/spec/fixtures/detector/peripheral.yml +271 -0
- data/spec/fixtures/detector/phablet.yml +3635 -1596
- data/spec/fixtures/detector/portable_media_player.yml +355 -46
- data/spec/fixtures/detector/smart_display.yml +183 -9
- data/spec/fixtures/detector/smart_speaker.yml +13 -8
- data/spec/fixtures/detector/smartphone-1.yml +4002 -4286
- data/spec/fixtures/detector/smartphone-10.yml +3771 -4763
- data/spec/fixtures/detector/smartphone-11.yml +3615 -4692
- data/spec/fixtures/detector/smartphone-12.yml +3856 -4764
- data/spec/fixtures/detector/smartphone-13.yml +4213 -4713
- data/spec/fixtures/detector/smartphone-14.yml +4039 -4497
- data/spec/fixtures/detector/smartphone-15.yml +5642 -2956
- data/spec/fixtures/detector/smartphone-16.yml +4739 -5082
- data/spec/fixtures/detector/smartphone-17.yml +4832 -4275
- data/spec/fixtures/detector/smartphone-18.yml +9806 -0
- data/spec/fixtures/detector/smartphone-19.yml +9965 -0
- data/spec/fixtures/detector/smartphone-2.yml +4842 -2589
- data/spec/fixtures/detector/smartphone-20.yml +9710 -0
- data/spec/fixtures/detector/smartphone-21.yml +8693 -0
- data/spec/fixtures/detector/smartphone-22.yml +10178 -0
- data/spec/fixtures/detector/smartphone-23.yml +9453 -0
- data/spec/fixtures/detector/smartphone-24.yml +9843 -0
- data/spec/fixtures/detector/smartphone-25.yml +9703 -0
- data/spec/fixtures/detector/smartphone-26.yml +10007 -0
- data/spec/fixtures/detector/smartphone-27.yml +4927 -0
- data/spec/fixtures/detector/smartphone-3.yml +4387 -4427
- data/spec/fixtures/detector/smartphone-4.yml +3597 -4582
- data/spec/fixtures/detector/smartphone-5.yml +4066 -5022
- data/spec/fixtures/detector/smartphone-6.yml +3455 -4621
- data/spec/fixtures/detector/smartphone-7.yml +3574 -4574
- data/spec/fixtures/detector/smartphone-8.yml +4617 -4704
- data/spec/fixtures/detector/smartphone-9.yml +4080 -5035
- data/spec/fixtures/detector/smartphone.yml +3244 -4234
- data/spec/fixtures/detector/tablet-1.yml +4652 -4492
- data/spec/fixtures/detector/tablet-2.yml +3515 -4434
- data/spec/fixtures/detector/tablet-3.yml +3418 -4351
- data/spec/fixtures/detector/tablet-4.yml +5149 -3200
- data/spec/fixtures/detector/tablet-5.yml +9273 -0
- data/spec/fixtures/detector/tablet-6.yml +4588 -0
- data/spec/fixtures/detector/tablet.yml +1621 -2613
- data/spec/fixtures/detector/tv-1.yml +2501 -0
- data/spec/fixtures/detector/tv.yml +7826 -3114
- data/spec/fixtures/detector/unknown.yml +370 -531
- data/spec/fixtures/detector/wearable.yml +863 -9
- data/spec/fixtures/parser/oss.yml +1350 -21
- data/spec/fixtures/parser/vendorfragments.yml +53 -53
- metadata +35 -5
@@ -1,45 +1,51 @@
|
|
1
1
|
---
|
2
|
-
-
|
2
|
+
-
|
3
3
|
user_agent: 360spider-image
|
4
4
|
bot:
|
5
5
|
name: 360Spider
|
6
6
|
category: Search bot
|
7
|
-
url:
|
7
|
+
url: https://www.so.com/help/help_3_2.html
|
8
8
|
producer:
|
9
9
|
name: Online Media Group, Inc.
|
10
10
|
url: ""
|
11
|
-
-
|
11
|
+
-
|
12
12
|
user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
|
13
13
|
bot:
|
14
14
|
name: 360Spider
|
15
15
|
category: Search bot
|
16
|
-
url:
|
16
|
+
url: https://www.so.com/help/help_3_2.html
|
17
17
|
producer:
|
18
18
|
name: Online Media Group, Inc.
|
19
19
|
url: ""
|
20
|
-
-
|
20
|
+
-
|
21
21
|
user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
|
22
22
|
bot:
|
23
23
|
name: 360Spider
|
24
24
|
category: Search bot
|
25
|
-
url:
|
25
|
+
url: https://www.so.com/help/help_3_2.html
|
26
26
|
producer:
|
27
27
|
name: Online Media Group, Inc.
|
28
28
|
url: ""
|
29
|
-
-
|
29
|
+
-
|
30
30
|
user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
|
31
31
|
bot:
|
32
32
|
name: 360Spider
|
33
33
|
category: Search bot
|
34
|
-
url:
|
34
|
+
url: https://www.so.com/help/help_3_2.html
|
35
35
|
producer:
|
36
36
|
name: Online Media Group, Inc.
|
37
37
|
url: ""
|
38
|
-
-
|
38
|
+
-
|
39
39
|
user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
|
40
40
|
bot:
|
41
41
|
name: ADMantX
|
42
|
-
-
|
42
|
+
-
|
43
|
+
user_agent: ias-va/3.1 (+https://www.admantx.com/service-fetcher.html)
|
44
|
+
bot:
|
45
|
+
name: ADmantX Service Fetcher
|
46
|
+
category: Service bot
|
47
|
+
url: https://www.admantx.com/service-fetcher.html
|
48
|
+
-
|
43
49
|
user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
|
44
50
|
bot:
|
45
51
|
name: Aboundexbot
|
@@ -48,7 +54,7 @@
|
|
48
54
|
producer:
|
49
55
|
name: Aboundex.com
|
50
56
|
url: http://www.aboundex.com
|
51
|
-
-
|
57
|
+
-
|
52
58
|
user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
|
53
59
|
bot:
|
54
60
|
name: Acoon
|
@@ -57,7 +63,7 @@
|
|
57
63
|
producer:
|
58
64
|
name: Acoon GmbH
|
59
65
|
url: http://www.acoon.de
|
60
|
-
-
|
66
|
+
-
|
61
67
|
user_agent: AddThis.com robot tech.support@clearspring.com
|
62
68
|
bot:
|
63
69
|
name: AddThis.com
|
@@ -66,25 +72,34 @@
|
|
66
72
|
producer:
|
67
73
|
name: Clearspring Technologies, Inc.
|
68
74
|
url: http://www.clearspring.com
|
69
|
-
-
|
75
|
+
-
|
70
76
|
user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
|
71
77
|
bot:
|
72
78
|
name: Alexa Crawler
|
73
79
|
category: Search bot
|
74
|
-
url: https://alexa.
|
80
|
+
url: https://support.alexa.com/hc/en-us/sections/200100794-Crawlers
|
75
81
|
producer:
|
76
82
|
name: Alexa Internet
|
77
|
-
url:
|
78
|
-
-
|
83
|
+
url: https://www.alexa.com
|
84
|
+
-
|
79
85
|
user_agent: Mozilla/5.0 (compatible; alexa site audit/1.0; http://www.alexa.com/help/webmasters; )
|
80
86
|
bot:
|
81
87
|
name: Alexa Site Audit
|
82
88
|
category: Site Monitor
|
83
|
-
url:
|
89
|
+
url: https://support.alexa.com/hc/en-us/articles/200450194
|
84
90
|
producer:
|
85
91
|
name: Alexa Internet
|
86
|
-
url:
|
87
|
-
-
|
92
|
+
url: https://www.alexa.com
|
93
|
+
-
|
94
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Amazonbot/0.1; +https://developer.amazon.com/support/amazonbot)
|
95
|
+
bot:
|
96
|
+
name: Amazon Bot
|
97
|
+
category: Crawler
|
98
|
+
url: https://developer.amazon.com/support/amazonbot
|
99
|
+
producer:
|
100
|
+
name: Amazon.com, Inc.
|
101
|
+
url: https://www.amazon.com/
|
102
|
+
-
|
88
103
|
user_agent: Amazon Route 53 Health Check Service; ref:xxxxxxxx-xxxx-xxxxxxxxx-xxxxxxxxxxxx; report http://amzn.to/xxxxxxx
|
89
104
|
bot:
|
90
105
|
name: Amazon Route53 Health Check
|
@@ -92,7 +107,7 @@
|
|
92
107
|
producer:
|
93
108
|
name: Amazon Web Services
|
94
109
|
url: https://aws.amazon.com/
|
95
|
-
-
|
110
|
+
-
|
96
111
|
user_agent: Amazon-Route53-Health-Check-Service (ref b0eb04d5-cb5e-40e7-839b-558e52fc3f0d; report http://amzn.to/1vsZADi)
|
97
112
|
bot:
|
98
113
|
name: Amazon Route53 Health Check
|
@@ -100,7 +115,7 @@
|
|
100
115
|
producer:
|
101
116
|
name: Amazon Web Services
|
102
117
|
url: https://aws.amazon.com/
|
103
|
-
-
|
118
|
+
-
|
104
119
|
user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
|
105
120
|
bot:
|
106
121
|
name: Amorank Spider
|
@@ -109,7 +124,7 @@
|
|
109
124
|
producer:
|
110
125
|
name: Amorank
|
111
126
|
url: http://www.amorank.com
|
112
|
-
-
|
127
|
+
-
|
113
128
|
user_agent: 'Curious George - www.analyticsseo.com/crawler'
|
114
129
|
bot:
|
115
130
|
name: Analytics SEO Crawler
|
@@ -118,7 +133,7 @@
|
|
118
133
|
producer:
|
119
134
|
name: Analytics SEO
|
120
135
|
url: http://www.analyticsseo.com
|
121
|
-
-
|
136
|
+
-
|
122
137
|
user_agent: ApacheBench/2.3
|
123
138
|
bot:
|
124
139
|
name: ApacheBench
|
@@ -126,35 +141,44 @@
|
|
126
141
|
url: https://httpd.apache.org/docs/2.4/programs/ab.html
|
127
142
|
producer:
|
128
143
|
name: The Apache Software Foundation
|
129
|
-
url:
|
130
|
-
-
|
144
|
+
url: https://www.apache.org/foundation/
|
145
|
+
-
|
131
146
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
|
132
147
|
bot:
|
133
148
|
name: Applebot
|
134
149
|
category: Crawler
|
135
|
-
url:
|
150
|
+
url: https://support.apple.com/en-us/HT204683
|
136
151
|
producer:
|
137
152
|
name: Apple Inc
|
138
|
-
url:
|
139
|
-
-
|
153
|
+
url: https://www.apple.com
|
154
|
+
-
|
155
|
+
user_agent: AppSignalBot/1.0 (+https://appsignal.com)
|
156
|
+
bot:
|
157
|
+
name: AppSignalBot
|
158
|
+
category: Site Monitor
|
159
|
+
url: https://docs.appsignal.com/uptime-monitoring/
|
160
|
+
producer:
|
161
|
+
name: AppSignal
|
162
|
+
url: https://appsignal.com/
|
163
|
+
-
|
140
164
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
|
141
165
|
bot:
|
142
166
|
name: Applebot
|
143
167
|
category: Crawler
|
144
|
-
url:
|
168
|
+
url: https://support.apple.com/en-us/HT204683
|
145
169
|
producer:
|
146
170
|
name: Apple Inc
|
147
|
-
url:
|
148
|
-
-
|
171
|
+
url: https://www.apple.com
|
172
|
+
-
|
149
173
|
user_agent: Arachni/v1.5.1
|
150
174
|
bot:
|
151
175
|
name: Arachni
|
152
176
|
category: Security Checker
|
153
|
-
url:
|
177
|
+
url: https://www.arachni-scanner.com/
|
154
178
|
producer:
|
155
179
|
name: Sarosys LLC
|
156
|
-
url:
|
157
|
-
-
|
180
|
+
url: https://www.sarosys.com/
|
181
|
+
-
|
158
182
|
user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
|
159
183
|
bot:
|
160
184
|
name: Ask Jeeves
|
@@ -163,7 +187,7 @@
|
|
163
187
|
producer:
|
164
188
|
name: Ask Jeeves Inc.
|
165
189
|
url: http://www.ask.com
|
166
|
-
-
|
190
|
+
-
|
167
191
|
user_agent: Mozilla/5.0 (compatible;AspiegelBot)
|
168
192
|
bot:
|
169
193
|
name: AspiegelBot
|
@@ -172,7 +196,7 @@
|
|
172
196
|
producer:
|
173
197
|
name: Huawei
|
174
198
|
url: https://www.huawei.com/
|
175
|
-
-
|
199
|
+
-
|
176
200
|
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; AspiegelBot)
|
177
201
|
bot:
|
178
202
|
name: AspiegelBot
|
@@ -181,7 +205,7 @@
|
|
181
205
|
producer:
|
182
206
|
name: Huawei
|
183
207
|
url: https://www.huawei.com/
|
184
|
-
-
|
208
|
+
-
|
185
209
|
user_agent: AwarioRssBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
186
210
|
bot:
|
187
211
|
name: Awario
|
@@ -190,7 +214,7 @@
|
|
190
214
|
producer:
|
191
215
|
name: Awario
|
192
216
|
url: https://awario.com/
|
193
|
-
-
|
217
|
+
-
|
194
218
|
user_agent: AwarioSmartBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
195
219
|
bot:
|
196
220
|
name: Awario
|
@@ -199,7 +223,7 @@
|
|
199
223
|
producer:
|
200
224
|
name: Awario
|
201
225
|
url: https://awario.com/
|
202
|
-
-
|
226
|
+
-
|
203
227
|
user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
|
204
228
|
bot:
|
205
229
|
name: BLEXBot Crawler
|
@@ -208,7 +232,7 @@
|
|
208
232
|
producer:
|
209
233
|
name: WebMeUp
|
210
234
|
url: http://webmeup.com
|
211
|
-
-
|
235
|
+
-
|
212
236
|
user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
|
213
237
|
bot:
|
214
238
|
name: BUbiNG
|
@@ -217,7 +241,7 @@
|
|
217
241
|
producer:
|
218
242
|
name: The Laboratory for Web Algorithmics (LAW)
|
219
243
|
url: 'http://law.di.unimi.it/software.php#buging'
|
220
|
-
-
|
244
|
+
-
|
221
245
|
user_agent: Backlink-Check.de (+http://www.backlink-check.de/bot.html)
|
222
246
|
bot:
|
223
247
|
name: Backlink-Check.de
|
@@ -226,7 +250,7 @@
|
|
226
250
|
producer:
|
227
251
|
name: Mediagreen Medienservice
|
228
252
|
url: http://www.backlink-check.de
|
229
|
-
-
|
253
|
+
-
|
230
254
|
user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
|
231
255
|
bot:
|
232
256
|
name: BacklinkCrawler
|
@@ -235,7 +259,7 @@
|
|
235
259
|
producer:
|
236
260
|
name: 2.0Promotion GbR
|
237
261
|
url: http://www.backlinktest.com
|
238
|
-
-
|
262
|
+
-
|
239
263
|
user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
|
240
264
|
bot:
|
241
265
|
name: Baidu Spider
|
@@ -244,7 +268,7 @@
|
|
244
268
|
producer:
|
245
269
|
name: Baidu
|
246
270
|
url: http://www.baidu.com
|
247
|
-
-
|
271
|
+
-
|
248
272
|
user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
|
249
273
|
bot:
|
250
274
|
name: Baidu Spider
|
@@ -253,7 +277,7 @@
|
|
253
277
|
producer:
|
254
278
|
name: Baidu
|
255
279
|
url: http://www.baidu.com
|
256
|
-
-
|
280
|
+
-
|
257
281
|
user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
|
258
282
|
bot:
|
259
283
|
name: Baidu Spider
|
@@ -262,7 +286,7 @@
|
|
262
286
|
producer:
|
263
287
|
name: Baidu
|
264
288
|
url: http://www.baidu.com
|
265
|
-
-
|
289
|
+
-
|
266
290
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
|
267
291
|
bot:
|
268
292
|
name: Baidu Spider
|
@@ -271,7 +295,7 @@
|
|
271
295
|
producer:
|
272
296
|
name: Baidu
|
273
297
|
url: http://www.baidu.com
|
274
|
-
-
|
298
|
+
-
|
275
299
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
|
276
300
|
bot:
|
277
301
|
name: Baidu Spider
|
@@ -280,7 +304,7 @@
|
|
280
304
|
producer:
|
281
305
|
name: Baidu
|
282
306
|
url: http://www.baidu.com
|
283
|
-
-
|
307
|
+
-
|
284
308
|
user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
|
285
309
|
bot:
|
286
310
|
name: Baidu Spider
|
@@ -289,7 +313,7 @@
|
|
289
313
|
producer:
|
290
314
|
name: Baidu
|
291
315
|
url: http://www.baidu.com
|
292
|
-
-
|
316
|
+
-
|
293
317
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
|
294
318
|
bot:
|
295
319
|
name: Baidu Spider
|
@@ -298,7 +322,13 @@
|
|
298
322
|
producer:
|
299
323
|
name: Baidu
|
300
324
|
url: http://www.baidu.com
|
301
|
-
-
|
325
|
+
-
|
326
|
+
user_agent: Barkrowler/0.9 (+http://www.exensa.com/crawl)
|
327
|
+
bot:
|
328
|
+
name: Barkrowler
|
329
|
+
category: Crawler
|
330
|
+
url: http://www.exensa.com/crawl
|
331
|
+
-
|
302
332
|
user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
|
303
333
|
bot:
|
304
334
|
name: BazQux Reader
|
@@ -307,7 +337,7 @@
|
|
307
337
|
producer:
|
308
338
|
name: ""
|
309
339
|
url: ""
|
310
|
-
-
|
340
|
+
-
|
311
341
|
user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
|
312
342
|
bot:
|
313
343
|
name: BingBot
|
@@ -316,7 +346,7 @@
|
|
316
346
|
producer:
|
317
347
|
name: Microsoft Corporation
|
318
348
|
url: http://www.microsoft.com
|
319
|
-
-
|
349
|
+
-
|
320
350
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
|
321
351
|
bot:
|
322
352
|
name: BingBot
|
@@ -325,7 +355,7 @@
|
|
325
355
|
producer:
|
326
356
|
name: Microsoft Corporation
|
327
357
|
url: http://www.microsoft.com
|
328
|
-
-
|
358
|
+
-
|
329
359
|
user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
|
330
360
|
bot:
|
331
361
|
name: BingBot
|
@@ -334,7 +364,7 @@
|
|
334
364
|
producer:
|
335
365
|
name: Microsoft Corporation
|
336
366
|
url: http://www.microsoft.com
|
337
|
-
-
|
367
|
+
-
|
338
368
|
user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
|
339
369
|
bot:
|
340
370
|
name: BingBot
|
@@ -343,7 +373,7 @@
|
|
343
373
|
producer:
|
344
374
|
name: Microsoft Corporation
|
345
375
|
url: http://www.microsoft.com
|
346
|
-
-
|
376
|
+
-
|
347
377
|
user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
|
348
378
|
bot:
|
349
379
|
name: BingBot
|
@@ -352,7 +382,7 @@
|
|
352
382
|
producer:
|
353
383
|
name: Microsoft Corporation
|
354
384
|
url: http://www.microsoft.com
|
355
|
-
-
|
385
|
+
-
|
356
386
|
user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
|
357
387
|
bot:
|
358
388
|
name: BingBot
|
@@ -361,7 +391,7 @@
|
|
361
391
|
producer:
|
362
392
|
name: Microsoft Corporation
|
363
393
|
url: http://www.microsoft.com
|
364
|
-
-
|
394
|
+
-
|
365
395
|
user_agent: msnbot/2.0b v1394720947.6703
|
366
396
|
bot:
|
367
397
|
name: BingBot
|
@@ -370,7 +400,7 @@
|
|
370
400
|
producer:
|
371
401
|
name: Microsoft Corporation
|
372
402
|
url: http://www.microsoft.com
|
373
|
-
-
|
403
|
+
-
|
374
404
|
user_agent: MSNBot/Nutch-1.5.1
|
375
405
|
bot:
|
376
406
|
name: BingBot
|
@@ -379,7 +409,7 @@
|
|
379
409
|
producer:
|
380
410
|
name: Microsoft Corporation
|
381
411
|
url: http://www.microsoft.com
|
382
|
-
-
|
412
|
+
-
|
383
413
|
user_agent: bitlybot/3.0
|
384
414
|
bot:
|
385
415
|
name: BitlyBot
|
@@ -388,7 +418,7 @@
|
|
388
418
|
producer:
|
389
419
|
name: Bitly, Inc.
|
390
420
|
url: https://bitly.com
|
391
|
-
-
|
421
|
+
-
|
392
422
|
user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
|
393
423
|
bot:
|
394
424
|
name: Blekkobot
|
@@ -397,7 +427,7 @@
|
|
397
427
|
producer:
|
398
428
|
name: Blekko
|
399
429
|
url: http://blekko.com
|
400
|
-
-
|
430
|
+
-
|
401
431
|
user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
|
402
432
|
bot:
|
403
433
|
name: Bloglovin
|
@@ -406,7 +436,7 @@
|
|
406
436
|
producer:
|
407
437
|
name: ""
|
408
438
|
url: ""
|
409
|
-
-
|
439
|
+
-
|
410
440
|
user_agent: Blogtrottr/2.0
|
411
441
|
bot:
|
412
442
|
name: Blogtrottr
|
@@ -415,24 +445,24 @@
|
|
415
445
|
producer:
|
416
446
|
name: Blogtrottr Ltd
|
417
447
|
url: https://blogtrottr.com/
|
418
|
-
-
|
448
|
+
-
|
419
449
|
user_agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com
|
420
450
|
bot:
|
421
451
|
name: BoardReader
|
422
452
|
category: Search bot
|
423
|
-
url:
|
453
|
+
url: https://boardreader.com/
|
424
454
|
producer:
|
425
455
|
name: Effyis Inc
|
426
|
-
url:
|
427
|
-
-
|
456
|
+
url: https://boardreader.com/
|
457
|
+
-
|
428
458
|
user_agent: BoardReader Blog Indexer(http://boardreader.com)
|
429
459
|
bot:
|
430
460
|
name: BoardReader Blog Indexer
|
431
461
|
category: Crawler
|
432
462
|
producer:
|
433
463
|
name: BoardReader
|
434
|
-
url:
|
435
|
-
-
|
464
|
+
url: https://boardreader.com/
|
465
|
+
-
|
436
466
|
user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
|
437
467
|
bot:
|
438
468
|
name: Bountii Bot
|
@@ -441,7 +471,7 @@
|
|
441
471
|
producer:
|
442
472
|
name: Bountii Inc.
|
443
473
|
url: http://bountii.com
|
444
|
-
-
|
474
|
+
-
|
445
475
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10.10; rv:41.0) Gecko/20100101 Firefox/55.0 BrandVerity/1.0 (http://www.brandverity.com/why-is-brandverity-visiting-me)
|
446
476
|
bot:
|
447
477
|
name: BrandVerity
|
@@ -450,7 +480,7 @@
|
|
450
480
|
producer:
|
451
481
|
name: BrandVerity, Inc.
|
452
482
|
url: https://www.brandverity.com/
|
453
|
-
-
|
483
|
+
-
|
454
484
|
user_agent: Browsershots
|
455
485
|
bot:
|
456
486
|
name: Browsershots
|
@@ -459,7 +489,7 @@
|
|
459
489
|
producer:
|
460
490
|
name: Browsershots.org
|
461
491
|
url: http://browsershots.org
|
462
|
-
-
|
492
|
+
-
|
463
493
|
user_agent: Buck/2.2; (+https://app.hypefactors.com/media-monitoring/about.html)
|
464
494
|
bot:
|
465
495
|
name: Buck
|
@@ -468,7 +498,7 @@
|
|
468
498
|
producer:
|
469
499
|
name: Hypefactors A/S
|
470
500
|
url: https://hypefactors.com/
|
471
|
-
-
|
501
|
+
-
|
472
502
|
user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
473
503
|
bot:
|
474
504
|
name: Butterfly Robot
|
@@ -477,7 +507,7 @@
|
|
477
507
|
producer:
|
478
508
|
name: Topsy Labs
|
479
509
|
url: http://labs.topsy.com
|
480
|
-
-
|
510
|
+
-
|
481
511
|
user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
482
512
|
bot:
|
483
513
|
name: Butterfly Robot
|
@@ -486,7 +516,7 @@
|
|
486
516
|
producer:
|
487
517
|
name: Topsy Labs
|
488
518
|
url: http://labs.topsy.com
|
489
|
-
-
|
519
|
+
-
|
490
520
|
user_agent: Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.5668.1446 Mobile Safari/537.36; Bytespider;bytespider@bytedance.com
|
491
521
|
bot:
|
492
522
|
name: Bytespider
|
@@ -495,7 +525,7 @@
|
|
495
525
|
producer:
|
496
526
|
name: ByteDance Ltd.
|
497
527
|
url: https://bytedance.com/
|
498
|
-
-
|
528
|
+
-
|
499
529
|
user_agent: CATExplorador/1.0beta (sistemes at domini dot cat; http://domini.cat/catexplorador.html)
|
500
530
|
bot:
|
501
531
|
name: CATExplorador
|
@@ -504,7 +534,7 @@
|
|
504
534
|
producer:
|
505
535
|
name: Fundació puntCAT
|
506
536
|
url: https://fundacio.cat/ca/domini/
|
507
|
-
-
|
537
|
+
-
|
508
538
|
user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
|
509
539
|
bot:
|
510
540
|
name: CareerBot
|
@@ -513,7 +543,7 @@
|
|
513
543
|
producer:
|
514
544
|
name: career-x GmbH
|
515
545
|
url: http://www.career-x.de
|
516
|
-
-
|
546
|
+
-
|
517
547
|
user_agent: Castro 2, Episode Duration Lookup
|
518
548
|
bot:
|
519
549
|
name: Castro 2
|
@@ -522,7 +552,7 @@
|
|
522
552
|
producer:
|
523
553
|
name: Supertop
|
524
554
|
url: http://supertop.co
|
525
|
-
-
|
555
|
+
-
|
526
556
|
user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
|
527
557
|
bot:
|
528
558
|
name: Cliqzbot
|
@@ -531,7 +561,7 @@
|
|
531
561
|
producer:
|
532
562
|
name: 10betterpages GmbH
|
533
563
|
url: http://cliqz.com
|
534
|
-
-
|
564
|
+
-
|
535
565
|
user_agent: Mozilla/5.0 (compatible; Cloudflare-AMP/1.0; +https://amp.cloudflare.com/doc/fetcher.html) AppleWebKit/534.34
|
536
566
|
bot:
|
537
567
|
name: CloudFlare AMP Fetcher
|
@@ -540,7 +570,7 @@
|
|
540
570
|
producer:
|
541
571
|
name: CloudFlare
|
542
572
|
url: http://www.cloudflare.com
|
543
|
-
-
|
573
|
+
-
|
544
574
|
user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
|
545
575
|
bot:
|
546
576
|
name: CloudFlare Always Online
|
@@ -549,7 +579,7 @@
|
|
549
579
|
producer:
|
550
580
|
name: CloudFlare
|
551
581
|
url: http://www.cloudflare.com
|
552
|
-
-
|
582
|
+
-
|
553
583
|
user_agent: collectd/5.5.1
|
554
584
|
bot:
|
555
585
|
name: Collectd
|
@@ -558,7 +588,7 @@
|
|
558
588
|
producer:
|
559
589
|
name: Collectd
|
560
590
|
url: https://collectd.org/
|
561
|
-
-
|
591
|
+
-
|
562
592
|
user_agent: CommaFeed/1.0 (http://www.commafeed.com)
|
563
593
|
bot:
|
564
594
|
name: CommaFeed
|
@@ -567,79 +597,79 @@
|
|
567
597
|
producer:
|
568
598
|
name: ""
|
569
599
|
url: ""
|
570
|
-
-
|
600
|
+
-
|
571
601
|
user_agent: coccocbot-web/1.0 (+http://help.coccoc.com/searchengine)
|
572
602
|
bot:
|
573
603
|
name: Cốc Cốc Bot
|
574
|
-
category: Search bot
|
575
604
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
605
|
+
category: Search bot
|
576
606
|
producer:
|
577
607
|
name: Cốc Cốc
|
578
608
|
url: https://coccoc.com/
|
579
|
-
-
|
609
|
+
-
|
580
610
|
user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
|
581
611
|
bot:
|
582
612
|
name: Cốc Cốc Bot
|
583
|
-
category: Search bot
|
584
613
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
614
|
+
category: Search bot
|
585
615
|
producer:
|
586
616
|
name: Cốc Cốc
|
587
617
|
url: https://coccoc.com/
|
588
|
-
-
|
618
|
+
-
|
589
619
|
user_agent: Mozilla/5.0 (compatible; coccocbot-ads/1.0; +http://help.coccoc.com/searchengine)
|
590
620
|
bot:
|
591
621
|
name: Cốc Cốc Bot
|
592
|
-
category: Search bot
|
593
622
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
623
|
+
category: Search bot
|
594
624
|
producer:
|
595
625
|
name: Cốc Cốc
|
596
626
|
url: https://coccoc.com/
|
597
|
-
-
|
627
|
+
-
|
598
628
|
user_agent: Mozilla/5.0 (compatible; coccocbot-fast/1.0; +http://help.coccoc.com/searchengine)
|
599
629
|
bot:
|
600
630
|
name: Cốc Cốc Bot
|
601
|
-
category: Search bot
|
602
631
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
632
|
+
category: Search bot
|
603
633
|
producer:
|
604
634
|
name: Cốc Cốc
|
605
635
|
url: https://coccoc.com/
|
606
|
-
-
|
636
|
+
-
|
607
637
|
user_agent: Mozilla/5.0 (compatible; coccocbot-image/1.0; +http://help.coccoc.com/searchengine)
|
608
638
|
bot:
|
609
639
|
name: Cốc Cốc Bot
|
610
|
-
category: Search bot
|
611
640
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
641
|
+
category: Search bot
|
612
642
|
producer:
|
613
643
|
name: Cốc Cốc
|
614
644
|
url: https://coccoc.com/
|
615
|
-
-
|
645
|
+
-
|
616
646
|
user_agent: Mozilla/5.0 (compatible; coccocbot-shopping/1.0; +http://help.coccoc.com/searchengine)
|
617
647
|
bot:
|
618
648
|
name: Cốc Cốc Bot
|
619
|
-
category: Search bot
|
620
649
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
650
|
+
category: Search bot
|
621
651
|
producer:
|
622
652
|
name: Cốc Cốc
|
623
653
|
url: https://coccoc.com/
|
624
|
-
-
|
654
|
+
-
|
625
655
|
user_agent: Mozilla/5.0 (compatible; coccocbot-web/1.0; +http://help.coccoc.com/searchengine)
|
626
656
|
bot:
|
627
657
|
name: Cốc Cốc Bot
|
628
|
-
category: Search bot
|
629
658
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
659
|
+
category: Search bot
|
630
660
|
producer:
|
631
661
|
name: Cốc Cốc
|
632
662
|
url: https://coccoc.com/
|
633
|
-
-
|
663
|
+
-
|
634
664
|
user_agent: Mozilla/5.0 (compatible; coccocbot/1.0; +http://help.coccoc.com/searchengine)
|
635
665
|
bot:
|
636
666
|
name: Cốc Cốc Bot
|
637
|
-
category: Search bot
|
638
667
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
668
|
+
category: Search bot
|
639
669
|
producer:
|
640
670
|
name: Cốc Cốc
|
641
671
|
url: https://coccoc.com/
|
642
|
-
-
|
672
|
+
-
|
643
673
|
user_agent: Datadog Agent/5.10.1
|
644
674
|
bot:
|
645
675
|
name: Datadog Agent
|
@@ -648,7 +678,7 @@
|
|
648
678
|
producer:
|
649
679
|
name: Datadog
|
650
680
|
url: https://www.datadoghq.com/
|
651
|
-
-
|
681
|
+
-
|
652
682
|
user_agent: Mozilla/5.0 (X11; Datanyze; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36
|
653
683
|
bot:
|
654
684
|
name: Datanyze
|
@@ -657,7 +687,7 @@
|
|
657
687
|
producer:
|
658
688
|
name: Datanyze
|
659
689
|
url: https://www.datanyze.com
|
660
|
-
-
|
690
|
+
-
|
661
691
|
user_agent: Mozilla/5.0 (compatible; Dataprovider/6.92; +https://www.dataprovider.com/)
|
662
692
|
bot:
|
663
693
|
name: Dataprovider
|
@@ -666,7 +696,7 @@
|
|
666
696
|
producer:
|
667
697
|
name: Dataprovider B.V.
|
668
698
|
url: https://www.dataprovider.com/
|
669
|
-
-
|
699
|
+
-
|
670
700
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
|
671
701
|
bot:
|
672
702
|
name: Daum
|
@@ -675,7 +705,7 @@
|
|
675
705
|
producer:
|
676
706
|
name: Daum Communications Corp.
|
677
707
|
url: http://www.kakaocorp.com/main
|
678
|
-
-
|
708
|
+
-
|
679
709
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
|
680
710
|
bot:
|
681
711
|
name: Daum
|
@@ -684,7 +714,7 @@
|
|
684
714
|
producer:
|
685
715
|
name: Daum Communications Corp.
|
686
716
|
url: http://www.kakaocorp.com/main
|
687
|
-
-
|
717
|
+
-
|
688
718
|
user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
|
689
719
|
bot:
|
690
720
|
name: Dazoobot
|
@@ -693,7 +723,7 @@
|
|
693
723
|
producer:
|
694
724
|
name: DAZOO.FR
|
695
725
|
url: http://dazoo.fr
|
696
|
-
-
|
726
|
+
-
|
697
727
|
user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
|
698
728
|
bot:
|
699
729
|
name: Discobot
|
@@ -702,7 +732,7 @@
|
|
702
732
|
producer:
|
703
733
|
name: Discovery Engine
|
704
734
|
url: http://discoveryengine.com
|
705
|
-
-
|
735
|
+
-
|
706
736
|
user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
|
707
737
|
bot:
|
708
738
|
name: Domain Re-Animator Bot
|
@@ -711,7 +741,7 @@
|
|
711
741
|
producer:
|
712
742
|
name: Domain Re-Animator, LLC
|
713
743
|
url: http://domainreanimator.com
|
714
|
-
-
|
744
|
+
-
|
715
745
|
user_agent: support@domainreanimator.com
|
716
746
|
bot:
|
717
747
|
name: Domain Re-Animator Bot
|
@@ -720,7 +750,13 @@
|
|
720
750
|
producer:
|
721
751
|
name: Domain Re-Animator, LLC
|
722
752
|
url: http://domainreanimator.com
|
723
|
-
-
|
753
|
+
-
|
754
|
+
user_agent: Mozilla/5.0 (compatible; Domains Project/1.1.0; +https://domainsproject.org)
|
755
|
+
bot:
|
756
|
+
name: Domains Project
|
757
|
+
category: Crawler
|
758
|
+
url: https://domainsproject.org
|
759
|
+
-
|
724
760
|
user_agent: dotbot
|
725
761
|
bot:
|
726
762
|
name: DotBot
|
@@ -729,7 +765,7 @@
|
|
729
765
|
producer:
|
730
766
|
name: SEOmoz, Inc.
|
731
767
|
url: http://moz.com/
|
732
|
-
-
|
768
|
+
-
|
733
769
|
user_agent: DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)
|
734
770
|
bot:
|
735
771
|
name: DuckDuckGo Bot
|
@@ -738,7 +774,7 @@
|
|
738
774
|
producer:
|
739
775
|
name: DuckDuckGo
|
740
776
|
url: https://duckduckgo.com/
|
741
|
-
-
|
777
|
+
-
|
742
778
|
user_agent: Mozilla/5.0 (compatible; DuckDuckGo-Favicons-Bot/1.0; +http://duckduckgo.com)
|
743
779
|
bot:
|
744
780
|
name: DuckDuckGo Bot
|
@@ -747,7 +783,7 @@
|
|
747
783
|
producer:
|
748
784
|
name: DuckDuckGo
|
749
785
|
url: https://duckduckgo.com/
|
750
|
-
-
|
786
|
+
-
|
751
787
|
user_agent: EMail Exractor
|
752
788
|
bot:
|
753
789
|
name: EMail Exractor
|
@@ -756,7 +792,7 @@
|
|
756
792
|
producer:
|
757
793
|
name: ""
|
758
794
|
url: ""
|
759
|
-
-
|
795
|
+
-
|
760
796
|
user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
|
761
797
|
bot:
|
762
798
|
name: Easou Spider
|
@@ -765,7 +801,7 @@
|
|
765
801
|
producer:
|
766
802
|
name: easou ICP
|
767
803
|
url: http://www.easou.com
|
768
|
-
-
|
804
|
+
-
|
769
805
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
|
770
806
|
bot:
|
771
807
|
name: Easou Spider
|
@@ -774,7 +810,7 @@
|
|
774
810
|
producer:
|
775
811
|
name: easou ICP
|
776
812
|
url: http://www.easou.com
|
777
|
-
-
|
813
|
+
-
|
778
814
|
user_agent: Mozilla/5.0 (compatible; Embedly/0.2; +http://support.embed.ly/)
|
779
815
|
bot:
|
780
816
|
name: Embedly
|
@@ -783,7 +819,7 @@
|
|
783
819
|
producer:
|
784
820
|
name: A Medium, Corp.
|
785
821
|
url: https://medium.com/
|
786
|
-
-
|
822
|
+
-
|
787
823
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
|
788
824
|
bot:
|
789
825
|
name: ExaBot
|
@@ -792,7 +828,7 @@
|
|
792
828
|
producer:
|
793
829
|
name: Dassault Systèmes
|
794
830
|
url: http://www.3ds.com
|
795
|
-
-
|
831
|
+
-
|
796
832
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
|
797
833
|
bot:
|
798
834
|
name: ExaBot
|
@@ -801,7 +837,7 @@
|
|
801
837
|
producer:
|
802
838
|
name: Dassault Systèmes
|
803
839
|
url: http://www.3ds.com
|
804
|
-
-
|
840
|
+
-
|
805
841
|
user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
|
806
842
|
bot:
|
807
843
|
name: ExaBot
|
@@ -810,7 +846,7 @@
|
|
810
846
|
producer:
|
811
847
|
name: Dassault Systèmes
|
812
848
|
url: http://www.3ds.com
|
813
|
-
-
|
849
|
+
-
|
814
850
|
user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
|
815
851
|
bot:
|
816
852
|
name: ExactSeek Crawler
|
@@ -819,7 +855,7 @@
|
|
819
855
|
producer:
|
820
856
|
name: Jayde Online, Inc.
|
821
857
|
url: http://www.jaydeonlineinc.com
|
822
|
-
-
|
858
|
+
-
|
823
859
|
user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
|
824
860
|
bot:
|
825
861
|
name: Ezooms
|
@@ -828,7 +864,7 @@
|
|
828
864
|
producer:
|
829
865
|
name: SEOmoz, Inc.
|
830
866
|
url: http://moz.com/
|
831
|
-
-
|
867
|
+
-
|
832
868
|
user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
|
833
869
|
bot:
|
834
870
|
name: Facebook External Hit
|
@@ -837,7 +873,7 @@
|
|
837
873
|
producer:
|
838
874
|
name: Facebook
|
839
875
|
url: http://www.facebook.com
|
840
|
-
-
|
876
|
+
-
|
841
877
|
user_agent: facebookexternalua
|
842
878
|
bot:
|
843
879
|
name: Facebook External Hit
|
@@ -846,7 +882,7 @@
|
|
846
882
|
producer:
|
847
883
|
name: Facebook
|
848
884
|
url: http://www.facebook.com
|
849
|
-
-
|
885
|
+
-
|
850
886
|
user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
|
851
887
|
bot:
|
852
888
|
name: Facebook External Hit
|
@@ -855,7 +891,7 @@
|
|
855
891
|
producer:
|
856
892
|
name: Facebook
|
857
893
|
url: http://www.facebook.com
|
858
|
-
-
|
894
|
+
-
|
859
895
|
user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
|
860
896
|
bot:
|
861
897
|
name: Feed Wrangler
|
@@ -864,7 +900,7 @@
|
|
864
900
|
producer:
|
865
901
|
name: 'David Smith & Developing Perspective, LLC'
|
866
902
|
url: https://david-smith.org
|
867
|
-
-
|
903
|
+
-
|
868
904
|
user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
|
869
905
|
bot:
|
870
906
|
name: FeedBurner
|
@@ -873,7 +909,7 @@
|
|
873
909
|
producer:
|
874
910
|
name: ""
|
875
911
|
url: ""
|
876
|
-
-
|
912
|
+
-
|
877
913
|
user_agent: 'Feedbin - 9 subscribers'
|
878
914
|
bot:
|
879
915
|
name: Feedbin
|
@@ -882,7 +918,7 @@
|
|
882
918
|
producer:
|
883
919
|
name: ""
|
884
920
|
url: ""
|
885
|
-
-
|
921
|
+
-
|
886
922
|
user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
|
887
923
|
bot:
|
888
924
|
name: Feedly
|
@@ -891,7 +927,7 @@
|
|
891
927
|
producer:
|
892
928
|
name: ""
|
893
929
|
url: ""
|
894
|
-
-
|
930
|
+
-
|
895
931
|
user_agent: FeedlyApp/1.0 (http://www.feedly.com)
|
896
932
|
bot:
|
897
933
|
name: Feedly
|
@@ -900,7 +936,7 @@
|
|
900
936
|
producer:
|
901
937
|
name: ""
|
902
938
|
url: ""
|
903
|
-
-
|
939
|
+
-
|
904
940
|
user_agent: FeedlyBot/1.0 (http://feedly.com)
|
905
941
|
bot:
|
906
942
|
name: Feedly
|
@@ -909,7 +945,7 @@
|
|
909
945
|
producer:
|
910
946
|
name: ""
|
911
947
|
url: ""
|
912
|
-
-
|
948
|
+
-
|
913
949
|
user_agent: MetaFeedly/1.0 (http://www.feedly.com)
|
914
950
|
bot:
|
915
951
|
name: Feedly
|
@@ -918,7 +954,7 @@
|
|
918
954
|
producer:
|
919
955
|
name: ""
|
920
956
|
url: ""
|
921
|
-
-
|
957
|
+
-
|
922
958
|
user_agent: Feedspot http://www.feedspot.com
|
923
959
|
bot:
|
924
960
|
name: Feedspot
|
@@ -927,7 +963,7 @@
|
|
927
963
|
producer:
|
928
964
|
name: ""
|
929
965
|
url: ""
|
930
|
-
-
|
966
|
+
-
|
931
967
|
user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
|
932
968
|
bot:
|
933
969
|
name: Fever
|
@@ -936,13 +972,13 @@
|
|
936
972
|
producer:
|
937
973
|
name: ""
|
938
974
|
url: ""
|
939
|
-
-
|
975
|
+
-
|
940
976
|
user_agent: Mozilla/5.0 (compatible; Findxbot/1.0; +http://www.findxbot.com)
|
941
977
|
bot:
|
942
978
|
name: Findxbot
|
943
979
|
category: Crawler
|
944
980
|
url: http://www.findxbot.com
|
945
|
-
-
|
981
|
+
-
|
946
982
|
user_agent: Mozilla/5.0 (compatible; FlipboardProxy/1.2; +http://flipboard.com/browserproxy)
|
947
983
|
bot:
|
948
984
|
name: Flipboard
|
@@ -951,7 +987,7 @@
|
|
951
987
|
producer:
|
952
988
|
name: Flipboard
|
953
989
|
url: http://flipboard.com/
|
954
|
-
-
|
990
|
+
-
|
955
991
|
user_agent: Mozilla/5.0 (compatible; FlipboardRSS/1.2; +http://flipboard.com/browserproxy)
|
956
992
|
bot:
|
957
993
|
name: Flipboard
|
@@ -960,19 +996,19 @@
|
|
960
996
|
producer:
|
961
997
|
name: Flipboard
|
962
998
|
url: http://flipboard.com/
|
963
|
-
-
|
999
|
+
-
|
964
1000
|
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
965
1001
|
bot:
|
966
1002
|
name: FreshRSS
|
967
1003
|
category: Feed Fetcher
|
968
1004
|
url: https://freshrss.org/
|
969
|
-
-
|
1005
|
+
-
|
970
1006
|
user_agent: FreshRSS/1.12.0 (Linux; https://freshrss.org)
|
971
1007
|
bot:
|
972
1008
|
name: FreshRSS
|
973
1009
|
category: Feed Fetcher
|
974
1010
|
url: https://freshrss.org/
|
975
|
-
-
|
1011
|
+
-
|
976
1012
|
user_agent: Mozilla/5.0 (X11; Linux x86_64; GTmetrix https://gtmetrix.com/) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/75.0.3770.100 Safari/537.36
|
977
1013
|
bot:
|
978
1014
|
name: GTmetrix
|
@@ -981,55 +1017,55 @@
|
|
981
1017
|
producer:
|
982
1018
|
name: Carbon60 Operating Co. Ltd.
|
983
1019
|
url: https://www.carbon60.com/
|
984
|
-
-
|
1020
|
+
-
|
985
1021
|
user_agent: 7Siters/1.07 (+https://7ooo.ru/siters/)
|
986
1022
|
bot:
|
987
1023
|
name: Generic Bot
|
988
|
-
-
|
1024
|
+
-
|
989
1025
|
user_agent: COMODO SSL Checker
|
990
1026
|
bot:
|
991
1027
|
name: Generic Bot
|
992
|
-
-
|
1028
|
+
-
|
993
1029
|
user_agent: help@dataminr.com
|
994
1030
|
bot:
|
995
1031
|
name: Generic Bot
|
996
|
-
-
|
1032
|
+
-
|
997
1033
|
user_agent: 'HybridBot (hybrid.ru/about. If our bot caused problems please contact us. Contact email: m.lyashkov@targetix.net)'
|
998
1034
|
bot:
|
999
1035
|
name: Generic Bot
|
1000
|
-
-
|
1036
|
+
-
|
1001
1037
|
user_agent: 'Mozilla/5.0 (compatible; +centuryb.o.t9[at]gmail.com)'
|
1002
1038
|
bot:
|
1003
1039
|
name: Generic Bot
|
1004
|
-
-
|
1040
|
+
-
|
1005
1041
|
user_agent: Mozilla/5.0 (compatible; +http://tweetedtimes.com)
|
1006
1042
|
bot:
|
1007
1043
|
name: Generic Bot
|
1008
|
-
-
|
1044
|
+
-
|
1009
1045
|
user_agent: Mozilla/5.0 (compatible; Shareaholicbot/2.0; +http://www.shareaholic.com/bot)
|
1010
1046
|
bot:
|
1011
1047
|
name: Generic Bot
|
1012
|
-
-
|
1048
|
+
-
|
1013
1049
|
user_agent: Mozilla/5.0 (compatible; TrendsmapResolver/0.1)
|
1014
1050
|
bot:
|
1015
1051
|
name: Generic Bot
|
1016
|
-
-
|
1052
|
+
-
|
1017
1053
|
user_agent: niki-bot
|
1018
1054
|
bot:
|
1019
1055
|
name: Generic Bot
|
1020
|
-
-
|
1056
|
+
-
|
1021
1057
|
user_agent: PHPCrawl
|
1022
1058
|
bot:
|
1023
1059
|
name: Generic Bot
|
1024
|
-
-
|
1060
|
+
-
|
1025
1061
|
user_agent: robots
|
1026
1062
|
bot:
|
1027
1063
|
name: Generic Bot
|
1028
|
-
-
|
1064
|
+
-
|
1029
1065
|
user_agent: SeopultContentAnalyzer/1.0
|
1030
1066
|
bot:
|
1031
1067
|
name: Generic Bot
|
1032
|
-
-
|
1068
|
+
-
|
1033
1069
|
user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
|
1034
1070
|
bot:
|
1035
1071
|
name: Genieo Web filter
|
@@ -1038,7 +1074,7 @@
|
|
1038
1074
|
producer:
|
1039
1075
|
name: Genieo
|
1040
1076
|
url: http://www.genieo.com
|
1041
|
-
-
|
1077
|
+
-
|
1042
1078
|
user_agent: GigablastOpenSource/1.0
|
1043
1079
|
bot:
|
1044
1080
|
name: Gigablast
|
@@ -1047,7 +1083,7 @@
|
|
1047
1083
|
producer:
|
1048
1084
|
name: Matt Wells
|
1049
1085
|
url: http://www.gigablast.com/faq.html
|
1050
|
-
-
|
1086
|
+
-
|
1051
1087
|
user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
|
1052
1088
|
bot:
|
1053
1089
|
name: Gluten Free Crawler
|
@@ -1056,7 +1092,7 @@
|
|
1056
1092
|
producer:
|
1057
1093
|
name: ""
|
1058
1094
|
url: ""
|
1059
|
-
-
|
1095
|
+
-
|
1060
1096
|
user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
|
1061
1097
|
bot:
|
1062
1098
|
name: Gmail Image Proxy
|
@@ -1065,7 +1101,7 @@
|
|
1065
1101
|
producer:
|
1066
1102
|
name: Google Inc.
|
1067
1103
|
url: http://www.google.com
|
1068
|
-
-
|
1104
|
+
-
|
1069
1105
|
user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
|
1070
1106
|
bot:
|
1071
1107
|
name: Goo
|
@@ -1074,12 +1110,12 @@
|
|
1074
1110
|
producer:
|
1075
1111
|
name: NTT Resonant
|
1076
1112
|
url: http://goo.ne.jp
|
1077
|
-
-
|
1113
|
+
-
|
1078
1114
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.75 Safari/537.36 Google Favicon
|
1079
1115
|
bot:
|
1080
1116
|
name: Google Favicon
|
1081
1117
|
category: Crawler
|
1082
|
-
-
|
1118
|
+
-
|
1083
1119
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
|
1084
1120
|
bot:
|
1085
1121
|
name: Google PageSpeed Insights
|
@@ -1088,7 +1124,7 @@
|
|
1088
1124
|
producer:
|
1089
1125
|
name: Google Inc.
|
1090
1126
|
url: http://www.google.com
|
1091
|
-
-
|
1127
|
+
-
|
1092
1128
|
user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
|
1093
1129
|
bot:
|
1094
1130
|
name: Google Partner Monitoring
|
@@ -1097,7 +1133,7 @@
|
|
1097
1133
|
producer:
|
1098
1134
|
name: Google Inc.
|
1099
1135
|
url: http://www.google.com
|
1100
|
-
-
|
1136
|
+
-
|
1101
1137
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Search Console) Chrome/41.0.2272.118 Safari/537.36
|
1102
1138
|
bot:
|
1103
1139
|
name: Google Search Console
|
@@ -1106,7 +1142,7 @@
|
|
1106
1142
|
producer:
|
1107
1143
|
name: Google Inc.
|
1108
1144
|
url: http://www.google.com
|
1109
|
-
-
|
1145
|
+
-
|
1110
1146
|
user_agent: Google-Structured-Data-Testing-Tool +https://search.google.com/structured-data/testing-tool)
|
1111
1147
|
bot:
|
1112
1148
|
name: Google Structured Data Testing Tool
|
@@ -1115,7 +1151,7 @@
|
|
1115
1151
|
producer:
|
1116
1152
|
name: Google Inc.
|
1117
1153
|
url: http://www.google.com
|
1118
|
-
-
|
1154
|
+
-
|
1119
1155
|
user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
|
1120
1156
|
bot:
|
1121
1157
|
name: Googlebot
|
@@ -1124,7 +1160,7 @@
|
|
1124
1160
|
producer:
|
1125
1161
|
name: Google Inc.
|
1126
1162
|
url: http://www.google.com
|
1127
|
-
-
|
1163
|
+
-
|
1128
1164
|
user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
|
1129
1165
|
bot:
|
1130
1166
|
name: Googlebot
|
@@ -1133,7 +1169,7 @@
|
|
1133
1169
|
producer:
|
1134
1170
|
name: Google Inc.
|
1135
1171
|
url: http://www.google.com
|
1136
|
-
-
|
1172
|
+
-
|
1137
1173
|
user_agent: APIs-Google (+https://developers.google.com/webmasters/APIs-Google.html)
|
1138
1174
|
bot:
|
1139
1175
|
name: Googlebot
|
@@ -1142,7 +1178,7 @@
|
|
1142
1178
|
producer:
|
1143
1179
|
name: Google Inc.
|
1144
1180
|
url: http://www.google.com
|
1145
|
-
-
|
1181
|
+
-
|
1146
1182
|
user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
1147
1183
|
bot:
|
1148
1184
|
name: Googlebot
|
@@ -1151,7 +1187,7 @@
|
|
1151
1187
|
producer:
|
1152
1188
|
name: Google Inc.
|
1153
1189
|
url: http://www.google.com
|
1154
|
-
-
|
1190
|
+
-
|
1155
1191
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
|
1156
1192
|
bot:
|
1157
1193
|
name: Googlebot
|
@@ -1160,7 +1196,7 @@
|
|
1160
1196
|
producer:
|
1161
1197
|
name: Google Inc.
|
1162
1198
|
url: http://www.google.com
|
1163
|
-
-
|
1199
|
+
-
|
1164
1200
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
|
1165
1201
|
bot:
|
1166
1202
|
name: Googlebot
|
@@ -1169,7 +1205,7 @@
|
|
1169
1205
|
producer:
|
1170
1206
|
name: Google Inc.
|
1171
1207
|
url: http://www.google.com
|
1172
|
-
-
|
1208
|
+
-
|
1173
1209
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
|
1174
1210
|
bot:
|
1175
1211
|
name: Googlebot
|
@@ -1178,7 +1214,7 @@
|
|
1178
1214
|
producer:
|
1179
1215
|
name: Google Inc.
|
1180
1216
|
url: http://www.google.com
|
1181
|
-
-
|
1217
|
+
-
|
1182
1218
|
user_agent: Google-AdWords-Express
|
1183
1219
|
bot:
|
1184
1220
|
name: Googlebot
|
@@ -1187,7 +1223,7 @@
|
|
1187
1223
|
producer:
|
1188
1224
|
name: Google Inc.
|
1189
1225
|
url: http://www.google.com
|
1190
|
-
-
|
1226
|
+
-
|
1191
1227
|
user_agent: Google-Adwords-Instant (+http://www.google.com/adsbot.html)
|
1192
1228
|
bot:
|
1193
1229
|
name: Googlebot
|
@@ -1196,7 +1232,7 @@
|
|
1196
1232
|
producer:
|
1197
1233
|
name: Google Inc.
|
1198
1234
|
url: http://www.google.com
|
1199
|
-
-
|
1235
|
+
-
|
1200
1236
|
user_agent: Google-speakr
|
1201
1237
|
bot:
|
1202
1238
|
name: Googlebot
|
@@ -1205,7 +1241,7 @@
|
|
1205
1241
|
producer:
|
1206
1242
|
name: Google Inc.
|
1207
1243
|
url: http://www.google.com
|
1208
|
-
-
|
1244
|
+
-
|
1209
1245
|
user_agent: Googlebot (gocrawl v0.4)
|
1210
1246
|
bot:
|
1211
1247
|
name: Googlebot
|
@@ -1214,7 +1250,7 @@
|
|
1214
1250
|
producer:
|
1215
1251
|
name: Google Inc.
|
1216
1252
|
url: http://www.google.com
|
1217
|
-
-
|
1253
|
+
-
|
1218
1254
|
user_agent: Googlebot-Image/1.0
|
1219
1255
|
bot:
|
1220
1256
|
name: Googlebot
|
@@ -1223,7 +1259,7 @@
|
|
1223
1259
|
producer:
|
1224
1260
|
name: Google Inc.
|
1225
1261
|
url: http://www.google.com
|
1226
|
-
-
|
1262
|
+
-
|
1227
1263
|
user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
|
1228
1264
|
bot:
|
1229
1265
|
name: Googlebot
|
@@ -1232,7 +1268,7 @@
|
|
1232
1268
|
producer:
|
1233
1269
|
name: Google Inc.
|
1234
1270
|
url: http://www.google.com
|
1235
|
-
-
|
1271
|
+
-
|
1236
1272
|
user_agent: Googlebot-Video/1.0
|
1237
1273
|
bot:
|
1238
1274
|
name: Googlebot
|
@@ -1241,7 +1277,7 @@
|
|
1241
1277
|
producer:
|
1242
1278
|
name: Google Inc.
|
1243
1279
|
url: http://www.google.com
|
1244
|
-
-
|
1280
|
+
-
|
1245
1281
|
user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
|
1246
1282
|
bot:
|
1247
1283
|
name: Googlebot
|
@@ -1250,7 +1286,7 @@
|
|
1250
1286
|
producer:
|
1251
1287
|
name: Google Inc.
|
1252
1288
|
url: http://www.google.com
|
1253
|
-
-
|
1289
|
+
-
|
1254
1290
|
user_agent: Googlebot/Nutch-1.7
|
1255
1291
|
bot:
|
1256
1292
|
name: Googlebot
|
@@ -1259,7 +1295,7 @@
|
|
1259
1295
|
producer:
|
1260
1296
|
name: Google Inc.
|
1261
1297
|
url: http://www.google.com
|
1262
|
-
-
|
1298
|
+
-
|
1263
1299
|
user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
|
1264
1300
|
bot:
|
1265
1301
|
name: Googlebot
|
@@ -1268,7 +1304,7 @@
|
|
1268
1304
|
producer:
|
1269
1305
|
name: Google Inc.
|
1270
1306
|
url: http://www.google.com
|
1271
|
-
-
|
1307
|
+
-
|
1272
1308
|
user_agent: Mediapartners-Google
|
1273
1309
|
bot:
|
1274
1310
|
name: Googlebot
|
@@ -1277,7 +1313,7 @@
|
|
1277
1313
|
producer:
|
1278
1314
|
name: Google Inc.
|
1279
1315
|
url: http://www.google.com
|
1280
|
-
-
|
1316
|
+
-
|
1281
1317
|
user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
|
1282
1318
|
bot:
|
1283
1319
|
name: Googlebot
|
@@ -1286,7 +1322,7 @@
|
|
1286
1322
|
producer:
|
1287
1323
|
name: Google Inc.
|
1288
1324
|
url: http://www.google.com
|
1289
|
-
-
|
1325
|
+
-
|
1290
1326
|
user_agent: Mozilla/5.0 (compatible; Google-Youtube-Links)
|
1291
1327
|
bot:
|
1292
1328
|
name: Googlebot
|
@@ -1295,7 +1331,7 @@
|
|
1295
1331
|
producer:
|
1296
1332
|
name: Google Inc.
|
1297
1333
|
url: http://www.google.com
|
1298
|
-
-
|
1334
|
+
-
|
1299
1335
|
user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
|
1300
1336
|
bot:
|
1301
1337
|
name: Googlebot
|
@@ -1304,7 +1340,7 @@
|
|
1304
1340
|
producer:
|
1305
1341
|
name: Google Inc.
|
1306
1342
|
url: http://www.google.com
|
1307
|
-
-
|
1343
|
+
-
|
1308
1344
|
user_agent: Mozilla/5.0 (en-US) AppleWebKit/537.36 (KHTML, like Gecko; Google-Assess) Chrome/34.0.1847.116 Safari/537.36
|
1309
1345
|
bot:
|
1310
1346
|
name: Googlebot
|
@@ -1313,7 +1349,7 @@
|
|
1313
1349
|
producer:
|
1314
1350
|
name: Google Inc.
|
1315
1351
|
url: http://www.google.com
|
1316
|
-
-
|
1352
|
+
-
|
1317
1353
|
user_agent: Mozilla/5.0 (en-us) AppleWebKit/537.36(KHTML, like Gecko; Google-Adwords-DisplayAds-WebRender;) Chrome/41.0.2272.118Safari/537.36
|
1318
1354
|
bot:
|
1319
1355
|
name: Googlebot
|
@@ -1322,7 +1358,7 @@
|
|
1322
1358
|
producer:
|
1323
1359
|
name: Google Inc.
|
1324
1360
|
url: http://www.google.com
|
1325
|
-
-
|
1361
|
+
-
|
1326
1362
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
1327
1363
|
bot:
|
1328
1364
|
name: Googlebot
|
@@ -1331,7 +1367,7 @@
|
|
1331
1367
|
producer:
|
1332
1368
|
name: Google Inc.
|
1333
1369
|
url: http://www.google.com
|
1334
|
-
-
|
1370
|
+
-
|
1335
1371
|
user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
|
1336
1372
|
bot:
|
1337
1373
|
name: Googlebot
|
@@ -1340,7 +1376,7 @@
|
|
1340
1376
|
producer:
|
1341
1377
|
name: Google Inc.
|
1342
1378
|
url: http://www.google.com
|
1343
|
-
-
|
1379
|
+
-
|
1344
1380
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-AMPHTML)
|
1345
1381
|
bot:
|
1346
1382
|
name: Googlebot
|
@@ -1349,7 +1385,7 @@
|
|
1349
1385
|
producer:
|
1350
1386
|
name: Google Inc.
|
1351
1387
|
url: http://www.google.com
|
1352
|
-
-
|
1388
|
+
-
|
1353
1389
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-Read-Aloud; +https://support.google.com/webmasters/answer/1061943)
|
1354
1390
|
bot:
|
1355
1391
|
name: Googlebot
|
@@ -1358,7 +1394,7 @@
|
|
1358
1394
|
producer:
|
1359
1395
|
name: Google Inc.
|
1360
1396
|
url: http://www.google.com
|
1361
|
-
-
|
1397
|
+
-
|
1362
1398
|
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; DuplexWeb-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.131 Mobile Safari/537.36
|
1363
1399
|
bot:
|
1364
1400
|
name: Googlebot
|
@@ -1367,7 +1403,7 @@
|
|
1367
1403
|
producer:
|
1368
1404
|
name: Google Inc.
|
1369
1405
|
url: http://www.google.com
|
1370
|
-
-
|
1406
|
+
-
|
1371
1407
|
user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
|
1372
1408
|
bot:
|
1373
1409
|
name: Googlebot
|
@@ -1376,7 +1412,7 @@
|
|
1376
1412
|
producer:
|
1377
1413
|
name: Google Inc.
|
1378
1414
|
url: http://www.google.com
|
1379
|
-
-
|
1415
|
+
-
|
1380
1416
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/27.0.1453 Safari/537.36 (compatible; Google-HotelAdsVerifier/2.0)
|
1381
1417
|
bot:
|
1382
1418
|
name: Googlebot
|
@@ -1385,7 +1421,7 @@
|
|
1385
1421
|
producer:
|
1386
1422
|
name: Google Inc.
|
1387
1423
|
url: http://www.google.com
|
1388
|
-
-
|
1424
|
+
-
|
1389
1425
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
|
1390
1426
|
bot:
|
1391
1427
|
name: Googlebot
|
@@ -1394,7 +1430,7 @@
|
|
1394
1430
|
producer:
|
1395
1431
|
name: Google Inc.
|
1396
1432
|
url: http://www.google.com
|
1397
|
-
-
|
1433
|
+
-
|
1398
1434
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36 (compatible; Google-Shopping-Quality +http://www.google.com/merchants/tos/extend/DE/tos.html)
|
1399
1435
|
bot:
|
1400
1436
|
name: Googlebot
|
@@ -1403,7 +1439,7 @@
|
|
1403
1439
|
producer:
|
1404
1440
|
name: Google Inc.
|
1405
1441
|
url: http://www.google.com
|
1406
|
-
-
|
1442
|
+
-
|
1407
1443
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
|
1408
1444
|
bot:
|
1409
1445
|
name: Googlebot
|
@@ -1412,7 +1448,7 @@
|
|
1412
1448
|
producer:
|
1413
1449
|
name: Google Inc.
|
1414
1450
|
url: http://www.google.com
|
1415
|
-
-
|
1451
|
+
-
|
1416
1452
|
user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
1417
1453
|
bot:
|
1418
1454
|
name: Googlebot
|
@@ -1421,7 +1457,13 @@
|
|
1421
1457
|
producer:
|
1422
1458
|
name: Google Inc.
|
1423
1459
|
url: http://www.google.com
|
1424
|
-
-
|
1460
|
+
-
|
1461
|
+
user_agent: Grammarly/1.0 (http://www.grammarly.com)
|
1462
|
+
bot:
|
1463
|
+
name: Grammarly
|
1464
|
+
category: Service bot
|
1465
|
+
url: https://www.grammarly.com
|
1466
|
+
-
|
1425
1467
|
user_agent: Mozilla/5.0 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
1426
1468
|
bot:
|
1427
1469
|
name: Grapeshot
|
@@ -1430,7 +1472,7 @@
|
|
1430
1472
|
producer:
|
1431
1473
|
name: Grapeshot
|
1432
1474
|
url: https://www.grapeshot.com
|
1433
|
-
-
|
1475
|
+
-
|
1434
1476
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1. 4 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
1435
1477
|
bot:
|
1436
1478
|
name: Grapeshot
|
@@ -1439,7 +1481,7 @@
|
|
1439
1481
|
producer:
|
1440
1482
|
name: Grapeshot
|
1441
1483
|
url: https://www.grapeshot.com
|
1442
|
-
-
|
1484
|
+
-
|
1443
1485
|
user_agent: HTTPMon/1.0b (http://www.httpmon.com)
|
1444
1486
|
bot:
|
1445
1487
|
name: HTTPMon
|
@@ -1448,7 +1490,7 @@
|
|
1448
1490
|
producer:
|
1449
1491
|
name: towards GmbH
|
1450
1492
|
url: http://www.towards.ch/
|
1451
|
-
-
|
1493
|
+
-
|
1452
1494
|
user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
|
1453
1495
|
bot:
|
1454
1496
|
name: Heritrix
|
@@ -1456,8 +1498,8 @@
|
|
1456
1498
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1457
1499
|
producer:
|
1458
1500
|
name: The Internet Archive
|
1459
|
-
url:
|
1460
|
-
-
|
1501
|
+
url: https://archive.org
|
1502
|
+
-
|
1461
1503
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
|
1462
1504
|
bot:
|
1463
1505
|
name: Heritrix
|
@@ -1465,8 +1507,8 @@
|
|
1465
1507
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1466
1508
|
producer:
|
1467
1509
|
name: The Internet Archive
|
1468
|
-
url:
|
1469
|
-
-
|
1510
|
+
url: https://archive.org
|
1511
|
+
-
|
1470
1512
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
|
1471
1513
|
bot:
|
1472
1514
|
name: Heritrix
|
@@ -1474,8 +1516,8 @@
|
|
1474
1516
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1475
1517
|
producer:
|
1476
1518
|
name: The Internet Archive
|
1477
|
-
url:
|
1478
|
-
-
|
1519
|
+
url: https://archive.org
|
1520
|
+
-
|
1479
1521
|
user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
|
1480
1522
|
bot:
|
1481
1523
|
name: Heritrix
|
@@ -1483,8 +1525,8 @@
|
|
1483
1525
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1484
1526
|
producer:
|
1485
1527
|
name: The Internet Archive
|
1486
|
-
url:
|
1487
|
-
-
|
1528
|
+
url: https://archive.org
|
1529
|
+
-
|
1488
1530
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
|
1489
1531
|
bot:
|
1490
1532
|
name: Heritrix
|
@@ -1492,8 +1534,8 @@
|
|
1492
1534
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1493
1535
|
producer:
|
1494
1536
|
name: The Internet Archive
|
1495
|
-
url:
|
1496
|
-
-
|
1537
|
+
url: https://archive.org
|
1538
|
+
-
|
1497
1539
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
|
1498
1540
|
bot:
|
1499
1541
|
name: Heritrix
|
@@ -1501,8 +1543,8 @@
|
|
1501
1543
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1502
1544
|
producer:
|
1503
1545
|
name: The Internet Archive
|
1504
|
-
url:
|
1505
|
-
-
|
1546
|
+
url: https://archive.org
|
1547
|
+
-
|
1506
1548
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
|
1507
1549
|
bot:
|
1508
1550
|
name: Heritrix
|
@@ -1510,8 +1552,8 @@
|
|
1510
1552
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1511
1553
|
producer:
|
1512
1554
|
name: The Internet Archive
|
1513
|
-
url:
|
1514
|
-
-
|
1555
|
+
url: https://archive.org
|
1556
|
+
-
|
1515
1557
|
user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
|
1516
1558
|
bot:
|
1517
1559
|
name: Heritrix
|
@@ -1519,8 +1561,8 @@
|
|
1519
1561
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
1520
1562
|
producer:
|
1521
1563
|
name: The Internet Archive
|
1522
|
-
url:
|
1523
|
-
-
|
1564
|
+
url: https://archive.org
|
1565
|
+
-
|
1524
1566
|
user_agent: Heurekabot-Feed/1.0 (+https://sluzby.heureka.cz/napoveda/heurekabot/)
|
1525
1567
|
bot:
|
1526
1568
|
name: Heureka Feed
|
@@ -1529,16 +1571,16 @@
|
|
1529
1571
|
producer:
|
1530
1572
|
name: Heureka.cz, a.s.
|
1531
1573
|
url: https://www.heureka.cz/
|
1532
|
-
-
|
1574
|
+
-
|
1533
1575
|
user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
|
1534
1576
|
bot:
|
1535
1577
|
name: HubPages
|
1536
1578
|
category: Crawler
|
1537
|
-
url:
|
1579
|
+
url: https://hubpages.com/help/crawlingpolicy
|
1538
1580
|
producer:
|
1539
|
-
name: HubPages
|
1540
|
-
url:
|
1541
|
-
-
|
1581
|
+
name: HubPages, Inc.
|
1582
|
+
url: https://discover.hubpages.com/
|
1583
|
+
-
|
1542
1584
|
user_agent: HubSpot Website Grader (web-crawlers@hubspot.com)
|
1543
1585
|
bot:
|
1544
1586
|
name: HubSpot
|
@@ -1546,7 +1588,7 @@
|
|
1546
1588
|
producer:
|
1547
1589
|
name: HubSpot Inc.
|
1548
1590
|
url: https://www.hubspot.com
|
1549
|
-
-
|
1591
|
+
-
|
1550
1592
|
user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
|
1551
1593
|
bot:
|
1552
1594
|
name: ICC-Crawler
|
@@ -1555,7 +1597,7 @@
|
|
1555
1597
|
producer:
|
1556
1598
|
name: ""
|
1557
1599
|
url: ""
|
1558
|
-
-
|
1600
|
+
-
|
1559
1601
|
user_agent: IDG/IT (http://spaziodati.eu/)
|
1560
1602
|
bot:
|
1561
1603
|
name: IDG/IT
|
@@ -1564,7 +1606,7 @@
|
|
1564
1606
|
producer:
|
1565
1607
|
name: SpazioDati S.r.l.
|
1566
1608
|
url: https://spaziodati.eu/
|
1567
|
-
-
|
1609
|
+
-
|
1568
1610
|
user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
|
1569
1611
|
bot:
|
1570
1612
|
name: IIS Site Analysis
|
@@ -1573,7 +1615,7 @@
|
|
1573
1615
|
producer:
|
1574
1616
|
name: Microsoft Corporation
|
1575
1617
|
url: http://www.microsoft.com
|
1576
|
-
-
|
1618
|
+
-
|
1577
1619
|
user_agent: IP-Guide.com Crawler/1.0 (https://ip-guide.com)
|
1578
1620
|
bot:
|
1579
1621
|
name: IP-Guide Crawler
|
@@ -1582,15 +1624,15 @@
|
|
1582
1624
|
producer:
|
1583
1625
|
name: ""
|
1584
1626
|
url: https://ip-guide.com
|
1585
|
-
-
|
1627
|
+
-
|
1586
1628
|
user_agent: Mozilla/5.0 (compatible; ips-agent)
|
1587
1629
|
bot:
|
1588
1630
|
name: IPS Agent
|
1589
|
-
category:
|
1631
|
+
category: Crawler
|
1590
1632
|
producer:
|
1591
1633
|
name: VeriSign, Inc
|
1592
1634
|
url: http://www.verisign.com/
|
1593
|
-
-
|
1635
|
+
-
|
1594
1636
|
user_agent: Kaspersky Lab CFR link resolver cfradmins@kaspersky.com
|
1595
1637
|
bot:
|
1596
1638
|
name: Kaspersky
|
@@ -1599,7 +1641,7 @@
|
|
1599
1641
|
producer:
|
1600
1642
|
name: AO Kaspersky Lab
|
1601
1643
|
url: https://www.kaspersky.com/
|
1602
|
-
-
|
1644
|
+
-
|
1603
1645
|
user_agent: kouio.com RSS reader
|
1604
1646
|
bot:
|
1605
1647
|
name: Kouio
|
@@ -1608,7 +1650,7 @@
|
|
1608
1650
|
producer:
|
1609
1651
|
name: ""
|
1610
1652
|
url: ""
|
1611
|
-
-
|
1653
|
+
-
|
1612
1654
|
user_agent: 'kouio.com RSS reader - 6 subscribers'
|
1613
1655
|
bot:
|
1614
1656
|
name: Kouio
|
@@ -1617,7 +1659,7 @@
|
|
1617
1659
|
producer:
|
1618
1660
|
name: ""
|
1619
1661
|
url: ""
|
1620
|
-
-
|
1662
|
+
-
|
1621
1663
|
user_agent: LCC (+http://corpora.informatik.uni-leipzig.de/crawler_faq.html)
|
1622
1664
|
bot:
|
1623
1665
|
name: LCC
|
@@ -1626,7 +1668,7 @@
|
|
1626
1668
|
producer:
|
1627
1669
|
name: Universität Leipzig
|
1628
1670
|
url: https://www.uni-leipzig.de/
|
1629
|
-
-
|
1671
|
+
-
|
1630
1672
|
user_agent: 'ltx71 - (http://ltx71.com/)'
|
1631
1673
|
bot:
|
1632
1674
|
name: LTX71
|
@@ -1634,7 +1676,7 @@
|
|
1634
1676
|
producer:
|
1635
1677
|
name: ""
|
1636
1678
|
url: ""
|
1637
|
-
-
|
1679
|
+
-
|
1638
1680
|
user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
|
1639
1681
|
bot:
|
1640
1682
|
name: Larbin web crawler
|
@@ -1643,7 +1685,7 @@
|
|
1643
1685
|
producer:
|
1644
1686
|
name: ""
|
1645
1687
|
url: ""
|
1646
|
-
-
|
1688
|
+
-
|
1647
1689
|
user_agent: "Mozilla/5.0 (compatible; Let's Encrypt validation server; +https://www.letsencrypt.org)"
|
1648
1690
|
bot:
|
1649
1691
|
name: "Let's Encrypt Validation"
|
@@ -1652,7 +1694,7 @@
|
|
1652
1694
|
producer:
|
1653
1695
|
name: "Let's Encrypt"
|
1654
1696
|
url: https://letsencrypt.org
|
1655
|
-
-
|
1697
|
+
-
|
1656
1698
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/61.0.3116.0 Mobile Safari/537.36 Chrome-Lighthouse
|
1657
1699
|
bot:
|
1658
1700
|
name: Lighthouse
|
@@ -1661,7 +1703,7 @@
|
|
1661
1703
|
producer:
|
1662
1704
|
name: Lighthouse
|
1663
1705
|
url: https://developers.google.com/web/tools/lighthouse
|
1664
|
-
-
|
1706
|
+
-
|
1665
1707
|
user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
|
1666
1708
|
bot:
|
1667
1709
|
name: Linkdex Bot
|
@@ -1670,7 +1712,7 @@
|
|
1670
1712
|
producer:
|
1671
1713
|
name: Mojeek Ltd.
|
1672
1714
|
url: http://www.mojeek.com
|
1673
|
-
-
|
1715
|
+
-
|
1674
1716
|
user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
|
1675
1717
|
bot:
|
1676
1718
|
name: Linkdex Bot
|
@@ -1679,7 +1721,7 @@
|
|
1679
1721
|
producer:
|
1680
1722
|
name: Mojeek Ltd.
|
1681
1723
|
url: http://www.mojeek.com
|
1682
|
-
-
|
1724
|
+
-
|
1683
1725
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
|
1684
1726
|
bot:
|
1685
1727
|
name: Linkdex Bot
|
@@ -1688,7 +1730,7 @@
|
|
1688
1730
|
producer:
|
1689
1731
|
name: Mojeek Ltd.
|
1690
1732
|
url: http://www.mojeek.com
|
1691
|
-
-
|
1733
|
+
-
|
1692
1734
|
user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
|
1693
1735
|
bot:
|
1694
1736
|
name: LinkedIn Bot
|
@@ -1697,7 +1739,7 @@
|
|
1697
1739
|
producer:
|
1698
1740
|
name: LinkedIn
|
1699
1741
|
url: http://www.linkedin.com
|
1700
|
-
-
|
1742
|
+
-
|
1701
1743
|
user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
|
1702
1744
|
bot:
|
1703
1745
|
name: MJ12 Bot
|
@@ -1706,7 +1748,7 @@
|
|
1706
1748
|
producer:
|
1707
1749
|
name: Majestic-12
|
1708
1750
|
url: http://majestic12.co.uk
|
1709
|
-
-
|
1751
|
+
-
|
1710
1752
|
user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
|
1711
1753
|
bot:
|
1712
1754
|
name: Magpie-Crawler
|
@@ -1715,7 +1757,7 @@
|
|
1715
1757
|
producer:
|
1716
1758
|
name: Brandwatch
|
1717
1759
|
url: http://www.brandwatch.com
|
1718
|
-
-
|
1760
|
+
-
|
1719
1761
|
user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
|
1720
1762
|
bot:
|
1721
1763
|
name: MagpieRSS
|
@@ -1724,7 +1766,7 @@
|
|
1724
1766
|
producer:
|
1725
1767
|
name: ""
|
1726
1768
|
url: ""
|
1727
|
-
-
|
1769
|
+
-
|
1728
1770
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
|
1729
1771
|
bot:
|
1730
1772
|
name: Mail.Ru Bot
|
@@ -1733,7 +1775,7 @@
|
|
1733
1775
|
producer:
|
1734
1776
|
name: Mail.Ru Group
|
1735
1777
|
url: http://corp.mail.ru
|
1736
|
-
-
|
1778
|
+
-
|
1737
1779
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
|
1738
1780
|
bot:
|
1739
1781
|
name: Mail.Ru Bot
|
@@ -1742,17 +1784,17 @@
|
|
1742
1784
|
producer:
|
1743
1785
|
name: Mail.Ru Group
|
1744
1786
|
url: http://corp.mail.ru
|
1745
|
-
-
|
1787
|
+
-
|
1746
1788
|
user_agent: http.rb/2.2.2 (Mastodon/1.6.1; +https://mathtod.online/)
|
1747
1789
|
bot:
|
1748
1790
|
name: Mastodon Bot
|
1749
1791
|
category: Social Media Agent
|
1750
|
-
-
|
1792
|
+
-
|
1751
1793
|
user_agent: http.rb/3.2.0 (Mastodon/2.4.3; +https://uwu.social/)
|
1752
1794
|
bot:
|
1753
1795
|
name: Mastodon Bot
|
1754
1796
|
category: Social Media Agent
|
1755
|
-
-
|
1797
|
+
-
|
1756
1798
|
user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
|
1757
1799
|
bot:
|
1758
1800
|
name: Meanpath Bot
|
@@ -1761,13 +1803,13 @@
|
|
1761
1803
|
producer:
|
1762
1804
|
name: Meanpath
|
1763
1805
|
url: http://www.meanpath.com
|
1764
|
-
-
|
1806
|
+
-
|
1765
1807
|
user_agent: MetaInspector/5.4.0 (+https://github.com/jaimeiniesta/metainspector)
|
1766
1808
|
bot:
|
1767
1809
|
name: MetaInspector
|
1768
1810
|
category: Crawler
|
1769
1811
|
url: https://github.com/jaimeiniesta/metainspector
|
1770
|
-
-
|
1812
|
+
-
|
1771
1813
|
user_agent: Mozilla/5.0 (compatible; MetaJobBot; http://www.metajob.de/crawler)
|
1772
1814
|
bot:
|
1773
1815
|
name: MetaJobBot
|
@@ -1776,7 +1818,7 @@
|
|
1776
1818
|
producer:
|
1777
1819
|
name: MetaJob
|
1778
1820
|
url: http://www.metajob.at
|
1779
|
-
-
|
1821
|
+
-
|
1780
1822
|
user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
|
1781
1823
|
bot:
|
1782
1824
|
name: Mixrank Bot
|
@@ -1785,7 +1827,7 @@
|
|
1785
1827
|
producer:
|
1786
1828
|
name: Online Media Group, Inc.
|
1787
1829
|
url: ""
|
1788
|
-
-
|
1830
|
+
-
|
1789
1831
|
user_agent: Mnogosearch-3.1.21
|
1790
1832
|
bot:
|
1791
1833
|
name: Mnogosearch
|
@@ -1794,7 +1836,7 @@
|
|
1794
1836
|
producer:
|
1795
1837
|
name: Lavtech.Com Corp.
|
1796
1838
|
url: ""
|
1797
|
-
-
|
1839
|
+
-
|
1798
1840
|
user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
|
1799
1841
|
bot:
|
1800
1842
|
name: MojeekBot
|
@@ -1803,7 +1845,7 @@
|
|
1803
1845
|
producer:
|
1804
1846
|
name: Mojeek Ltd.
|
1805
1847
|
url: http://www.mojeek.com
|
1806
|
-
-
|
1848
|
+
-
|
1807
1849
|
user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
|
1808
1850
|
bot:
|
1809
1851
|
name: Monitor.Us
|
@@ -1812,7 +1854,7 @@
|
|
1812
1854
|
producer:
|
1813
1855
|
name: Monitor.Us
|
1814
1856
|
url: http://www.monitor.us
|
1815
|
-
-
|
1857
|
+
-
|
1816
1858
|
user_agent: munin/2.0.30-1 (libwww-perl/6.15)
|
1817
1859
|
bot:
|
1818
1860
|
name: Munin
|
@@ -1821,7 +1863,7 @@
|
|
1821
1863
|
producer:
|
1822
1864
|
name: Munin
|
1823
1865
|
url: http://munin-monitoring.org/
|
1824
|
-
-
|
1866
|
+
-
|
1825
1867
|
user_agent: munin/http_loadtime
|
1826
1868
|
bot:
|
1827
1869
|
name: Munin
|
@@ -1830,7 +1872,7 @@
|
|
1830
1872
|
producer:
|
1831
1873
|
name: Munin
|
1832
1874
|
url: http://munin-monitoring.org/
|
1833
|
-
-
|
1875
|
+
-
|
1834
1876
|
user_agent: nlcrawler/1.0 (+http://northernlight.com/)
|
1835
1877
|
bot:
|
1836
1878
|
name: NLCrawler
|
@@ -1839,7 +1881,7 @@
|
|
1839
1881
|
producer:
|
1840
1882
|
name: Northern Light
|
1841
1883
|
url: http://northernlight.com
|
1842
|
-
-
|
1884
|
+
-
|
1843
1885
|
user_agent: check_http/v1.5 (nagios-plugins 1.5)
|
1844
1886
|
bot:
|
1845
1887
|
name: Nagios check_http
|
@@ -1848,7 +1890,7 @@
|
|
1848
1890
|
producer:
|
1849
1891
|
name: Nagios Plugins Development Team
|
1850
1892
|
url: https://nagios.org
|
1851
|
-
-
|
1893
|
+
-
|
1852
1894
|
user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
|
1853
1895
|
bot:
|
1854
1896
|
name: NalezenCzBot
|
@@ -1857,11 +1899,11 @@
|
|
1857
1899
|
producer:
|
1858
1900
|
name: Jaroslav Kuboš
|
1859
1901
|
url: ""
|
1860
|
-
-
|
1902
|
+
-
|
1861
1903
|
user_agent: NetLyzer FastProbe
|
1862
1904
|
bot:
|
1863
1905
|
name: NetLyzer FastProbe
|
1864
|
-
-
|
1906
|
+
-
|
1865
1907
|
user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
|
1866
1908
|
bot:
|
1867
1909
|
name: Netcraft Survey Bot
|
@@ -1870,7 +1912,7 @@
|
|
1870
1912
|
producer:
|
1871
1913
|
name: Netcraft
|
1872
1914
|
url: http://www.netcraft.com
|
1873
|
-
-
|
1915
|
+
-
|
1874
1916
|
user_agent: Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)
|
1875
1917
|
bot:
|
1876
1918
|
name: Netcraft Survey Bot
|
@@ -1879,7 +1921,7 @@
|
|
1879
1921
|
producer:
|
1880
1922
|
name: Netcraft
|
1881
1923
|
url: http://www.netcraft.com
|
1882
|
-
-
|
1924
|
+
-
|
1883
1925
|
user_agent: 'Netcraft SSL Server Survey - contact info@netcraft.com'
|
1884
1926
|
bot:
|
1885
1927
|
name: Netcraft Survey Bot
|
@@ -1888,7 +1930,7 @@
|
|
1888
1930
|
producer:
|
1889
1931
|
name: Netcraft
|
1890
1932
|
url: http://www.netcraft.com
|
1891
|
-
-
|
1933
|
+
-
|
1892
1934
|
user_agent: Netvibes (http://www.netvibes.com)
|
1893
1935
|
bot:
|
1894
1936
|
name: Netvibes
|
@@ -1897,7 +1939,7 @@
|
|
1897
1939
|
producer:
|
1898
1940
|
name: ""
|
1899
1941
|
url: ""
|
1900
|
-
-
|
1942
|
+
-
|
1901
1943
|
user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
|
1902
1944
|
bot:
|
1903
1945
|
name: Netvibes
|
@@ -1906,7 +1948,7 @@
|
|
1906
1948
|
producer:
|
1907
1949
|
name: ""
|
1908
1950
|
url: ""
|
1909
|
-
-
|
1951
|
+
-
|
1910
1952
|
user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1911
1953
|
bot:
|
1912
1954
|
name: NewsBlur
|
@@ -1915,7 +1957,7 @@
|
|
1915
1957
|
producer:
|
1916
1958
|
name: ""
|
1917
1959
|
url: ""
|
1918
|
-
-
|
1960
|
+
-
|
1919
1961
|
user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1920
1962
|
bot:
|
1921
1963
|
name: NewsBlur
|
@@ -1924,7 +1966,7 @@
|
|
1924
1966
|
producer:
|
1925
1967
|
name: ""
|
1926
1968
|
url: ""
|
1927
|
-
-
|
1969
|
+
-
|
1928
1970
|
user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
1929
1971
|
bot:
|
1930
1972
|
name: NewsBlur
|
@@ -1933,7 +1975,7 @@
|
|
1933
1975
|
producer:
|
1934
1976
|
name: ""
|
1935
1977
|
url: ""
|
1936
|
-
-
|
1978
|
+
-
|
1937
1979
|
user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
1938
1980
|
bot:
|
1939
1981
|
name: NewsBlur
|
@@ -1942,7 +1984,7 @@
|
|
1942
1984
|
producer:
|
1943
1985
|
name: ""
|
1944
1986
|
url: ""
|
1945
|
-
-
|
1987
|
+
-
|
1946
1988
|
user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
|
1947
1989
|
bot:
|
1948
1990
|
name: NewsGator
|
@@ -1951,7 +1993,7 @@
|
|
1951
1993
|
producer:
|
1952
1994
|
name: ""
|
1953
1995
|
url: ""
|
1954
|
-
-
|
1996
|
+
-
|
1955
1997
|
user_agent: Mozilla/5.0 (compatible; Nmap Scripting Engine; https://nmap.org/book/nse.html)
|
1956
1998
|
bot:
|
1957
1999
|
name: Nmap
|
@@ -1960,7 +2002,7 @@
|
|
1960
2002
|
producer:
|
1961
2003
|
name: Nmap
|
1962
2004
|
url: https://nmap.org/
|
1963
|
-
-
|
2005
|
+
-
|
1964
2006
|
user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
|
1965
2007
|
bot:
|
1966
2008
|
name: Nutch-based Bot
|
@@ -1968,8 +2010,8 @@
|
|
1968
2010
|
url: https://nutch.apache.org
|
1969
2011
|
producer:
|
1970
2012
|
name: The Apache Software Foundation
|
1971
|
-
url:
|
1972
|
-
-
|
2013
|
+
url: https://www.apache.org/foundation/
|
2014
|
+
-
|
1973
2015
|
user_agent: CB/Nutch-1.7
|
1974
2016
|
bot:
|
1975
2017
|
name: Nutch-based Bot
|
@@ -1977,8 +2019,8 @@
|
|
1977
2019
|
url: https://nutch.apache.org
|
1978
2020
|
producer:
|
1979
2021
|
name: The Apache Software Foundation
|
1980
|
-
url:
|
1981
|
-
-
|
2022
|
+
url: https://www.apache.org/foundation/
|
2023
|
+
-
|
1982
2024
|
user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
|
1983
2025
|
bot:
|
1984
2026
|
name: Nutch-based Bot
|
@@ -1986,8 +2028,8 @@
|
|
1986
2028
|
url: https://nutch.apache.org
|
1987
2029
|
producer:
|
1988
2030
|
name: The Apache Software Foundation
|
1989
|
-
url:
|
1990
|
-
-
|
2031
|
+
url: https://www.apache.org/foundation/
|
2032
|
+
-
|
1991
2033
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
|
1992
2034
|
bot:
|
1993
2035
|
name: Nutch-based Bot
|
@@ -1995,8 +2037,8 @@
|
|
1995
2037
|
url: https://nutch.apache.org
|
1996
2038
|
producer:
|
1997
2039
|
name: The Apache Software Foundation
|
1998
|
-
url:
|
1999
|
-
-
|
2040
|
+
url: https://www.apache.org/foundation/
|
2041
|
+
-
|
2000
2042
|
user_agent: My Nutch Spider/Nutch-1.6
|
2001
2043
|
bot:
|
2002
2044
|
name: Nutch-based Bot
|
@@ -2004,8 +2046,8 @@
|
|
2004
2046
|
url: https://nutch.apache.org
|
2005
2047
|
producer:
|
2006
2048
|
name: The Apache Software Foundation
|
2007
|
-
url:
|
2008
|
-
-
|
2049
|
+
url: https://www.apache.org/foundation/
|
2050
|
+
-
|
2009
2051
|
user_agent: MySpider/Nutch-2.2
|
2010
2052
|
bot:
|
2011
2053
|
name: Nutch-based Bot
|
@@ -2013,8 +2055,8 @@
|
|
2013
2055
|
url: https://nutch.apache.org
|
2014
2056
|
producer:
|
2015
2057
|
name: The Apache Software Foundation
|
2016
|
-
url:
|
2017
|
-
-
|
2058
|
+
url: https://www.apache.org/foundation/
|
2059
|
+
-
|
2018
2060
|
user_agent: Nutch12/Nutch-1.2
|
2019
2061
|
bot:
|
2020
2062
|
name: Nutch-based Bot
|
@@ -2022,8 +2064,8 @@
|
|
2022
2064
|
url: https://nutch.apache.org
|
2023
2065
|
producer:
|
2024
2066
|
name: The Apache Software Foundation
|
2025
|
-
url:
|
2026
|
-
-
|
2067
|
+
url: https://www.apache.org/foundation/
|
2068
|
+
-
|
2027
2069
|
user_agent: NutchSpider/Nutch-1.4
|
2028
2070
|
bot:
|
2029
2071
|
name: Nutch-based Bot
|
@@ -2031,8 +2073,8 @@
|
|
2031
2073
|
url: https://nutch.apache.org
|
2032
2074
|
producer:
|
2033
2075
|
name: The Apache Software Foundation
|
2034
|
-
url:
|
2035
|
-
-
|
2076
|
+
url: https://www.apache.org/foundation/
|
2077
|
+
-
|
2036
2078
|
user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
|
2037
2079
|
bot:
|
2038
2080
|
name: Nutch-based Bot
|
@@ -2040,8 +2082,8 @@
|
|
2040
2082
|
url: https://nutch.apache.org
|
2041
2083
|
producer:
|
2042
2084
|
name: The Apache Software Foundation
|
2043
|
-
url:
|
2044
|
-
-
|
2085
|
+
url: https://www.apache.org/foundation/
|
2086
|
+
-
|
2045
2087
|
user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
|
2046
2088
|
bot:
|
2047
2089
|
name: Nutch-based Bot
|
@@ -2049,8 +2091,8 @@
|
|
2049
2091
|
url: https://nutch.apache.org
|
2050
2092
|
producer:
|
2051
2093
|
name: The Apache Software Foundation
|
2052
|
-
url:
|
2053
|
-
-
|
2094
|
+
url: https://www.apache.org/foundation/
|
2095
|
+
-
|
2054
2096
|
user_agent: testnutch/Nutch-1.8
|
2055
2097
|
bot:
|
2056
2098
|
name: Nutch-based Bot
|
@@ -2058,8 +2100,8 @@
|
|
2058
2100
|
url: https://nutch.apache.org
|
2059
2101
|
producer:
|
2060
2102
|
name: The Apache Software Foundation
|
2061
|
-
url:
|
2062
|
-
-
|
2103
|
+
url: https://www.apache.org/foundation/
|
2104
|
+
-
|
2063
2105
|
user_agent: Your Nutch Spider/Nutch-2.2.1
|
2064
2106
|
bot:
|
2065
2107
|
name: Nutch-based Bot
|
@@ -2067,8 +2109,8 @@
|
|
2067
2109
|
url: https://nutch.apache.org
|
2068
2110
|
producer:
|
2069
2111
|
name: The Apache Software Foundation
|
2070
|
-
url:
|
2071
|
-
-
|
2112
|
+
url: https://www.apache.org/foundation/
|
2113
|
+
-
|
2072
2114
|
user_agent: your sipder name/Nutch-1.7
|
2073
2115
|
bot:
|
2074
2116
|
name: Nutch-based Bot
|
@@ -2076,8 +2118,8 @@
|
|
2076
2118
|
url: https://nutch.apache.org
|
2077
2119
|
producer:
|
2078
2120
|
name: The Apache Software Foundation
|
2079
|
-
url:
|
2080
|
-
-
|
2121
|
+
url: https://www.apache.org/foundation/
|
2122
|
+
-
|
2081
2123
|
user_agent: Nuzzel
|
2082
2124
|
bot:
|
2083
2125
|
name: Nuzzel
|
@@ -2085,11 +2127,11 @@
|
|
2085
2127
|
producer:
|
2086
2128
|
name: Nuzzel
|
2087
2129
|
url: https://www.nuzzel.com/
|
2088
|
-
-
|
2130
|
+
-
|
2089
2131
|
user_agent: Octopus 1.0.2
|
2090
2132
|
bot:
|
2091
2133
|
name: Octopus
|
2092
|
-
-
|
2134
|
+
-
|
2093
2135
|
user_agent: omgili/0.5 +http://omgili.com
|
2094
2136
|
bot:
|
2095
2137
|
name: Omgili bot
|
@@ -2098,7 +2140,7 @@
|
|
2098
2140
|
producer:
|
2099
2141
|
name: Omgili
|
2100
2142
|
url: http://www.omgili.com
|
2101
|
-
-
|
2143
|
+
-
|
2102
2144
|
user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
|
2103
2145
|
bot:
|
2104
2146
|
name: Omgili bot
|
@@ -2107,7 +2149,7 @@
|
|
2107
2149
|
producer:
|
2108
2150
|
name: Omgili
|
2109
2151
|
url: http://www.omgili.com
|
2110
|
-
-
|
2152
|
+
-
|
2111
2153
|
user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
|
2112
2154
|
bot:
|
2113
2155
|
name: OpenLinkProfiler
|
@@ -2116,7 +2158,7 @@
|
|
2116
2158
|
producer:
|
2117
2159
|
name: Axandra GmbH
|
2118
2160
|
url: http://www.axandra.com
|
2119
|
-
-
|
2161
|
+
-
|
2120
2162
|
user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
|
2121
2163
|
bot:
|
2122
2164
|
name: OpenWebSpider
|
@@ -2125,7 +2167,7 @@
|
|
2125
2167
|
producer:
|
2126
2168
|
name: OpenWebSpider Lab
|
2127
2169
|
url: http://lab.openwebspider.org
|
2128
|
-
-
|
2170
|
+
-
|
2129
2171
|
user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
|
2130
2172
|
bot:
|
2131
2173
|
name: Openindex Spider
|
@@ -2134,7 +2176,7 @@
|
|
2134
2176
|
producer:
|
2135
2177
|
name: Openindex B.V.
|
2136
2178
|
url: http://www.openindex.io
|
2137
|
-
-
|
2179
|
+
-
|
2138
2180
|
user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
|
2139
2181
|
bot:
|
2140
2182
|
name: Orange Bot
|
@@ -2143,7 +2185,7 @@
|
|
2143
2185
|
producer:
|
2144
2186
|
name: Orange
|
2145
2187
|
url: http://www.orange.fr
|
2146
|
-
-
|
2188
|
+
-
|
2147
2189
|
user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
|
2148
2190
|
bot:
|
2149
2191
|
name: Orange Bot
|
@@ -2152,7 +2194,7 @@
|
|
2152
2194
|
producer:
|
2153
2195
|
name: Orange
|
2154
2196
|
url: http://www.orange.fr
|
2155
|
-
-
|
2197
|
+
-
|
2156
2198
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
|
2157
2199
|
bot:
|
2158
2200
|
name: Orange Bot
|
@@ -2161,7 +2203,7 @@
|
|
2161
2203
|
producer:
|
2162
2204
|
name: Orange
|
2163
2205
|
url: http://www.orange.fr
|
2164
|
-
-
|
2206
|
+
-
|
2165
2207
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
|
2166
2208
|
bot:
|
2167
2209
|
name: Orange Bot
|
@@ -2170,7 +2212,7 @@
|
|
2170
2212
|
producer:
|
2171
2213
|
name: Orange
|
2172
2214
|
url: http://www.orange.fr
|
2173
|
-
-
|
2215
|
+
-
|
2174
2216
|
user_agent: Mozilla/5.0 (Java) outbrain
|
2175
2217
|
bot:
|
2176
2218
|
name: Outbrain
|
@@ -2179,7 +2221,7 @@
|
|
2179
2221
|
producer:
|
2180
2222
|
name: Outbrain
|
2181
2223
|
url: http://www.outbrain.com/
|
2182
|
-
-
|
2224
|
+
-
|
2183
2225
|
user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
|
2184
2226
|
bot:
|
2185
2227
|
name: PHP Server Monitor
|
@@ -2188,7 +2230,16 @@
|
|
2188
2230
|
producer:
|
2189
2231
|
name: PHP Server Monitor
|
2190
2232
|
url: http://www.phpservermonitor.org/
|
2191
|
-
-
|
2233
|
+
-
|
2234
|
+
user_agent: Mozilla/5.0 (compatible; PRTG Network Monitor (www.paessler.com); Windows)
|
2235
|
+
bot:
|
2236
|
+
name: PRTG Network Monitor
|
2237
|
+
category: Network Monitor
|
2238
|
+
url: https://www.paessler.com/prtg
|
2239
|
+
producer:
|
2240
|
+
name: Paessler AG
|
2241
|
+
url: https://www.paessler.com
|
2242
|
+
-
|
2192
2243
|
user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
|
2193
2244
|
bot:
|
2194
2245
|
name: PaperLiBot
|
@@ -2197,13 +2248,19 @@
|
|
2197
2248
|
producer:
|
2198
2249
|
name: Smallrivers SA
|
2199
2250
|
url: http://www.paper.li
|
2200
|
-
-
|
2251
|
+
-
|
2252
|
+
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; PetalBot;+https://aspiegel.com/petalbot)
|
2253
|
+
bot:
|
2254
|
+
name: Petal Bot
|
2255
|
+
category: Crawler
|
2256
|
+
url: https://aspiegel.com/petalbot
|
2257
|
+
-
|
2201
2258
|
user_agent: phantomas/1.11.0 (PhantomJS/1.9.8; linux x64)
|
2202
2259
|
bot:
|
2203
2260
|
name: Phantomas
|
2204
2261
|
category: Site Monitor
|
2205
2262
|
url: https://github.com/macbre/phantomas
|
2206
|
-
-
|
2263
|
+
-
|
2207
2264
|
user_agent: psbot-page (+http://www.picsearch.com/bot.html)
|
2208
2265
|
bot:
|
2209
2266
|
name: Picsearch bot
|
@@ -2212,7 +2269,7 @@
|
|
2212
2269
|
producer:
|
2213
2270
|
name: Picsearch
|
2214
2271
|
url: http://www.picsearch.com
|
2215
|
-
-
|
2272
|
+
-
|
2216
2273
|
user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
|
2217
2274
|
bot:
|
2218
2275
|
name: Picsearch bot
|
@@ -2221,7 +2278,7 @@
|
|
2221
2278
|
producer:
|
2222
2279
|
name: Picsearch
|
2223
2280
|
url: http://www.picsearch.com
|
2224
|
-
-
|
2281
|
+
-
|
2225
2282
|
user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
|
2226
2283
|
bot:
|
2227
2284
|
name: Pingdom Bot
|
@@ -2230,25 +2287,34 @@
|
|
2230
2287
|
producer:
|
2231
2288
|
name: Pingdom AB
|
2232
2289
|
url: https://www.pingdom.com
|
2233
|
-
-
|
2290
|
+
-
|
2234
2291
|
user_agent: Mozilla/5.0 (compatible; Pinterestbot/1.0; http://www.pinterest.com/bot.html)
|
2235
2292
|
bot:
|
2236
2293
|
name: Pinterest
|
2237
|
-
url:
|
2294
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
2238
2295
|
category: Crawler
|
2239
2296
|
producer:
|
2240
2297
|
name: Pinterest
|
2241
|
-
url:
|
2242
|
-
-
|
2298
|
+
url: https://www.pinterest.com/
|
2299
|
+
-
|
2243
2300
|
user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
|
2244
2301
|
bot:
|
2245
2302
|
name: Pinterest
|
2246
|
-
url:
|
2303
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
2304
|
+
category: Crawler
|
2305
|
+
producer:
|
2306
|
+
name: Pinterest
|
2307
|
+
url: https://www.pinterest.com/
|
2308
|
+
-
|
2309
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Pinterestbot/1.0; https://www.pinterest.com/bot.html)
|
2310
|
+
bot:
|
2311
|
+
name: Pinterest
|
2312
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
2247
2313
|
category: Crawler
|
2248
2314
|
producer:
|
2249
2315
|
name: Pinterest
|
2250
|
-
url:
|
2251
|
-
-
|
2316
|
+
url: https://www.pinterest.com/
|
2317
|
+
-
|
2252
2318
|
user_agent: PocketParser/2.0 (+https://getpocket.com/pocketparser_ua)
|
2253
2319
|
bot:
|
2254
2320
|
name: PocketParser
|
@@ -2257,7 +2323,7 @@
|
|
2257
2323
|
producer:
|
2258
2324
|
name: Pocket
|
2259
2325
|
url: https://getpocket.com/
|
2260
|
-
-
|
2326
|
+
-
|
2261
2327
|
user_agent: PritTorrent/1.0
|
2262
2328
|
bot:
|
2263
2329
|
name: PritTorrent
|
@@ -2266,7 +2332,7 @@
|
|
2266
2332
|
producer:
|
2267
2333
|
name: Bitlove
|
2268
2334
|
url: http://bitlove.org/
|
2269
|
-
-
|
2335
|
+
-
|
2270
2336
|
user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
|
2271
2337
|
bot:
|
2272
2338
|
name: QuerySeekerSpider
|
@@ -2275,7 +2341,7 @@
|
|
2275
2341
|
producer:
|
2276
2342
|
name: QueryEye Inc.
|
2277
2343
|
url: http://queryeye.com
|
2278
|
-
-
|
2344
|
+
-
|
2279
2345
|
user_agent: Quora Link Preview/1.0 (http://www.quora.com)
|
2280
2346
|
bot:
|
2281
2347
|
name: Quora Link Preview
|
@@ -2284,7 +2350,7 @@
|
|
2284
2350
|
producer:
|
2285
2351
|
name: Quora
|
2286
2352
|
url: http://www.quora.com
|
2287
|
-
-
|
2353
|
+
-
|
2288
2354
|
user_agent: 'Mozilla/5.0 (compatible; Qwantify/2.2w; +https://www.qwant.com/)/*'
|
2289
2355
|
bot:
|
2290
2356
|
name: Qwantify
|
@@ -2293,7 +2359,7 @@
|
|
2293
2359
|
producer:
|
2294
2360
|
name: Qwant Corporation
|
2295
2361
|
url: https://www.qwant.com/
|
2296
|
-
-
|
2362
|
+
-
|
2297
2363
|
user_agent: ROI Hunter; https://api-dev.roihunter.com
|
2298
2364
|
bot:
|
2299
2365
|
name: ROI Hunter
|
@@ -2302,17 +2368,17 @@
|
|
2302
2368
|
producer:
|
2303
2369
|
name: Roihunter a.s.
|
2304
2370
|
url: http://roihunter.com/
|
2305
|
-
-
|
2371
|
+
-
|
2306
2372
|
user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
|
2307
2373
|
bot:
|
2308
2374
|
name: RSSRadio Bot
|
2309
|
-
-
|
2375
|
+
-
|
2310
2376
|
user_agent: Rainmeter WebParser plugin
|
2311
2377
|
bot:
|
2312
2378
|
name: Rainmeter
|
2313
2379
|
category: Crawler
|
2314
2380
|
url: https://www.rainmeter.net
|
2315
|
-
-
|
2381
|
+
-
|
2316
2382
|
user_agent: RamblerMail/6.0 (incompatible; ImageProxy/6.0)
|
2317
2383
|
bot:
|
2318
2384
|
name: RamblerMail Image Proxy
|
@@ -2321,7 +2387,7 @@
|
|
2321
2387
|
producer:
|
2322
2388
|
name: 'Rambler&Co'
|
2323
2389
|
url: https://rambler-co.ru/
|
2324
|
-
-
|
2390
|
+
-
|
2325
2391
|
user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
|
2326
2392
|
bot:
|
2327
2393
|
name: Reddit Bot
|
@@ -2330,7 +2396,12 @@
|
|
2330
2396
|
producer:
|
2331
2397
|
name: reddit inc.
|
2332
2398
|
url: http://www.reddit.com
|
2333
|
-
-
|
2399
|
+
-
|
2400
|
+
user_agent: Robozilla/1.0
|
2401
|
+
bot:
|
2402
|
+
name: Robozilla
|
2403
|
+
category: Crawler
|
2404
|
+
-
|
2334
2405
|
user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
|
2335
2406
|
bot:
|
2336
2407
|
name: Rogerbot
|
@@ -2339,7 +2410,7 @@
|
|
2339
2410
|
producer:
|
2340
2411
|
name: SEOmoz, Inc.
|
2341
2412
|
url: http://moz.com/
|
2342
|
-
-
|
2413
|
+
-
|
2343
2414
|
user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
|
2344
2415
|
bot:
|
2345
2416
|
name: Rogerbot
|
@@ -2348,7 +2419,7 @@
|
|
2348
2419
|
producer:
|
2349
2420
|
name: SEOmoz, Inc.
|
2350
2421
|
url: http://moz.com/
|
2351
|
-
-
|
2422
|
+
-
|
2352
2423
|
user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
|
2353
2424
|
bot:
|
2354
2425
|
name: Rogerbot
|
@@ -2357,7 +2428,7 @@
|
|
2357
2428
|
producer:
|
2358
2429
|
name: SEOmoz, Inc.
|
2359
2430
|
url: http://moz.com/
|
2360
|
-
-
|
2431
|
+
-
|
2361
2432
|
user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
|
2362
2433
|
bot:
|
2363
2434
|
name: SEOENGBot
|
@@ -2366,7 +2437,7 @@
|
|
2366
2437
|
producer:
|
2367
2438
|
name: SEO Engine
|
2368
2439
|
url: http://www.seoengine.com
|
2369
|
-
-
|
2440
|
+
-
|
2370
2441
|
user_agent: Mozilla/5.0 (compatible; SEOkicks-Robot; +http://www.seokicks.de/robot.html)
|
2371
2442
|
bot:
|
2372
2443
|
name: SEOkicks-Robot
|
@@ -2375,7 +2446,7 @@
|
|
2375
2446
|
producer:
|
2376
2447
|
name: SEOkicks
|
2377
2448
|
url: https://www.seokicks.de/
|
2378
|
-
-
|
2449
|
+
-
|
2379
2450
|
user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
|
2380
2451
|
bot:
|
2381
2452
|
name: SISTRIX Crawler
|
@@ -2402,7 +2473,7 @@
|
|
2402
2473
|
producer:
|
2403
2474
|
name: SISTRIX GmbH
|
2404
2475
|
url: http://www.sistrix.de
|
2405
|
-
-
|
2476
|
+
-
|
2406
2477
|
user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer; Uptime; +https://www.sistrix.com/faq/uptime)
|
2407
2478
|
bot:
|
2408
2479
|
name: SISTRIX Optimizer
|
@@ -2411,7 +2482,7 @@
|
|
2411
2482
|
producer:
|
2412
2483
|
name: SISTRIX GmbH
|
2413
2484
|
url: http://www.sistrix.de
|
2414
|
-
-
|
2485
|
+
-
|
2415
2486
|
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.75 Safari/537.36 (compatible; SMTBot/1.0; +http://www.similartech.com/smtbot)
|
2416
2487
|
bot:
|
2417
2488
|
name: SMTBot
|
@@ -2420,7 +2491,7 @@
|
|
2420
2491
|
producer:
|
2421
2492
|
name: SimilarTech Ltd.
|
2422
2493
|
url: https://www.similartech.com/
|
2423
|
-
-
|
2494
|
+
-
|
2424
2495
|
user_agent: SSL Labs (https://www.ssllabs.com/about/assessment.html)
|
2425
2496
|
bot:
|
2426
2497
|
name: SSL Labs
|
@@ -2429,7 +2500,7 @@
|
|
2429
2500
|
producer:
|
2430
2501
|
name: SSL Labs
|
2431
2502
|
url: https://www.ssllabs.com/about/assessment.html
|
2432
|
-
-
|
2503
|
+
-
|
2433
2504
|
user_agent: SafeDNSBot (https://www.safedns.com/searchbot)
|
2434
2505
|
bot:
|
2435
2506
|
name: SafeDNSBot
|
@@ -2438,13 +2509,13 @@
|
|
2438
2509
|
producer:
|
2439
2510
|
name: SafeDNS, Inc.
|
2440
2511
|
url: https://www.safedns.com/
|
2441
|
-
-
|
2512
|
+
-
|
2442
2513
|
user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
|
2443
2514
|
bot:
|
2444
2515
|
name: Scrapy
|
2445
2516
|
category: Crawler
|
2446
2517
|
url: http://scrapy.org
|
2447
|
-
-
|
2518
|
+
-
|
2448
2519
|
user_agent: Screaming Frog SEO Spider/2.22
|
2449
2520
|
bot:
|
2450
2521
|
name: Screaming Frog SEO Spider
|
@@ -2453,7 +2524,7 @@
|
|
2453
2524
|
producer:
|
2454
2525
|
name: Screaming Frog Ltd
|
2455
2526
|
url: http://www.screamingfrog.co.uk
|
2456
|
-
-
|
2527
|
+
-
|
2457
2528
|
user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
|
2458
2529
|
bot:
|
2459
2530
|
name: ScreenerBot
|
@@ -2462,7 +2533,13 @@
|
|
2462
2533
|
producer:
|
2463
2534
|
name: ""
|
2464
2535
|
url: ""
|
2465
|
-
-
|
2536
|
+
-
|
2537
|
+
user_agent: Mozilla/5.0 (compatible) SemanticScholarBot (+https://www.semanticscholar.org/crawler)
|
2538
|
+
bot:
|
2539
|
+
name: Semantic Scholar Bot
|
2540
|
+
category: Crawler
|
2541
|
+
url: https://www.semanticscholar.org/crawler
|
2542
|
+
-
|
2466
2543
|
user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
|
2467
2544
|
bot:
|
2468
2545
|
name: Semrush Bot
|
@@ -2471,7 +2548,7 @@
|
|
2471
2548
|
producer:
|
2472
2549
|
name: SEMrush
|
2473
2550
|
url: http://www.semrush.com
|
2474
|
-
-
|
2551
|
+
-
|
2475
2552
|
user_agent: SensikaBot/x.33 (+http://sensika.com)
|
2476
2553
|
bot:
|
2477
2554
|
name: Sensika Bot
|
@@ -2480,24 +2557,36 @@
|
|
2480
2557
|
producer:
|
2481
2558
|
name: Sensika
|
2482
2559
|
url: http://sensika.com
|
2483
|
-
-
|
2560
|
+
-
|
2484
2561
|
user_agent: sentry/8.6.0 (https://getsentry.com)
|
2485
2562
|
bot:
|
2486
2563
|
name: Sentry Bot
|
2487
2564
|
producer:
|
2488
2565
|
name: Sentry
|
2489
2566
|
url: https://sentry.io
|
2490
|
-
-
|
2567
|
+
-
|
2568
|
+
user_agent: Seobility
|
2569
|
+
bot:
|
2570
|
+
name: Seobility
|
2571
|
+
category: Crawler
|
2572
|
+
url: 'https://www.seobility.net/en/faq/?category=crawling#!aboutourbot'
|
2573
|
+
-
|
2491
2574
|
user_agent: Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)
|
2492
2575
|
bot:
|
2493
2576
|
name: Seoscanners.net
|
2494
2577
|
category: Crawler
|
2495
2578
|
url: ""
|
2496
|
-
-
|
2579
|
+
-
|
2580
|
+
user_agent: SerendeputyBot/0.8.6 (http://serendeputy.com/about/serendeputy-bot)
|
2581
|
+
bot:
|
2582
|
+
name: Serendeputy Bot
|
2583
|
+
category: Crawler
|
2584
|
+
url: https://serendeputy.com/about/serendeputy-bot
|
2585
|
+
-
|
2497
2586
|
user_agent: Server Density Service Monitoring v2
|
2498
2587
|
bot:
|
2499
2588
|
name: Server Density
|
2500
|
-
-
|
2589
|
+
-
|
2501
2590
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
|
2502
2591
|
bot:
|
2503
2592
|
name: Seznam Bot
|
@@ -2506,7 +2595,7 @@
|
|
2506
2595
|
producer:
|
2507
2596
|
name: Seznam.cz, a.s.
|
2508
2597
|
url: http://www.seznam.cz/
|
2509
|
-
-
|
2598
|
+
-
|
2510
2599
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
|
2511
2600
|
bot:
|
2512
2601
|
name: Seznam Bot
|
@@ -2515,7 +2604,7 @@
|
|
2515
2604
|
producer:
|
2516
2605
|
name: Seznam.cz, a.s.
|
2517
2606
|
url: http://www.seznam.cz/
|
2518
|
-
-
|
2607
|
+
-
|
2519
2608
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
|
2520
2609
|
bot:
|
2521
2610
|
name: Seznam Bot
|
@@ -2524,7 +2613,7 @@
|
|
2524
2613
|
producer:
|
2525
2614
|
name: Seznam.cz, a.s.
|
2526
2615
|
url: http://www.seznam.cz/
|
2527
|
-
-
|
2616
|
+
-
|
2528
2617
|
user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
|
2529
2618
|
bot:
|
2530
2619
|
name: Seznam Bot
|
@@ -2533,7 +2622,7 @@
|
|
2533
2622
|
producer:
|
2534
2623
|
name: Seznam.cz, a.s.
|
2535
2624
|
url: http://www.seznam.cz/
|
2536
|
-
-
|
2625
|
+
-
|
2537
2626
|
user_agent: Mozilla/5.0 SeznamEmailProxy/2.0.174
|
2538
2627
|
bot:
|
2539
2628
|
name: Seznam Email Proxy
|
@@ -2542,7 +2631,7 @@
|
|
2542
2631
|
producer:
|
2543
2632
|
name: Seznam.cz, a.s.
|
2544
2633
|
url: http://www.seznam.cz/
|
2545
|
-
-
|
2634
|
+
-
|
2546
2635
|
user_agent: Seznam-Zbozi-robot/3.0
|
2547
2636
|
bot:
|
2548
2637
|
name: Seznam Zbozi.cz
|
@@ -2551,7 +2640,7 @@
|
|
2551
2640
|
producer:
|
2552
2641
|
name: Seznam.cz, a.s.
|
2553
2642
|
url: https://www.zbozi.cz/
|
2554
|
-
-
|
2643
|
+
-
|
2555
2644
|
user_agent: Mozilla/5.0 (ShopAlike; LadenZeile) FeedBot
|
2556
2645
|
bot:
|
2557
2646
|
name: ShopAlike
|
@@ -2560,7 +2649,7 @@
|
|
2560
2649
|
producer:
|
2561
2650
|
name: Visual Meta
|
2562
2651
|
url: https://www.shopalike.cz/
|
2563
|
-
-
|
2652
|
+
-
|
2564
2653
|
user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
|
2565
2654
|
bot:
|
2566
2655
|
name: ShopWiki
|
@@ -2569,7 +2658,7 @@
|
|
2569
2658
|
producer:
|
2570
2659
|
name: ShopWiki Corp.
|
2571
2660
|
url: http://www.shopwiki.com
|
2572
|
-
-
|
2661
|
+
-
|
2573
2662
|
user_agent: shopify-partner-homepage-scraper
|
2574
2663
|
bot:
|
2575
2664
|
name: Shopify Partner
|
@@ -2578,7 +2667,7 @@
|
|
2578
2667
|
producer:
|
2579
2668
|
name: Shopify
|
2580
2669
|
url: https://www.shopify.com/
|
2581
|
-
-
|
2670
|
+
-
|
2582
2671
|
user_agent: SilverReader/1.0; http://silverreader.com
|
2583
2672
|
bot:
|
2584
2673
|
name: SilverReader
|
@@ -2587,7 +2676,7 @@
|
|
2587
2676
|
producer:
|
2588
2677
|
name: ""
|
2589
2678
|
url: ""
|
2590
|
-
-
|
2679
|
+
-
|
2591
2680
|
user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
|
2592
2681
|
bot:
|
2593
2682
|
name: SimplePie
|
@@ -2596,7 +2685,7 @@
|
|
2596
2685
|
producer:
|
2597
2686
|
name: ""
|
2598
2687
|
url: ""
|
2599
|
-
-
|
2688
|
+
-
|
2600
2689
|
user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
|
2601
2690
|
bot:
|
2602
2691
|
name: SimplePie
|
@@ -2605,7 +2694,7 @@
|
|
2605
2694
|
producer:
|
2606
2695
|
name: ""
|
2607
2696
|
url: ""
|
2608
|
-
-
|
2697
|
+
-
|
2609
2698
|
user_agent: Site24x7
|
2610
2699
|
bot:
|
2611
2700
|
name: Site24x7 Website Monitoring
|
@@ -2614,13 +2703,13 @@
|
|
2614
2703
|
producer:
|
2615
2704
|
name: Site24x7
|
2616
2705
|
url: https://www.site24x7.com
|
2617
|
-
-
|
2706
|
+
-
|
2618
2707
|
user_agent: SiteSucker for macOS/2.10.5
|
2619
2708
|
bot:
|
2620
2709
|
name: SiteSucker
|
2621
2710
|
category: Crawler
|
2622
2711
|
url: http://ricks-apps.com/osx/sitesucker/
|
2623
|
-
-
|
2712
|
+
-
|
2624
2713
|
user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.0) Match by Siteimprove.com
|
2625
2714
|
bot:
|
2626
2715
|
name: Siteimprove
|
@@ -2629,7 +2718,7 @@
|
|
2629
2718
|
producer:
|
2630
2719
|
name: Siteimprove GmbH
|
2631
2720
|
url: https://siteimprove.com/
|
2632
|
-
-
|
2721
|
+
-
|
2633
2722
|
user_agent: Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; Trident/6.0) LinkCheck by Siteimprove.com
|
2634
2723
|
bot:
|
2635
2724
|
name: Siteimprove
|
@@ -2638,7 +2727,7 @@
|
|
2638
2727
|
producer:
|
2639
2728
|
name: Siteimprove GmbH
|
2640
2729
|
url: https://siteimprove.com/
|
2641
|
-
-
|
2730
|
+
-
|
2642
2731
|
user_agent: sixy.ch/1.0
|
2643
2732
|
bot:
|
2644
2733
|
name: Sixy.ch
|
@@ -2647,7 +2736,7 @@
|
|
2647
2736
|
producer:
|
2648
2737
|
name: Manuel Kasper
|
2649
2738
|
url: https://neon1.net/
|
2650
|
-
-
|
2739
|
+
-
|
2651
2740
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
|
2652
2741
|
bot:
|
2653
2742
|
name: Skype URI Preview
|
@@ -2656,7 +2745,7 @@
|
|
2656
2745
|
producer:
|
2657
2746
|
name: Skype Communications S.à.r.l.
|
2658
2747
|
url: https://www.skype.com
|
2659
|
-
-
|
2748
|
+
-
|
2660
2749
|
user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
|
2661
2750
|
bot:
|
2662
2751
|
name: Slackbot
|
@@ -2665,7 +2754,7 @@
|
|
2665
2754
|
producer:
|
2666
2755
|
name: Slack Technologies
|
2667
2756
|
url: http://slack.com
|
2668
|
-
-
|
2757
|
+
-
|
2669
2758
|
user_agent: 'AppEngine-Google; (+http://code.google.com/appengine; appid: s~snapchat-proxy)'
|
2670
2759
|
bot:
|
2671
2760
|
name: Snapchat Proxy
|
@@ -2674,7 +2763,7 @@
|
|
2674
2763
|
producer:
|
2675
2764
|
name: Snapchat Inc.
|
2676
2765
|
url: https://www.snapchat.com
|
2677
|
-
-
|
2766
|
+
-
|
2678
2767
|
user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
|
2679
2768
|
bot:
|
2680
2769
|
name: Sogou Spider
|
@@ -2683,7 +2772,7 @@
|
|
2683
2772
|
producer:
|
2684
2773
|
name: Sohu, Inc.
|
2685
2774
|
url: http://www.sogou.com
|
2686
|
-
-
|
2775
|
+
-
|
2687
2776
|
user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
2688
2777
|
bot:
|
2689
2778
|
name: Sogou Spider
|
@@ -2692,7 +2781,7 @@
|
|
2692
2781
|
producer:
|
2693
2782
|
name: Sohu, Inc.
|
2694
2783
|
url: http://www.sogou.com
|
2695
|
-
-
|
2784
|
+
-
|
2696
2785
|
user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
|
2697
2786
|
bot:
|
2698
2787
|
name: Sogou Spider
|
@@ -2701,7 +2790,7 @@
|
|
2701
2790
|
producer:
|
2702
2791
|
name: Sohu, Inc.
|
2703
2792
|
url: http://www.sogou.com
|
2704
|
-
-
|
2793
|
+
-
|
2705
2794
|
user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
2706
2795
|
bot:
|
2707
2796
|
name: Sogou Spider
|
@@ -2710,7 +2799,7 @@
|
|
2710
2799
|
producer:
|
2711
2800
|
name: Sohu, Inc.
|
2712
2801
|
url: http://www.sogou.com
|
2713
|
-
-
|
2802
|
+
-
|
2714
2803
|
user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
|
2715
2804
|
bot:
|
2716
2805
|
name: Soso Spider
|
@@ -2719,13 +2808,13 @@
|
|
2719
2808
|
producer:
|
2720
2809
|
name: Tencent Holdings
|
2721
2810
|
url: http://www.soso.com
|
2722
|
-
-
|
2811
|
+
-
|
2723
2812
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_6) AppleWebKit/537.36 (KHTML, like Gecko) Sparkler/0.2.0-SNAPSHOT
|
2724
2813
|
bot:
|
2725
2814
|
name: Sparkler
|
2726
2815
|
category: Crawler
|
2727
2816
|
url: https://github.com/USCDataScience/sparkler
|
2728
|
-
-
|
2817
|
+
-
|
2729
2818
|
user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
|
2730
2819
|
bot:
|
2731
2820
|
name: Spinn3r
|
@@ -2734,32 +2823,26 @@
|
|
2734
2823
|
producer:
|
2735
2824
|
name: Tailrank Inc
|
2736
2825
|
url: http://spinn3r.com
|
2737
|
-
-
|
2826
|
+
-
|
2738
2827
|
user_agent: Spotify/1.0
|
2739
2828
|
bot:
|
2740
2829
|
name: Spotify
|
2741
2830
|
producer:
|
2742
2831
|
name: Spotify
|
2743
2832
|
url: https://www.spotify.com
|
2744
|
-
-
|
2833
|
+
-
|
2745
2834
|
user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
|
2746
2835
|
bot:
|
2747
2836
|
name: Sputnik Bot
|
2748
|
-
category: ""
|
2837
|
+
category: "Crawler"
|
2749
2838
|
url: ""
|
2750
|
-
|
2751
|
-
name: ""
|
2752
|
-
url: ""
|
2753
|
-
-
|
2839
|
+
-
|
2754
2840
|
user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
|
2755
2841
|
bot:
|
2756
|
-
name: Sputnik Bot
|
2757
|
-
category: ""
|
2842
|
+
name: Sputnik Image Bot
|
2843
|
+
category: "Crawler"
|
2758
2844
|
url: ""
|
2759
|
-
|
2760
|
-
name: ""
|
2761
|
-
url: ""
|
2762
|
-
-
|
2845
|
+
-
|
2763
2846
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_8_5) AppleWebKit/536.30.1 (KHTML, like Gecko) (compatible; Startpagina-Linkchecker/1.0; +https://www.startpagina.nl/linkchecker)
|
2764
2847
|
bot:
|
2765
2848
|
name: Startpagina Linkchecker
|
@@ -2768,7 +2851,7 @@
|
|
2768
2851
|
producer:
|
2769
2852
|
name: Startpagina B.V.
|
2770
2853
|
url: https://www.startpagina.nl/
|
2771
|
-
-
|
2854
|
+
-
|
2772
2855
|
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.4 (KHTML, like Gecko) Chrome/98 Safari/537.4 (StatusCake)
|
2773
2856
|
bot:
|
2774
2857
|
name: StatusCake
|
@@ -2777,7 +2860,7 @@
|
|
2777
2860
|
producer:
|
2778
2861
|
name: StatusCake
|
2779
2862
|
url: https://www.statuscake.com
|
2780
|
-
-
|
2863
|
+
-
|
2781
2864
|
user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
|
2782
2865
|
bot:
|
2783
2866
|
name: Superfeedr Bot
|
@@ -2786,7 +2869,7 @@
|
|
2786
2869
|
producer:
|
2787
2870
|
name: Superfeedr
|
2788
2871
|
url: https://superfeedr.com/
|
2789
|
-
-
|
2872
|
+
-
|
2790
2873
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
|
2791
2874
|
bot:
|
2792
2875
|
name: Survey Bot
|
@@ -2795,7 +2878,7 @@
|
|
2795
2878
|
producer:
|
2796
2879
|
name: Domain Tools
|
2797
2880
|
url: http://www.domaintools.com
|
2798
|
-
-
|
2881
|
+
-
|
2799
2882
|
user_agent: TLSProbe/1.0 (+https://scan.trustnet.venafi.com/)
|
2800
2883
|
bot:
|
2801
2884
|
name: TLSProbe
|
@@ -2804,23 +2887,23 @@
|
|
2804
2887
|
producer:
|
2805
2888
|
name: Venafi TrustNet
|
2806
2889
|
url: https://www.venafi.com
|
2807
|
-
-
|
2890
|
+
-
|
2808
2891
|
user_agent: Tarmot Gezgin/1.0 (compatible; TarmotGezgin/1.1; +http://www.tarmot.com/gezgin)
|
2809
2892
|
bot:
|
2810
2893
|
name: Tarmot Gezgin
|
2811
2894
|
url: http://www.tarmot.com/gezgin/
|
2812
2895
|
category: Search bot
|
2813
|
-
-
|
2896
|
+
-
|
2814
2897
|
user_agent: TelegramBot (like TwitterBot)
|
2815
2898
|
bot:
|
2816
2899
|
name: TelegramBot
|
2817
2900
|
url: https://telegram.org/blog/bot-revolution
|
2818
|
-
-
|
2901
|
+
-
|
2819
2902
|
user_agent: The Knowledge AI
|
2820
2903
|
bot:
|
2821
2904
|
name: The Knowledge AI
|
2822
2905
|
category: Crawler
|
2823
|
-
-
|
2906
|
+
-
|
2824
2907
|
user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
|
2825
2908
|
bot:
|
2826
2909
|
name: TinEye Crawler
|
@@ -2829,7 +2912,7 @@
|
|
2829
2912
|
producer:
|
2830
2913
|
name: Idée Inc.
|
2831
2914
|
url: http://ideeinc.com
|
2832
|
-
-
|
2915
|
+
-
|
2833
2916
|
user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
|
2834
2917
|
bot:
|
2835
2918
|
name: Tiny Tiny RSS
|
@@ -2838,7 +2921,7 @@
|
|
2838
2921
|
producer:
|
2839
2922
|
name: ""
|
2840
2923
|
url: ""
|
2841
|
-
-
|
2924
|
+
-
|
2842
2925
|
user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
|
2843
2926
|
bot:
|
2844
2927
|
name: Tiny Tiny RSS
|
@@ -2847,7 +2930,7 @@
|
|
2847
2930
|
producer:
|
2848
2931
|
name: ""
|
2849
2932
|
url: ""
|
2850
|
-
-
|
2933
|
+
-
|
2851
2934
|
user_agent: Mozilla/5.0 (compatible; tracemyfile/1.0)
|
2852
2935
|
bot:
|
2853
2936
|
name: TraceMyFile
|
@@ -2856,7 +2939,7 @@
|
|
2856
2939
|
producer:
|
2857
2940
|
name: Idee Inc.
|
2858
2941
|
url: http://ideeinc.com/
|
2859
|
-
-
|
2942
|
+
-
|
2860
2943
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 6.0; en-GB; rv:1.0; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20071127 Firefox/3.0.0.11
|
2861
2944
|
bot:
|
2862
2945
|
name: Trendiction Bot
|
@@ -2865,7 +2948,7 @@
|
|
2865
2948
|
producer:
|
2866
2949
|
name: Talkwalker Inc.
|
2867
2950
|
url: http://www.talkwalker.com
|
2868
|
-
-
|
2951
|
+
-
|
2869
2952
|
user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
|
2870
2953
|
bot:
|
2871
2954
|
name: TurnitinBot
|
@@ -2874,7 +2957,7 @@
|
|
2874
2957
|
producer:
|
2875
2958
|
name: iParadigms, LLC.
|
2876
2959
|
url: http://www.turnitin.com
|
2877
|
-
-
|
2960
|
+
-
|
2878
2961
|
user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
|
2879
2962
|
bot:
|
2880
2963
|
name: TweetedTimes Bot
|
@@ -2883,7 +2966,7 @@
|
|
2883
2966
|
producer:
|
2884
2967
|
name: TweetedTimes
|
2885
2968
|
url: http://tweetedtimes.com/
|
2886
|
-
-
|
2969
|
+
-
|
2887
2970
|
user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
|
2888
2971
|
bot:
|
2889
2972
|
name: TweetedTimes Bot
|
@@ -2892,7 +2975,7 @@
|
|
2892
2975
|
producer:
|
2893
2976
|
name: TweetedTimes
|
2894
2977
|
url: http://tweetedtimes.com/
|
2895
|
-
-
|
2978
|
+
-
|
2896
2979
|
user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
|
2897
2980
|
bot:
|
2898
2981
|
name: Tweetmeme Bot
|
@@ -2901,7 +2984,7 @@
|
|
2901
2984
|
producer:
|
2902
2985
|
name: Mediasift
|
2903
2986
|
url: ""
|
2904
|
-
-
|
2987
|
+
-
|
2905
2988
|
user_agent: Mozilla/5.0 (compatible; Twingly Recon; twingly.com)
|
2906
2989
|
bot:
|
2907
2990
|
name: Twingly Recon
|
@@ -2909,7 +2992,7 @@
|
|
2909
2992
|
producer:
|
2910
2993
|
name: Twingly
|
2911
2994
|
url: https://www.twingly.com
|
2912
|
-
-
|
2995
|
+
-
|
2913
2996
|
user_agent: Twitterbot/1.0
|
2914
2997
|
bot:
|
2915
2998
|
name: Twitterbot
|
@@ -2918,7 +3001,7 @@
|
|
2918
3001
|
producer:
|
2919
3002
|
name: Twitter
|
2920
3003
|
url: http://www.twitter.com
|
2921
|
-
-
|
3004
|
+
-
|
2922
3005
|
user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
|
2923
3006
|
bot:
|
2924
3007
|
name: URLAppendBot
|
@@ -2927,7 +3010,7 @@
|
|
2927
3010
|
producer:
|
2928
3011
|
name: Profound Networks
|
2929
3012
|
url: http://www.profound.net
|
2930
|
-
-
|
3013
|
+
-
|
2931
3014
|
user_agent: 'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36 (via secureurl.fwdcdn.com - mail.ukr.net proxy)'
|
2932
3015
|
bot:
|
2933
3016
|
name: UkrNet Mail Proxy
|
@@ -2936,7 +3019,7 @@
|
|
2936
3019
|
producer:
|
2937
3020
|
name: UkrNet Ltd
|
2938
3021
|
url: https://www.ukr.net/
|
2939
|
-
-
|
3022
|
+
-
|
2940
3023
|
user_agent: UniversalFeedParser/5.2.1 +https://code.google.com/p/feedparser/
|
2941
3024
|
bot:
|
2942
3025
|
name: UniversalFeedParser
|
@@ -2945,7 +3028,7 @@
|
|
2945
3028
|
producer:
|
2946
3029
|
name: Kurt McKee
|
2947
3030
|
url: https://github.com/kurtmckee
|
2948
|
-
-
|
3031
|
+
-
|
2949
3032
|
user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
|
2950
3033
|
bot:
|
2951
3034
|
name: Uptime Robot
|
@@ -2954,7 +3037,7 @@
|
|
2954
3037
|
producer:
|
2955
3038
|
name: Uptime Robot
|
2956
3039
|
url: http://uptimerobot.com
|
2957
|
-
-
|
3040
|
+
-
|
2958
3041
|
user_agent: Mozilla/5.0 (compatible; Uptimebot/1.0; +http://www.uptime.com/uptimebot)
|
2959
3042
|
bot:
|
2960
3043
|
name: Uptimebot
|
@@ -2963,7 +3046,7 @@
|
|
2963
3046
|
producer:
|
2964
3047
|
name: Uptime
|
2965
3048
|
url: https://uptime.com
|
2966
|
-
-
|
3049
|
+
-
|
2967
3050
|
user_agent: Mozilla/5.0 (compatible; vkShare; +http://vk.com/dev/Share)
|
2968
3051
|
bot:
|
2969
3052
|
name: VK Share Button
|
@@ -2972,7 +3055,7 @@
|
|
2972
3055
|
producer:
|
2973
3056
|
name: VK
|
2974
3057
|
url: http://vk.com/
|
2975
|
-
-
|
3058
|
+
-
|
2976
3059
|
user_agent: 'Mozilla/4.0 (compatible; Vagabondo/4.0; http://webagent.wise-guys.nl/; http://www.wise-guys.nl/)'
|
2977
3060
|
bot:
|
2978
3061
|
name: Vagabondo
|
@@ -2981,7 +3064,19 @@
|
|
2981
3064
|
producer:
|
2982
3065
|
name: WiseGuys
|
2983
3066
|
url: http://www.wise-guys.nl/
|
2984
|
-
-
|
3067
|
+
-
|
3068
|
+
user_agent: Mozilla/5.0 (compatible; VelenPublicWebCrawler/1.0; +https://velen.io)
|
3069
|
+
bot:
|
3070
|
+
name: Velen Public Web Crawler
|
3071
|
+
category: Crawler
|
3072
|
+
url: https://hunter.io/robot
|
3073
|
+
-
|
3074
|
+
user_agent: Vercelbot (+https://vercel.com)
|
3075
|
+
bot:
|
3076
|
+
name: Vercel Bot
|
3077
|
+
category: Service bot
|
3078
|
+
url: https://vercel.com
|
3079
|
+
-
|
2985
3080
|
user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
|
2986
3081
|
bot:
|
2987
3082
|
name: Visual Site Mapper Crawler
|
@@ -2990,7 +3085,7 @@
|
|
2990
3085
|
producer:
|
2991
3086
|
name: Alentum Software Ltd.
|
2992
3087
|
url: http://www.alentum.com
|
2993
|
-
-
|
3088
|
+
-
|
2994
3089
|
user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
|
2995
3090
|
bot:
|
2996
3091
|
name: W3C CSS Validator
|
@@ -2999,7 +3094,7 @@
|
|
2999
3094
|
producer:
|
3000
3095
|
name: W3C
|
3001
3096
|
url: http://www.w3.org
|
3002
|
-
-
|
3097
|
+
-
|
3003
3098
|
user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
|
3004
3099
|
bot:
|
3005
3100
|
name: W3C I18N Checker
|
@@ -3008,7 +3103,7 @@
|
|
3008
3103
|
producer:
|
3009
3104
|
name: W3C
|
3010
3105
|
url: http://www.w3.org
|
3011
|
-
-
|
3106
|
+
-
|
3012
3107
|
user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
|
3013
3108
|
bot:
|
3014
3109
|
name: W3C Link Checker
|
@@ -3017,7 +3112,7 @@
|
|
3017
3112
|
producer:
|
3018
3113
|
name: W3C
|
3019
3114
|
url: http://www.w3.org
|
3020
|
-
-
|
3115
|
+
-
|
3021
3116
|
user_agent: W3C-checklink/4.81 libwww-perl/5.836
|
3022
3117
|
bot:
|
3023
3118
|
name: W3C Link Checker
|
@@ -3026,7 +3121,7 @@
|
|
3026
3121
|
producer:
|
3027
3122
|
name: W3C
|
3028
3123
|
url: http://www.w3.org
|
3029
|
-
-
|
3124
|
+
-
|
3030
3125
|
user_agent: Validator.nu/LV http://validator.w3.org/services
|
3031
3126
|
bot:
|
3032
3127
|
name: W3C Markup Validation Service
|
@@ -3035,7 +3130,7 @@
|
|
3035
3130
|
producer:
|
3036
3131
|
name: W3C
|
3037
3132
|
url: http://www.w3.org
|
3038
|
-
-
|
3133
|
+
-
|
3039
3134
|
user_agent: W3C_Validator/1.3 http://validator.w3.org/services
|
3040
3135
|
bot:
|
3041
3136
|
name: W3C Markup Validation Service
|
@@ -3044,7 +3139,7 @@
|
|
3044
3139
|
producer:
|
3045
3140
|
name: W3C
|
3046
3141
|
url: http://www.w3.org
|
3047
|
-
-
|
3142
|
+
-
|
3048
3143
|
user_agent: W3C_Validator/1.767
|
3049
3144
|
bot:
|
3050
3145
|
name: W3C Markup Validation Service
|
@@ -3053,7 +3148,7 @@
|
|
3053
3148
|
producer:
|
3054
3149
|
name: W3C
|
3055
3150
|
url: http://www.w3.org
|
3056
|
-
-
|
3151
|
+
-
|
3057
3152
|
user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
|
3058
3153
|
bot:
|
3059
3154
|
name: W3C MobileOK Checker
|
@@ -3062,7 +3157,7 @@
|
|
3062
3157
|
producer:
|
3063
3158
|
name: W3C
|
3064
3159
|
url: http://www.w3.org
|
3065
|
-
-
|
3160
|
+
-
|
3066
3161
|
user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
|
3067
3162
|
bot:
|
3068
3163
|
name: W3C Unified Validator
|
@@ -3071,7 +3166,7 @@
|
|
3071
3166
|
producer:
|
3072
3167
|
name: W3C
|
3073
3168
|
url: http://www.w3.org
|
3074
|
-
-
|
3169
|
+
-
|
3075
3170
|
user_agent: Mozilla/5.0 (compatible; Wappalyzer; +https://github.com/AliasIO/Wappalyzer)
|
3076
3171
|
bot:
|
3077
3172
|
name: Wappalyzer
|
@@ -3079,7 +3174,7 @@
|
|
3079
3174
|
producer:
|
3080
3175
|
name: AliasIO
|
3081
3176
|
url: https://github.com/AliasIO
|
3082
|
-
-
|
3177
|
+
-
|
3083
3178
|
user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
|
3084
3179
|
bot:
|
3085
3180
|
name: WeSEE:Search
|
@@ -3088,13 +3183,13 @@
|
|
3088
3183
|
producer:
|
3089
3184
|
name: WeSEE Ltd
|
3090
3185
|
url: http://www.wesee.com
|
3091
|
-
-
|
3186
|
+
-
|
3092
3187
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Moto G (4) Build/MPJ24.139-64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.146 Mobile Safari/537.36 PTST/180829.190838
|
3093
3188
|
bot:
|
3094
3189
|
name: WebPageTest
|
3095
3190
|
category: Site Monitor
|
3096
3191
|
url: https://www.webpagetest.org
|
3097
|
-
-
|
3192
|
+
-
|
3098
3193
|
user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
|
3099
3194
|
bot:
|
3100
3195
|
name: WebSitePulse
|
@@ -3103,7 +3198,7 @@
|
|
3103
3198
|
producer:
|
3104
3199
|
name: WebSitePulse
|
3105
3200
|
url: http://www.websitepulse.com/
|
3106
|
-
-
|
3201
|
+
-
|
3107
3202
|
user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
|
3108
3203
|
bot:
|
3109
3204
|
name: WebbCrawler
|
@@ -3112,7 +3207,7 @@
|
|
3112
3207
|
producer:
|
3113
3208
|
name: Steve Webb
|
3114
3209
|
url: http://badcheese.com
|
3115
|
-
-
|
3210
|
+
-
|
3116
3211
|
user_agent: weborama-fetcher (+http://www.weborama.com)
|
3117
3212
|
bot:
|
3118
3213
|
name: Weborama
|
@@ -3121,7 +3216,7 @@
|
|
3121
3216
|
producer:
|
3122
3217
|
name: Weborama SA
|
3123
3218
|
url: https://weborama.com/
|
3124
|
-
-
|
3219
|
+
-
|
3125
3220
|
user_agent: WikiDo/1.1 (http://wikido.com; crawler@wikido.com)
|
3126
3221
|
bot:
|
3127
3222
|
name: WikiDo
|
@@ -3130,7 +3225,7 @@
|
|
3130
3225
|
producer:
|
3131
3226
|
name: Fotolitografie Fiorentine di Becchi Antonio s.n.c.
|
3132
3227
|
url: https://www.wikido.com/
|
3133
|
-
-
|
3228
|
+
-
|
3134
3229
|
user_agent: Mozilla/5.0 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
3135
3230
|
bot:
|
3136
3231
|
name: WooRank
|
@@ -3139,7 +3234,7 @@
|
|
3139
3234
|
producer:
|
3140
3235
|
name: WooRank sprl
|
3141
3236
|
url: https://www.woorank.com/
|
3142
|
-
-
|
3237
|
+
-
|
3143
3238
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/604.1.38 (KHTML, like Gecko) Version/11.0 Mobile/15A372 Safari/604.1 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
3144
3239
|
bot:
|
3145
3240
|
name: WooRank
|
@@ -3148,7 +3243,7 @@
|
|
3148
3243
|
producer:
|
3149
3244
|
name: WooRank sprl
|
3150
3245
|
url: https://www.woorank.com/
|
3151
|
-
-
|
3246
|
+
-
|
3152
3247
|
user_agent: WordPress/4.7.2; https://example.com
|
3153
3248
|
bot:
|
3154
3249
|
name: WordPress
|
@@ -3157,7 +3252,7 @@
|
|
3157
3252
|
producer:
|
3158
3253
|
name: Wordpress.org
|
3159
3254
|
url: https://wordpress.org/
|
3160
|
-
-
|
3255
|
+
-
|
3161
3256
|
user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
|
3162
3257
|
bot:
|
3163
3258
|
name: Wotbox
|
@@ -3166,7 +3261,7 @@
|
|
3166
3261
|
producer:
|
3167
3262
|
name: Wotbox
|
3168
3263
|
url: http://www.wotbox.com
|
3169
|
-
-
|
3264
|
+
-
|
3170
3265
|
user_agent: XenForo/2.x (https://www.example.com)
|
3171
3266
|
bot:
|
3172
3267
|
name: XenForo
|
@@ -3175,7 +3270,7 @@
|
|
3175
3270
|
producer:
|
3176
3271
|
name: XenForo Ltd.
|
3177
3272
|
url: https://xenforo.com/
|
3178
|
-
-
|
3273
|
+
-
|
3179
3274
|
user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
|
3180
3275
|
bot:
|
3181
3276
|
name: YaCy
|
@@ -3184,7 +3279,7 @@
|
|
3184
3279
|
producer:
|
3185
3280
|
name: YaCy
|
3186
3281
|
url: http://yacy.net
|
3187
|
-
-
|
3282
|
+
-
|
3188
3283
|
user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
|
3189
3284
|
bot:
|
3190
3285
|
name: YaCy
|
@@ -3193,7 +3288,7 @@
|
|
3193
3288
|
producer:
|
3194
3289
|
name: YaCy
|
3195
3290
|
url: http://yacy.net
|
3196
|
-
-
|
3291
|
+
-
|
3197
3292
|
user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
|
3198
3293
|
bot:
|
3199
3294
|
name: Yahoo Gemini
|
@@ -3202,7 +3297,7 @@
|
|
3202
3297
|
producer:
|
3203
3298
|
name: Yahoo! Inc.
|
3204
3299
|
url: http://www.yahoo.com
|
3205
|
-
-
|
3300
|
+
-
|
3206
3301
|
user_agent: Y!J-BRW/1.0 (https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716)
|
3207
3302
|
bot:
|
3208
3303
|
name: Yahoo! Japan BRW
|
@@ -3211,7 +3306,7 @@
|
|
3211
3306
|
producer:
|
3212
3307
|
name: Yahoo! Japan Corp.
|
3213
3308
|
url: https://www.yahoo.co.jp/
|
3214
|
-
-
|
3309
|
+
-
|
3215
3310
|
user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
|
3216
3311
|
bot:
|
3217
3312
|
name: Yahoo! Link Preview
|
@@ -3220,7 +3315,7 @@
|
|
3220
3315
|
producer:
|
3221
3316
|
name: Yahoo! Inc.
|
3222
3317
|
url: http://www.yahoo.com
|
3223
|
-
-
|
3318
|
+
-
|
3224
3319
|
user_agent: Yahoo:LinkExpander:Slingstone
|
3225
3320
|
bot:
|
3226
3321
|
name: Yahoo! Link Preview
|
@@ -3229,7 +3324,7 @@
|
|
3229
3324
|
producer:
|
3230
3325
|
name: Yahoo! Inc.
|
3231
3326
|
url: http://www.yahoo.com
|
3232
|
-
-
|
3327
|
+
-
|
3233
3328
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
|
3234
3329
|
bot:
|
3235
3330
|
name: Yahoo! Slurp
|
@@ -3238,7 +3333,7 @@
|
|
3238
3333
|
producer:
|
3239
3334
|
name: Yahoo! Inc.
|
3240
3335
|
url: http://www.yahoo.com
|
3241
|
-
-
|
3336
|
+
-
|
3242
3337
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
|
3243
3338
|
bot:
|
3244
3339
|
name: Yahoo! Slurp
|
@@ -3247,7 +3342,7 @@
|
|
3247
3342
|
producer:
|
3248
3343
|
name: Yahoo! Inc.
|
3249
3344
|
url: http://www.yahoo.com
|
3250
|
-
-
|
3345
|
+
-
|
3251
3346
|
user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
|
3252
3347
|
bot:
|
3253
3348
|
name: Yandex Bot
|
@@ -3256,7 +3351,7 @@
|
|
3256
3351
|
producer:
|
3257
3352
|
name: Yandex LLC
|
3258
3353
|
url: http://company.yandex.com
|
3259
|
-
-
|
3354
|
+
-
|
3260
3355
|
user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
|
3261
3356
|
bot:
|
3262
3357
|
name: Yandex Bot
|
@@ -3265,7 +3360,7 @@
|
|
3265
3360
|
producer:
|
3266
3361
|
name: Yandex LLC
|
3267
3362
|
url: http://company.yandex.com
|
3268
|
-
-
|
3363
|
+
-
|
3269
3364
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
3270
3365
|
bot:
|
3271
3366
|
name: Yandex Bot
|
@@ -3274,7 +3369,7 @@
|
|
3274
3369
|
producer:
|
3275
3370
|
name: Yandex LLC
|
3276
3371
|
url: http://company.yandex.com
|
3277
|
-
-
|
3372
|
+
-
|
3278
3373
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
3279
3374
|
bot:
|
3280
3375
|
name: Yandex Bot
|
@@ -3283,7 +3378,7 @@
|
|
3283
3378
|
producer:
|
3284
3379
|
name: Yandex LLC
|
3285
3380
|
url: http://company.yandex.com
|
3286
|
-
-
|
3381
|
+
-
|
3287
3382
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
3288
3383
|
bot:
|
3289
3384
|
name: Yandex Bot
|
@@ -3292,7 +3387,7 @@
|
|
3292
3387
|
producer:
|
3293
3388
|
name: Yandex LLC
|
3294
3389
|
url: http://company.yandex.com
|
3295
|
-
-
|
3390
|
+
-
|
3296
3391
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
3297
3392
|
bot:
|
3298
3393
|
name: Yandex Bot
|
@@ -3301,7 +3396,7 @@
|
|
3301
3396
|
producer:
|
3302
3397
|
name: Yandex LLC
|
3303
3398
|
url: http://company.yandex.com
|
3304
|
-
-
|
3399
|
+
-
|
3305
3400
|
user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
|
3306
3401
|
bot:
|
3307
3402
|
name: Yandex Bot
|
@@ -3310,7 +3405,7 @@
|
|
3310
3405
|
producer:
|
3311
3406
|
name: Yandex LLC
|
3312
3407
|
url: http://company.yandex.com
|
3313
|
-
-
|
3408
|
+
-
|
3314
3409
|
user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
|
3315
3410
|
bot:
|
3316
3411
|
name: Yandex Bot
|
@@ -3319,7 +3414,7 @@
|
|
3319
3414
|
producer:
|
3320
3415
|
name: Yandex LLC
|
3321
3416
|
url: http://company.yandex.com
|
3322
|
-
-
|
3417
|
+
-
|
3323
3418
|
user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
|
3324
3419
|
bot:
|
3325
3420
|
name: Yandex Bot
|
@@ -3328,7 +3423,7 @@
|
|
3328
3423
|
producer:
|
3329
3424
|
name: Yandex LLC
|
3330
3425
|
url: http://company.yandex.com
|
3331
|
-
-
|
3426
|
+
-
|
3332
3427
|
user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
|
3333
3428
|
bot:
|
3334
3429
|
name: Yandex Bot
|
@@ -3337,7 +3432,7 @@
|
|
3337
3432
|
producer:
|
3338
3433
|
name: Yandex LLC
|
3339
3434
|
url: http://company.yandex.com
|
3340
|
-
-
|
3435
|
+
-
|
3341
3436
|
user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
|
3342
3437
|
bot:
|
3343
3438
|
name: Yandex Bot
|
@@ -3346,7 +3441,7 @@
|
|
3346
3441
|
producer:
|
3347
3442
|
name: Yandex LLC
|
3348
3443
|
url: http://company.yandex.com
|
3349
|
-
-
|
3444
|
+
-
|
3350
3445
|
user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
|
3351
3446
|
bot:
|
3352
3447
|
name: Yandex Bot
|
@@ -3355,7 +3450,7 @@
|
|
3355
3450
|
producer:
|
3356
3451
|
name: Yandex LLC
|
3357
3452
|
url: http://company.yandex.com
|
3358
|
-
-
|
3453
|
+
-
|
3359
3454
|
user_agent: Mozilla/5.0 (compatible; YandexMobileScreenShotBot/1.0; +http://yandex.com/bots)
|
3360
3455
|
bot:
|
3361
3456
|
name: Yandex Bot
|
@@ -3364,7 +3459,7 @@
|
|
3364
3459
|
producer:
|
3365
3460
|
name: Yandex LLC
|
3366
3461
|
url: http://company.yandex.com
|
3367
|
-
-
|
3462
|
+
-
|
3368
3463
|
user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
|
3369
3464
|
bot:
|
3370
3465
|
name: Yandex Bot
|
@@ -3373,7 +3468,7 @@
|
|
3373
3468
|
producer:
|
3374
3469
|
name: Yandex LLC
|
3375
3470
|
url: http://company.yandex.com
|
3376
|
-
-
|
3471
|
+
-
|
3377
3472
|
user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
|
3378
3473
|
bot:
|
3379
3474
|
name: Yandex Bot
|
@@ -3382,7 +3477,7 @@
|
|
3382
3477
|
producer:
|
3383
3478
|
name: Yandex LLC
|
3384
3479
|
url: http://company.yandex.com
|
3385
|
-
-
|
3480
|
+
-
|
3386
3481
|
user_agent: Mozilla/5.0 (compatible; YandexOntoDB/1.0; +http://yandex.com/bots)
|
3387
3482
|
bot:
|
3388
3483
|
name: Yandex Bot
|
@@ -3391,7 +3486,7 @@
|
|
3391
3486
|
producer:
|
3392
3487
|
name: Yandex LLC
|
3393
3488
|
url: http://company.yandex.com
|
3394
|
-
-
|
3489
|
+
-
|
3395
3490
|
user_agent: Mozilla/5.0 (compatible; YandexOntoDBAPI/1.0; +http://yandex.com/bots)
|
3396
3491
|
bot:
|
3397
3492
|
name: Yandex Bot
|
@@ -3400,7 +3495,7 @@
|
|
3400
3495
|
producer:
|
3401
3496
|
name: Yandex LLC
|
3402
3497
|
url: http://company.yandex.com
|
3403
|
-
-
|
3498
|
+
-
|
3404
3499
|
user_agent: Mozilla/5.0 (compatible; YandexPartner/3.0; +http://yandex.com/bots)
|
3405
3500
|
bot:
|
3406
3501
|
name: Yandex Bot
|
@@ -3409,7 +3504,7 @@
|
|
3409
3504
|
producer:
|
3410
3505
|
name: Yandex LLC
|
3411
3506
|
url: http://company.yandex.com
|
3412
|
-
-
|
3507
|
+
-
|
3413
3508
|
user_agent: Mozilla/5.0 (compatible; YandexRCA/1.0; +http://yandex.com/bots)
|
3414
3509
|
bot:
|
3415
3510
|
name: Yandex Bot
|
@@ -3418,7 +3513,7 @@
|
|
3418
3513
|
producer:
|
3419
3514
|
name: Yandex LLC
|
3420
3515
|
url: http://company.yandex.com
|
3421
|
-
-
|
3516
|
+
-
|
3422
3517
|
user_agent: Mozilla/5.0 (compatible; YandexSearchShop/1.0; +http://yandex.com/bots)
|
3423
3518
|
bot:
|
3424
3519
|
name: Yandex Bot
|
@@ -3427,7 +3522,7 @@
|
|
3427
3522
|
producer:
|
3428
3523
|
name: Yandex LLC
|
3429
3524
|
url: http://company.yandex.com
|
3430
|
-
-
|
3525
|
+
-
|
3431
3526
|
user_agent: Mozilla/5.0 (compatible; YandexTracker/1.0; +http://yandex.com/bots)
|
3432
3527
|
bot:
|
3433
3528
|
name: Yandex Bot
|
@@ -3436,7 +3531,7 @@
|
|
3436
3531
|
producer:
|
3437
3532
|
name: Yandex LLC
|
3438
3533
|
url: http://company.yandex.com
|
3439
|
-
-
|
3534
|
+
-
|
3440
3535
|
user_agent: Mozilla/5.0 (compatible; YandexTurbo/1.0; +http://yandex.com/bots)
|
3441
3536
|
bot:
|
3442
3537
|
name: Yandex Bot
|
@@ -3445,7 +3540,7 @@
|
|
3445
3540
|
producer:
|
3446
3541
|
name: Yandex LLC
|
3447
3542
|
url: http://company.yandex.com
|
3448
|
-
-
|
3543
|
+
-
|
3449
3544
|
user_agent: Mozilla/5.0 (compatible; YandexVerticals/1.0; http://yandex.com/bots)
|
3450
3545
|
bot:
|
3451
3546
|
name: Yandex Bot
|
@@ -3454,7 +3549,7 @@
|
|
3454
3549
|
producer:
|
3455
3550
|
name: Yandex LLC
|
3456
3551
|
url: http://company.yandex.com
|
3457
|
-
-
|
3552
|
+
-
|
3458
3553
|
user_agent: Mozilla/5.0 (compatible; NaverJapan/1.0; +http://corp.naver.jp/)
|
3459
3554
|
bot:
|
3460
3555
|
name: Yeti/Naverbot
|
@@ -3463,7 +3558,7 @@
|
|
3463
3558
|
producer:
|
3464
3559
|
name: Naver
|
3465
3560
|
url: http://www.naver.com
|
3466
|
-
-
|
3561
|
+
-
|
3467
3562
|
user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
|
3468
3563
|
bot:
|
3469
3564
|
name: Yeti/Naverbot
|
@@ -3472,7 +3567,7 @@
|
|
3472
3567
|
producer:
|
3473
3568
|
name: Naver
|
3474
3569
|
url: http://www.naver.com
|
3475
|
-
-
|
3570
|
+
-
|
3476
3571
|
user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
|
3477
3572
|
bot:
|
3478
3573
|
name: Youdao Bot
|
@@ -3481,13 +3576,13 @@
|
|
3481
3576
|
producer:
|
3482
3577
|
name: NetEase, Inc.
|
3483
3578
|
url: http://corp.163.com
|
3484
|
-
-
|
3579
|
+
-
|
3485
3580
|
user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
|
3486
3581
|
bot:
|
3487
3582
|
name: Yourls
|
3488
3583
|
category: Crawler
|
3489
3584
|
url: http://yourls.org
|
3490
|
-
-
|
3585
|
+
-
|
3491
3586
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
|
3492
3587
|
bot:
|
3493
3588
|
name: Yunyun Bot
|
@@ -3496,7 +3591,7 @@
|
|
3496
3591
|
producer:
|
3497
3592
|
name: YunYun
|
3498
3593
|
url: http://www.yunyun.com
|
3499
|
-
-
|
3594
|
+
-
|
3500
3595
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
|
3501
3596
|
bot:
|
3502
3597
|
name: Yunyun Bot
|
@@ -3505,7 +3600,7 @@
|
|
3505
3600
|
producer:
|
3506
3601
|
name: YunYun
|
3507
3602
|
url: http://www.yunyun.com
|
3508
|
-
-
|
3603
|
+
-
|
3509
3604
|
user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
|
3510
3605
|
bot:
|
3511
3606
|
name: Yunyun Bot
|
@@ -3514,21 +3609,21 @@
|
|
3514
3609
|
producer:
|
3515
3610
|
name: YunYun
|
3516
3611
|
url: http://www.yunyun.com
|
3517
|
-
-
|
3612
|
+
-
|
3518
3613
|
user_agent: Zao/0.1 (http://www.kototol.org/zao)
|
3519
3614
|
bot:
|
3520
3615
|
name: Zao
|
3521
3616
|
category: Crawler
|
3522
|
-
-
|
3617
|
+
-
|
3523
3618
|
user_agent: zelist.ro feed parser (+http://www.zelist.ro)
|
3524
3619
|
bot:
|
3525
3620
|
name: Ze List
|
3526
|
-
category: Feed Fetcher
|
3527
3621
|
url: https://www.zelist.ro/
|
3622
|
+
category: Feed Fetcher
|
3528
3623
|
producer:
|
3529
3624
|
name: Treeworks SRL
|
3530
3625
|
url: https://www.tree.ro/
|
3531
|
-
-
|
3626
|
+
-
|
3532
3627
|
user_agent: Zookabot/2.5;++http://zookabot.com
|
3533
3628
|
bot:
|
3534
3629
|
name: Zookabot
|
@@ -3537,7 +3632,7 @@
|
|
3537
3632
|
producer:
|
3538
3633
|
name: Hwacha ApS
|
3539
3634
|
url: http://hwacha.dk
|
3540
|
-
-
|
3635
|
+
-
|
3541
3636
|
user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
|
3542
3637
|
bot:
|
3543
3638
|
name: ZumBot
|
@@ -3546,7 +3641,7 @@
|
|
3546
3641
|
producer:
|
3547
3642
|
name: ZUM internet
|
3548
3643
|
url: http://www.zuminternet.com/
|
3549
|
-
-
|
3644
|
+
-
|
3550
3645
|
user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
|
3551
3646
|
bot:
|
3552
3647
|
name: ZumBot
|
@@ -3555,106 +3650,106 @@
|
|
3555
3650
|
producer:
|
3556
3651
|
name: ZUM internet
|
3557
3652
|
url: http://www.zuminternet.com/
|
3558
|
-
-
|
3653
|
+
-
|
3559
3654
|
user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
|
3560
3655
|
bot:
|
3561
3656
|
name: aHrefs Bot
|
3562
3657
|
category: Crawler
|
3563
|
-
url:
|
3658
|
+
url: https://ahrefs.com/robot
|
3564
3659
|
producer:
|
3565
3660
|
name: Ahrefs Pte Ltd
|
3566
|
-
url:
|
3567
|
-
-
|
3661
|
+
url: https://ahrefs.com/robot
|
3662
|
+
-
|
3568
3663
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
|
3569
3664
|
bot:
|
3570
3665
|
name: aHrefs Bot
|
3571
3666
|
category: Crawler
|
3572
|
-
url:
|
3667
|
+
url: https://ahrefs.com/robot
|
3573
3668
|
producer:
|
3574
3669
|
name: Ahrefs Pte Ltd
|
3575
|
-
url:
|
3576
|
-
-
|
3670
|
+
url: https://ahrefs.com/robot
|
3671
|
+
-
|
3577
3672
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
|
3578
3673
|
bot:
|
3579
3674
|
name: aHrefs Bot
|
3580
3675
|
category: Crawler
|
3581
|
-
url:
|
3676
|
+
url: https://ahrefs.com/robot
|
3582
3677
|
producer:
|
3583
3678
|
name: Ahrefs Pte Ltd
|
3584
|
-
url:
|
3585
|
-
-
|
3679
|
+
url: https://ahrefs.com/robot
|
3680
|
+
-
|
3586
3681
|
user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
|
3587
3682
|
bot:
|
3588
3683
|
name: aHrefs Bot
|
3589
3684
|
category: Crawler
|
3590
|
-
url:
|
3685
|
+
url: https://ahrefs.com/robot
|
3591
3686
|
producer:
|
3592
3687
|
name: Ahrefs Pte Ltd
|
3593
|
-
url:
|
3594
|
-
-
|
3688
|
+
url: https://ahrefs.com/robot
|
3689
|
+
-
|
3595
3690
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
|
3596
3691
|
bot:
|
3597
3692
|
name: archive.org bot
|
3598
3693
|
category: Crawler
|
3599
|
-
url:
|
3694
|
+
url: https://archive.org/details/archive.org_bot
|
3600
3695
|
producer:
|
3601
3696
|
name: The Internet Archive
|
3602
|
-
url:
|
3603
|
-
-
|
3697
|
+
url: https://archive.org
|
3698
|
+
-
|
3604
3699
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
|
3605
3700
|
bot:
|
3606
3701
|
name: archive.org bot
|
3607
3702
|
category: Crawler
|
3608
|
-
url:
|
3703
|
+
url: https://archive.org/details/archive.org_bot
|
3609
3704
|
producer:
|
3610
3705
|
name: The Internet Archive
|
3611
|
-
url:
|
3612
|
-
-
|
3706
|
+
url: https://archive.org
|
3707
|
+
-
|
3613
3708
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
|
3614
3709
|
bot:
|
3615
3710
|
name: archive.org bot
|
3616
3711
|
category: Crawler
|
3617
|
-
url:
|
3712
|
+
url: https://archive.org/details/archive.org_bot
|
3618
3713
|
producer:
|
3619
3714
|
name: The Internet Archive
|
3620
|
-
url:
|
3621
|
-
-
|
3715
|
+
url: https://archive.org
|
3716
|
+
-
|
3622
3717
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
|
3623
3718
|
bot:
|
3624
3719
|
name: archive.org bot
|
3625
3720
|
category: Crawler
|
3626
|
-
url:
|
3721
|
+
url: https://archive.org/details/archive.org_bot
|
3627
3722
|
producer:
|
3628
3723
|
name: The Internet Archive
|
3629
|
-
url:
|
3630
|
-
-
|
3724
|
+
url: https://archive.org
|
3725
|
+
-
|
3631
3726
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
|
3632
3727
|
bot:
|
3633
3728
|
name: archive.org bot
|
3634
3729
|
category: Crawler
|
3635
|
-
url:
|
3730
|
+
url: https://archive.org/details/archive.org_bot
|
3636
3731
|
producer:
|
3637
3732
|
name: The Internet Archive
|
3638
|
-
url:
|
3639
|
-
-
|
3733
|
+
url: https://archive.org
|
3734
|
+
-
|
3640
3735
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
|
3641
3736
|
bot:
|
3642
3737
|
name: archive.org bot
|
3643
3738
|
category: Crawler
|
3644
|
-
url:
|
3739
|
+
url: https://archive.org/details/archive.org_bot
|
3645
3740
|
producer:
|
3646
3741
|
name: The Internet Archive
|
3647
|
-
url:
|
3648
|
-
-
|
3742
|
+
url: https://archive.org
|
3743
|
+
-
|
3649
3744
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
|
3650
3745
|
bot:
|
3651
3746
|
name: archive.org bot
|
3652
3747
|
category: Crawler
|
3653
|
-
url:
|
3748
|
+
url: https://archive.org/details/archive.org_bot
|
3654
3749
|
producer:
|
3655
3750
|
name: The Internet Archive
|
3656
|
-
url:
|
3657
|
-
-
|
3751
|
+
url: https://archive.org
|
3752
|
+
-
|
3658
3753
|
user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
|
3659
3754
|
bot:
|
3660
3755
|
name: ccBot crawler
|
@@ -3663,7 +3758,7 @@
|
|
3663
3758
|
producer:
|
3664
3759
|
name: reddit inc.
|
3665
3760
|
url: http://www.reddit.com
|
3666
|
-
-
|
3761
|
+
-
|
3667
3762
|
user_agent: Mozilla/5.0 eCairn-Grabber/1.0 (+http://ecairn.com/grabber)
|
3668
3763
|
bot:
|
3669
3764
|
name: eCairn-Grabber
|
@@ -3671,7 +3766,7 @@
|
|
3671
3766
|
producer:
|
3672
3767
|
name: eCairn
|
3673
3768
|
url: https://ecairn.com
|
3674
|
-
-
|
3769
|
+
-
|
3675
3770
|
user_agent: eZ Publish Link Validator
|
3676
3771
|
bot:
|
3677
3772
|
name: eZ Publish Link Validator
|
@@ -3680,7 +3775,7 @@
|
|
3680
3775
|
producer:
|
3681
3776
|
name: eZ Systems AS
|
3682
3777
|
url: https://ez.no/
|
3683
|
-
-
|
3778
|
+
-
|
3684
3779
|
user_agent: Mozilla/5.0 (compatible; evc-batch/2.0)
|
3685
3780
|
bot:
|
3686
3781
|
name: evc-batch
|
@@ -3689,13 +3784,13 @@
|
|
3689
3784
|
producer:
|
3690
3785
|
name: eVenture Capital Partners II, LLC
|
3691
3786
|
url: http://www.eventures.vc/
|
3692
|
-
-
|
3787
|
+
-
|
3693
3788
|
user_agent: Mozilla/5.0 (compatible; inoreader.com; 2 subscribers)
|
3694
3789
|
bot:
|
3695
3790
|
name: inoreader
|
3696
3791
|
category: Feed Reader
|
3697
3792
|
url: https://www.inoreader.com
|
3698
|
-
-
|
3793
|
+
-
|
3699
3794
|
user_agent: masscan/1.0 (https://github.com/robertdavidgraham/masscan)
|
3700
3795
|
bot:
|
3701
3796
|
name: masscan
|
@@ -3704,21 +3799,21 @@
|
|
3704
3799
|
producer:
|
3705
3800
|
name: Robert Graham
|
3706
3801
|
url: https://github.com/robertdavidgraham
|
3707
|
-
-
|
3802
|
+
-
|
3708
3803
|
user_agent: 'Mozilla/5.0/Firefox/42.0 - nbertaupete95(at)gmail.com'
|
3709
3804
|
bot:
|
3710
3805
|
name: nbertaupete95
|
3711
3806
|
category: Crawler
|
3712
|
-
-
|
3807
|
+
-
|
3713
3808
|
user_agent: Mozilla/5.0 (compatible; oBot/2.3.1; http://www.xforce-security.com/crawler/)
|
3714
3809
|
bot:
|
3715
3810
|
name: oBot
|
3716
3811
|
category: Search bot
|
3717
|
-
url:
|
3812
|
+
url: https://www.xforce-security.com/crawler/
|
3718
3813
|
producer:
|
3719
3814
|
name: 'IBM Germany Research & Development GmbH'
|
3720
3815
|
url: https://exchange.xforce.ibmcloud.com/
|
3721
|
-
-
|
3816
|
+
-
|
3722
3817
|
user_agent: 'sqlmap/1.1.8.2#dev (http://sqlmap.org)'
|
3723
3818
|
bot:
|
3724
3819
|
name: sqlmap
|
@@ -3727,87 +3822,613 @@
|
|
3727
3822
|
producer:
|
3728
3823
|
name: sqlmap
|
3729
3824
|
url: http://sqlmap.org/
|
3730
|
-
-
|
3825
|
+
-
|
3731
3826
|
user_agent: Mozilla/5.0 (compatible; theoldreader.com; 1 subscribers; feed-id=aaa)
|
3732
3827
|
bot:
|
3733
3828
|
name: theoldreader
|
3734
3829
|
category: Feed Reader
|
3735
3830
|
url: https://theoldreader.com
|
3736
|
-
|
3737
3831
|
-
|
3738
|
-
user_agent:
|
3832
|
+
user_agent: Sprinklr 2.0
|
3739
3833
|
bot:
|
3740
|
-
name:
|
3834
|
+
name: Sprinklr
|
3741
3835
|
category: Crawler
|
3742
|
-
url:
|
3743
|
-
|
3836
|
+
url: ""
|
3837
|
+
producer:
|
3838
|
+
name: Sprinklr, Inc.
|
3839
|
+
url: https://www.sprinklr.com/
|
3744
3840
|
-
|
3745
|
-
user_agent:
|
3841
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64)AppleWebKit/537.36 (KHTML, like Gecko; Google-Ads-Qualify)Chrome/85.0.4183.140 Safari/537.36
|
3746
3842
|
bot:
|
3747
|
-
name:
|
3748
|
-
category:
|
3749
|
-
url:
|
3750
|
-
|
3843
|
+
name: Googlebot
|
3844
|
+
category: Search bot
|
3845
|
+
url: http://www.google.com/bot.html
|
3846
|
+
producer:
|
3847
|
+
name: Google Inc.
|
3848
|
+
url: http://www.google.com
|
3751
3849
|
-
|
3752
|
-
user_agent:
|
3850
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64; BDCbot/1.0; +http://bigweb.bigdatacorp.com.br/faq.aspx) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36
|
3753
3851
|
bot:
|
3754
|
-
name:
|
3755
|
-
category:
|
3756
|
-
url:
|
3757
|
-
|
3852
|
+
name: BDCbot
|
3853
|
+
category: Crawler
|
3854
|
+
url: https://bigweb.bigdatacorp.com.br/pages/faq.aspx
|
3855
|
+
producer:
|
3856
|
+
name: BIG Data Solucoes Em Tecnologia de Informatica LTDA
|
3857
|
+
url: https://bigdatacorp.com.br/
|
3758
3858
|
-
|
3759
|
-
user_agent:
|
3859
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36 CloudflareDiagnostics/1.0
|
3760
3860
|
bot:
|
3761
|
-
name:
|
3861
|
+
name: Cloudflare Diagnostics
|
3862
|
+
category: Site Monitor
|
3863
|
+
url: https://www.cloudflare.com/
|
3864
|
+
producer:
|
3865
|
+
name: Cloudflare
|
3866
|
+
url: https://www.cloudflare.com
|
3867
|
+
-
|
3868
|
+
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 12_0 like Mac OS X) adbeat.com/policy AppleWebKit/605.1.15 (KHTML, like Gecko) CriOS/69.0.3497.105 Mobile/15E148 Safari/605.1
|
3869
|
+
bot:
|
3870
|
+
name: Adbeat
|
3762
3871
|
category: Crawler
|
3763
|
-
|
3872
|
+
url: https://www.adbeat.com/operation_policy
|
3873
|
+
producer:
|
3874
|
+
name: PPC Labs LLC
|
3875
|
+
url: https://www.adbeat.com/
|
3764
3876
|
-
|
3765
|
-
user_agent: Mozilla/5.0 (
|
3877
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; BW/1.1; bit.ly/2W6Px8S) Chrome/84.0.4147.105 Safari/537.36
|
3766
3878
|
bot:
|
3767
|
-
name:
|
3879
|
+
name: BuiltWith
|
3768
3880
|
category: Crawler
|
3769
|
-
url: https://
|
3770
|
-
|
3881
|
+
url: https://builtwith.com/biup
|
3882
|
+
producer:
|
3883
|
+
name: BuiltWith Pty Ltd
|
3884
|
+
url: https://builtwith.com/
|
3771
3885
|
-
|
3772
|
-
user_agent: Mozilla/5.0 (
|
3886
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36 (+https://whatis.contentkingapp.com)
|
3773
3887
|
bot:
|
3774
|
-
name:
|
3888
|
+
name: ContentKing
|
3889
|
+
category: Site Monitor
|
3890
|
+
url: https://whatis.contentkingapp.com/
|
3891
|
+
producer:
|
3892
|
+
name: ContentKing BV
|
3893
|
+
url: https://www.contentkingapp.com/
|
3894
|
+
-
|
3895
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.89 Safari/537.36 MicroAdBot/1.1 (https://www.microad.co.jp/contact/)
|
3896
|
+
bot:
|
3897
|
+
name: MicroAdBot
|
3775
3898
|
category: Crawler
|
3776
|
-
url: https://
|
3777
|
-
|
3899
|
+
url: https://www.microad.co.jp/
|
3900
|
+
producer:
|
3901
|
+
name: MicroAd, Inc.
|
3902
|
+
url: https://www.microad.co.jp/
|
3778
3903
|
-
|
3779
|
-
user_agent:
|
3904
|
+
user_agent: Mozilla/5.0 (compatible; PingAdmin.Ru/1.2; +http://pingadmin.ru/free_test/)
|
3780
3905
|
bot:
|
3781
|
-
name:
|
3906
|
+
name: PingAdmin.Ru
|
3907
|
+
category: Site Monitor
|
3908
|
+
url: https://ping-admin.ru/
|
3909
|
+
-
|
3910
|
+
user_agent: Mozilla/5.0 (compatible; WebDataStats/1.0 ; +https://webdatastats.com/policy.html)
|
3911
|
+
bot:
|
3912
|
+
name: WebDataStats
|
3782
3913
|
category: Crawler
|
3783
|
-
url:
|
3784
|
-
|
3914
|
+
url: https://webdatastats.com/policy.html
|
3915
|
+
producer:
|
3916
|
+
name: WebTehRazrabotka LLC
|
3917
|
+
url: https://webdatastats.com/
|
3785
3918
|
-
|
3786
|
-
user_agent:
|
3919
|
+
user_agent: Mozilla/5.0 (compatible; parse.ly scraper/0.14; +http://parsely.com)
|
3787
3920
|
bot:
|
3788
|
-
name:
|
3789
|
-
category:
|
3790
|
-
url: https://www.
|
3791
|
-
|
3921
|
+
name: parse.ly
|
3922
|
+
category: Crawler
|
3923
|
+
url: https://www.parse.ly/help/integration/crawler
|
3924
|
+
producer:
|
3925
|
+
name: Parsely, Inc.
|
3926
|
+
url: https://www.parse.ly/
|
3792
3927
|
-
|
3793
|
-
user_agent: Mozilla/5.0 (compatible
|
3928
|
+
user_agent: Mozilla/5.0 (compatible; Nimbostratus-Bot/v1.3.2; http://cloudsystemnetworks.com)
|
3794
3929
|
bot:
|
3795
|
-
name:
|
3930
|
+
name: Nimbostratus Bot
|
3931
|
+
category: Site Monitor
|
3932
|
+
url: http://cloudsystemnetworks.com
|
3933
|
+
-
|
3934
|
+
user_agent: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.17) Gecko/20110515 HeartRails_Capture/1.0.4 (+http://capture.heartrails.com/) Namoroka/3.6.17
|
3935
|
+
bot:
|
3936
|
+
name: Heart Rails Capture
|
3937
|
+
category: Service Agent
|
3938
|
+
url: http://capture.heartrails.com
|
3939
|
+
-
|
3940
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36 http://notifyninja.com/monitoring
|
3941
|
+
bot:
|
3942
|
+
name: Notify Ninja
|
3943
|
+
category: Site Monitor
|
3944
|
+
url: http://notifyninja.com
|
3945
|
+
-
|
3946
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) Project-Resonance (http://project-resonance.com/) (KHTML, like Gecko) Chrome/83.0.4103.61 Safari/537.36
|
3947
|
+
bot:
|
3948
|
+
name: Project Resonance
|
3796
3949
|
category: Crawler
|
3797
|
-
url:
|
3798
|
-
|
3950
|
+
url: http://project-resonance.com
|
3799
3951
|
-
|
3800
|
-
user_agent: Mozilla/5.0 (compatible;
|
3952
|
+
user_agent: Mozilla/5.0 (compatible; DataXu/1.0; +http://dataxu.com)
|
3801
3953
|
bot:
|
3802
|
-
name:
|
3954
|
+
name: DataXu
|
3955
|
+
category: Service Agent
|
3956
|
+
url: https://advertising.roku.com/dataxu
|
3957
|
+
producer:
|
3958
|
+
name: Roku, Inc.
|
3959
|
+
url: https://roku.com
|
3960
|
+
-
|
3961
|
+
user_agent: Mozilla/5.0 (Unknown; Linux x86_64) AppleWebKit/534.34 (KHTML, like Gecko) PingdomTMS/0.8.5 Safari/534.34
|
3962
|
+
bot:
|
3963
|
+
name: Pingdom Bot
|
3964
|
+
category: Site Monitor
|
3965
|
+
url: ""
|
3966
|
+
producer:
|
3967
|
+
name: Pingdom AB
|
3968
|
+
url: https://www.pingdom.com
|
3969
|
+
-
|
3970
|
+
user_agent: Mozilla/5.0 (compatible; Cocolyzebot/1.0; https://cocolyze.com/bot)
|
3971
|
+
bot:
|
3972
|
+
name: Cocolyzebot
|
3803
3973
|
category: Crawler
|
3804
|
-
url: https://
|
3805
|
-
|
3974
|
+
url: https://cocolyze.com/en/cocolyzebot
|
3975
|
+
producer:
|
3976
|
+
name: VSI INNOVATION SAS
|
3977
|
+
url: https://vsi-innovation.com/
|
3806
3978
|
-
|
3807
|
-
user_agent:
|
3979
|
+
user_agent: veryhip (http://veryhip.com/)
|
3808
3980
|
bot:
|
3809
|
-
name:
|
3981
|
+
name: VeryHip
|
3810
3982
|
category: Crawler
|
3811
|
-
url:
|
3812
|
-
|
3813
|
-
|
3983
|
+
url: https://veryhip.com/
|
3984
|
+
producer:
|
3985
|
+
name: VeryHip
|
3986
|
+
url: https://veryhip.com/
|
3987
|
+
-
|
3988
|
+
user_agent: Mozilla/5.0 (compatible; LinkpadBot/2.3; +http://linkpad.org/robot/)
|
3989
|
+
bot:
|
3990
|
+
name: LinkpadBot
|
3991
|
+
category: Crawler
|
3992
|
+
url: https://www.linkpad.org/
|
3993
|
+
producer:
|
3994
|
+
name: Solomono LLC
|
3995
|
+
url: https://www.linkpad.org/
|
3996
|
+
-
|
3997
|
+
user_agent: Mozilla/4.0 (compatible; MuscatFerret/1.7; http://www.webtop.com/)
|
3998
|
+
bot:
|
3999
|
+
name: MuscatFerret
|
4000
|
+
category: Crawler
|
4001
|
+
url: http://www.webtop.com/
|
4002
|
+
-
|
4003
|
+
user_agent: Quora-Bot/1.0 (http://www.quora.com)
|
4004
|
+
bot:
|
4005
|
+
name: Quora Bot
|
4006
|
+
category: Crawler
|
4007
|
+
url: ""
|
4008
|
+
producer:
|
4009
|
+
name: Quora
|
4010
|
+
url: https://www.quora.com/
|
4011
|
+
-
|
4012
|
+
user_agent: PageThing.com
|
4013
|
+
bot:
|
4014
|
+
name: PageThing
|
4015
|
+
category: Crawler
|
4016
|
+
url: https://www.pagething.com/
|
4017
|
+
producer:
|
4018
|
+
name: SPECIALNOISE LTD
|
4019
|
+
url: https://www.specialnoise.com/
|
4020
|
+
-
|
4021
|
+
user_agent: ArchiveBox/0.5.3 (+https://github.com/ArchiveBox/ArchiveBox/)
|
4022
|
+
bot:
|
4023
|
+
name: ArchiveBox
|
4024
|
+
url: https://archivebox.io/
|
4025
|
+
category: Crawler
|
4026
|
+
producer:
|
4027
|
+
name: ""
|
4028
|
+
url: ""
|
4029
|
+
-
|
4030
|
+
user_agent: Choosito/1.0 +http://www.choosito.com/
|
4031
|
+
bot:
|
4032
|
+
name: Choosito
|
4033
|
+
url: https://www.choosito.com/
|
4034
|
+
category: Crawler
|
4035
|
+
producer:
|
4036
|
+
name: Choosito! Inc.
|
4037
|
+
url: https://www.choosito.com/
|
4038
|
+
-
|
4039
|
+
user_agent: datagnionbot (+http://www.datagnion.com/bot.html)
|
4040
|
+
bot:
|
4041
|
+
name: datagnionbot
|
4042
|
+
url: https://www.datagnion.com/bot.html
|
4043
|
+
category: Crawler
|
4044
|
+
producer:
|
4045
|
+
name: DATAGNION GMBH
|
4046
|
+
url: https://www.datagnion.com/
|
4047
|
+
-
|
4048
|
+
user_agent: InterNaetBoten/0.99 (http://www.xn--internt-bxa.nu)
|
4049
|
+
bot:
|
4050
|
+
name: Generic Bot
|
4051
|
+
-
|
4052
|
+
user_agent: EasyBib AutoCite (http://autocite-info.citation-api.com/)
|
4053
|
+
bot:
|
4054
|
+
name: Generic Bot
|
4055
|
+
-
|
4056
|
+
user_agent: Bidtellect/0.0.643.0
|
4057
|
+
bot:
|
4058
|
+
name: Generic Bot
|
4059
|
+
-
|
4060
|
+
user_agent: Mozilla/5.0 (compatible; meg/0.2; +https://github.com/tomnomnom/meg)
|
4061
|
+
bot:
|
4062
|
+
name: Generic Bot
|
4063
|
+
-
|
4064
|
+
user_agent: Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:66.0) WhatCMS/1.0
|
4065
|
+
bot:
|
4066
|
+
name: WhatCMS
|
4067
|
+
url: https://whatcms.org/
|
4068
|
+
category: Crawler
|
4069
|
+
producer:
|
4070
|
+
name: "Nineteen Ten LLC"
|
4071
|
+
url: "https://whatcms.org/"
|
4072
|
+
-
|
4073
|
+
user_agent: httpx - Open-source project (github.com/projectdiscovery/httpx)
|
4074
|
+
bot:
|
4075
|
+
name: httpx
|
4076
|
+
url: https://github.com/projectdiscovery/httpx
|
4077
|
+
category: Crawler
|
4078
|
+
producer:
|
4079
|
+
name: ""
|
4080
|
+
url: ""
|
4081
|
+
-
|
4082
|
+
user_agent: 'Expanse indexes the network perimeters of our customers. If you have any questions or concerns, please reach out to: scaninfo@expanseinc.com'
|
4083
|
+
bot:
|
4084
|
+
name: Expanse
|
4085
|
+
category: Security Checker
|
4086
|
+
url: https://expanse.co/
|
4087
|
+
producer:
|
4088
|
+
name: Expanse Inc.
|
4089
|
+
url: https://expanse.co/
|
4090
|
+
-
|
4091
|
+
user_agent: 'HuaweiWebCatBot/6.0) (To acquire the allowed html pages as reliable information of URL categorization in the automatic process for Huawei Web Categorization.; https://isecurity.huawei.com/; sec at huawei dot com)'
|
4092
|
+
bot:
|
4093
|
+
name: HuaweiWebCatBot
|
4094
|
+
category: Crawler
|
4095
|
+
url: https://isecurity.huawei.com
|
4096
|
+
producer:
|
4097
|
+
name: Huawei Technologies Co., Ltd.
|
4098
|
+
url: https://huawei.com
|
4099
|
+
-
|
4100
|
+
user_agent: Mozilla/5.0 (compatible; SputnikFaviconBot/1.2; +http://corp.sputnik.ru/webmaster)
|
4101
|
+
bot:
|
4102
|
+
name: Sputnik Favicon Bot
|
4103
|
+
url: ""
|
4104
|
+
category: Crawler
|
4105
|
+
-
|
4106
|
+
user_agent: Hatena-Favicon2 (http://www.hatena.ne.jp/faq/)
|
4107
|
+
bot:
|
4108
|
+
name: Hatena Favicon
|
4109
|
+
category: Crawler
|
4110
|
+
url: https://www.hatena.ne.jp/faq/
|
4111
|
+
producer:
|
4112
|
+
name: Hatena Co., Ltd.
|
4113
|
+
url: https://www.hatena.ne.jp
|
4114
|
+
-
|
4115
|
+
user_agent: Mozilla/5.0 (compatible; RyowlEngine/1.0; +https://ryowl.org)
|
4116
|
+
bot:
|
4117
|
+
name: Ryowl
|
4118
|
+
category: Crawler
|
4119
|
+
url: https://ryowl.org
|
4120
|
+
-
|
4121
|
+
user_agent: Mozilla/5.0 (compatible; OdklBot/1.0 like Linux; klass@odnoklassniki.ru)
|
4122
|
+
bot:
|
4123
|
+
name: Odnoklassniki Bot
|
4124
|
+
category: Crawler
|
4125
|
+
url: https://odnoklassniki.ru
|
4126
|
+
-
|
4127
|
+
user_agent: Mediatoolkitbot (complaints@mediatoolkit.com)
|
4128
|
+
bot:
|
4129
|
+
name: Mediatoolkit Bot
|
4130
|
+
category: Crawler
|
4131
|
+
url: https://mediatoolkit.com
|
4132
|
+
-
|
4133
|
+
user_agent: ZoominfoBot (zoominfobot at zoominfo dot com)
|
4134
|
+
bot:
|
4135
|
+
name: ZoominfoBot
|
4136
|
+
category: Crawler
|
4137
|
+
url: https://www.zoominfo.com
|
4138
|
+
-
|
4139
|
+
user_agent: Mozilla/5.0 (compatible; WeViKaBot/1.0; +http://www.wevika.de/)
|
4140
|
+
bot:
|
4141
|
+
name: WeViKaBot
|
4142
|
+
category: Crawler
|
4143
|
+
url: http://www.wevika.de
|
4144
|
+
-
|
4145
|
+
user_agent: Mozilla/5.0 (compatible; SEOkicks; +https://www.seokicks.de/robot.html)
|
4146
|
+
bot:
|
4147
|
+
name: SEOkicks
|
4148
|
+
category: Crawler
|
4149
|
+
url: https://www.seokicks.de/robot.html
|
4150
|
+
-
|
4151
|
+
user_agent: Mozilla/5.0 (compatible; Plukkie/1.6; http://www.botje.com/plukkie.htm)
|
4152
|
+
bot:
|
4153
|
+
name: Plukkie
|
4154
|
+
category: Crawler
|
4155
|
+
url: http://www.botje.com/plukkie.htm
|
4156
|
+
-
|
4157
|
+
user_agent: Mozilla/5.0 (compatible; proximic; https://www.comscore.com/Web-Crawler)
|
4158
|
+
bot:
|
4159
|
+
name: Comscore
|
4160
|
+
category: Crawler
|
4161
|
+
url: https://www.comscore.com/Web-Crawler
|
4162
|
+
-
|
4163
|
+
user_agent: Mozilla/5.0 (compatible; SurdotlyBot/1.0; +http://sur.ly/bot.html)
|
4164
|
+
bot:
|
4165
|
+
name: SurdotlyBot
|
4166
|
+
category: Crawler
|
4167
|
+
url: http://sur.ly/bot.html
|
4168
|
+
-
|
4169
|
+
user_agent: Mozilla/5.0 (compatible; Gowikibot/1.0; +http://www.gowikibot.com)
|
4170
|
+
bot:
|
4171
|
+
name: Gowikibot
|
4172
|
+
category: Crawler
|
4173
|
+
url: http:/www.gowikibot.com
|
4174
|
+
-
|
4175
|
+
user_agent: Mozilla/5.0 (compatible; SabsimBot/3.0; +https://sabsim.com)
|
4176
|
+
bot:
|
4177
|
+
name: SabsimBot
|
4178
|
+
category: Crawler
|
4179
|
+
url: https://sabsim.com
|
4180
|
+
-
|
4181
|
+
user_agent: Mozilla/5.0 (compatible; LumtelBot/1.0; +http://lumtel.com)
|
4182
|
+
bot:
|
4183
|
+
name: LumtelBot
|
4184
|
+
category: Crawler
|
4185
|
+
url: https://umtel.com
|
4186
|
+
-
|
4187
|
+
user_agent: Mozilla/5.0+(compatible;+PiplBot;+http://www.pipl.com/bot/)
|
4188
|
+
bot:
|
4189
|
+
name: PiplBot
|
4190
|
+
category: Crawler
|
4191
|
+
url: http://www.pipl.com/bot
|
4192
|
+
-
|
4193
|
+
user_agent: Mozilla/5.0 (compatible; woobot/2.0; +https://www.woorank.com/bot)
|
4194
|
+
bot:
|
4195
|
+
name: WooRank
|
4196
|
+
category: Crawler
|
4197
|
+
url: https://www.woorank.com/bot
|
4198
|
+
-
|
4199
|
+
user_agent: YahooMailProxy; https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
4200
|
+
bot:
|
4201
|
+
name: Yahoo! Mail Proxy
|
4202
|
+
category: Service Agent
|
4203
|
+
url: https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
4204
|
+
producer:
|
4205
|
+
name: Yahoo! Inc.
|
4206
|
+
url: http://www.yahoo.com
|
4207
|
+
-
|
4208
|
+
user_agent: 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; Cookiebot/1.0; http://cookiebot.com/) Chrome/79.0.3945.117 Safari/537.36'
|
4209
|
+
bot:
|
4210
|
+
name: Cookiebot
|
4211
|
+
category: Crawler
|
4212
|
+
url: https://support.cookiebot.com/hc/en-us/articles/360014264140-Scanner-User-Agent
|
4213
|
+
producer:
|
4214
|
+
name: Cybot A/S
|
4215
|
+
url: https://www.cybot.com/
|
4216
|
+
-
|
4217
|
+
user_agent: NetSystemsResearch studies the availability of various services across the internet. Our website is netsystemsresearch.com
|
4218
|
+
bot:
|
4219
|
+
name: NetSystemsResearch
|
4220
|
+
category: Security Checker
|
4221
|
+
url: https://www.netsystemsresearch.com/
|
4222
|
+
producer:
|
4223
|
+
name: NET SYSTEMS RESEARCH LLC
|
4224
|
+
url: https://www.netsystemsresearch.com/
|
4225
|
+
-
|
4226
|
+
user_agent: 'Mozilla/5.0 (compatible; CensysInspect/1.1; https://about.censys.io/)'
|
4227
|
+
bot:
|
4228
|
+
name: CensysInspect
|
4229
|
+
category: Security Checker
|
4230
|
+
url: https://about.censys.io/
|
4231
|
+
producer:
|
4232
|
+
name: Censys, Inc.
|
4233
|
+
url: https://censys.io/
|
4234
|
+
-
|
4235
|
+
user_agent: https://gdnplus.com:Gather Analyze Provide.
|
4236
|
+
bot:
|
4237
|
+
name: GDNP
|
4238
|
+
category: Crawler
|
4239
|
+
url: https://gdnplus.com/
|
4240
|
+
producer:
|
4241
|
+
name: Global Digital Network Plus, LLC
|
4242
|
+
url: https://gdnplus.com/
|
4243
|
+
-
|
4244
|
+
user_agent: WellKnownBot/0.1 (https://well-known.dev)
|
4245
|
+
bot:
|
4246
|
+
name: WellKnownBot
|
4247
|
+
category: Crawler
|
4248
|
+
url: https://well-known.dev
|
4249
|
+
-
|
4250
|
+
user_agent: Mozilla/5.0 (compatible; Adsbot/3.1; https://seostar.co/robot/)
|
4251
|
+
bot:
|
4252
|
+
name: Adsbot
|
4253
|
+
category: Crawler
|
4254
|
+
url: https://seostar.co/robot/
|
4255
|
+
-
|
4256
|
+
user_agent: MTRobot/0.2 (Metrics Tools Analytics Crawler; https://metrics-tools.de/robot.html; crawler@metrics-tools.de)
|
4257
|
+
bot:
|
4258
|
+
name: MTRobot
|
4259
|
+
category: Crawler
|
4260
|
+
url: https://metrics-tools.de/robot.html
|
4261
|
+
producer:
|
4262
|
+
name: Metrics Tools
|
4263
|
+
url: https://metrics-tools.de/
|
4264
|
+
-
|
4265
|
+
user_agent: My User Agent 1.0
|
4266
|
+
bot:
|
4267
|
+
name: Generic Bot
|
4268
|
+
-
|
4269
|
+
user_agent: serpstatbot/1.0 (advanced backlink tracking bot; curl/7.58.0; http://serpstatbot.com/; abuse@serpstatbot.com)
|
4270
|
+
bot:
|
4271
|
+
name: serpstatbot
|
4272
|
+
category: Crawler
|
4273
|
+
url: http://serpstatbot.com/
|
4274
|
+
producer:
|
4275
|
+
name: Netpeak Ltd
|
4276
|
+
url: https://netpeak.net/
|
4277
|
+
-
|
4278
|
+
user_agent: colly - https://github.com/gocolly/colly/v2
|
4279
|
+
bot:
|
4280
|
+
name: colly
|
4281
|
+
category: Crawler
|
4282
|
+
url: https://github.com/gocolly/colly/
|
4283
|
+
-
|
4284
|
+
user_agent: l9tcpid/v1.0.0
|
4285
|
+
bot:
|
4286
|
+
name: l9tcpid
|
4287
|
+
category: Security Checker
|
4288
|
+
url: https://github.com/LeakIX/l9tcpid
|
4289
|
+
-
|
4290
|
+
user_agent: Mozilla/5.0 (compatible; MegaIndex.ru/2.0; +http://megaindex.com/crawler)
|
4291
|
+
bot:
|
4292
|
+
name: MegaIndex
|
4293
|
+
category: Crawler
|
4294
|
+
url: https://megaindex.com/crawler
|
4295
|
+
-
|
4296
|
+
user_agent: Mozilla/5.0 (compatible; Seekport Crawler; http://seekport.com/)
|
4297
|
+
bot:
|
4298
|
+
name: Seekport
|
4299
|
+
category: Crawler
|
4300
|
+
url: http://www.seekport.com/
|
4301
|
+
producer:
|
4302
|
+
name: SISTRIX GmbH
|
4303
|
+
url: https://www.sistrix.de/
|
4304
|
+
-
|
4305
|
+
user_agent: Mozilla/5.0 (compatible; seolyt/1.1; +https://seolyt.com)
|
4306
|
+
bot:
|
4307
|
+
name: seolyt
|
4308
|
+
category: Crawler
|
4309
|
+
url: https://seolyt.com/
|
4310
|
+
-
|
4311
|
+
user_agent: Mozilla/5.0 (compatible; YaK/1.0; http://linkfluence.com/; bot@linkfluence.com)
|
4312
|
+
bot:
|
4313
|
+
name: YaK
|
4314
|
+
category: Crawler
|
4315
|
+
url: https://www.linkfluence.com/
|
4316
|
+
producer:
|
4317
|
+
name: Linkfluence SAS
|
4318
|
+
url: https://www.linkfluence.com/
|
4319
|
+
-
|
4320
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64; +http://www.komodia.com/newwiki/index.php/URL_server_crawler) KomodiaBot/1.0
|
4321
|
+
bot:
|
4322
|
+
name: KomodiaBot
|
4323
|
+
category: Crawler
|
4324
|
+
url: http://www.komodia.com/newwiki/index.php/URL_server_crawler
|
4325
|
+
producer:
|
4326
|
+
name: Komodia Inc.
|
4327
|
+
url: https://www.komodia.com/
|
4328
|
+
-
|
4329
|
+
user_agent: Mozilla/5.0 (Windows NT 6.3; WOW64; Trident/7.0; rv:11.0; Catchpoint) like Gecko
|
4330
|
+
bot:
|
4331
|
+
name: Catchpoint
|
4332
|
+
category: Site Monitor
|
4333
|
+
url: https://www.catchpoint.com/
|
4334
|
+
producer:
|
4335
|
+
name: Catchpoint Systems
|
4336
|
+
url: https://www.catchpoint.com/
|
4337
|
+
-
|
4338
|
+
user_agent: Better Uptime Bot Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36
|
4339
|
+
bot:
|
4340
|
+
name: Better Uptime Bot
|
4341
|
+
category: Site Monitor
|
4342
|
+
url: https://betteruptime.com/faq
|
4343
|
+
producer:
|
4344
|
+
name: Better Uptime
|
4345
|
+
url: https://betteruptime.com/
|
4346
|
+
-
|
4347
|
+
user_agent: gobuster/3.1.0
|
4348
|
+
bot:
|
4349
|
+
name: Gobuster
|
4350
|
+
url: https://github.com/OJ/gobuster
|
4351
|
+
-
|
4352
|
+
user_agent: k6/0.31.1 (https://k6.io/)
|
4353
|
+
bot:
|
4354
|
+
name: K6
|
4355
|
+
url: https://k6.io/
|
4356
|
+
-
|
4357
|
+
user_agent: Mozilla/5.0 (compatible; Neevabot/1.0; https://neeva.com/neevabot)
|
4358
|
+
bot:
|
4359
|
+
name: Neevabot
|
4360
|
+
category: Search bot
|
4361
|
+
url: https://neeva.com/neevabot
|
4362
|
+
producer:
|
4363
|
+
name: Neeva Inc.
|
4364
|
+
url: https://neeva.com/
|
4365
|
+
-
|
4366
|
+
user_agent: LinkPreview/1.5 (http://linkpreview.net)
|
4367
|
+
bot:
|
4368
|
+
name: LinkPreview
|
4369
|
+
category: Service Agent
|
4370
|
+
url: https://www.linkpreview.net/
|
4371
|
+
-
|
4372
|
+
user_agent: Mozilla/5.0 (compatible; JungleKeyThumbnail/1.1; +http://www.junglekey.fr/)
|
4373
|
+
bot:
|
4374
|
+
name: JungleKeyThumbnail
|
4375
|
+
category: Crawler
|
4376
|
+
url: https://junglekey.com/
|
4377
|
+
-
|
4378
|
+
user_agent: rocketmonitor 1.0
|
4379
|
+
bot:
|
4380
|
+
name: RocketMonitorBot
|
4381
|
+
category: Site Monitor
|
4382
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
4383
|
+
producer:
|
4384
|
+
name: Radio Mast, Inc.
|
4385
|
+
url: https://www.radiomast.io/
|
4386
|
+
-
|
4387
|
+
user_agent: RocketMonitorBot/1.0 ( https://www.radiomast.io)
|
4388
|
+
bot:
|
4389
|
+
name: RocketMonitorBot
|
4390
|
+
category: Site Monitor
|
4391
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
4392
|
+
producer:
|
4393
|
+
name: Radio Mast, Inc.
|
4394
|
+
url: https://www.radiomast.io/
|
4395
|
+
-
|
4396
|
+
user_agent: SitemapParser-VIPnytt/1.1 ( https://github.com/VIPnytt/SitemapParser/blob/master/README.md)
|
4397
|
+
bot:
|
4398
|
+
name: SitemapParser-VIPnytt
|
4399
|
+
category: Crawler
|
4400
|
+
url: https://github.com/VIPnytt/SitemapParser/
|
4401
|
+
-
|
4402
|
+
user_agent: Turnitin (https://bit.ly/2UvnfoQ)
|
4403
|
+
bot:
|
4404
|
+
name: Turnitin
|
4405
|
+
category: Crawler
|
4406
|
+
url: https://turnitin.com/robot/crawlerinfo.html
|
4407
|
+
-
|
4408
|
+
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; Storebot-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Mobile Safari/537.36
|
4409
|
+
bot:
|
4410
|
+
name: Google StoreBot
|
4411
|
+
category: Crawler
|
4412
|
+
-
|
4413
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.56 Safari/537.36 DMBrowser/2.1 (UV)
|
4414
|
+
bot:
|
4415
|
+
name: Dotcom Monitor
|
4416
|
+
category: Site Monitor
|
4417
|
+
url: https://www.dotcom-monitor.com
|
4418
|
+
-
|
4419
|
+
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64; rv:29.0) Gecko/20100101 /29.0 DMBrowser-BV
|
4420
|
+
bot:
|
4421
|
+
name: Dotcom Monitor
|
4422
|
+
category: Site Monitor
|
4423
|
+
url: https://www.dotcom-monitor.com
|
4424
|
+
-
|
4425
|
+
user_agent: Mozilla/5.0 (compatible; ThinkChaos/0.3.0; +In_the_test_phase,_if_the_ThinkChaos_brings_you_trouble,_please_add_disallow_to_the_robots.txt._Thank_you.)
|
4426
|
+
bot:
|
4427
|
+
name: ThinkChaos
|
4428
|
+
category: Crawler
|
4429
|
+
-
|
4430
|
+
user_agent: Mozilla/5.0 (compatible; DataForSeoBot/1.0; +https://dataforseo.com/dataforseo-bot)
|
4431
|
+
bot:
|
4432
|
+
name: DataForSeoBot
|
4433
|
+
category: Crawler
|
4434
|
+
url: https://dataforseo.com/dataforseo-bot
|