device_detector 1.0.5 → 1.0.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.md +7 -6
- data/lib/device_detector/browser.rb +364 -0
- data/lib/device_detector/client.rb +8 -0
- data/lib/device_detector/device.rb +1124 -4
- data/lib/device_detector/os.rb +36 -11
- data/lib/device_detector/version.rb +1 -1
- data/lib/device_detector/version_extractor.rb +9 -0
- data/lib/device_detector.rb +57 -13
- data/regexes/bots.yml +551 -58
- data/regexes/client/browser_engine.yml +7 -1
- data/regexes/client/browsers.yml +594 -71
- data/regexes/client/feed_readers.yml +4 -10
- data/regexes/client/libraries.yml +47 -2
- data/regexes/client/mediaplayers.yml +25 -1
- data/regexes/client/mobile_apps.yml +447 -77
- data/regexes/client/pim.yml +49 -1
- data/regexes/device/cameras.yml +5 -5
- data/regexes/device/car_browsers.yml +16 -0
- data/regexes/device/consoles.yml +6 -0
- data/regexes/device/mobiles.yml +12905 -4561
- data/regexes/device/portable_media_player.yml +20 -3
- data/regexes/device/shell_tv.yml +117 -0
- data/regexes/device/televisions.yml +426 -35
- data/regexes/oss.yml +567 -139
- data/spec/device_detector/concrete_user_agent_spec.rb +30 -42
- data/spec/device_detector/detector_fixtures_spec.rb +9 -5
- data/spec/device_detector/device_spec.rb +26 -10
- data/spec/fixtures/client/browser.yml +1463 -391
- data/spec/fixtures/client/feed_reader.yml +0 -12
- data/spec/fixtures/client/library.yml +91 -37
- data/spec/fixtures/client/mediaplayer.yml +30 -0
- data/spec/fixtures/client/mobile_app.yml +498 -45
- data/spec/fixtures/client/pim.yml +60 -0
- data/spec/fixtures/detector/bots.yml +1189 -568
- data/spec/fixtures/detector/camera.yml +12 -26
- data/spec/fixtures/detector/car_browser.yml +151 -15
- data/spec/fixtures/detector/console.yml +70 -48
- data/spec/fixtures/detector/desktop.yml +2041 -916
- data/spec/fixtures/detector/feature_phone.yml +895 -189
- data/spec/fixtures/detector/feed_reader.yml +50 -77
- data/spec/fixtures/detector/mediaplayer.yml +79 -26
- data/spec/fixtures/detector/mobile_apps.yml +726 -72
- data/spec/fixtures/detector/peripheral.yml +271 -0
- data/spec/fixtures/detector/phablet.yml +3635 -1596
- data/spec/fixtures/detector/portable_media_player.yml +355 -46
- data/spec/fixtures/detector/smart_display.yml +183 -9
- data/spec/fixtures/detector/smart_speaker.yml +13 -8
- data/spec/fixtures/detector/smartphone-1.yml +4002 -4286
- data/spec/fixtures/detector/smartphone-10.yml +3771 -4763
- data/spec/fixtures/detector/smartphone-11.yml +3615 -4692
- data/spec/fixtures/detector/smartphone-12.yml +3856 -4764
- data/spec/fixtures/detector/smartphone-13.yml +4213 -4713
- data/spec/fixtures/detector/smartphone-14.yml +4039 -4497
- data/spec/fixtures/detector/smartphone-15.yml +5642 -2956
- data/spec/fixtures/detector/smartphone-16.yml +4739 -5082
- data/spec/fixtures/detector/smartphone-17.yml +4832 -4275
- data/spec/fixtures/detector/smartphone-18.yml +9806 -0
- data/spec/fixtures/detector/smartphone-19.yml +9965 -0
- data/spec/fixtures/detector/smartphone-2.yml +4842 -2589
- data/spec/fixtures/detector/smartphone-20.yml +9710 -0
- data/spec/fixtures/detector/smartphone-21.yml +8693 -0
- data/spec/fixtures/detector/smartphone-22.yml +10178 -0
- data/spec/fixtures/detector/smartphone-23.yml +9453 -0
- data/spec/fixtures/detector/smartphone-24.yml +9843 -0
- data/spec/fixtures/detector/smartphone-25.yml +9703 -0
- data/spec/fixtures/detector/smartphone-26.yml +10007 -0
- data/spec/fixtures/detector/smartphone-27.yml +4927 -0
- data/spec/fixtures/detector/smartphone-3.yml +4387 -4427
- data/spec/fixtures/detector/smartphone-4.yml +3597 -4582
- data/spec/fixtures/detector/smartphone-5.yml +4066 -5022
- data/spec/fixtures/detector/smartphone-6.yml +3455 -4621
- data/spec/fixtures/detector/smartphone-7.yml +3574 -4574
- data/spec/fixtures/detector/smartphone-8.yml +4617 -4704
- data/spec/fixtures/detector/smartphone-9.yml +4080 -5035
- data/spec/fixtures/detector/smartphone.yml +3244 -4234
- data/spec/fixtures/detector/tablet-1.yml +4652 -4492
- data/spec/fixtures/detector/tablet-2.yml +3515 -4434
- data/spec/fixtures/detector/tablet-3.yml +3418 -4351
- data/spec/fixtures/detector/tablet-4.yml +5149 -3200
- data/spec/fixtures/detector/tablet-5.yml +9273 -0
- data/spec/fixtures/detector/tablet-6.yml +4588 -0
- data/spec/fixtures/detector/tablet.yml +1621 -2613
- data/spec/fixtures/detector/tv-1.yml +2501 -0
- data/spec/fixtures/detector/tv.yml +7826 -3114
- data/spec/fixtures/detector/unknown.yml +370 -531
- data/spec/fixtures/detector/wearable.yml +863 -9
- data/spec/fixtures/parser/oss.yml +1350 -21
- data/spec/fixtures/parser/vendorfragments.yml +53 -53
- metadata +35 -5
|
@@ -1,45 +1,51 @@
|
|
|
1
1
|
---
|
|
2
|
-
-
|
|
2
|
+
-
|
|
3
3
|
user_agent: 360spider-image
|
|
4
4
|
bot:
|
|
5
5
|
name: 360Spider
|
|
6
6
|
category: Search bot
|
|
7
|
-
url:
|
|
7
|
+
url: https://www.so.com/help/help_3_2.html
|
|
8
8
|
producer:
|
|
9
9
|
name: Online Media Group, Inc.
|
|
10
10
|
url: ""
|
|
11
|
-
-
|
|
11
|
+
-
|
|
12
12
|
user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
|
|
13
13
|
bot:
|
|
14
14
|
name: 360Spider
|
|
15
15
|
category: Search bot
|
|
16
|
-
url:
|
|
16
|
+
url: https://www.so.com/help/help_3_2.html
|
|
17
17
|
producer:
|
|
18
18
|
name: Online Media Group, Inc.
|
|
19
19
|
url: ""
|
|
20
|
-
-
|
|
20
|
+
-
|
|
21
21
|
user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
|
|
22
22
|
bot:
|
|
23
23
|
name: 360Spider
|
|
24
24
|
category: Search bot
|
|
25
|
-
url:
|
|
25
|
+
url: https://www.so.com/help/help_3_2.html
|
|
26
26
|
producer:
|
|
27
27
|
name: Online Media Group, Inc.
|
|
28
28
|
url: ""
|
|
29
|
-
-
|
|
29
|
+
-
|
|
30
30
|
user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
|
|
31
31
|
bot:
|
|
32
32
|
name: 360Spider
|
|
33
33
|
category: Search bot
|
|
34
|
-
url:
|
|
34
|
+
url: https://www.so.com/help/help_3_2.html
|
|
35
35
|
producer:
|
|
36
36
|
name: Online Media Group, Inc.
|
|
37
37
|
url: ""
|
|
38
|
-
-
|
|
38
|
+
-
|
|
39
39
|
user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
|
|
40
40
|
bot:
|
|
41
41
|
name: ADMantX
|
|
42
|
-
-
|
|
42
|
+
-
|
|
43
|
+
user_agent: ias-va/3.1 (+https://www.admantx.com/service-fetcher.html)
|
|
44
|
+
bot:
|
|
45
|
+
name: ADmantX Service Fetcher
|
|
46
|
+
category: Service bot
|
|
47
|
+
url: https://www.admantx.com/service-fetcher.html
|
|
48
|
+
-
|
|
43
49
|
user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
|
|
44
50
|
bot:
|
|
45
51
|
name: Aboundexbot
|
|
@@ -48,7 +54,7 @@
|
|
|
48
54
|
producer:
|
|
49
55
|
name: Aboundex.com
|
|
50
56
|
url: http://www.aboundex.com
|
|
51
|
-
-
|
|
57
|
+
-
|
|
52
58
|
user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
|
|
53
59
|
bot:
|
|
54
60
|
name: Acoon
|
|
@@ -57,7 +63,7 @@
|
|
|
57
63
|
producer:
|
|
58
64
|
name: Acoon GmbH
|
|
59
65
|
url: http://www.acoon.de
|
|
60
|
-
-
|
|
66
|
+
-
|
|
61
67
|
user_agent: AddThis.com robot tech.support@clearspring.com
|
|
62
68
|
bot:
|
|
63
69
|
name: AddThis.com
|
|
@@ -66,25 +72,34 @@
|
|
|
66
72
|
producer:
|
|
67
73
|
name: Clearspring Technologies, Inc.
|
|
68
74
|
url: http://www.clearspring.com
|
|
69
|
-
-
|
|
75
|
+
-
|
|
70
76
|
user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
|
|
71
77
|
bot:
|
|
72
78
|
name: Alexa Crawler
|
|
73
79
|
category: Search bot
|
|
74
|
-
url: https://alexa.
|
|
80
|
+
url: https://support.alexa.com/hc/en-us/sections/200100794-Crawlers
|
|
75
81
|
producer:
|
|
76
82
|
name: Alexa Internet
|
|
77
|
-
url:
|
|
78
|
-
-
|
|
83
|
+
url: https://www.alexa.com
|
|
84
|
+
-
|
|
79
85
|
user_agent: Mozilla/5.0 (compatible; alexa site audit/1.0; http://www.alexa.com/help/webmasters; )
|
|
80
86
|
bot:
|
|
81
87
|
name: Alexa Site Audit
|
|
82
88
|
category: Site Monitor
|
|
83
|
-
url:
|
|
89
|
+
url: https://support.alexa.com/hc/en-us/articles/200450194
|
|
84
90
|
producer:
|
|
85
91
|
name: Alexa Internet
|
|
86
|
-
url:
|
|
87
|
-
-
|
|
92
|
+
url: https://www.alexa.com
|
|
93
|
+
-
|
|
94
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Amazonbot/0.1; +https://developer.amazon.com/support/amazonbot)
|
|
95
|
+
bot:
|
|
96
|
+
name: Amazon Bot
|
|
97
|
+
category: Crawler
|
|
98
|
+
url: https://developer.amazon.com/support/amazonbot
|
|
99
|
+
producer:
|
|
100
|
+
name: Amazon.com, Inc.
|
|
101
|
+
url: https://www.amazon.com/
|
|
102
|
+
-
|
|
88
103
|
user_agent: Amazon Route 53 Health Check Service; ref:xxxxxxxx-xxxx-xxxxxxxxx-xxxxxxxxxxxx; report http://amzn.to/xxxxxxx
|
|
89
104
|
bot:
|
|
90
105
|
name: Amazon Route53 Health Check
|
|
@@ -92,7 +107,7 @@
|
|
|
92
107
|
producer:
|
|
93
108
|
name: Amazon Web Services
|
|
94
109
|
url: https://aws.amazon.com/
|
|
95
|
-
-
|
|
110
|
+
-
|
|
96
111
|
user_agent: Amazon-Route53-Health-Check-Service (ref b0eb04d5-cb5e-40e7-839b-558e52fc3f0d; report http://amzn.to/1vsZADi)
|
|
97
112
|
bot:
|
|
98
113
|
name: Amazon Route53 Health Check
|
|
@@ -100,7 +115,7 @@
|
|
|
100
115
|
producer:
|
|
101
116
|
name: Amazon Web Services
|
|
102
117
|
url: https://aws.amazon.com/
|
|
103
|
-
-
|
|
118
|
+
-
|
|
104
119
|
user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
|
|
105
120
|
bot:
|
|
106
121
|
name: Amorank Spider
|
|
@@ -109,7 +124,7 @@
|
|
|
109
124
|
producer:
|
|
110
125
|
name: Amorank
|
|
111
126
|
url: http://www.amorank.com
|
|
112
|
-
-
|
|
127
|
+
-
|
|
113
128
|
user_agent: 'Curious George - www.analyticsseo.com/crawler'
|
|
114
129
|
bot:
|
|
115
130
|
name: Analytics SEO Crawler
|
|
@@ -118,7 +133,7 @@
|
|
|
118
133
|
producer:
|
|
119
134
|
name: Analytics SEO
|
|
120
135
|
url: http://www.analyticsseo.com
|
|
121
|
-
-
|
|
136
|
+
-
|
|
122
137
|
user_agent: ApacheBench/2.3
|
|
123
138
|
bot:
|
|
124
139
|
name: ApacheBench
|
|
@@ -126,35 +141,44 @@
|
|
|
126
141
|
url: https://httpd.apache.org/docs/2.4/programs/ab.html
|
|
127
142
|
producer:
|
|
128
143
|
name: The Apache Software Foundation
|
|
129
|
-
url:
|
|
130
|
-
-
|
|
144
|
+
url: https://www.apache.org/foundation/
|
|
145
|
+
-
|
|
131
146
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
|
|
132
147
|
bot:
|
|
133
148
|
name: Applebot
|
|
134
149
|
category: Crawler
|
|
135
|
-
url:
|
|
150
|
+
url: https://support.apple.com/en-us/HT204683
|
|
136
151
|
producer:
|
|
137
152
|
name: Apple Inc
|
|
138
|
-
url:
|
|
139
|
-
-
|
|
153
|
+
url: https://www.apple.com
|
|
154
|
+
-
|
|
155
|
+
user_agent: AppSignalBot/1.0 (+https://appsignal.com)
|
|
156
|
+
bot:
|
|
157
|
+
name: AppSignalBot
|
|
158
|
+
category: Site Monitor
|
|
159
|
+
url: https://docs.appsignal.com/uptime-monitoring/
|
|
160
|
+
producer:
|
|
161
|
+
name: AppSignal
|
|
162
|
+
url: https://appsignal.com/
|
|
163
|
+
-
|
|
140
164
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
|
|
141
165
|
bot:
|
|
142
166
|
name: Applebot
|
|
143
167
|
category: Crawler
|
|
144
|
-
url:
|
|
168
|
+
url: https://support.apple.com/en-us/HT204683
|
|
145
169
|
producer:
|
|
146
170
|
name: Apple Inc
|
|
147
|
-
url:
|
|
148
|
-
-
|
|
171
|
+
url: https://www.apple.com
|
|
172
|
+
-
|
|
149
173
|
user_agent: Arachni/v1.5.1
|
|
150
174
|
bot:
|
|
151
175
|
name: Arachni
|
|
152
176
|
category: Security Checker
|
|
153
|
-
url:
|
|
177
|
+
url: https://www.arachni-scanner.com/
|
|
154
178
|
producer:
|
|
155
179
|
name: Sarosys LLC
|
|
156
|
-
url:
|
|
157
|
-
-
|
|
180
|
+
url: https://www.sarosys.com/
|
|
181
|
+
-
|
|
158
182
|
user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
|
|
159
183
|
bot:
|
|
160
184
|
name: Ask Jeeves
|
|
@@ -163,7 +187,7 @@
|
|
|
163
187
|
producer:
|
|
164
188
|
name: Ask Jeeves Inc.
|
|
165
189
|
url: http://www.ask.com
|
|
166
|
-
-
|
|
190
|
+
-
|
|
167
191
|
user_agent: Mozilla/5.0 (compatible;AspiegelBot)
|
|
168
192
|
bot:
|
|
169
193
|
name: AspiegelBot
|
|
@@ -172,7 +196,7 @@
|
|
|
172
196
|
producer:
|
|
173
197
|
name: Huawei
|
|
174
198
|
url: https://www.huawei.com/
|
|
175
|
-
-
|
|
199
|
+
-
|
|
176
200
|
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; AspiegelBot)
|
|
177
201
|
bot:
|
|
178
202
|
name: AspiegelBot
|
|
@@ -181,7 +205,7 @@
|
|
|
181
205
|
producer:
|
|
182
206
|
name: Huawei
|
|
183
207
|
url: https://www.huawei.com/
|
|
184
|
-
-
|
|
208
|
+
-
|
|
185
209
|
user_agent: AwarioRssBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
|
186
210
|
bot:
|
|
187
211
|
name: Awario
|
|
@@ -190,7 +214,7 @@
|
|
|
190
214
|
producer:
|
|
191
215
|
name: Awario
|
|
192
216
|
url: https://awario.com/
|
|
193
|
-
-
|
|
217
|
+
-
|
|
194
218
|
user_agent: AwarioSmartBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
|
195
219
|
bot:
|
|
196
220
|
name: Awario
|
|
@@ -199,7 +223,7 @@
|
|
|
199
223
|
producer:
|
|
200
224
|
name: Awario
|
|
201
225
|
url: https://awario.com/
|
|
202
|
-
-
|
|
226
|
+
-
|
|
203
227
|
user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
|
|
204
228
|
bot:
|
|
205
229
|
name: BLEXBot Crawler
|
|
@@ -208,7 +232,7 @@
|
|
|
208
232
|
producer:
|
|
209
233
|
name: WebMeUp
|
|
210
234
|
url: http://webmeup.com
|
|
211
|
-
-
|
|
235
|
+
-
|
|
212
236
|
user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
|
|
213
237
|
bot:
|
|
214
238
|
name: BUbiNG
|
|
@@ -217,7 +241,7 @@
|
|
|
217
241
|
producer:
|
|
218
242
|
name: The Laboratory for Web Algorithmics (LAW)
|
|
219
243
|
url: 'http://law.di.unimi.it/software.php#buging'
|
|
220
|
-
-
|
|
244
|
+
-
|
|
221
245
|
user_agent: Backlink-Check.de (+http://www.backlink-check.de/bot.html)
|
|
222
246
|
bot:
|
|
223
247
|
name: Backlink-Check.de
|
|
@@ -226,7 +250,7 @@
|
|
|
226
250
|
producer:
|
|
227
251
|
name: Mediagreen Medienservice
|
|
228
252
|
url: http://www.backlink-check.de
|
|
229
|
-
-
|
|
253
|
+
-
|
|
230
254
|
user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
|
|
231
255
|
bot:
|
|
232
256
|
name: BacklinkCrawler
|
|
@@ -235,7 +259,7 @@
|
|
|
235
259
|
producer:
|
|
236
260
|
name: 2.0Promotion GbR
|
|
237
261
|
url: http://www.backlinktest.com
|
|
238
|
-
-
|
|
262
|
+
-
|
|
239
263
|
user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
|
|
240
264
|
bot:
|
|
241
265
|
name: Baidu Spider
|
|
@@ -244,7 +268,7 @@
|
|
|
244
268
|
producer:
|
|
245
269
|
name: Baidu
|
|
246
270
|
url: http://www.baidu.com
|
|
247
|
-
-
|
|
271
|
+
-
|
|
248
272
|
user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
|
|
249
273
|
bot:
|
|
250
274
|
name: Baidu Spider
|
|
@@ -253,7 +277,7 @@
|
|
|
253
277
|
producer:
|
|
254
278
|
name: Baidu
|
|
255
279
|
url: http://www.baidu.com
|
|
256
|
-
-
|
|
280
|
+
-
|
|
257
281
|
user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
|
|
258
282
|
bot:
|
|
259
283
|
name: Baidu Spider
|
|
@@ -262,7 +286,7 @@
|
|
|
262
286
|
producer:
|
|
263
287
|
name: Baidu
|
|
264
288
|
url: http://www.baidu.com
|
|
265
|
-
-
|
|
289
|
+
-
|
|
266
290
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
|
|
267
291
|
bot:
|
|
268
292
|
name: Baidu Spider
|
|
@@ -271,7 +295,7 @@
|
|
|
271
295
|
producer:
|
|
272
296
|
name: Baidu
|
|
273
297
|
url: http://www.baidu.com
|
|
274
|
-
-
|
|
298
|
+
-
|
|
275
299
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
|
|
276
300
|
bot:
|
|
277
301
|
name: Baidu Spider
|
|
@@ -280,7 +304,7 @@
|
|
|
280
304
|
producer:
|
|
281
305
|
name: Baidu
|
|
282
306
|
url: http://www.baidu.com
|
|
283
|
-
-
|
|
307
|
+
-
|
|
284
308
|
user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
|
|
285
309
|
bot:
|
|
286
310
|
name: Baidu Spider
|
|
@@ -289,7 +313,7 @@
|
|
|
289
313
|
producer:
|
|
290
314
|
name: Baidu
|
|
291
315
|
url: http://www.baidu.com
|
|
292
|
-
-
|
|
316
|
+
-
|
|
293
317
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
|
|
294
318
|
bot:
|
|
295
319
|
name: Baidu Spider
|
|
@@ -298,7 +322,13 @@
|
|
|
298
322
|
producer:
|
|
299
323
|
name: Baidu
|
|
300
324
|
url: http://www.baidu.com
|
|
301
|
-
-
|
|
325
|
+
-
|
|
326
|
+
user_agent: Barkrowler/0.9 (+http://www.exensa.com/crawl)
|
|
327
|
+
bot:
|
|
328
|
+
name: Barkrowler
|
|
329
|
+
category: Crawler
|
|
330
|
+
url: http://www.exensa.com/crawl
|
|
331
|
+
-
|
|
302
332
|
user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
|
|
303
333
|
bot:
|
|
304
334
|
name: BazQux Reader
|
|
@@ -307,7 +337,7 @@
|
|
|
307
337
|
producer:
|
|
308
338
|
name: ""
|
|
309
339
|
url: ""
|
|
310
|
-
-
|
|
340
|
+
-
|
|
311
341
|
user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
|
|
312
342
|
bot:
|
|
313
343
|
name: BingBot
|
|
@@ -316,7 +346,7 @@
|
|
|
316
346
|
producer:
|
|
317
347
|
name: Microsoft Corporation
|
|
318
348
|
url: http://www.microsoft.com
|
|
319
|
-
-
|
|
349
|
+
-
|
|
320
350
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
|
|
321
351
|
bot:
|
|
322
352
|
name: BingBot
|
|
@@ -325,7 +355,7 @@
|
|
|
325
355
|
producer:
|
|
326
356
|
name: Microsoft Corporation
|
|
327
357
|
url: http://www.microsoft.com
|
|
328
|
-
-
|
|
358
|
+
-
|
|
329
359
|
user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
|
|
330
360
|
bot:
|
|
331
361
|
name: BingBot
|
|
@@ -334,7 +364,7 @@
|
|
|
334
364
|
producer:
|
|
335
365
|
name: Microsoft Corporation
|
|
336
366
|
url: http://www.microsoft.com
|
|
337
|
-
-
|
|
367
|
+
-
|
|
338
368
|
user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
|
|
339
369
|
bot:
|
|
340
370
|
name: BingBot
|
|
@@ -343,7 +373,7 @@
|
|
|
343
373
|
producer:
|
|
344
374
|
name: Microsoft Corporation
|
|
345
375
|
url: http://www.microsoft.com
|
|
346
|
-
-
|
|
376
|
+
-
|
|
347
377
|
user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
|
|
348
378
|
bot:
|
|
349
379
|
name: BingBot
|
|
@@ -352,7 +382,7 @@
|
|
|
352
382
|
producer:
|
|
353
383
|
name: Microsoft Corporation
|
|
354
384
|
url: http://www.microsoft.com
|
|
355
|
-
-
|
|
385
|
+
-
|
|
356
386
|
user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
|
|
357
387
|
bot:
|
|
358
388
|
name: BingBot
|
|
@@ -361,7 +391,7 @@
|
|
|
361
391
|
producer:
|
|
362
392
|
name: Microsoft Corporation
|
|
363
393
|
url: http://www.microsoft.com
|
|
364
|
-
-
|
|
394
|
+
-
|
|
365
395
|
user_agent: msnbot/2.0b v1394720947.6703
|
|
366
396
|
bot:
|
|
367
397
|
name: BingBot
|
|
@@ -370,7 +400,7 @@
|
|
|
370
400
|
producer:
|
|
371
401
|
name: Microsoft Corporation
|
|
372
402
|
url: http://www.microsoft.com
|
|
373
|
-
-
|
|
403
|
+
-
|
|
374
404
|
user_agent: MSNBot/Nutch-1.5.1
|
|
375
405
|
bot:
|
|
376
406
|
name: BingBot
|
|
@@ -379,7 +409,7 @@
|
|
|
379
409
|
producer:
|
|
380
410
|
name: Microsoft Corporation
|
|
381
411
|
url: http://www.microsoft.com
|
|
382
|
-
-
|
|
412
|
+
-
|
|
383
413
|
user_agent: bitlybot/3.0
|
|
384
414
|
bot:
|
|
385
415
|
name: BitlyBot
|
|
@@ -388,7 +418,7 @@
|
|
|
388
418
|
producer:
|
|
389
419
|
name: Bitly, Inc.
|
|
390
420
|
url: https://bitly.com
|
|
391
|
-
-
|
|
421
|
+
-
|
|
392
422
|
user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
|
|
393
423
|
bot:
|
|
394
424
|
name: Blekkobot
|
|
@@ -397,7 +427,7 @@
|
|
|
397
427
|
producer:
|
|
398
428
|
name: Blekko
|
|
399
429
|
url: http://blekko.com
|
|
400
|
-
-
|
|
430
|
+
-
|
|
401
431
|
user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
|
|
402
432
|
bot:
|
|
403
433
|
name: Bloglovin
|
|
@@ -406,7 +436,7 @@
|
|
|
406
436
|
producer:
|
|
407
437
|
name: ""
|
|
408
438
|
url: ""
|
|
409
|
-
-
|
|
439
|
+
-
|
|
410
440
|
user_agent: Blogtrottr/2.0
|
|
411
441
|
bot:
|
|
412
442
|
name: Blogtrottr
|
|
@@ -415,24 +445,24 @@
|
|
|
415
445
|
producer:
|
|
416
446
|
name: Blogtrottr Ltd
|
|
417
447
|
url: https://blogtrottr.com/
|
|
418
|
-
-
|
|
448
|
+
-
|
|
419
449
|
user_agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com
|
|
420
450
|
bot:
|
|
421
451
|
name: BoardReader
|
|
422
452
|
category: Search bot
|
|
423
|
-
url:
|
|
453
|
+
url: https://boardreader.com/
|
|
424
454
|
producer:
|
|
425
455
|
name: Effyis Inc
|
|
426
|
-
url:
|
|
427
|
-
-
|
|
456
|
+
url: https://boardreader.com/
|
|
457
|
+
-
|
|
428
458
|
user_agent: BoardReader Blog Indexer(http://boardreader.com)
|
|
429
459
|
bot:
|
|
430
460
|
name: BoardReader Blog Indexer
|
|
431
461
|
category: Crawler
|
|
432
462
|
producer:
|
|
433
463
|
name: BoardReader
|
|
434
|
-
url:
|
|
435
|
-
-
|
|
464
|
+
url: https://boardreader.com/
|
|
465
|
+
-
|
|
436
466
|
user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
|
|
437
467
|
bot:
|
|
438
468
|
name: Bountii Bot
|
|
@@ -441,7 +471,7 @@
|
|
|
441
471
|
producer:
|
|
442
472
|
name: Bountii Inc.
|
|
443
473
|
url: http://bountii.com
|
|
444
|
-
-
|
|
474
|
+
-
|
|
445
475
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10.10; rv:41.0) Gecko/20100101 Firefox/55.0 BrandVerity/1.0 (http://www.brandverity.com/why-is-brandverity-visiting-me)
|
|
446
476
|
bot:
|
|
447
477
|
name: BrandVerity
|
|
@@ -450,7 +480,7 @@
|
|
|
450
480
|
producer:
|
|
451
481
|
name: BrandVerity, Inc.
|
|
452
482
|
url: https://www.brandverity.com/
|
|
453
|
-
-
|
|
483
|
+
-
|
|
454
484
|
user_agent: Browsershots
|
|
455
485
|
bot:
|
|
456
486
|
name: Browsershots
|
|
@@ -459,7 +489,7 @@
|
|
|
459
489
|
producer:
|
|
460
490
|
name: Browsershots.org
|
|
461
491
|
url: http://browsershots.org
|
|
462
|
-
-
|
|
492
|
+
-
|
|
463
493
|
user_agent: Buck/2.2; (+https://app.hypefactors.com/media-monitoring/about.html)
|
|
464
494
|
bot:
|
|
465
495
|
name: Buck
|
|
@@ -468,7 +498,7 @@
|
|
|
468
498
|
producer:
|
|
469
499
|
name: Hypefactors A/S
|
|
470
500
|
url: https://hypefactors.com/
|
|
471
|
-
-
|
|
501
|
+
-
|
|
472
502
|
user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
|
473
503
|
bot:
|
|
474
504
|
name: Butterfly Robot
|
|
@@ -477,7 +507,7 @@
|
|
|
477
507
|
producer:
|
|
478
508
|
name: Topsy Labs
|
|
479
509
|
url: http://labs.topsy.com
|
|
480
|
-
-
|
|
510
|
+
-
|
|
481
511
|
user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
|
482
512
|
bot:
|
|
483
513
|
name: Butterfly Robot
|
|
@@ -486,7 +516,7 @@
|
|
|
486
516
|
producer:
|
|
487
517
|
name: Topsy Labs
|
|
488
518
|
url: http://labs.topsy.com
|
|
489
|
-
-
|
|
519
|
+
-
|
|
490
520
|
user_agent: Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.5668.1446 Mobile Safari/537.36; Bytespider;bytespider@bytedance.com
|
|
491
521
|
bot:
|
|
492
522
|
name: Bytespider
|
|
@@ -495,7 +525,7 @@
|
|
|
495
525
|
producer:
|
|
496
526
|
name: ByteDance Ltd.
|
|
497
527
|
url: https://bytedance.com/
|
|
498
|
-
-
|
|
528
|
+
-
|
|
499
529
|
user_agent: CATExplorador/1.0beta (sistemes at domini dot cat; http://domini.cat/catexplorador.html)
|
|
500
530
|
bot:
|
|
501
531
|
name: CATExplorador
|
|
@@ -504,7 +534,7 @@
|
|
|
504
534
|
producer:
|
|
505
535
|
name: Fundació puntCAT
|
|
506
536
|
url: https://fundacio.cat/ca/domini/
|
|
507
|
-
-
|
|
537
|
+
-
|
|
508
538
|
user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
|
|
509
539
|
bot:
|
|
510
540
|
name: CareerBot
|
|
@@ -513,7 +543,7 @@
|
|
|
513
543
|
producer:
|
|
514
544
|
name: career-x GmbH
|
|
515
545
|
url: http://www.career-x.de
|
|
516
|
-
-
|
|
546
|
+
-
|
|
517
547
|
user_agent: Castro 2, Episode Duration Lookup
|
|
518
548
|
bot:
|
|
519
549
|
name: Castro 2
|
|
@@ -522,7 +552,7 @@
|
|
|
522
552
|
producer:
|
|
523
553
|
name: Supertop
|
|
524
554
|
url: http://supertop.co
|
|
525
|
-
-
|
|
555
|
+
-
|
|
526
556
|
user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
|
|
527
557
|
bot:
|
|
528
558
|
name: Cliqzbot
|
|
@@ -531,7 +561,7 @@
|
|
|
531
561
|
producer:
|
|
532
562
|
name: 10betterpages GmbH
|
|
533
563
|
url: http://cliqz.com
|
|
534
|
-
-
|
|
564
|
+
-
|
|
535
565
|
user_agent: Mozilla/5.0 (compatible; Cloudflare-AMP/1.0; +https://amp.cloudflare.com/doc/fetcher.html) AppleWebKit/534.34
|
|
536
566
|
bot:
|
|
537
567
|
name: CloudFlare AMP Fetcher
|
|
@@ -540,7 +570,7 @@
|
|
|
540
570
|
producer:
|
|
541
571
|
name: CloudFlare
|
|
542
572
|
url: http://www.cloudflare.com
|
|
543
|
-
-
|
|
573
|
+
-
|
|
544
574
|
user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
|
|
545
575
|
bot:
|
|
546
576
|
name: CloudFlare Always Online
|
|
@@ -549,7 +579,7 @@
|
|
|
549
579
|
producer:
|
|
550
580
|
name: CloudFlare
|
|
551
581
|
url: http://www.cloudflare.com
|
|
552
|
-
-
|
|
582
|
+
-
|
|
553
583
|
user_agent: collectd/5.5.1
|
|
554
584
|
bot:
|
|
555
585
|
name: Collectd
|
|
@@ -558,7 +588,7 @@
|
|
|
558
588
|
producer:
|
|
559
589
|
name: Collectd
|
|
560
590
|
url: https://collectd.org/
|
|
561
|
-
-
|
|
591
|
+
-
|
|
562
592
|
user_agent: CommaFeed/1.0 (http://www.commafeed.com)
|
|
563
593
|
bot:
|
|
564
594
|
name: CommaFeed
|
|
@@ -567,79 +597,79 @@
|
|
|
567
597
|
producer:
|
|
568
598
|
name: ""
|
|
569
599
|
url: ""
|
|
570
|
-
-
|
|
600
|
+
-
|
|
571
601
|
user_agent: coccocbot-web/1.0 (+http://help.coccoc.com/searchengine)
|
|
572
602
|
bot:
|
|
573
603
|
name: Cốc Cốc Bot
|
|
574
|
-
category: Search bot
|
|
575
604
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
605
|
+
category: Search bot
|
|
576
606
|
producer:
|
|
577
607
|
name: Cốc Cốc
|
|
578
608
|
url: https://coccoc.com/
|
|
579
|
-
-
|
|
609
|
+
-
|
|
580
610
|
user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
|
|
581
611
|
bot:
|
|
582
612
|
name: Cốc Cốc Bot
|
|
583
|
-
category: Search bot
|
|
584
613
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
614
|
+
category: Search bot
|
|
585
615
|
producer:
|
|
586
616
|
name: Cốc Cốc
|
|
587
617
|
url: https://coccoc.com/
|
|
588
|
-
-
|
|
618
|
+
-
|
|
589
619
|
user_agent: Mozilla/5.0 (compatible; coccocbot-ads/1.0; +http://help.coccoc.com/searchengine)
|
|
590
620
|
bot:
|
|
591
621
|
name: Cốc Cốc Bot
|
|
592
|
-
category: Search bot
|
|
593
622
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
623
|
+
category: Search bot
|
|
594
624
|
producer:
|
|
595
625
|
name: Cốc Cốc
|
|
596
626
|
url: https://coccoc.com/
|
|
597
|
-
-
|
|
627
|
+
-
|
|
598
628
|
user_agent: Mozilla/5.0 (compatible; coccocbot-fast/1.0; +http://help.coccoc.com/searchengine)
|
|
599
629
|
bot:
|
|
600
630
|
name: Cốc Cốc Bot
|
|
601
|
-
category: Search bot
|
|
602
631
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
632
|
+
category: Search bot
|
|
603
633
|
producer:
|
|
604
634
|
name: Cốc Cốc
|
|
605
635
|
url: https://coccoc.com/
|
|
606
|
-
-
|
|
636
|
+
-
|
|
607
637
|
user_agent: Mozilla/5.0 (compatible; coccocbot-image/1.0; +http://help.coccoc.com/searchengine)
|
|
608
638
|
bot:
|
|
609
639
|
name: Cốc Cốc Bot
|
|
610
|
-
category: Search bot
|
|
611
640
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
641
|
+
category: Search bot
|
|
612
642
|
producer:
|
|
613
643
|
name: Cốc Cốc
|
|
614
644
|
url: https://coccoc.com/
|
|
615
|
-
-
|
|
645
|
+
-
|
|
616
646
|
user_agent: Mozilla/5.0 (compatible; coccocbot-shopping/1.0; +http://help.coccoc.com/searchengine)
|
|
617
647
|
bot:
|
|
618
648
|
name: Cốc Cốc Bot
|
|
619
|
-
category: Search bot
|
|
620
649
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
650
|
+
category: Search bot
|
|
621
651
|
producer:
|
|
622
652
|
name: Cốc Cốc
|
|
623
653
|
url: https://coccoc.com/
|
|
624
|
-
-
|
|
654
|
+
-
|
|
625
655
|
user_agent: Mozilla/5.0 (compatible; coccocbot-web/1.0; +http://help.coccoc.com/searchengine)
|
|
626
656
|
bot:
|
|
627
657
|
name: Cốc Cốc Bot
|
|
628
|
-
category: Search bot
|
|
629
658
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
659
|
+
category: Search bot
|
|
630
660
|
producer:
|
|
631
661
|
name: Cốc Cốc
|
|
632
662
|
url: https://coccoc.com/
|
|
633
|
-
-
|
|
663
|
+
-
|
|
634
664
|
user_agent: Mozilla/5.0 (compatible; coccocbot/1.0; +http://help.coccoc.com/searchengine)
|
|
635
665
|
bot:
|
|
636
666
|
name: Cốc Cốc Bot
|
|
637
|
-
category: Search bot
|
|
638
667
|
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
668
|
+
category: Search bot
|
|
639
669
|
producer:
|
|
640
670
|
name: Cốc Cốc
|
|
641
671
|
url: https://coccoc.com/
|
|
642
|
-
-
|
|
672
|
+
-
|
|
643
673
|
user_agent: Datadog Agent/5.10.1
|
|
644
674
|
bot:
|
|
645
675
|
name: Datadog Agent
|
|
@@ -648,7 +678,7 @@
|
|
|
648
678
|
producer:
|
|
649
679
|
name: Datadog
|
|
650
680
|
url: https://www.datadoghq.com/
|
|
651
|
-
-
|
|
681
|
+
-
|
|
652
682
|
user_agent: Mozilla/5.0 (X11; Datanyze; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36
|
|
653
683
|
bot:
|
|
654
684
|
name: Datanyze
|
|
@@ -657,7 +687,7 @@
|
|
|
657
687
|
producer:
|
|
658
688
|
name: Datanyze
|
|
659
689
|
url: https://www.datanyze.com
|
|
660
|
-
-
|
|
690
|
+
-
|
|
661
691
|
user_agent: Mozilla/5.0 (compatible; Dataprovider/6.92; +https://www.dataprovider.com/)
|
|
662
692
|
bot:
|
|
663
693
|
name: Dataprovider
|
|
@@ -666,7 +696,7 @@
|
|
|
666
696
|
producer:
|
|
667
697
|
name: Dataprovider B.V.
|
|
668
698
|
url: https://www.dataprovider.com/
|
|
669
|
-
-
|
|
699
|
+
-
|
|
670
700
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
|
|
671
701
|
bot:
|
|
672
702
|
name: Daum
|
|
@@ -675,7 +705,7 @@
|
|
|
675
705
|
producer:
|
|
676
706
|
name: Daum Communications Corp.
|
|
677
707
|
url: http://www.kakaocorp.com/main
|
|
678
|
-
-
|
|
708
|
+
-
|
|
679
709
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
|
|
680
710
|
bot:
|
|
681
711
|
name: Daum
|
|
@@ -684,7 +714,7 @@
|
|
|
684
714
|
producer:
|
|
685
715
|
name: Daum Communications Corp.
|
|
686
716
|
url: http://www.kakaocorp.com/main
|
|
687
|
-
-
|
|
717
|
+
-
|
|
688
718
|
user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
|
|
689
719
|
bot:
|
|
690
720
|
name: Dazoobot
|
|
@@ -693,7 +723,7 @@
|
|
|
693
723
|
producer:
|
|
694
724
|
name: DAZOO.FR
|
|
695
725
|
url: http://dazoo.fr
|
|
696
|
-
-
|
|
726
|
+
-
|
|
697
727
|
user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
|
|
698
728
|
bot:
|
|
699
729
|
name: Discobot
|
|
@@ -702,7 +732,7 @@
|
|
|
702
732
|
producer:
|
|
703
733
|
name: Discovery Engine
|
|
704
734
|
url: http://discoveryengine.com
|
|
705
|
-
-
|
|
735
|
+
-
|
|
706
736
|
user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
|
|
707
737
|
bot:
|
|
708
738
|
name: Domain Re-Animator Bot
|
|
@@ -711,7 +741,7 @@
|
|
|
711
741
|
producer:
|
|
712
742
|
name: Domain Re-Animator, LLC
|
|
713
743
|
url: http://domainreanimator.com
|
|
714
|
-
-
|
|
744
|
+
-
|
|
715
745
|
user_agent: support@domainreanimator.com
|
|
716
746
|
bot:
|
|
717
747
|
name: Domain Re-Animator Bot
|
|
@@ -720,7 +750,13 @@
|
|
|
720
750
|
producer:
|
|
721
751
|
name: Domain Re-Animator, LLC
|
|
722
752
|
url: http://domainreanimator.com
|
|
723
|
-
-
|
|
753
|
+
-
|
|
754
|
+
user_agent: Mozilla/5.0 (compatible; Domains Project/1.1.0; +https://domainsproject.org)
|
|
755
|
+
bot:
|
|
756
|
+
name: Domains Project
|
|
757
|
+
category: Crawler
|
|
758
|
+
url: https://domainsproject.org
|
|
759
|
+
-
|
|
724
760
|
user_agent: dotbot
|
|
725
761
|
bot:
|
|
726
762
|
name: DotBot
|
|
@@ -729,7 +765,7 @@
|
|
|
729
765
|
producer:
|
|
730
766
|
name: SEOmoz, Inc.
|
|
731
767
|
url: http://moz.com/
|
|
732
|
-
-
|
|
768
|
+
-
|
|
733
769
|
user_agent: DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)
|
|
734
770
|
bot:
|
|
735
771
|
name: DuckDuckGo Bot
|
|
@@ -738,7 +774,7 @@
|
|
|
738
774
|
producer:
|
|
739
775
|
name: DuckDuckGo
|
|
740
776
|
url: https://duckduckgo.com/
|
|
741
|
-
-
|
|
777
|
+
-
|
|
742
778
|
user_agent: Mozilla/5.0 (compatible; DuckDuckGo-Favicons-Bot/1.0; +http://duckduckgo.com)
|
|
743
779
|
bot:
|
|
744
780
|
name: DuckDuckGo Bot
|
|
@@ -747,7 +783,7 @@
|
|
|
747
783
|
producer:
|
|
748
784
|
name: DuckDuckGo
|
|
749
785
|
url: https://duckduckgo.com/
|
|
750
|
-
-
|
|
786
|
+
-
|
|
751
787
|
user_agent: EMail Exractor
|
|
752
788
|
bot:
|
|
753
789
|
name: EMail Exractor
|
|
@@ -756,7 +792,7 @@
|
|
|
756
792
|
producer:
|
|
757
793
|
name: ""
|
|
758
794
|
url: ""
|
|
759
|
-
-
|
|
795
|
+
-
|
|
760
796
|
user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
|
|
761
797
|
bot:
|
|
762
798
|
name: Easou Spider
|
|
@@ -765,7 +801,7 @@
|
|
|
765
801
|
producer:
|
|
766
802
|
name: easou ICP
|
|
767
803
|
url: http://www.easou.com
|
|
768
|
-
-
|
|
804
|
+
-
|
|
769
805
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
|
|
770
806
|
bot:
|
|
771
807
|
name: Easou Spider
|
|
@@ -774,7 +810,7 @@
|
|
|
774
810
|
producer:
|
|
775
811
|
name: easou ICP
|
|
776
812
|
url: http://www.easou.com
|
|
777
|
-
-
|
|
813
|
+
-
|
|
778
814
|
user_agent: Mozilla/5.0 (compatible; Embedly/0.2; +http://support.embed.ly/)
|
|
779
815
|
bot:
|
|
780
816
|
name: Embedly
|
|
@@ -783,7 +819,7 @@
|
|
|
783
819
|
producer:
|
|
784
820
|
name: A Medium, Corp.
|
|
785
821
|
url: https://medium.com/
|
|
786
|
-
-
|
|
822
|
+
-
|
|
787
823
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
|
|
788
824
|
bot:
|
|
789
825
|
name: ExaBot
|
|
@@ -792,7 +828,7 @@
|
|
|
792
828
|
producer:
|
|
793
829
|
name: Dassault Systèmes
|
|
794
830
|
url: http://www.3ds.com
|
|
795
|
-
-
|
|
831
|
+
-
|
|
796
832
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
|
|
797
833
|
bot:
|
|
798
834
|
name: ExaBot
|
|
@@ -801,7 +837,7 @@
|
|
|
801
837
|
producer:
|
|
802
838
|
name: Dassault Systèmes
|
|
803
839
|
url: http://www.3ds.com
|
|
804
|
-
-
|
|
840
|
+
-
|
|
805
841
|
user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
|
|
806
842
|
bot:
|
|
807
843
|
name: ExaBot
|
|
@@ -810,7 +846,7 @@
|
|
|
810
846
|
producer:
|
|
811
847
|
name: Dassault Systèmes
|
|
812
848
|
url: http://www.3ds.com
|
|
813
|
-
-
|
|
849
|
+
-
|
|
814
850
|
user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
|
|
815
851
|
bot:
|
|
816
852
|
name: ExactSeek Crawler
|
|
@@ -819,7 +855,7 @@
|
|
|
819
855
|
producer:
|
|
820
856
|
name: Jayde Online, Inc.
|
|
821
857
|
url: http://www.jaydeonlineinc.com
|
|
822
|
-
-
|
|
858
|
+
-
|
|
823
859
|
user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
|
|
824
860
|
bot:
|
|
825
861
|
name: Ezooms
|
|
@@ -828,7 +864,7 @@
|
|
|
828
864
|
producer:
|
|
829
865
|
name: SEOmoz, Inc.
|
|
830
866
|
url: http://moz.com/
|
|
831
|
-
-
|
|
867
|
+
-
|
|
832
868
|
user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
|
|
833
869
|
bot:
|
|
834
870
|
name: Facebook External Hit
|
|
@@ -837,7 +873,7 @@
|
|
|
837
873
|
producer:
|
|
838
874
|
name: Facebook
|
|
839
875
|
url: http://www.facebook.com
|
|
840
|
-
-
|
|
876
|
+
-
|
|
841
877
|
user_agent: facebookexternalua
|
|
842
878
|
bot:
|
|
843
879
|
name: Facebook External Hit
|
|
@@ -846,7 +882,7 @@
|
|
|
846
882
|
producer:
|
|
847
883
|
name: Facebook
|
|
848
884
|
url: http://www.facebook.com
|
|
849
|
-
-
|
|
885
|
+
-
|
|
850
886
|
user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
|
|
851
887
|
bot:
|
|
852
888
|
name: Facebook External Hit
|
|
@@ -855,7 +891,7 @@
|
|
|
855
891
|
producer:
|
|
856
892
|
name: Facebook
|
|
857
893
|
url: http://www.facebook.com
|
|
858
|
-
-
|
|
894
|
+
-
|
|
859
895
|
user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
|
|
860
896
|
bot:
|
|
861
897
|
name: Feed Wrangler
|
|
@@ -864,7 +900,7 @@
|
|
|
864
900
|
producer:
|
|
865
901
|
name: 'David Smith & Developing Perspective, LLC'
|
|
866
902
|
url: https://david-smith.org
|
|
867
|
-
-
|
|
903
|
+
-
|
|
868
904
|
user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
|
|
869
905
|
bot:
|
|
870
906
|
name: FeedBurner
|
|
@@ -873,7 +909,7 @@
|
|
|
873
909
|
producer:
|
|
874
910
|
name: ""
|
|
875
911
|
url: ""
|
|
876
|
-
-
|
|
912
|
+
-
|
|
877
913
|
user_agent: 'Feedbin - 9 subscribers'
|
|
878
914
|
bot:
|
|
879
915
|
name: Feedbin
|
|
@@ -882,7 +918,7 @@
|
|
|
882
918
|
producer:
|
|
883
919
|
name: ""
|
|
884
920
|
url: ""
|
|
885
|
-
-
|
|
921
|
+
-
|
|
886
922
|
user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
|
|
887
923
|
bot:
|
|
888
924
|
name: Feedly
|
|
@@ -891,7 +927,7 @@
|
|
|
891
927
|
producer:
|
|
892
928
|
name: ""
|
|
893
929
|
url: ""
|
|
894
|
-
-
|
|
930
|
+
-
|
|
895
931
|
user_agent: FeedlyApp/1.0 (http://www.feedly.com)
|
|
896
932
|
bot:
|
|
897
933
|
name: Feedly
|
|
@@ -900,7 +936,7 @@
|
|
|
900
936
|
producer:
|
|
901
937
|
name: ""
|
|
902
938
|
url: ""
|
|
903
|
-
-
|
|
939
|
+
-
|
|
904
940
|
user_agent: FeedlyBot/1.0 (http://feedly.com)
|
|
905
941
|
bot:
|
|
906
942
|
name: Feedly
|
|
@@ -909,7 +945,7 @@
|
|
|
909
945
|
producer:
|
|
910
946
|
name: ""
|
|
911
947
|
url: ""
|
|
912
|
-
-
|
|
948
|
+
-
|
|
913
949
|
user_agent: MetaFeedly/1.0 (http://www.feedly.com)
|
|
914
950
|
bot:
|
|
915
951
|
name: Feedly
|
|
@@ -918,7 +954,7 @@
|
|
|
918
954
|
producer:
|
|
919
955
|
name: ""
|
|
920
956
|
url: ""
|
|
921
|
-
-
|
|
957
|
+
-
|
|
922
958
|
user_agent: Feedspot http://www.feedspot.com
|
|
923
959
|
bot:
|
|
924
960
|
name: Feedspot
|
|
@@ -927,7 +963,7 @@
|
|
|
927
963
|
producer:
|
|
928
964
|
name: ""
|
|
929
965
|
url: ""
|
|
930
|
-
-
|
|
966
|
+
-
|
|
931
967
|
user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
|
|
932
968
|
bot:
|
|
933
969
|
name: Fever
|
|
@@ -936,13 +972,13 @@
|
|
|
936
972
|
producer:
|
|
937
973
|
name: ""
|
|
938
974
|
url: ""
|
|
939
|
-
-
|
|
975
|
+
-
|
|
940
976
|
user_agent: Mozilla/5.0 (compatible; Findxbot/1.0; +http://www.findxbot.com)
|
|
941
977
|
bot:
|
|
942
978
|
name: Findxbot
|
|
943
979
|
category: Crawler
|
|
944
980
|
url: http://www.findxbot.com
|
|
945
|
-
-
|
|
981
|
+
-
|
|
946
982
|
user_agent: Mozilla/5.0 (compatible; FlipboardProxy/1.2; +http://flipboard.com/browserproxy)
|
|
947
983
|
bot:
|
|
948
984
|
name: Flipboard
|
|
@@ -951,7 +987,7 @@
|
|
|
951
987
|
producer:
|
|
952
988
|
name: Flipboard
|
|
953
989
|
url: http://flipboard.com/
|
|
954
|
-
-
|
|
990
|
+
-
|
|
955
991
|
user_agent: Mozilla/5.0 (compatible; FlipboardRSS/1.2; +http://flipboard.com/browserproxy)
|
|
956
992
|
bot:
|
|
957
993
|
name: Flipboard
|
|
@@ -960,19 +996,19 @@
|
|
|
960
996
|
producer:
|
|
961
997
|
name: Flipboard
|
|
962
998
|
url: http://flipboard.com/
|
|
963
|
-
-
|
|
999
|
+
-
|
|
964
1000
|
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
|
965
1001
|
bot:
|
|
966
1002
|
name: FreshRSS
|
|
967
1003
|
category: Feed Fetcher
|
|
968
1004
|
url: https://freshrss.org/
|
|
969
|
-
-
|
|
1005
|
+
-
|
|
970
1006
|
user_agent: FreshRSS/1.12.0 (Linux; https://freshrss.org)
|
|
971
1007
|
bot:
|
|
972
1008
|
name: FreshRSS
|
|
973
1009
|
category: Feed Fetcher
|
|
974
1010
|
url: https://freshrss.org/
|
|
975
|
-
-
|
|
1011
|
+
-
|
|
976
1012
|
user_agent: Mozilla/5.0 (X11; Linux x86_64; GTmetrix https://gtmetrix.com/) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/75.0.3770.100 Safari/537.36
|
|
977
1013
|
bot:
|
|
978
1014
|
name: GTmetrix
|
|
@@ -981,55 +1017,55 @@
|
|
|
981
1017
|
producer:
|
|
982
1018
|
name: Carbon60 Operating Co. Ltd.
|
|
983
1019
|
url: https://www.carbon60.com/
|
|
984
|
-
-
|
|
1020
|
+
-
|
|
985
1021
|
user_agent: 7Siters/1.07 (+https://7ooo.ru/siters/)
|
|
986
1022
|
bot:
|
|
987
1023
|
name: Generic Bot
|
|
988
|
-
-
|
|
1024
|
+
-
|
|
989
1025
|
user_agent: COMODO SSL Checker
|
|
990
1026
|
bot:
|
|
991
1027
|
name: Generic Bot
|
|
992
|
-
-
|
|
1028
|
+
-
|
|
993
1029
|
user_agent: help@dataminr.com
|
|
994
1030
|
bot:
|
|
995
1031
|
name: Generic Bot
|
|
996
|
-
-
|
|
1032
|
+
-
|
|
997
1033
|
user_agent: 'HybridBot (hybrid.ru/about. If our bot caused problems please contact us. Contact email: m.lyashkov@targetix.net)'
|
|
998
1034
|
bot:
|
|
999
1035
|
name: Generic Bot
|
|
1000
|
-
-
|
|
1036
|
+
-
|
|
1001
1037
|
user_agent: 'Mozilla/5.0 (compatible; +centuryb.o.t9[at]gmail.com)'
|
|
1002
1038
|
bot:
|
|
1003
1039
|
name: Generic Bot
|
|
1004
|
-
-
|
|
1040
|
+
-
|
|
1005
1041
|
user_agent: Mozilla/5.0 (compatible; +http://tweetedtimes.com)
|
|
1006
1042
|
bot:
|
|
1007
1043
|
name: Generic Bot
|
|
1008
|
-
-
|
|
1044
|
+
-
|
|
1009
1045
|
user_agent: Mozilla/5.0 (compatible; Shareaholicbot/2.0; +http://www.shareaholic.com/bot)
|
|
1010
1046
|
bot:
|
|
1011
1047
|
name: Generic Bot
|
|
1012
|
-
-
|
|
1048
|
+
-
|
|
1013
1049
|
user_agent: Mozilla/5.0 (compatible; TrendsmapResolver/0.1)
|
|
1014
1050
|
bot:
|
|
1015
1051
|
name: Generic Bot
|
|
1016
|
-
-
|
|
1052
|
+
-
|
|
1017
1053
|
user_agent: niki-bot
|
|
1018
1054
|
bot:
|
|
1019
1055
|
name: Generic Bot
|
|
1020
|
-
-
|
|
1056
|
+
-
|
|
1021
1057
|
user_agent: PHPCrawl
|
|
1022
1058
|
bot:
|
|
1023
1059
|
name: Generic Bot
|
|
1024
|
-
-
|
|
1060
|
+
-
|
|
1025
1061
|
user_agent: robots
|
|
1026
1062
|
bot:
|
|
1027
1063
|
name: Generic Bot
|
|
1028
|
-
-
|
|
1064
|
+
-
|
|
1029
1065
|
user_agent: SeopultContentAnalyzer/1.0
|
|
1030
1066
|
bot:
|
|
1031
1067
|
name: Generic Bot
|
|
1032
|
-
-
|
|
1068
|
+
-
|
|
1033
1069
|
user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
|
|
1034
1070
|
bot:
|
|
1035
1071
|
name: Genieo Web filter
|
|
@@ -1038,7 +1074,7 @@
|
|
|
1038
1074
|
producer:
|
|
1039
1075
|
name: Genieo
|
|
1040
1076
|
url: http://www.genieo.com
|
|
1041
|
-
-
|
|
1077
|
+
-
|
|
1042
1078
|
user_agent: GigablastOpenSource/1.0
|
|
1043
1079
|
bot:
|
|
1044
1080
|
name: Gigablast
|
|
@@ -1047,7 +1083,7 @@
|
|
|
1047
1083
|
producer:
|
|
1048
1084
|
name: Matt Wells
|
|
1049
1085
|
url: http://www.gigablast.com/faq.html
|
|
1050
|
-
-
|
|
1086
|
+
-
|
|
1051
1087
|
user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
|
|
1052
1088
|
bot:
|
|
1053
1089
|
name: Gluten Free Crawler
|
|
@@ -1056,7 +1092,7 @@
|
|
|
1056
1092
|
producer:
|
|
1057
1093
|
name: ""
|
|
1058
1094
|
url: ""
|
|
1059
|
-
-
|
|
1095
|
+
-
|
|
1060
1096
|
user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
|
|
1061
1097
|
bot:
|
|
1062
1098
|
name: Gmail Image Proxy
|
|
@@ -1065,7 +1101,7 @@
|
|
|
1065
1101
|
producer:
|
|
1066
1102
|
name: Google Inc.
|
|
1067
1103
|
url: http://www.google.com
|
|
1068
|
-
-
|
|
1104
|
+
-
|
|
1069
1105
|
user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
|
|
1070
1106
|
bot:
|
|
1071
1107
|
name: Goo
|
|
@@ -1074,12 +1110,12 @@
|
|
|
1074
1110
|
producer:
|
|
1075
1111
|
name: NTT Resonant
|
|
1076
1112
|
url: http://goo.ne.jp
|
|
1077
|
-
-
|
|
1113
|
+
-
|
|
1078
1114
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.75 Safari/537.36 Google Favicon
|
|
1079
1115
|
bot:
|
|
1080
1116
|
name: Google Favicon
|
|
1081
1117
|
category: Crawler
|
|
1082
|
-
-
|
|
1118
|
+
-
|
|
1083
1119
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
|
|
1084
1120
|
bot:
|
|
1085
1121
|
name: Google PageSpeed Insights
|
|
@@ -1088,7 +1124,7 @@
|
|
|
1088
1124
|
producer:
|
|
1089
1125
|
name: Google Inc.
|
|
1090
1126
|
url: http://www.google.com
|
|
1091
|
-
-
|
|
1127
|
+
-
|
|
1092
1128
|
user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
|
|
1093
1129
|
bot:
|
|
1094
1130
|
name: Google Partner Monitoring
|
|
@@ -1097,7 +1133,7 @@
|
|
|
1097
1133
|
producer:
|
|
1098
1134
|
name: Google Inc.
|
|
1099
1135
|
url: http://www.google.com
|
|
1100
|
-
-
|
|
1136
|
+
-
|
|
1101
1137
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Search Console) Chrome/41.0.2272.118 Safari/537.36
|
|
1102
1138
|
bot:
|
|
1103
1139
|
name: Google Search Console
|
|
@@ -1106,7 +1142,7 @@
|
|
|
1106
1142
|
producer:
|
|
1107
1143
|
name: Google Inc.
|
|
1108
1144
|
url: http://www.google.com
|
|
1109
|
-
-
|
|
1145
|
+
-
|
|
1110
1146
|
user_agent: Google-Structured-Data-Testing-Tool +https://search.google.com/structured-data/testing-tool)
|
|
1111
1147
|
bot:
|
|
1112
1148
|
name: Google Structured Data Testing Tool
|
|
@@ -1115,7 +1151,7 @@
|
|
|
1115
1151
|
producer:
|
|
1116
1152
|
name: Google Inc.
|
|
1117
1153
|
url: http://www.google.com
|
|
1118
|
-
-
|
|
1154
|
+
-
|
|
1119
1155
|
user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
|
|
1120
1156
|
bot:
|
|
1121
1157
|
name: Googlebot
|
|
@@ -1124,7 +1160,7 @@
|
|
|
1124
1160
|
producer:
|
|
1125
1161
|
name: Google Inc.
|
|
1126
1162
|
url: http://www.google.com
|
|
1127
|
-
-
|
|
1163
|
+
-
|
|
1128
1164
|
user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
|
|
1129
1165
|
bot:
|
|
1130
1166
|
name: Googlebot
|
|
@@ -1133,7 +1169,7 @@
|
|
|
1133
1169
|
producer:
|
|
1134
1170
|
name: Google Inc.
|
|
1135
1171
|
url: http://www.google.com
|
|
1136
|
-
-
|
|
1172
|
+
-
|
|
1137
1173
|
user_agent: APIs-Google (+https://developers.google.com/webmasters/APIs-Google.html)
|
|
1138
1174
|
bot:
|
|
1139
1175
|
name: Googlebot
|
|
@@ -1142,7 +1178,7 @@
|
|
|
1142
1178
|
producer:
|
|
1143
1179
|
name: Google Inc.
|
|
1144
1180
|
url: http://www.google.com
|
|
1145
|
-
-
|
|
1181
|
+
-
|
|
1146
1182
|
user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
|
1147
1183
|
bot:
|
|
1148
1184
|
name: Googlebot
|
|
@@ -1151,7 +1187,7 @@
|
|
|
1151
1187
|
producer:
|
|
1152
1188
|
name: Google Inc.
|
|
1153
1189
|
url: http://www.google.com
|
|
1154
|
-
-
|
|
1190
|
+
-
|
|
1155
1191
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
|
|
1156
1192
|
bot:
|
|
1157
1193
|
name: Googlebot
|
|
@@ -1160,7 +1196,7 @@
|
|
|
1160
1196
|
producer:
|
|
1161
1197
|
name: Google Inc.
|
|
1162
1198
|
url: http://www.google.com
|
|
1163
|
-
-
|
|
1199
|
+
-
|
|
1164
1200
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
|
|
1165
1201
|
bot:
|
|
1166
1202
|
name: Googlebot
|
|
@@ -1169,7 +1205,7 @@
|
|
|
1169
1205
|
producer:
|
|
1170
1206
|
name: Google Inc.
|
|
1171
1207
|
url: http://www.google.com
|
|
1172
|
-
-
|
|
1208
|
+
-
|
|
1173
1209
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
|
|
1174
1210
|
bot:
|
|
1175
1211
|
name: Googlebot
|
|
@@ -1178,7 +1214,7 @@
|
|
|
1178
1214
|
producer:
|
|
1179
1215
|
name: Google Inc.
|
|
1180
1216
|
url: http://www.google.com
|
|
1181
|
-
-
|
|
1217
|
+
-
|
|
1182
1218
|
user_agent: Google-AdWords-Express
|
|
1183
1219
|
bot:
|
|
1184
1220
|
name: Googlebot
|
|
@@ -1187,7 +1223,7 @@
|
|
|
1187
1223
|
producer:
|
|
1188
1224
|
name: Google Inc.
|
|
1189
1225
|
url: http://www.google.com
|
|
1190
|
-
-
|
|
1226
|
+
-
|
|
1191
1227
|
user_agent: Google-Adwords-Instant (+http://www.google.com/adsbot.html)
|
|
1192
1228
|
bot:
|
|
1193
1229
|
name: Googlebot
|
|
@@ -1196,7 +1232,7 @@
|
|
|
1196
1232
|
producer:
|
|
1197
1233
|
name: Google Inc.
|
|
1198
1234
|
url: http://www.google.com
|
|
1199
|
-
-
|
|
1235
|
+
-
|
|
1200
1236
|
user_agent: Google-speakr
|
|
1201
1237
|
bot:
|
|
1202
1238
|
name: Googlebot
|
|
@@ -1205,7 +1241,7 @@
|
|
|
1205
1241
|
producer:
|
|
1206
1242
|
name: Google Inc.
|
|
1207
1243
|
url: http://www.google.com
|
|
1208
|
-
-
|
|
1244
|
+
-
|
|
1209
1245
|
user_agent: Googlebot (gocrawl v0.4)
|
|
1210
1246
|
bot:
|
|
1211
1247
|
name: Googlebot
|
|
@@ -1214,7 +1250,7 @@
|
|
|
1214
1250
|
producer:
|
|
1215
1251
|
name: Google Inc.
|
|
1216
1252
|
url: http://www.google.com
|
|
1217
|
-
-
|
|
1253
|
+
-
|
|
1218
1254
|
user_agent: Googlebot-Image/1.0
|
|
1219
1255
|
bot:
|
|
1220
1256
|
name: Googlebot
|
|
@@ -1223,7 +1259,7 @@
|
|
|
1223
1259
|
producer:
|
|
1224
1260
|
name: Google Inc.
|
|
1225
1261
|
url: http://www.google.com
|
|
1226
|
-
-
|
|
1262
|
+
-
|
|
1227
1263
|
user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
|
|
1228
1264
|
bot:
|
|
1229
1265
|
name: Googlebot
|
|
@@ -1232,7 +1268,7 @@
|
|
|
1232
1268
|
producer:
|
|
1233
1269
|
name: Google Inc.
|
|
1234
1270
|
url: http://www.google.com
|
|
1235
|
-
-
|
|
1271
|
+
-
|
|
1236
1272
|
user_agent: Googlebot-Video/1.0
|
|
1237
1273
|
bot:
|
|
1238
1274
|
name: Googlebot
|
|
@@ -1241,7 +1277,7 @@
|
|
|
1241
1277
|
producer:
|
|
1242
1278
|
name: Google Inc.
|
|
1243
1279
|
url: http://www.google.com
|
|
1244
|
-
-
|
|
1280
|
+
-
|
|
1245
1281
|
user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
|
|
1246
1282
|
bot:
|
|
1247
1283
|
name: Googlebot
|
|
@@ -1250,7 +1286,7 @@
|
|
|
1250
1286
|
producer:
|
|
1251
1287
|
name: Google Inc.
|
|
1252
1288
|
url: http://www.google.com
|
|
1253
|
-
-
|
|
1289
|
+
-
|
|
1254
1290
|
user_agent: Googlebot/Nutch-1.7
|
|
1255
1291
|
bot:
|
|
1256
1292
|
name: Googlebot
|
|
@@ -1259,7 +1295,7 @@
|
|
|
1259
1295
|
producer:
|
|
1260
1296
|
name: Google Inc.
|
|
1261
1297
|
url: http://www.google.com
|
|
1262
|
-
-
|
|
1298
|
+
-
|
|
1263
1299
|
user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
|
|
1264
1300
|
bot:
|
|
1265
1301
|
name: Googlebot
|
|
@@ -1268,7 +1304,7 @@
|
|
|
1268
1304
|
producer:
|
|
1269
1305
|
name: Google Inc.
|
|
1270
1306
|
url: http://www.google.com
|
|
1271
|
-
-
|
|
1307
|
+
-
|
|
1272
1308
|
user_agent: Mediapartners-Google
|
|
1273
1309
|
bot:
|
|
1274
1310
|
name: Googlebot
|
|
@@ -1277,7 +1313,7 @@
|
|
|
1277
1313
|
producer:
|
|
1278
1314
|
name: Google Inc.
|
|
1279
1315
|
url: http://www.google.com
|
|
1280
|
-
-
|
|
1316
|
+
-
|
|
1281
1317
|
user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
|
|
1282
1318
|
bot:
|
|
1283
1319
|
name: Googlebot
|
|
@@ -1286,7 +1322,7 @@
|
|
|
1286
1322
|
producer:
|
|
1287
1323
|
name: Google Inc.
|
|
1288
1324
|
url: http://www.google.com
|
|
1289
|
-
-
|
|
1325
|
+
-
|
|
1290
1326
|
user_agent: Mozilla/5.0 (compatible; Google-Youtube-Links)
|
|
1291
1327
|
bot:
|
|
1292
1328
|
name: Googlebot
|
|
@@ -1295,7 +1331,7 @@
|
|
|
1295
1331
|
producer:
|
|
1296
1332
|
name: Google Inc.
|
|
1297
1333
|
url: http://www.google.com
|
|
1298
|
-
-
|
|
1334
|
+
-
|
|
1299
1335
|
user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
|
|
1300
1336
|
bot:
|
|
1301
1337
|
name: Googlebot
|
|
@@ -1304,7 +1340,7 @@
|
|
|
1304
1340
|
producer:
|
|
1305
1341
|
name: Google Inc.
|
|
1306
1342
|
url: http://www.google.com
|
|
1307
|
-
-
|
|
1343
|
+
-
|
|
1308
1344
|
user_agent: Mozilla/5.0 (en-US) AppleWebKit/537.36 (KHTML, like Gecko; Google-Assess) Chrome/34.0.1847.116 Safari/537.36
|
|
1309
1345
|
bot:
|
|
1310
1346
|
name: Googlebot
|
|
@@ -1313,7 +1349,7 @@
|
|
|
1313
1349
|
producer:
|
|
1314
1350
|
name: Google Inc.
|
|
1315
1351
|
url: http://www.google.com
|
|
1316
|
-
-
|
|
1352
|
+
-
|
|
1317
1353
|
user_agent: Mozilla/5.0 (en-us) AppleWebKit/537.36(KHTML, like Gecko; Google-Adwords-DisplayAds-WebRender;) Chrome/41.0.2272.118Safari/537.36
|
|
1318
1354
|
bot:
|
|
1319
1355
|
name: Googlebot
|
|
@@ -1322,7 +1358,7 @@
|
|
|
1322
1358
|
producer:
|
|
1323
1359
|
name: Google Inc.
|
|
1324
1360
|
url: http://www.google.com
|
|
1325
|
-
-
|
|
1361
|
+
-
|
|
1326
1362
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
|
1327
1363
|
bot:
|
|
1328
1364
|
name: Googlebot
|
|
@@ -1331,7 +1367,7 @@
|
|
|
1331
1367
|
producer:
|
|
1332
1368
|
name: Google Inc.
|
|
1333
1369
|
url: http://www.google.com
|
|
1334
|
-
-
|
|
1370
|
+
-
|
|
1335
1371
|
user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
|
|
1336
1372
|
bot:
|
|
1337
1373
|
name: Googlebot
|
|
@@ -1340,7 +1376,7 @@
|
|
|
1340
1376
|
producer:
|
|
1341
1377
|
name: Google Inc.
|
|
1342
1378
|
url: http://www.google.com
|
|
1343
|
-
-
|
|
1379
|
+
-
|
|
1344
1380
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-AMPHTML)
|
|
1345
1381
|
bot:
|
|
1346
1382
|
name: Googlebot
|
|
@@ -1349,7 +1385,7 @@
|
|
|
1349
1385
|
producer:
|
|
1350
1386
|
name: Google Inc.
|
|
1351
1387
|
url: http://www.google.com
|
|
1352
|
-
-
|
|
1388
|
+
-
|
|
1353
1389
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-Read-Aloud; +https://support.google.com/webmasters/answer/1061943)
|
|
1354
1390
|
bot:
|
|
1355
1391
|
name: Googlebot
|
|
@@ -1358,7 +1394,7 @@
|
|
|
1358
1394
|
producer:
|
|
1359
1395
|
name: Google Inc.
|
|
1360
1396
|
url: http://www.google.com
|
|
1361
|
-
-
|
|
1397
|
+
-
|
|
1362
1398
|
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; DuplexWeb-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.131 Mobile Safari/537.36
|
|
1363
1399
|
bot:
|
|
1364
1400
|
name: Googlebot
|
|
@@ -1367,7 +1403,7 @@
|
|
|
1367
1403
|
producer:
|
|
1368
1404
|
name: Google Inc.
|
|
1369
1405
|
url: http://www.google.com
|
|
1370
|
-
-
|
|
1406
|
+
-
|
|
1371
1407
|
user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
|
|
1372
1408
|
bot:
|
|
1373
1409
|
name: Googlebot
|
|
@@ -1376,7 +1412,7 @@
|
|
|
1376
1412
|
producer:
|
|
1377
1413
|
name: Google Inc.
|
|
1378
1414
|
url: http://www.google.com
|
|
1379
|
-
-
|
|
1415
|
+
-
|
|
1380
1416
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/27.0.1453 Safari/537.36 (compatible; Google-HotelAdsVerifier/2.0)
|
|
1381
1417
|
bot:
|
|
1382
1418
|
name: Googlebot
|
|
@@ -1385,7 +1421,7 @@
|
|
|
1385
1421
|
producer:
|
|
1386
1422
|
name: Google Inc.
|
|
1387
1423
|
url: http://www.google.com
|
|
1388
|
-
-
|
|
1424
|
+
-
|
|
1389
1425
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
|
|
1390
1426
|
bot:
|
|
1391
1427
|
name: Googlebot
|
|
@@ -1394,7 +1430,7 @@
|
|
|
1394
1430
|
producer:
|
|
1395
1431
|
name: Google Inc.
|
|
1396
1432
|
url: http://www.google.com
|
|
1397
|
-
-
|
|
1433
|
+
-
|
|
1398
1434
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36 (compatible; Google-Shopping-Quality +http://www.google.com/merchants/tos/extend/DE/tos.html)
|
|
1399
1435
|
bot:
|
|
1400
1436
|
name: Googlebot
|
|
@@ -1403,7 +1439,7 @@
|
|
|
1403
1439
|
producer:
|
|
1404
1440
|
name: Google Inc.
|
|
1405
1441
|
url: http://www.google.com
|
|
1406
|
-
-
|
|
1442
|
+
-
|
|
1407
1443
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
|
|
1408
1444
|
bot:
|
|
1409
1445
|
name: Googlebot
|
|
@@ -1412,7 +1448,7 @@
|
|
|
1412
1448
|
producer:
|
|
1413
1449
|
name: Google Inc.
|
|
1414
1450
|
url: http://www.google.com
|
|
1415
|
-
-
|
|
1451
|
+
-
|
|
1416
1452
|
user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
|
1417
1453
|
bot:
|
|
1418
1454
|
name: Googlebot
|
|
@@ -1421,7 +1457,13 @@
|
|
|
1421
1457
|
producer:
|
|
1422
1458
|
name: Google Inc.
|
|
1423
1459
|
url: http://www.google.com
|
|
1424
|
-
-
|
|
1460
|
+
-
|
|
1461
|
+
user_agent: Grammarly/1.0 (http://www.grammarly.com)
|
|
1462
|
+
bot:
|
|
1463
|
+
name: Grammarly
|
|
1464
|
+
category: Service bot
|
|
1465
|
+
url: https://www.grammarly.com
|
|
1466
|
+
-
|
|
1425
1467
|
user_agent: Mozilla/5.0 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
|
1426
1468
|
bot:
|
|
1427
1469
|
name: Grapeshot
|
|
@@ -1430,7 +1472,7 @@
|
|
|
1430
1472
|
producer:
|
|
1431
1473
|
name: Grapeshot
|
|
1432
1474
|
url: https://www.grapeshot.com
|
|
1433
|
-
-
|
|
1475
|
+
-
|
|
1434
1476
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1. 4 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
|
1435
1477
|
bot:
|
|
1436
1478
|
name: Grapeshot
|
|
@@ -1439,7 +1481,7 @@
|
|
|
1439
1481
|
producer:
|
|
1440
1482
|
name: Grapeshot
|
|
1441
1483
|
url: https://www.grapeshot.com
|
|
1442
|
-
-
|
|
1484
|
+
-
|
|
1443
1485
|
user_agent: HTTPMon/1.0b (http://www.httpmon.com)
|
|
1444
1486
|
bot:
|
|
1445
1487
|
name: HTTPMon
|
|
@@ -1448,7 +1490,7 @@
|
|
|
1448
1490
|
producer:
|
|
1449
1491
|
name: towards GmbH
|
|
1450
1492
|
url: http://www.towards.ch/
|
|
1451
|
-
-
|
|
1493
|
+
-
|
|
1452
1494
|
user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
|
|
1453
1495
|
bot:
|
|
1454
1496
|
name: Heritrix
|
|
@@ -1456,8 +1498,8 @@
|
|
|
1456
1498
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1457
1499
|
producer:
|
|
1458
1500
|
name: The Internet Archive
|
|
1459
|
-
url:
|
|
1460
|
-
-
|
|
1501
|
+
url: https://archive.org
|
|
1502
|
+
-
|
|
1461
1503
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
|
|
1462
1504
|
bot:
|
|
1463
1505
|
name: Heritrix
|
|
@@ -1465,8 +1507,8 @@
|
|
|
1465
1507
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1466
1508
|
producer:
|
|
1467
1509
|
name: The Internet Archive
|
|
1468
|
-
url:
|
|
1469
|
-
-
|
|
1510
|
+
url: https://archive.org
|
|
1511
|
+
-
|
|
1470
1512
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
|
|
1471
1513
|
bot:
|
|
1472
1514
|
name: Heritrix
|
|
@@ -1474,8 +1516,8 @@
|
|
|
1474
1516
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1475
1517
|
producer:
|
|
1476
1518
|
name: The Internet Archive
|
|
1477
|
-
url:
|
|
1478
|
-
-
|
|
1519
|
+
url: https://archive.org
|
|
1520
|
+
-
|
|
1479
1521
|
user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
|
|
1480
1522
|
bot:
|
|
1481
1523
|
name: Heritrix
|
|
@@ -1483,8 +1525,8 @@
|
|
|
1483
1525
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1484
1526
|
producer:
|
|
1485
1527
|
name: The Internet Archive
|
|
1486
|
-
url:
|
|
1487
|
-
-
|
|
1528
|
+
url: https://archive.org
|
|
1529
|
+
-
|
|
1488
1530
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
|
|
1489
1531
|
bot:
|
|
1490
1532
|
name: Heritrix
|
|
@@ -1492,8 +1534,8 @@
|
|
|
1492
1534
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1493
1535
|
producer:
|
|
1494
1536
|
name: The Internet Archive
|
|
1495
|
-
url:
|
|
1496
|
-
-
|
|
1537
|
+
url: https://archive.org
|
|
1538
|
+
-
|
|
1497
1539
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
|
|
1498
1540
|
bot:
|
|
1499
1541
|
name: Heritrix
|
|
@@ -1501,8 +1543,8 @@
|
|
|
1501
1543
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1502
1544
|
producer:
|
|
1503
1545
|
name: The Internet Archive
|
|
1504
|
-
url:
|
|
1505
|
-
-
|
|
1546
|
+
url: https://archive.org
|
|
1547
|
+
-
|
|
1506
1548
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
|
|
1507
1549
|
bot:
|
|
1508
1550
|
name: Heritrix
|
|
@@ -1510,8 +1552,8 @@
|
|
|
1510
1552
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1511
1553
|
producer:
|
|
1512
1554
|
name: The Internet Archive
|
|
1513
|
-
url:
|
|
1514
|
-
-
|
|
1555
|
+
url: https://archive.org
|
|
1556
|
+
-
|
|
1515
1557
|
user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
|
|
1516
1558
|
bot:
|
|
1517
1559
|
name: Heritrix
|
|
@@ -1519,8 +1561,8 @@
|
|
|
1519
1561
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1520
1562
|
producer:
|
|
1521
1563
|
name: The Internet Archive
|
|
1522
|
-
url:
|
|
1523
|
-
-
|
|
1564
|
+
url: https://archive.org
|
|
1565
|
+
-
|
|
1524
1566
|
user_agent: Heurekabot-Feed/1.0 (+https://sluzby.heureka.cz/napoveda/heurekabot/)
|
|
1525
1567
|
bot:
|
|
1526
1568
|
name: Heureka Feed
|
|
@@ -1529,16 +1571,16 @@
|
|
|
1529
1571
|
producer:
|
|
1530
1572
|
name: Heureka.cz, a.s.
|
|
1531
1573
|
url: https://www.heureka.cz/
|
|
1532
|
-
-
|
|
1574
|
+
-
|
|
1533
1575
|
user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
|
|
1534
1576
|
bot:
|
|
1535
1577
|
name: HubPages
|
|
1536
1578
|
category: Crawler
|
|
1537
|
-
url:
|
|
1579
|
+
url: https://hubpages.com/help/crawlingpolicy
|
|
1538
1580
|
producer:
|
|
1539
|
-
name: HubPages
|
|
1540
|
-
url:
|
|
1541
|
-
-
|
|
1581
|
+
name: HubPages, Inc.
|
|
1582
|
+
url: https://discover.hubpages.com/
|
|
1583
|
+
-
|
|
1542
1584
|
user_agent: HubSpot Website Grader (web-crawlers@hubspot.com)
|
|
1543
1585
|
bot:
|
|
1544
1586
|
name: HubSpot
|
|
@@ -1546,7 +1588,7 @@
|
|
|
1546
1588
|
producer:
|
|
1547
1589
|
name: HubSpot Inc.
|
|
1548
1590
|
url: https://www.hubspot.com
|
|
1549
|
-
-
|
|
1591
|
+
-
|
|
1550
1592
|
user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
|
|
1551
1593
|
bot:
|
|
1552
1594
|
name: ICC-Crawler
|
|
@@ -1555,7 +1597,7 @@
|
|
|
1555
1597
|
producer:
|
|
1556
1598
|
name: ""
|
|
1557
1599
|
url: ""
|
|
1558
|
-
-
|
|
1600
|
+
-
|
|
1559
1601
|
user_agent: IDG/IT (http://spaziodati.eu/)
|
|
1560
1602
|
bot:
|
|
1561
1603
|
name: IDG/IT
|
|
@@ -1564,7 +1606,7 @@
|
|
|
1564
1606
|
producer:
|
|
1565
1607
|
name: SpazioDati S.r.l.
|
|
1566
1608
|
url: https://spaziodati.eu/
|
|
1567
|
-
-
|
|
1609
|
+
-
|
|
1568
1610
|
user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
|
|
1569
1611
|
bot:
|
|
1570
1612
|
name: IIS Site Analysis
|
|
@@ -1573,7 +1615,7 @@
|
|
|
1573
1615
|
producer:
|
|
1574
1616
|
name: Microsoft Corporation
|
|
1575
1617
|
url: http://www.microsoft.com
|
|
1576
|
-
-
|
|
1618
|
+
-
|
|
1577
1619
|
user_agent: IP-Guide.com Crawler/1.0 (https://ip-guide.com)
|
|
1578
1620
|
bot:
|
|
1579
1621
|
name: IP-Guide Crawler
|
|
@@ -1582,15 +1624,15 @@
|
|
|
1582
1624
|
producer:
|
|
1583
1625
|
name: ""
|
|
1584
1626
|
url: https://ip-guide.com
|
|
1585
|
-
-
|
|
1627
|
+
-
|
|
1586
1628
|
user_agent: Mozilla/5.0 (compatible; ips-agent)
|
|
1587
1629
|
bot:
|
|
1588
1630
|
name: IPS Agent
|
|
1589
|
-
category:
|
|
1631
|
+
category: Crawler
|
|
1590
1632
|
producer:
|
|
1591
1633
|
name: VeriSign, Inc
|
|
1592
1634
|
url: http://www.verisign.com/
|
|
1593
|
-
-
|
|
1635
|
+
-
|
|
1594
1636
|
user_agent: Kaspersky Lab CFR link resolver cfradmins@kaspersky.com
|
|
1595
1637
|
bot:
|
|
1596
1638
|
name: Kaspersky
|
|
@@ -1599,7 +1641,7 @@
|
|
|
1599
1641
|
producer:
|
|
1600
1642
|
name: AO Kaspersky Lab
|
|
1601
1643
|
url: https://www.kaspersky.com/
|
|
1602
|
-
-
|
|
1644
|
+
-
|
|
1603
1645
|
user_agent: kouio.com RSS reader
|
|
1604
1646
|
bot:
|
|
1605
1647
|
name: Kouio
|
|
@@ -1608,7 +1650,7 @@
|
|
|
1608
1650
|
producer:
|
|
1609
1651
|
name: ""
|
|
1610
1652
|
url: ""
|
|
1611
|
-
-
|
|
1653
|
+
-
|
|
1612
1654
|
user_agent: 'kouio.com RSS reader - 6 subscribers'
|
|
1613
1655
|
bot:
|
|
1614
1656
|
name: Kouio
|
|
@@ -1617,7 +1659,7 @@
|
|
|
1617
1659
|
producer:
|
|
1618
1660
|
name: ""
|
|
1619
1661
|
url: ""
|
|
1620
|
-
-
|
|
1662
|
+
-
|
|
1621
1663
|
user_agent: LCC (+http://corpora.informatik.uni-leipzig.de/crawler_faq.html)
|
|
1622
1664
|
bot:
|
|
1623
1665
|
name: LCC
|
|
@@ -1626,7 +1668,7 @@
|
|
|
1626
1668
|
producer:
|
|
1627
1669
|
name: Universität Leipzig
|
|
1628
1670
|
url: https://www.uni-leipzig.de/
|
|
1629
|
-
-
|
|
1671
|
+
-
|
|
1630
1672
|
user_agent: 'ltx71 - (http://ltx71.com/)'
|
|
1631
1673
|
bot:
|
|
1632
1674
|
name: LTX71
|
|
@@ -1634,7 +1676,7 @@
|
|
|
1634
1676
|
producer:
|
|
1635
1677
|
name: ""
|
|
1636
1678
|
url: ""
|
|
1637
|
-
-
|
|
1679
|
+
-
|
|
1638
1680
|
user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
|
|
1639
1681
|
bot:
|
|
1640
1682
|
name: Larbin web crawler
|
|
@@ -1643,7 +1685,7 @@
|
|
|
1643
1685
|
producer:
|
|
1644
1686
|
name: ""
|
|
1645
1687
|
url: ""
|
|
1646
|
-
-
|
|
1688
|
+
-
|
|
1647
1689
|
user_agent: "Mozilla/5.0 (compatible; Let's Encrypt validation server; +https://www.letsencrypt.org)"
|
|
1648
1690
|
bot:
|
|
1649
1691
|
name: "Let's Encrypt Validation"
|
|
@@ -1652,7 +1694,7 @@
|
|
|
1652
1694
|
producer:
|
|
1653
1695
|
name: "Let's Encrypt"
|
|
1654
1696
|
url: https://letsencrypt.org
|
|
1655
|
-
-
|
|
1697
|
+
-
|
|
1656
1698
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/61.0.3116.0 Mobile Safari/537.36 Chrome-Lighthouse
|
|
1657
1699
|
bot:
|
|
1658
1700
|
name: Lighthouse
|
|
@@ -1661,7 +1703,7 @@
|
|
|
1661
1703
|
producer:
|
|
1662
1704
|
name: Lighthouse
|
|
1663
1705
|
url: https://developers.google.com/web/tools/lighthouse
|
|
1664
|
-
-
|
|
1706
|
+
-
|
|
1665
1707
|
user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
|
|
1666
1708
|
bot:
|
|
1667
1709
|
name: Linkdex Bot
|
|
@@ -1670,7 +1712,7 @@
|
|
|
1670
1712
|
producer:
|
|
1671
1713
|
name: Mojeek Ltd.
|
|
1672
1714
|
url: http://www.mojeek.com
|
|
1673
|
-
-
|
|
1715
|
+
-
|
|
1674
1716
|
user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
|
|
1675
1717
|
bot:
|
|
1676
1718
|
name: Linkdex Bot
|
|
@@ -1679,7 +1721,7 @@
|
|
|
1679
1721
|
producer:
|
|
1680
1722
|
name: Mojeek Ltd.
|
|
1681
1723
|
url: http://www.mojeek.com
|
|
1682
|
-
-
|
|
1724
|
+
-
|
|
1683
1725
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
|
|
1684
1726
|
bot:
|
|
1685
1727
|
name: Linkdex Bot
|
|
@@ -1688,7 +1730,7 @@
|
|
|
1688
1730
|
producer:
|
|
1689
1731
|
name: Mojeek Ltd.
|
|
1690
1732
|
url: http://www.mojeek.com
|
|
1691
|
-
-
|
|
1733
|
+
-
|
|
1692
1734
|
user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
|
|
1693
1735
|
bot:
|
|
1694
1736
|
name: LinkedIn Bot
|
|
@@ -1697,7 +1739,7 @@
|
|
|
1697
1739
|
producer:
|
|
1698
1740
|
name: LinkedIn
|
|
1699
1741
|
url: http://www.linkedin.com
|
|
1700
|
-
-
|
|
1742
|
+
-
|
|
1701
1743
|
user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
|
|
1702
1744
|
bot:
|
|
1703
1745
|
name: MJ12 Bot
|
|
@@ -1706,7 +1748,7 @@
|
|
|
1706
1748
|
producer:
|
|
1707
1749
|
name: Majestic-12
|
|
1708
1750
|
url: http://majestic12.co.uk
|
|
1709
|
-
-
|
|
1751
|
+
-
|
|
1710
1752
|
user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
|
|
1711
1753
|
bot:
|
|
1712
1754
|
name: Magpie-Crawler
|
|
@@ -1715,7 +1757,7 @@
|
|
|
1715
1757
|
producer:
|
|
1716
1758
|
name: Brandwatch
|
|
1717
1759
|
url: http://www.brandwatch.com
|
|
1718
|
-
-
|
|
1760
|
+
-
|
|
1719
1761
|
user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
|
|
1720
1762
|
bot:
|
|
1721
1763
|
name: MagpieRSS
|
|
@@ -1724,7 +1766,7 @@
|
|
|
1724
1766
|
producer:
|
|
1725
1767
|
name: ""
|
|
1726
1768
|
url: ""
|
|
1727
|
-
-
|
|
1769
|
+
-
|
|
1728
1770
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
|
|
1729
1771
|
bot:
|
|
1730
1772
|
name: Mail.Ru Bot
|
|
@@ -1733,7 +1775,7 @@
|
|
|
1733
1775
|
producer:
|
|
1734
1776
|
name: Mail.Ru Group
|
|
1735
1777
|
url: http://corp.mail.ru
|
|
1736
|
-
-
|
|
1778
|
+
-
|
|
1737
1779
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
|
|
1738
1780
|
bot:
|
|
1739
1781
|
name: Mail.Ru Bot
|
|
@@ -1742,17 +1784,17 @@
|
|
|
1742
1784
|
producer:
|
|
1743
1785
|
name: Mail.Ru Group
|
|
1744
1786
|
url: http://corp.mail.ru
|
|
1745
|
-
-
|
|
1787
|
+
-
|
|
1746
1788
|
user_agent: http.rb/2.2.2 (Mastodon/1.6.1; +https://mathtod.online/)
|
|
1747
1789
|
bot:
|
|
1748
1790
|
name: Mastodon Bot
|
|
1749
1791
|
category: Social Media Agent
|
|
1750
|
-
-
|
|
1792
|
+
-
|
|
1751
1793
|
user_agent: http.rb/3.2.0 (Mastodon/2.4.3; +https://uwu.social/)
|
|
1752
1794
|
bot:
|
|
1753
1795
|
name: Mastodon Bot
|
|
1754
1796
|
category: Social Media Agent
|
|
1755
|
-
-
|
|
1797
|
+
-
|
|
1756
1798
|
user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
|
|
1757
1799
|
bot:
|
|
1758
1800
|
name: Meanpath Bot
|
|
@@ -1761,13 +1803,13 @@
|
|
|
1761
1803
|
producer:
|
|
1762
1804
|
name: Meanpath
|
|
1763
1805
|
url: http://www.meanpath.com
|
|
1764
|
-
-
|
|
1806
|
+
-
|
|
1765
1807
|
user_agent: MetaInspector/5.4.0 (+https://github.com/jaimeiniesta/metainspector)
|
|
1766
1808
|
bot:
|
|
1767
1809
|
name: MetaInspector
|
|
1768
1810
|
category: Crawler
|
|
1769
1811
|
url: https://github.com/jaimeiniesta/metainspector
|
|
1770
|
-
-
|
|
1812
|
+
-
|
|
1771
1813
|
user_agent: Mozilla/5.0 (compatible; MetaJobBot; http://www.metajob.de/crawler)
|
|
1772
1814
|
bot:
|
|
1773
1815
|
name: MetaJobBot
|
|
@@ -1776,7 +1818,7 @@
|
|
|
1776
1818
|
producer:
|
|
1777
1819
|
name: MetaJob
|
|
1778
1820
|
url: http://www.metajob.at
|
|
1779
|
-
-
|
|
1821
|
+
-
|
|
1780
1822
|
user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
|
|
1781
1823
|
bot:
|
|
1782
1824
|
name: Mixrank Bot
|
|
@@ -1785,7 +1827,7 @@
|
|
|
1785
1827
|
producer:
|
|
1786
1828
|
name: Online Media Group, Inc.
|
|
1787
1829
|
url: ""
|
|
1788
|
-
-
|
|
1830
|
+
-
|
|
1789
1831
|
user_agent: Mnogosearch-3.1.21
|
|
1790
1832
|
bot:
|
|
1791
1833
|
name: Mnogosearch
|
|
@@ -1794,7 +1836,7 @@
|
|
|
1794
1836
|
producer:
|
|
1795
1837
|
name: Lavtech.Com Corp.
|
|
1796
1838
|
url: ""
|
|
1797
|
-
-
|
|
1839
|
+
-
|
|
1798
1840
|
user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
|
|
1799
1841
|
bot:
|
|
1800
1842
|
name: MojeekBot
|
|
@@ -1803,7 +1845,7 @@
|
|
|
1803
1845
|
producer:
|
|
1804
1846
|
name: Mojeek Ltd.
|
|
1805
1847
|
url: http://www.mojeek.com
|
|
1806
|
-
-
|
|
1848
|
+
-
|
|
1807
1849
|
user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
|
|
1808
1850
|
bot:
|
|
1809
1851
|
name: Monitor.Us
|
|
@@ -1812,7 +1854,7 @@
|
|
|
1812
1854
|
producer:
|
|
1813
1855
|
name: Monitor.Us
|
|
1814
1856
|
url: http://www.monitor.us
|
|
1815
|
-
-
|
|
1857
|
+
-
|
|
1816
1858
|
user_agent: munin/2.0.30-1 (libwww-perl/6.15)
|
|
1817
1859
|
bot:
|
|
1818
1860
|
name: Munin
|
|
@@ -1821,7 +1863,7 @@
|
|
|
1821
1863
|
producer:
|
|
1822
1864
|
name: Munin
|
|
1823
1865
|
url: http://munin-monitoring.org/
|
|
1824
|
-
-
|
|
1866
|
+
-
|
|
1825
1867
|
user_agent: munin/http_loadtime
|
|
1826
1868
|
bot:
|
|
1827
1869
|
name: Munin
|
|
@@ -1830,7 +1872,7 @@
|
|
|
1830
1872
|
producer:
|
|
1831
1873
|
name: Munin
|
|
1832
1874
|
url: http://munin-monitoring.org/
|
|
1833
|
-
-
|
|
1875
|
+
-
|
|
1834
1876
|
user_agent: nlcrawler/1.0 (+http://northernlight.com/)
|
|
1835
1877
|
bot:
|
|
1836
1878
|
name: NLCrawler
|
|
@@ -1839,7 +1881,7 @@
|
|
|
1839
1881
|
producer:
|
|
1840
1882
|
name: Northern Light
|
|
1841
1883
|
url: http://northernlight.com
|
|
1842
|
-
-
|
|
1884
|
+
-
|
|
1843
1885
|
user_agent: check_http/v1.5 (nagios-plugins 1.5)
|
|
1844
1886
|
bot:
|
|
1845
1887
|
name: Nagios check_http
|
|
@@ -1848,7 +1890,7 @@
|
|
|
1848
1890
|
producer:
|
|
1849
1891
|
name: Nagios Plugins Development Team
|
|
1850
1892
|
url: https://nagios.org
|
|
1851
|
-
-
|
|
1893
|
+
-
|
|
1852
1894
|
user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
|
|
1853
1895
|
bot:
|
|
1854
1896
|
name: NalezenCzBot
|
|
@@ -1857,11 +1899,11 @@
|
|
|
1857
1899
|
producer:
|
|
1858
1900
|
name: Jaroslav Kuboš
|
|
1859
1901
|
url: ""
|
|
1860
|
-
-
|
|
1902
|
+
-
|
|
1861
1903
|
user_agent: NetLyzer FastProbe
|
|
1862
1904
|
bot:
|
|
1863
1905
|
name: NetLyzer FastProbe
|
|
1864
|
-
-
|
|
1906
|
+
-
|
|
1865
1907
|
user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
|
|
1866
1908
|
bot:
|
|
1867
1909
|
name: Netcraft Survey Bot
|
|
@@ -1870,7 +1912,7 @@
|
|
|
1870
1912
|
producer:
|
|
1871
1913
|
name: Netcraft
|
|
1872
1914
|
url: http://www.netcraft.com
|
|
1873
|
-
-
|
|
1915
|
+
-
|
|
1874
1916
|
user_agent: Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)
|
|
1875
1917
|
bot:
|
|
1876
1918
|
name: Netcraft Survey Bot
|
|
@@ -1879,7 +1921,7 @@
|
|
|
1879
1921
|
producer:
|
|
1880
1922
|
name: Netcraft
|
|
1881
1923
|
url: http://www.netcraft.com
|
|
1882
|
-
-
|
|
1924
|
+
-
|
|
1883
1925
|
user_agent: 'Netcraft SSL Server Survey - contact info@netcraft.com'
|
|
1884
1926
|
bot:
|
|
1885
1927
|
name: Netcraft Survey Bot
|
|
@@ -1888,7 +1930,7 @@
|
|
|
1888
1930
|
producer:
|
|
1889
1931
|
name: Netcraft
|
|
1890
1932
|
url: http://www.netcraft.com
|
|
1891
|
-
-
|
|
1933
|
+
-
|
|
1892
1934
|
user_agent: Netvibes (http://www.netvibes.com)
|
|
1893
1935
|
bot:
|
|
1894
1936
|
name: Netvibes
|
|
@@ -1897,7 +1939,7 @@
|
|
|
1897
1939
|
producer:
|
|
1898
1940
|
name: ""
|
|
1899
1941
|
url: ""
|
|
1900
|
-
-
|
|
1942
|
+
-
|
|
1901
1943
|
user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
|
|
1902
1944
|
bot:
|
|
1903
1945
|
name: Netvibes
|
|
@@ -1906,7 +1948,7 @@
|
|
|
1906
1948
|
producer:
|
|
1907
1949
|
name: ""
|
|
1908
1950
|
url: ""
|
|
1909
|
-
-
|
|
1951
|
+
-
|
|
1910
1952
|
user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
|
1911
1953
|
bot:
|
|
1912
1954
|
name: NewsBlur
|
|
@@ -1915,7 +1957,7 @@
|
|
|
1915
1957
|
producer:
|
|
1916
1958
|
name: ""
|
|
1917
1959
|
url: ""
|
|
1918
|
-
-
|
|
1960
|
+
-
|
|
1919
1961
|
user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
|
1920
1962
|
bot:
|
|
1921
1963
|
name: NewsBlur
|
|
@@ -1924,7 +1966,7 @@
|
|
|
1924
1966
|
producer:
|
|
1925
1967
|
name: ""
|
|
1926
1968
|
url: ""
|
|
1927
|
-
-
|
|
1969
|
+
-
|
|
1928
1970
|
user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
|
1929
1971
|
bot:
|
|
1930
1972
|
name: NewsBlur
|
|
@@ -1933,7 +1975,7 @@
|
|
|
1933
1975
|
producer:
|
|
1934
1976
|
name: ""
|
|
1935
1977
|
url: ""
|
|
1936
|
-
-
|
|
1978
|
+
-
|
|
1937
1979
|
user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
|
1938
1980
|
bot:
|
|
1939
1981
|
name: NewsBlur
|
|
@@ -1942,7 +1984,7 @@
|
|
|
1942
1984
|
producer:
|
|
1943
1985
|
name: ""
|
|
1944
1986
|
url: ""
|
|
1945
|
-
-
|
|
1987
|
+
-
|
|
1946
1988
|
user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
|
|
1947
1989
|
bot:
|
|
1948
1990
|
name: NewsGator
|
|
@@ -1951,7 +1993,7 @@
|
|
|
1951
1993
|
producer:
|
|
1952
1994
|
name: ""
|
|
1953
1995
|
url: ""
|
|
1954
|
-
-
|
|
1996
|
+
-
|
|
1955
1997
|
user_agent: Mozilla/5.0 (compatible; Nmap Scripting Engine; https://nmap.org/book/nse.html)
|
|
1956
1998
|
bot:
|
|
1957
1999
|
name: Nmap
|
|
@@ -1960,7 +2002,7 @@
|
|
|
1960
2002
|
producer:
|
|
1961
2003
|
name: Nmap
|
|
1962
2004
|
url: https://nmap.org/
|
|
1963
|
-
-
|
|
2005
|
+
-
|
|
1964
2006
|
user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
|
|
1965
2007
|
bot:
|
|
1966
2008
|
name: Nutch-based Bot
|
|
@@ -1968,8 +2010,8 @@
|
|
|
1968
2010
|
url: https://nutch.apache.org
|
|
1969
2011
|
producer:
|
|
1970
2012
|
name: The Apache Software Foundation
|
|
1971
|
-
url:
|
|
1972
|
-
-
|
|
2013
|
+
url: https://www.apache.org/foundation/
|
|
2014
|
+
-
|
|
1973
2015
|
user_agent: CB/Nutch-1.7
|
|
1974
2016
|
bot:
|
|
1975
2017
|
name: Nutch-based Bot
|
|
@@ -1977,8 +2019,8 @@
|
|
|
1977
2019
|
url: https://nutch.apache.org
|
|
1978
2020
|
producer:
|
|
1979
2021
|
name: The Apache Software Foundation
|
|
1980
|
-
url:
|
|
1981
|
-
-
|
|
2022
|
+
url: https://www.apache.org/foundation/
|
|
2023
|
+
-
|
|
1982
2024
|
user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
|
|
1983
2025
|
bot:
|
|
1984
2026
|
name: Nutch-based Bot
|
|
@@ -1986,8 +2028,8 @@
|
|
|
1986
2028
|
url: https://nutch.apache.org
|
|
1987
2029
|
producer:
|
|
1988
2030
|
name: The Apache Software Foundation
|
|
1989
|
-
url:
|
|
1990
|
-
-
|
|
2031
|
+
url: https://www.apache.org/foundation/
|
|
2032
|
+
-
|
|
1991
2033
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
|
|
1992
2034
|
bot:
|
|
1993
2035
|
name: Nutch-based Bot
|
|
@@ -1995,8 +2037,8 @@
|
|
|
1995
2037
|
url: https://nutch.apache.org
|
|
1996
2038
|
producer:
|
|
1997
2039
|
name: The Apache Software Foundation
|
|
1998
|
-
url:
|
|
1999
|
-
-
|
|
2040
|
+
url: https://www.apache.org/foundation/
|
|
2041
|
+
-
|
|
2000
2042
|
user_agent: My Nutch Spider/Nutch-1.6
|
|
2001
2043
|
bot:
|
|
2002
2044
|
name: Nutch-based Bot
|
|
@@ -2004,8 +2046,8 @@
|
|
|
2004
2046
|
url: https://nutch.apache.org
|
|
2005
2047
|
producer:
|
|
2006
2048
|
name: The Apache Software Foundation
|
|
2007
|
-
url:
|
|
2008
|
-
-
|
|
2049
|
+
url: https://www.apache.org/foundation/
|
|
2050
|
+
-
|
|
2009
2051
|
user_agent: MySpider/Nutch-2.2
|
|
2010
2052
|
bot:
|
|
2011
2053
|
name: Nutch-based Bot
|
|
@@ -2013,8 +2055,8 @@
|
|
|
2013
2055
|
url: https://nutch.apache.org
|
|
2014
2056
|
producer:
|
|
2015
2057
|
name: The Apache Software Foundation
|
|
2016
|
-
url:
|
|
2017
|
-
-
|
|
2058
|
+
url: https://www.apache.org/foundation/
|
|
2059
|
+
-
|
|
2018
2060
|
user_agent: Nutch12/Nutch-1.2
|
|
2019
2061
|
bot:
|
|
2020
2062
|
name: Nutch-based Bot
|
|
@@ -2022,8 +2064,8 @@
|
|
|
2022
2064
|
url: https://nutch.apache.org
|
|
2023
2065
|
producer:
|
|
2024
2066
|
name: The Apache Software Foundation
|
|
2025
|
-
url:
|
|
2026
|
-
-
|
|
2067
|
+
url: https://www.apache.org/foundation/
|
|
2068
|
+
-
|
|
2027
2069
|
user_agent: NutchSpider/Nutch-1.4
|
|
2028
2070
|
bot:
|
|
2029
2071
|
name: Nutch-based Bot
|
|
@@ -2031,8 +2073,8 @@
|
|
|
2031
2073
|
url: https://nutch.apache.org
|
|
2032
2074
|
producer:
|
|
2033
2075
|
name: The Apache Software Foundation
|
|
2034
|
-
url:
|
|
2035
|
-
-
|
|
2076
|
+
url: https://www.apache.org/foundation/
|
|
2077
|
+
-
|
|
2036
2078
|
user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
|
|
2037
2079
|
bot:
|
|
2038
2080
|
name: Nutch-based Bot
|
|
@@ -2040,8 +2082,8 @@
|
|
|
2040
2082
|
url: https://nutch.apache.org
|
|
2041
2083
|
producer:
|
|
2042
2084
|
name: The Apache Software Foundation
|
|
2043
|
-
url:
|
|
2044
|
-
-
|
|
2085
|
+
url: https://www.apache.org/foundation/
|
|
2086
|
+
-
|
|
2045
2087
|
user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
|
|
2046
2088
|
bot:
|
|
2047
2089
|
name: Nutch-based Bot
|
|
@@ -2049,8 +2091,8 @@
|
|
|
2049
2091
|
url: https://nutch.apache.org
|
|
2050
2092
|
producer:
|
|
2051
2093
|
name: The Apache Software Foundation
|
|
2052
|
-
url:
|
|
2053
|
-
-
|
|
2094
|
+
url: https://www.apache.org/foundation/
|
|
2095
|
+
-
|
|
2054
2096
|
user_agent: testnutch/Nutch-1.8
|
|
2055
2097
|
bot:
|
|
2056
2098
|
name: Nutch-based Bot
|
|
@@ -2058,8 +2100,8 @@
|
|
|
2058
2100
|
url: https://nutch.apache.org
|
|
2059
2101
|
producer:
|
|
2060
2102
|
name: The Apache Software Foundation
|
|
2061
|
-
url:
|
|
2062
|
-
-
|
|
2103
|
+
url: https://www.apache.org/foundation/
|
|
2104
|
+
-
|
|
2063
2105
|
user_agent: Your Nutch Spider/Nutch-2.2.1
|
|
2064
2106
|
bot:
|
|
2065
2107
|
name: Nutch-based Bot
|
|
@@ -2067,8 +2109,8 @@
|
|
|
2067
2109
|
url: https://nutch.apache.org
|
|
2068
2110
|
producer:
|
|
2069
2111
|
name: The Apache Software Foundation
|
|
2070
|
-
url:
|
|
2071
|
-
-
|
|
2112
|
+
url: https://www.apache.org/foundation/
|
|
2113
|
+
-
|
|
2072
2114
|
user_agent: your sipder name/Nutch-1.7
|
|
2073
2115
|
bot:
|
|
2074
2116
|
name: Nutch-based Bot
|
|
@@ -2076,8 +2118,8 @@
|
|
|
2076
2118
|
url: https://nutch.apache.org
|
|
2077
2119
|
producer:
|
|
2078
2120
|
name: The Apache Software Foundation
|
|
2079
|
-
url:
|
|
2080
|
-
-
|
|
2121
|
+
url: https://www.apache.org/foundation/
|
|
2122
|
+
-
|
|
2081
2123
|
user_agent: Nuzzel
|
|
2082
2124
|
bot:
|
|
2083
2125
|
name: Nuzzel
|
|
@@ -2085,11 +2127,11 @@
|
|
|
2085
2127
|
producer:
|
|
2086
2128
|
name: Nuzzel
|
|
2087
2129
|
url: https://www.nuzzel.com/
|
|
2088
|
-
-
|
|
2130
|
+
-
|
|
2089
2131
|
user_agent: Octopus 1.0.2
|
|
2090
2132
|
bot:
|
|
2091
2133
|
name: Octopus
|
|
2092
|
-
-
|
|
2134
|
+
-
|
|
2093
2135
|
user_agent: omgili/0.5 +http://omgili.com
|
|
2094
2136
|
bot:
|
|
2095
2137
|
name: Omgili bot
|
|
@@ -2098,7 +2140,7 @@
|
|
|
2098
2140
|
producer:
|
|
2099
2141
|
name: Omgili
|
|
2100
2142
|
url: http://www.omgili.com
|
|
2101
|
-
-
|
|
2143
|
+
-
|
|
2102
2144
|
user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
|
|
2103
2145
|
bot:
|
|
2104
2146
|
name: Omgili bot
|
|
@@ -2107,7 +2149,7 @@
|
|
|
2107
2149
|
producer:
|
|
2108
2150
|
name: Omgili
|
|
2109
2151
|
url: http://www.omgili.com
|
|
2110
|
-
-
|
|
2152
|
+
-
|
|
2111
2153
|
user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
|
|
2112
2154
|
bot:
|
|
2113
2155
|
name: OpenLinkProfiler
|
|
@@ -2116,7 +2158,7 @@
|
|
|
2116
2158
|
producer:
|
|
2117
2159
|
name: Axandra GmbH
|
|
2118
2160
|
url: http://www.axandra.com
|
|
2119
|
-
-
|
|
2161
|
+
-
|
|
2120
2162
|
user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
|
|
2121
2163
|
bot:
|
|
2122
2164
|
name: OpenWebSpider
|
|
@@ -2125,7 +2167,7 @@
|
|
|
2125
2167
|
producer:
|
|
2126
2168
|
name: OpenWebSpider Lab
|
|
2127
2169
|
url: http://lab.openwebspider.org
|
|
2128
|
-
-
|
|
2170
|
+
-
|
|
2129
2171
|
user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
|
|
2130
2172
|
bot:
|
|
2131
2173
|
name: Openindex Spider
|
|
@@ -2134,7 +2176,7 @@
|
|
|
2134
2176
|
producer:
|
|
2135
2177
|
name: Openindex B.V.
|
|
2136
2178
|
url: http://www.openindex.io
|
|
2137
|
-
-
|
|
2179
|
+
-
|
|
2138
2180
|
user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
|
|
2139
2181
|
bot:
|
|
2140
2182
|
name: Orange Bot
|
|
@@ -2143,7 +2185,7 @@
|
|
|
2143
2185
|
producer:
|
|
2144
2186
|
name: Orange
|
|
2145
2187
|
url: http://www.orange.fr
|
|
2146
|
-
-
|
|
2188
|
+
-
|
|
2147
2189
|
user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
|
|
2148
2190
|
bot:
|
|
2149
2191
|
name: Orange Bot
|
|
@@ -2152,7 +2194,7 @@
|
|
|
2152
2194
|
producer:
|
|
2153
2195
|
name: Orange
|
|
2154
2196
|
url: http://www.orange.fr
|
|
2155
|
-
-
|
|
2197
|
+
-
|
|
2156
2198
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
|
|
2157
2199
|
bot:
|
|
2158
2200
|
name: Orange Bot
|
|
@@ -2161,7 +2203,7 @@
|
|
|
2161
2203
|
producer:
|
|
2162
2204
|
name: Orange
|
|
2163
2205
|
url: http://www.orange.fr
|
|
2164
|
-
-
|
|
2206
|
+
-
|
|
2165
2207
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
|
|
2166
2208
|
bot:
|
|
2167
2209
|
name: Orange Bot
|
|
@@ -2170,7 +2212,7 @@
|
|
|
2170
2212
|
producer:
|
|
2171
2213
|
name: Orange
|
|
2172
2214
|
url: http://www.orange.fr
|
|
2173
|
-
-
|
|
2215
|
+
-
|
|
2174
2216
|
user_agent: Mozilla/5.0 (Java) outbrain
|
|
2175
2217
|
bot:
|
|
2176
2218
|
name: Outbrain
|
|
@@ -2179,7 +2221,7 @@
|
|
|
2179
2221
|
producer:
|
|
2180
2222
|
name: Outbrain
|
|
2181
2223
|
url: http://www.outbrain.com/
|
|
2182
|
-
-
|
|
2224
|
+
-
|
|
2183
2225
|
user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
|
|
2184
2226
|
bot:
|
|
2185
2227
|
name: PHP Server Monitor
|
|
@@ -2188,7 +2230,16 @@
|
|
|
2188
2230
|
producer:
|
|
2189
2231
|
name: PHP Server Monitor
|
|
2190
2232
|
url: http://www.phpservermonitor.org/
|
|
2191
|
-
-
|
|
2233
|
+
-
|
|
2234
|
+
user_agent: Mozilla/5.0 (compatible; PRTG Network Monitor (www.paessler.com); Windows)
|
|
2235
|
+
bot:
|
|
2236
|
+
name: PRTG Network Monitor
|
|
2237
|
+
category: Network Monitor
|
|
2238
|
+
url: https://www.paessler.com/prtg
|
|
2239
|
+
producer:
|
|
2240
|
+
name: Paessler AG
|
|
2241
|
+
url: https://www.paessler.com
|
|
2242
|
+
-
|
|
2192
2243
|
user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
|
|
2193
2244
|
bot:
|
|
2194
2245
|
name: PaperLiBot
|
|
@@ -2197,13 +2248,19 @@
|
|
|
2197
2248
|
producer:
|
|
2198
2249
|
name: Smallrivers SA
|
|
2199
2250
|
url: http://www.paper.li
|
|
2200
|
-
-
|
|
2251
|
+
-
|
|
2252
|
+
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; PetalBot;+https://aspiegel.com/petalbot)
|
|
2253
|
+
bot:
|
|
2254
|
+
name: Petal Bot
|
|
2255
|
+
category: Crawler
|
|
2256
|
+
url: https://aspiegel.com/petalbot
|
|
2257
|
+
-
|
|
2201
2258
|
user_agent: phantomas/1.11.0 (PhantomJS/1.9.8; linux x64)
|
|
2202
2259
|
bot:
|
|
2203
2260
|
name: Phantomas
|
|
2204
2261
|
category: Site Monitor
|
|
2205
2262
|
url: https://github.com/macbre/phantomas
|
|
2206
|
-
-
|
|
2263
|
+
-
|
|
2207
2264
|
user_agent: psbot-page (+http://www.picsearch.com/bot.html)
|
|
2208
2265
|
bot:
|
|
2209
2266
|
name: Picsearch bot
|
|
@@ -2212,7 +2269,7 @@
|
|
|
2212
2269
|
producer:
|
|
2213
2270
|
name: Picsearch
|
|
2214
2271
|
url: http://www.picsearch.com
|
|
2215
|
-
-
|
|
2272
|
+
-
|
|
2216
2273
|
user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
|
|
2217
2274
|
bot:
|
|
2218
2275
|
name: Picsearch bot
|
|
@@ -2221,7 +2278,7 @@
|
|
|
2221
2278
|
producer:
|
|
2222
2279
|
name: Picsearch
|
|
2223
2280
|
url: http://www.picsearch.com
|
|
2224
|
-
-
|
|
2281
|
+
-
|
|
2225
2282
|
user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
|
|
2226
2283
|
bot:
|
|
2227
2284
|
name: Pingdom Bot
|
|
@@ -2230,25 +2287,34 @@
|
|
|
2230
2287
|
producer:
|
|
2231
2288
|
name: Pingdom AB
|
|
2232
2289
|
url: https://www.pingdom.com
|
|
2233
|
-
-
|
|
2290
|
+
-
|
|
2234
2291
|
user_agent: Mozilla/5.0 (compatible; Pinterestbot/1.0; http://www.pinterest.com/bot.html)
|
|
2235
2292
|
bot:
|
|
2236
2293
|
name: Pinterest
|
|
2237
|
-
url:
|
|
2294
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
|
2238
2295
|
category: Crawler
|
|
2239
2296
|
producer:
|
|
2240
2297
|
name: Pinterest
|
|
2241
|
-
url:
|
|
2242
|
-
-
|
|
2298
|
+
url: https://www.pinterest.com/
|
|
2299
|
+
-
|
|
2243
2300
|
user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
|
|
2244
2301
|
bot:
|
|
2245
2302
|
name: Pinterest
|
|
2246
|
-
url:
|
|
2303
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
|
2304
|
+
category: Crawler
|
|
2305
|
+
producer:
|
|
2306
|
+
name: Pinterest
|
|
2307
|
+
url: https://www.pinterest.com/
|
|
2308
|
+
-
|
|
2309
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Pinterestbot/1.0; https://www.pinterest.com/bot.html)
|
|
2310
|
+
bot:
|
|
2311
|
+
name: Pinterest
|
|
2312
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
|
2247
2313
|
category: Crawler
|
|
2248
2314
|
producer:
|
|
2249
2315
|
name: Pinterest
|
|
2250
|
-
url:
|
|
2251
|
-
-
|
|
2316
|
+
url: https://www.pinterest.com/
|
|
2317
|
+
-
|
|
2252
2318
|
user_agent: PocketParser/2.0 (+https://getpocket.com/pocketparser_ua)
|
|
2253
2319
|
bot:
|
|
2254
2320
|
name: PocketParser
|
|
@@ -2257,7 +2323,7 @@
|
|
|
2257
2323
|
producer:
|
|
2258
2324
|
name: Pocket
|
|
2259
2325
|
url: https://getpocket.com/
|
|
2260
|
-
-
|
|
2326
|
+
-
|
|
2261
2327
|
user_agent: PritTorrent/1.0
|
|
2262
2328
|
bot:
|
|
2263
2329
|
name: PritTorrent
|
|
@@ -2266,7 +2332,7 @@
|
|
|
2266
2332
|
producer:
|
|
2267
2333
|
name: Bitlove
|
|
2268
2334
|
url: http://bitlove.org/
|
|
2269
|
-
-
|
|
2335
|
+
-
|
|
2270
2336
|
user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
|
|
2271
2337
|
bot:
|
|
2272
2338
|
name: QuerySeekerSpider
|
|
@@ -2275,7 +2341,7 @@
|
|
|
2275
2341
|
producer:
|
|
2276
2342
|
name: QueryEye Inc.
|
|
2277
2343
|
url: http://queryeye.com
|
|
2278
|
-
-
|
|
2344
|
+
-
|
|
2279
2345
|
user_agent: Quora Link Preview/1.0 (http://www.quora.com)
|
|
2280
2346
|
bot:
|
|
2281
2347
|
name: Quora Link Preview
|
|
@@ -2284,7 +2350,7 @@
|
|
|
2284
2350
|
producer:
|
|
2285
2351
|
name: Quora
|
|
2286
2352
|
url: http://www.quora.com
|
|
2287
|
-
-
|
|
2353
|
+
-
|
|
2288
2354
|
user_agent: 'Mozilla/5.0 (compatible; Qwantify/2.2w; +https://www.qwant.com/)/*'
|
|
2289
2355
|
bot:
|
|
2290
2356
|
name: Qwantify
|
|
@@ -2293,7 +2359,7 @@
|
|
|
2293
2359
|
producer:
|
|
2294
2360
|
name: Qwant Corporation
|
|
2295
2361
|
url: https://www.qwant.com/
|
|
2296
|
-
-
|
|
2362
|
+
-
|
|
2297
2363
|
user_agent: ROI Hunter; https://api-dev.roihunter.com
|
|
2298
2364
|
bot:
|
|
2299
2365
|
name: ROI Hunter
|
|
@@ -2302,17 +2368,17 @@
|
|
|
2302
2368
|
producer:
|
|
2303
2369
|
name: Roihunter a.s.
|
|
2304
2370
|
url: http://roihunter.com/
|
|
2305
|
-
-
|
|
2371
|
+
-
|
|
2306
2372
|
user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
|
|
2307
2373
|
bot:
|
|
2308
2374
|
name: RSSRadio Bot
|
|
2309
|
-
-
|
|
2375
|
+
-
|
|
2310
2376
|
user_agent: Rainmeter WebParser plugin
|
|
2311
2377
|
bot:
|
|
2312
2378
|
name: Rainmeter
|
|
2313
2379
|
category: Crawler
|
|
2314
2380
|
url: https://www.rainmeter.net
|
|
2315
|
-
-
|
|
2381
|
+
-
|
|
2316
2382
|
user_agent: RamblerMail/6.0 (incompatible; ImageProxy/6.0)
|
|
2317
2383
|
bot:
|
|
2318
2384
|
name: RamblerMail Image Proxy
|
|
@@ -2321,7 +2387,7 @@
|
|
|
2321
2387
|
producer:
|
|
2322
2388
|
name: 'Rambler&Co'
|
|
2323
2389
|
url: https://rambler-co.ru/
|
|
2324
|
-
-
|
|
2390
|
+
-
|
|
2325
2391
|
user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
|
|
2326
2392
|
bot:
|
|
2327
2393
|
name: Reddit Bot
|
|
@@ -2330,7 +2396,12 @@
|
|
|
2330
2396
|
producer:
|
|
2331
2397
|
name: reddit inc.
|
|
2332
2398
|
url: http://www.reddit.com
|
|
2333
|
-
-
|
|
2399
|
+
-
|
|
2400
|
+
user_agent: Robozilla/1.0
|
|
2401
|
+
bot:
|
|
2402
|
+
name: Robozilla
|
|
2403
|
+
category: Crawler
|
|
2404
|
+
-
|
|
2334
2405
|
user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
|
|
2335
2406
|
bot:
|
|
2336
2407
|
name: Rogerbot
|
|
@@ -2339,7 +2410,7 @@
|
|
|
2339
2410
|
producer:
|
|
2340
2411
|
name: SEOmoz, Inc.
|
|
2341
2412
|
url: http://moz.com/
|
|
2342
|
-
-
|
|
2413
|
+
-
|
|
2343
2414
|
user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
|
|
2344
2415
|
bot:
|
|
2345
2416
|
name: Rogerbot
|
|
@@ -2348,7 +2419,7 @@
|
|
|
2348
2419
|
producer:
|
|
2349
2420
|
name: SEOmoz, Inc.
|
|
2350
2421
|
url: http://moz.com/
|
|
2351
|
-
-
|
|
2422
|
+
-
|
|
2352
2423
|
user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
|
|
2353
2424
|
bot:
|
|
2354
2425
|
name: Rogerbot
|
|
@@ -2357,7 +2428,7 @@
|
|
|
2357
2428
|
producer:
|
|
2358
2429
|
name: SEOmoz, Inc.
|
|
2359
2430
|
url: http://moz.com/
|
|
2360
|
-
-
|
|
2431
|
+
-
|
|
2361
2432
|
user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
|
|
2362
2433
|
bot:
|
|
2363
2434
|
name: SEOENGBot
|
|
@@ -2366,7 +2437,7 @@
|
|
|
2366
2437
|
producer:
|
|
2367
2438
|
name: SEO Engine
|
|
2368
2439
|
url: http://www.seoengine.com
|
|
2369
|
-
-
|
|
2440
|
+
-
|
|
2370
2441
|
user_agent: Mozilla/5.0 (compatible; SEOkicks-Robot; +http://www.seokicks.de/robot.html)
|
|
2371
2442
|
bot:
|
|
2372
2443
|
name: SEOkicks-Robot
|
|
@@ -2375,7 +2446,7 @@
|
|
|
2375
2446
|
producer:
|
|
2376
2447
|
name: SEOkicks
|
|
2377
2448
|
url: https://www.seokicks.de/
|
|
2378
|
-
-
|
|
2449
|
+
-
|
|
2379
2450
|
user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
|
|
2380
2451
|
bot:
|
|
2381
2452
|
name: SISTRIX Crawler
|
|
@@ -2402,7 +2473,7 @@
|
|
|
2402
2473
|
producer:
|
|
2403
2474
|
name: SISTRIX GmbH
|
|
2404
2475
|
url: http://www.sistrix.de
|
|
2405
|
-
-
|
|
2476
|
+
-
|
|
2406
2477
|
user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer; Uptime; +https://www.sistrix.com/faq/uptime)
|
|
2407
2478
|
bot:
|
|
2408
2479
|
name: SISTRIX Optimizer
|
|
@@ -2411,7 +2482,7 @@
|
|
|
2411
2482
|
producer:
|
|
2412
2483
|
name: SISTRIX GmbH
|
|
2413
2484
|
url: http://www.sistrix.de
|
|
2414
|
-
-
|
|
2485
|
+
-
|
|
2415
2486
|
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.75 Safari/537.36 (compatible; SMTBot/1.0; +http://www.similartech.com/smtbot)
|
|
2416
2487
|
bot:
|
|
2417
2488
|
name: SMTBot
|
|
@@ -2420,7 +2491,7 @@
|
|
|
2420
2491
|
producer:
|
|
2421
2492
|
name: SimilarTech Ltd.
|
|
2422
2493
|
url: https://www.similartech.com/
|
|
2423
|
-
-
|
|
2494
|
+
-
|
|
2424
2495
|
user_agent: SSL Labs (https://www.ssllabs.com/about/assessment.html)
|
|
2425
2496
|
bot:
|
|
2426
2497
|
name: SSL Labs
|
|
@@ -2429,7 +2500,7 @@
|
|
|
2429
2500
|
producer:
|
|
2430
2501
|
name: SSL Labs
|
|
2431
2502
|
url: https://www.ssllabs.com/about/assessment.html
|
|
2432
|
-
-
|
|
2503
|
+
-
|
|
2433
2504
|
user_agent: SafeDNSBot (https://www.safedns.com/searchbot)
|
|
2434
2505
|
bot:
|
|
2435
2506
|
name: SafeDNSBot
|
|
@@ -2438,13 +2509,13 @@
|
|
|
2438
2509
|
producer:
|
|
2439
2510
|
name: SafeDNS, Inc.
|
|
2440
2511
|
url: https://www.safedns.com/
|
|
2441
|
-
-
|
|
2512
|
+
-
|
|
2442
2513
|
user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
|
|
2443
2514
|
bot:
|
|
2444
2515
|
name: Scrapy
|
|
2445
2516
|
category: Crawler
|
|
2446
2517
|
url: http://scrapy.org
|
|
2447
|
-
-
|
|
2518
|
+
-
|
|
2448
2519
|
user_agent: Screaming Frog SEO Spider/2.22
|
|
2449
2520
|
bot:
|
|
2450
2521
|
name: Screaming Frog SEO Spider
|
|
@@ -2453,7 +2524,7 @@
|
|
|
2453
2524
|
producer:
|
|
2454
2525
|
name: Screaming Frog Ltd
|
|
2455
2526
|
url: http://www.screamingfrog.co.uk
|
|
2456
|
-
-
|
|
2527
|
+
-
|
|
2457
2528
|
user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
|
|
2458
2529
|
bot:
|
|
2459
2530
|
name: ScreenerBot
|
|
@@ -2462,7 +2533,13 @@
|
|
|
2462
2533
|
producer:
|
|
2463
2534
|
name: ""
|
|
2464
2535
|
url: ""
|
|
2465
|
-
-
|
|
2536
|
+
-
|
|
2537
|
+
user_agent: Mozilla/5.0 (compatible) SemanticScholarBot (+https://www.semanticscholar.org/crawler)
|
|
2538
|
+
bot:
|
|
2539
|
+
name: Semantic Scholar Bot
|
|
2540
|
+
category: Crawler
|
|
2541
|
+
url: https://www.semanticscholar.org/crawler
|
|
2542
|
+
-
|
|
2466
2543
|
user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
|
|
2467
2544
|
bot:
|
|
2468
2545
|
name: Semrush Bot
|
|
@@ -2471,7 +2548,7 @@
|
|
|
2471
2548
|
producer:
|
|
2472
2549
|
name: SEMrush
|
|
2473
2550
|
url: http://www.semrush.com
|
|
2474
|
-
-
|
|
2551
|
+
-
|
|
2475
2552
|
user_agent: SensikaBot/x.33 (+http://sensika.com)
|
|
2476
2553
|
bot:
|
|
2477
2554
|
name: Sensika Bot
|
|
@@ -2480,24 +2557,36 @@
|
|
|
2480
2557
|
producer:
|
|
2481
2558
|
name: Sensika
|
|
2482
2559
|
url: http://sensika.com
|
|
2483
|
-
-
|
|
2560
|
+
-
|
|
2484
2561
|
user_agent: sentry/8.6.0 (https://getsentry.com)
|
|
2485
2562
|
bot:
|
|
2486
2563
|
name: Sentry Bot
|
|
2487
2564
|
producer:
|
|
2488
2565
|
name: Sentry
|
|
2489
2566
|
url: https://sentry.io
|
|
2490
|
-
-
|
|
2567
|
+
-
|
|
2568
|
+
user_agent: Seobility
|
|
2569
|
+
bot:
|
|
2570
|
+
name: Seobility
|
|
2571
|
+
category: Crawler
|
|
2572
|
+
url: 'https://www.seobility.net/en/faq/?category=crawling#!aboutourbot'
|
|
2573
|
+
-
|
|
2491
2574
|
user_agent: Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)
|
|
2492
2575
|
bot:
|
|
2493
2576
|
name: Seoscanners.net
|
|
2494
2577
|
category: Crawler
|
|
2495
2578
|
url: ""
|
|
2496
|
-
-
|
|
2579
|
+
-
|
|
2580
|
+
user_agent: SerendeputyBot/0.8.6 (http://serendeputy.com/about/serendeputy-bot)
|
|
2581
|
+
bot:
|
|
2582
|
+
name: Serendeputy Bot
|
|
2583
|
+
category: Crawler
|
|
2584
|
+
url: https://serendeputy.com/about/serendeputy-bot
|
|
2585
|
+
-
|
|
2497
2586
|
user_agent: Server Density Service Monitoring v2
|
|
2498
2587
|
bot:
|
|
2499
2588
|
name: Server Density
|
|
2500
|
-
-
|
|
2589
|
+
-
|
|
2501
2590
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
|
|
2502
2591
|
bot:
|
|
2503
2592
|
name: Seznam Bot
|
|
@@ -2506,7 +2595,7 @@
|
|
|
2506
2595
|
producer:
|
|
2507
2596
|
name: Seznam.cz, a.s.
|
|
2508
2597
|
url: http://www.seznam.cz/
|
|
2509
|
-
-
|
|
2598
|
+
-
|
|
2510
2599
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
|
|
2511
2600
|
bot:
|
|
2512
2601
|
name: Seznam Bot
|
|
@@ -2515,7 +2604,7 @@
|
|
|
2515
2604
|
producer:
|
|
2516
2605
|
name: Seznam.cz, a.s.
|
|
2517
2606
|
url: http://www.seznam.cz/
|
|
2518
|
-
-
|
|
2607
|
+
-
|
|
2519
2608
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
|
|
2520
2609
|
bot:
|
|
2521
2610
|
name: Seznam Bot
|
|
@@ -2524,7 +2613,7 @@
|
|
|
2524
2613
|
producer:
|
|
2525
2614
|
name: Seznam.cz, a.s.
|
|
2526
2615
|
url: http://www.seznam.cz/
|
|
2527
|
-
-
|
|
2616
|
+
-
|
|
2528
2617
|
user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
|
|
2529
2618
|
bot:
|
|
2530
2619
|
name: Seznam Bot
|
|
@@ -2533,7 +2622,7 @@
|
|
|
2533
2622
|
producer:
|
|
2534
2623
|
name: Seznam.cz, a.s.
|
|
2535
2624
|
url: http://www.seznam.cz/
|
|
2536
|
-
-
|
|
2625
|
+
-
|
|
2537
2626
|
user_agent: Mozilla/5.0 SeznamEmailProxy/2.0.174
|
|
2538
2627
|
bot:
|
|
2539
2628
|
name: Seznam Email Proxy
|
|
@@ -2542,7 +2631,7 @@
|
|
|
2542
2631
|
producer:
|
|
2543
2632
|
name: Seznam.cz, a.s.
|
|
2544
2633
|
url: http://www.seznam.cz/
|
|
2545
|
-
-
|
|
2634
|
+
-
|
|
2546
2635
|
user_agent: Seznam-Zbozi-robot/3.0
|
|
2547
2636
|
bot:
|
|
2548
2637
|
name: Seznam Zbozi.cz
|
|
@@ -2551,7 +2640,7 @@
|
|
|
2551
2640
|
producer:
|
|
2552
2641
|
name: Seznam.cz, a.s.
|
|
2553
2642
|
url: https://www.zbozi.cz/
|
|
2554
|
-
-
|
|
2643
|
+
-
|
|
2555
2644
|
user_agent: Mozilla/5.0 (ShopAlike; LadenZeile) FeedBot
|
|
2556
2645
|
bot:
|
|
2557
2646
|
name: ShopAlike
|
|
@@ -2560,7 +2649,7 @@
|
|
|
2560
2649
|
producer:
|
|
2561
2650
|
name: Visual Meta
|
|
2562
2651
|
url: https://www.shopalike.cz/
|
|
2563
|
-
-
|
|
2652
|
+
-
|
|
2564
2653
|
user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
|
|
2565
2654
|
bot:
|
|
2566
2655
|
name: ShopWiki
|
|
@@ -2569,7 +2658,7 @@
|
|
|
2569
2658
|
producer:
|
|
2570
2659
|
name: ShopWiki Corp.
|
|
2571
2660
|
url: http://www.shopwiki.com
|
|
2572
|
-
-
|
|
2661
|
+
-
|
|
2573
2662
|
user_agent: shopify-partner-homepage-scraper
|
|
2574
2663
|
bot:
|
|
2575
2664
|
name: Shopify Partner
|
|
@@ -2578,7 +2667,7 @@
|
|
|
2578
2667
|
producer:
|
|
2579
2668
|
name: Shopify
|
|
2580
2669
|
url: https://www.shopify.com/
|
|
2581
|
-
-
|
|
2670
|
+
-
|
|
2582
2671
|
user_agent: SilverReader/1.0; http://silverreader.com
|
|
2583
2672
|
bot:
|
|
2584
2673
|
name: SilverReader
|
|
@@ -2587,7 +2676,7 @@
|
|
|
2587
2676
|
producer:
|
|
2588
2677
|
name: ""
|
|
2589
2678
|
url: ""
|
|
2590
|
-
-
|
|
2679
|
+
-
|
|
2591
2680
|
user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
|
|
2592
2681
|
bot:
|
|
2593
2682
|
name: SimplePie
|
|
@@ -2596,7 +2685,7 @@
|
|
|
2596
2685
|
producer:
|
|
2597
2686
|
name: ""
|
|
2598
2687
|
url: ""
|
|
2599
|
-
-
|
|
2688
|
+
-
|
|
2600
2689
|
user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
|
|
2601
2690
|
bot:
|
|
2602
2691
|
name: SimplePie
|
|
@@ -2605,7 +2694,7 @@
|
|
|
2605
2694
|
producer:
|
|
2606
2695
|
name: ""
|
|
2607
2696
|
url: ""
|
|
2608
|
-
-
|
|
2697
|
+
-
|
|
2609
2698
|
user_agent: Site24x7
|
|
2610
2699
|
bot:
|
|
2611
2700
|
name: Site24x7 Website Monitoring
|
|
@@ -2614,13 +2703,13 @@
|
|
|
2614
2703
|
producer:
|
|
2615
2704
|
name: Site24x7
|
|
2616
2705
|
url: https://www.site24x7.com
|
|
2617
|
-
-
|
|
2706
|
+
-
|
|
2618
2707
|
user_agent: SiteSucker for macOS/2.10.5
|
|
2619
2708
|
bot:
|
|
2620
2709
|
name: SiteSucker
|
|
2621
2710
|
category: Crawler
|
|
2622
2711
|
url: http://ricks-apps.com/osx/sitesucker/
|
|
2623
|
-
-
|
|
2712
|
+
-
|
|
2624
2713
|
user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.0) Match by Siteimprove.com
|
|
2625
2714
|
bot:
|
|
2626
2715
|
name: Siteimprove
|
|
@@ -2629,7 +2718,7 @@
|
|
|
2629
2718
|
producer:
|
|
2630
2719
|
name: Siteimprove GmbH
|
|
2631
2720
|
url: https://siteimprove.com/
|
|
2632
|
-
-
|
|
2721
|
+
-
|
|
2633
2722
|
user_agent: Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; Trident/6.0) LinkCheck by Siteimprove.com
|
|
2634
2723
|
bot:
|
|
2635
2724
|
name: Siteimprove
|
|
@@ -2638,7 +2727,7 @@
|
|
|
2638
2727
|
producer:
|
|
2639
2728
|
name: Siteimprove GmbH
|
|
2640
2729
|
url: https://siteimprove.com/
|
|
2641
|
-
-
|
|
2730
|
+
-
|
|
2642
2731
|
user_agent: sixy.ch/1.0
|
|
2643
2732
|
bot:
|
|
2644
2733
|
name: Sixy.ch
|
|
@@ -2647,7 +2736,7 @@
|
|
|
2647
2736
|
producer:
|
|
2648
2737
|
name: Manuel Kasper
|
|
2649
2738
|
url: https://neon1.net/
|
|
2650
|
-
-
|
|
2739
|
+
-
|
|
2651
2740
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
|
|
2652
2741
|
bot:
|
|
2653
2742
|
name: Skype URI Preview
|
|
@@ -2656,7 +2745,7 @@
|
|
|
2656
2745
|
producer:
|
|
2657
2746
|
name: Skype Communications S.à.r.l.
|
|
2658
2747
|
url: https://www.skype.com
|
|
2659
|
-
-
|
|
2748
|
+
-
|
|
2660
2749
|
user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
|
|
2661
2750
|
bot:
|
|
2662
2751
|
name: Slackbot
|
|
@@ -2665,7 +2754,7 @@
|
|
|
2665
2754
|
producer:
|
|
2666
2755
|
name: Slack Technologies
|
|
2667
2756
|
url: http://slack.com
|
|
2668
|
-
-
|
|
2757
|
+
-
|
|
2669
2758
|
user_agent: 'AppEngine-Google; (+http://code.google.com/appengine; appid: s~snapchat-proxy)'
|
|
2670
2759
|
bot:
|
|
2671
2760
|
name: Snapchat Proxy
|
|
@@ -2674,7 +2763,7 @@
|
|
|
2674
2763
|
producer:
|
|
2675
2764
|
name: Snapchat Inc.
|
|
2676
2765
|
url: https://www.snapchat.com
|
|
2677
|
-
-
|
|
2766
|
+
-
|
|
2678
2767
|
user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
|
|
2679
2768
|
bot:
|
|
2680
2769
|
name: Sogou Spider
|
|
@@ -2683,7 +2772,7 @@
|
|
|
2683
2772
|
producer:
|
|
2684
2773
|
name: Sohu, Inc.
|
|
2685
2774
|
url: http://www.sogou.com
|
|
2686
|
-
-
|
|
2775
|
+
-
|
|
2687
2776
|
user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
|
2688
2777
|
bot:
|
|
2689
2778
|
name: Sogou Spider
|
|
@@ -2692,7 +2781,7 @@
|
|
|
2692
2781
|
producer:
|
|
2693
2782
|
name: Sohu, Inc.
|
|
2694
2783
|
url: http://www.sogou.com
|
|
2695
|
-
-
|
|
2784
|
+
-
|
|
2696
2785
|
user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
|
|
2697
2786
|
bot:
|
|
2698
2787
|
name: Sogou Spider
|
|
@@ -2701,7 +2790,7 @@
|
|
|
2701
2790
|
producer:
|
|
2702
2791
|
name: Sohu, Inc.
|
|
2703
2792
|
url: http://www.sogou.com
|
|
2704
|
-
-
|
|
2793
|
+
-
|
|
2705
2794
|
user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
|
2706
2795
|
bot:
|
|
2707
2796
|
name: Sogou Spider
|
|
@@ -2710,7 +2799,7 @@
|
|
|
2710
2799
|
producer:
|
|
2711
2800
|
name: Sohu, Inc.
|
|
2712
2801
|
url: http://www.sogou.com
|
|
2713
|
-
-
|
|
2802
|
+
-
|
|
2714
2803
|
user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
|
|
2715
2804
|
bot:
|
|
2716
2805
|
name: Soso Spider
|
|
@@ -2719,13 +2808,13 @@
|
|
|
2719
2808
|
producer:
|
|
2720
2809
|
name: Tencent Holdings
|
|
2721
2810
|
url: http://www.soso.com
|
|
2722
|
-
-
|
|
2811
|
+
-
|
|
2723
2812
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_6) AppleWebKit/537.36 (KHTML, like Gecko) Sparkler/0.2.0-SNAPSHOT
|
|
2724
2813
|
bot:
|
|
2725
2814
|
name: Sparkler
|
|
2726
2815
|
category: Crawler
|
|
2727
2816
|
url: https://github.com/USCDataScience/sparkler
|
|
2728
|
-
-
|
|
2817
|
+
-
|
|
2729
2818
|
user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
|
|
2730
2819
|
bot:
|
|
2731
2820
|
name: Spinn3r
|
|
@@ -2734,32 +2823,26 @@
|
|
|
2734
2823
|
producer:
|
|
2735
2824
|
name: Tailrank Inc
|
|
2736
2825
|
url: http://spinn3r.com
|
|
2737
|
-
-
|
|
2826
|
+
-
|
|
2738
2827
|
user_agent: Spotify/1.0
|
|
2739
2828
|
bot:
|
|
2740
2829
|
name: Spotify
|
|
2741
2830
|
producer:
|
|
2742
2831
|
name: Spotify
|
|
2743
2832
|
url: https://www.spotify.com
|
|
2744
|
-
-
|
|
2833
|
+
-
|
|
2745
2834
|
user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
|
|
2746
2835
|
bot:
|
|
2747
2836
|
name: Sputnik Bot
|
|
2748
|
-
category: ""
|
|
2837
|
+
category: "Crawler"
|
|
2749
2838
|
url: ""
|
|
2750
|
-
|
|
2751
|
-
name: ""
|
|
2752
|
-
url: ""
|
|
2753
|
-
-
|
|
2839
|
+
-
|
|
2754
2840
|
user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
|
|
2755
2841
|
bot:
|
|
2756
|
-
name: Sputnik Bot
|
|
2757
|
-
category: ""
|
|
2842
|
+
name: Sputnik Image Bot
|
|
2843
|
+
category: "Crawler"
|
|
2758
2844
|
url: ""
|
|
2759
|
-
|
|
2760
|
-
name: ""
|
|
2761
|
-
url: ""
|
|
2762
|
-
-
|
|
2845
|
+
-
|
|
2763
2846
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_8_5) AppleWebKit/536.30.1 (KHTML, like Gecko) (compatible; Startpagina-Linkchecker/1.0; +https://www.startpagina.nl/linkchecker)
|
|
2764
2847
|
bot:
|
|
2765
2848
|
name: Startpagina Linkchecker
|
|
@@ -2768,7 +2851,7 @@
|
|
|
2768
2851
|
producer:
|
|
2769
2852
|
name: Startpagina B.V.
|
|
2770
2853
|
url: https://www.startpagina.nl/
|
|
2771
|
-
-
|
|
2854
|
+
-
|
|
2772
2855
|
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.4 (KHTML, like Gecko) Chrome/98 Safari/537.4 (StatusCake)
|
|
2773
2856
|
bot:
|
|
2774
2857
|
name: StatusCake
|
|
@@ -2777,7 +2860,7 @@
|
|
|
2777
2860
|
producer:
|
|
2778
2861
|
name: StatusCake
|
|
2779
2862
|
url: https://www.statuscake.com
|
|
2780
|
-
-
|
|
2863
|
+
-
|
|
2781
2864
|
user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
|
|
2782
2865
|
bot:
|
|
2783
2866
|
name: Superfeedr Bot
|
|
@@ -2786,7 +2869,7 @@
|
|
|
2786
2869
|
producer:
|
|
2787
2870
|
name: Superfeedr
|
|
2788
2871
|
url: https://superfeedr.com/
|
|
2789
|
-
-
|
|
2872
|
+
-
|
|
2790
2873
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
|
|
2791
2874
|
bot:
|
|
2792
2875
|
name: Survey Bot
|
|
@@ -2795,7 +2878,7 @@
|
|
|
2795
2878
|
producer:
|
|
2796
2879
|
name: Domain Tools
|
|
2797
2880
|
url: http://www.domaintools.com
|
|
2798
|
-
-
|
|
2881
|
+
-
|
|
2799
2882
|
user_agent: TLSProbe/1.0 (+https://scan.trustnet.venafi.com/)
|
|
2800
2883
|
bot:
|
|
2801
2884
|
name: TLSProbe
|
|
@@ -2804,23 +2887,23 @@
|
|
|
2804
2887
|
producer:
|
|
2805
2888
|
name: Venafi TrustNet
|
|
2806
2889
|
url: https://www.venafi.com
|
|
2807
|
-
-
|
|
2890
|
+
-
|
|
2808
2891
|
user_agent: Tarmot Gezgin/1.0 (compatible; TarmotGezgin/1.1; +http://www.tarmot.com/gezgin)
|
|
2809
2892
|
bot:
|
|
2810
2893
|
name: Tarmot Gezgin
|
|
2811
2894
|
url: http://www.tarmot.com/gezgin/
|
|
2812
2895
|
category: Search bot
|
|
2813
|
-
-
|
|
2896
|
+
-
|
|
2814
2897
|
user_agent: TelegramBot (like TwitterBot)
|
|
2815
2898
|
bot:
|
|
2816
2899
|
name: TelegramBot
|
|
2817
2900
|
url: https://telegram.org/blog/bot-revolution
|
|
2818
|
-
-
|
|
2901
|
+
-
|
|
2819
2902
|
user_agent: The Knowledge AI
|
|
2820
2903
|
bot:
|
|
2821
2904
|
name: The Knowledge AI
|
|
2822
2905
|
category: Crawler
|
|
2823
|
-
-
|
|
2906
|
+
-
|
|
2824
2907
|
user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
|
|
2825
2908
|
bot:
|
|
2826
2909
|
name: TinEye Crawler
|
|
@@ -2829,7 +2912,7 @@
|
|
|
2829
2912
|
producer:
|
|
2830
2913
|
name: Idée Inc.
|
|
2831
2914
|
url: http://ideeinc.com
|
|
2832
|
-
-
|
|
2915
|
+
-
|
|
2833
2916
|
user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
|
|
2834
2917
|
bot:
|
|
2835
2918
|
name: Tiny Tiny RSS
|
|
@@ -2838,7 +2921,7 @@
|
|
|
2838
2921
|
producer:
|
|
2839
2922
|
name: ""
|
|
2840
2923
|
url: ""
|
|
2841
|
-
-
|
|
2924
|
+
-
|
|
2842
2925
|
user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
|
|
2843
2926
|
bot:
|
|
2844
2927
|
name: Tiny Tiny RSS
|
|
@@ -2847,7 +2930,7 @@
|
|
|
2847
2930
|
producer:
|
|
2848
2931
|
name: ""
|
|
2849
2932
|
url: ""
|
|
2850
|
-
-
|
|
2933
|
+
-
|
|
2851
2934
|
user_agent: Mozilla/5.0 (compatible; tracemyfile/1.0)
|
|
2852
2935
|
bot:
|
|
2853
2936
|
name: TraceMyFile
|
|
@@ -2856,7 +2939,7 @@
|
|
|
2856
2939
|
producer:
|
|
2857
2940
|
name: Idee Inc.
|
|
2858
2941
|
url: http://ideeinc.com/
|
|
2859
|
-
-
|
|
2942
|
+
-
|
|
2860
2943
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 6.0; en-GB; rv:1.0; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20071127 Firefox/3.0.0.11
|
|
2861
2944
|
bot:
|
|
2862
2945
|
name: Trendiction Bot
|
|
@@ -2865,7 +2948,7 @@
|
|
|
2865
2948
|
producer:
|
|
2866
2949
|
name: Talkwalker Inc.
|
|
2867
2950
|
url: http://www.talkwalker.com
|
|
2868
|
-
-
|
|
2951
|
+
-
|
|
2869
2952
|
user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
|
|
2870
2953
|
bot:
|
|
2871
2954
|
name: TurnitinBot
|
|
@@ -2874,7 +2957,7 @@
|
|
|
2874
2957
|
producer:
|
|
2875
2958
|
name: iParadigms, LLC.
|
|
2876
2959
|
url: http://www.turnitin.com
|
|
2877
|
-
-
|
|
2960
|
+
-
|
|
2878
2961
|
user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
|
|
2879
2962
|
bot:
|
|
2880
2963
|
name: TweetedTimes Bot
|
|
@@ -2883,7 +2966,7 @@
|
|
|
2883
2966
|
producer:
|
|
2884
2967
|
name: TweetedTimes
|
|
2885
2968
|
url: http://tweetedtimes.com/
|
|
2886
|
-
-
|
|
2969
|
+
-
|
|
2887
2970
|
user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
|
|
2888
2971
|
bot:
|
|
2889
2972
|
name: TweetedTimes Bot
|
|
@@ -2892,7 +2975,7 @@
|
|
|
2892
2975
|
producer:
|
|
2893
2976
|
name: TweetedTimes
|
|
2894
2977
|
url: http://tweetedtimes.com/
|
|
2895
|
-
-
|
|
2978
|
+
-
|
|
2896
2979
|
user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
|
|
2897
2980
|
bot:
|
|
2898
2981
|
name: Tweetmeme Bot
|
|
@@ -2901,7 +2984,7 @@
|
|
|
2901
2984
|
producer:
|
|
2902
2985
|
name: Mediasift
|
|
2903
2986
|
url: ""
|
|
2904
|
-
-
|
|
2987
|
+
-
|
|
2905
2988
|
user_agent: Mozilla/5.0 (compatible; Twingly Recon; twingly.com)
|
|
2906
2989
|
bot:
|
|
2907
2990
|
name: Twingly Recon
|
|
@@ -2909,7 +2992,7 @@
|
|
|
2909
2992
|
producer:
|
|
2910
2993
|
name: Twingly
|
|
2911
2994
|
url: https://www.twingly.com
|
|
2912
|
-
-
|
|
2995
|
+
-
|
|
2913
2996
|
user_agent: Twitterbot/1.0
|
|
2914
2997
|
bot:
|
|
2915
2998
|
name: Twitterbot
|
|
@@ -2918,7 +3001,7 @@
|
|
|
2918
3001
|
producer:
|
|
2919
3002
|
name: Twitter
|
|
2920
3003
|
url: http://www.twitter.com
|
|
2921
|
-
-
|
|
3004
|
+
-
|
|
2922
3005
|
user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
|
|
2923
3006
|
bot:
|
|
2924
3007
|
name: URLAppendBot
|
|
@@ -2927,7 +3010,7 @@
|
|
|
2927
3010
|
producer:
|
|
2928
3011
|
name: Profound Networks
|
|
2929
3012
|
url: http://www.profound.net
|
|
2930
|
-
-
|
|
3013
|
+
-
|
|
2931
3014
|
user_agent: 'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36 (via secureurl.fwdcdn.com - mail.ukr.net proxy)'
|
|
2932
3015
|
bot:
|
|
2933
3016
|
name: UkrNet Mail Proxy
|
|
@@ -2936,7 +3019,7 @@
|
|
|
2936
3019
|
producer:
|
|
2937
3020
|
name: UkrNet Ltd
|
|
2938
3021
|
url: https://www.ukr.net/
|
|
2939
|
-
-
|
|
3022
|
+
-
|
|
2940
3023
|
user_agent: UniversalFeedParser/5.2.1 +https://code.google.com/p/feedparser/
|
|
2941
3024
|
bot:
|
|
2942
3025
|
name: UniversalFeedParser
|
|
@@ -2945,7 +3028,7 @@
|
|
|
2945
3028
|
producer:
|
|
2946
3029
|
name: Kurt McKee
|
|
2947
3030
|
url: https://github.com/kurtmckee
|
|
2948
|
-
-
|
|
3031
|
+
-
|
|
2949
3032
|
user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
|
|
2950
3033
|
bot:
|
|
2951
3034
|
name: Uptime Robot
|
|
@@ -2954,7 +3037,7 @@
|
|
|
2954
3037
|
producer:
|
|
2955
3038
|
name: Uptime Robot
|
|
2956
3039
|
url: http://uptimerobot.com
|
|
2957
|
-
-
|
|
3040
|
+
-
|
|
2958
3041
|
user_agent: Mozilla/5.0 (compatible; Uptimebot/1.0; +http://www.uptime.com/uptimebot)
|
|
2959
3042
|
bot:
|
|
2960
3043
|
name: Uptimebot
|
|
@@ -2963,7 +3046,7 @@
|
|
|
2963
3046
|
producer:
|
|
2964
3047
|
name: Uptime
|
|
2965
3048
|
url: https://uptime.com
|
|
2966
|
-
-
|
|
3049
|
+
-
|
|
2967
3050
|
user_agent: Mozilla/5.0 (compatible; vkShare; +http://vk.com/dev/Share)
|
|
2968
3051
|
bot:
|
|
2969
3052
|
name: VK Share Button
|
|
@@ -2972,7 +3055,7 @@
|
|
|
2972
3055
|
producer:
|
|
2973
3056
|
name: VK
|
|
2974
3057
|
url: http://vk.com/
|
|
2975
|
-
-
|
|
3058
|
+
-
|
|
2976
3059
|
user_agent: 'Mozilla/4.0 (compatible; Vagabondo/4.0; http://webagent.wise-guys.nl/; http://www.wise-guys.nl/)'
|
|
2977
3060
|
bot:
|
|
2978
3061
|
name: Vagabondo
|
|
@@ -2981,7 +3064,19 @@
|
|
|
2981
3064
|
producer:
|
|
2982
3065
|
name: WiseGuys
|
|
2983
3066
|
url: http://www.wise-guys.nl/
|
|
2984
|
-
-
|
|
3067
|
+
-
|
|
3068
|
+
user_agent: Mozilla/5.0 (compatible; VelenPublicWebCrawler/1.0; +https://velen.io)
|
|
3069
|
+
bot:
|
|
3070
|
+
name: Velen Public Web Crawler
|
|
3071
|
+
category: Crawler
|
|
3072
|
+
url: https://hunter.io/robot
|
|
3073
|
+
-
|
|
3074
|
+
user_agent: Vercelbot (+https://vercel.com)
|
|
3075
|
+
bot:
|
|
3076
|
+
name: Vercel Bot
|
|
3077
|
+
category: Service bot
|
|
3078
|
+
url: https://vercel.com
|
|
3079
|
+
-
|
|
2985
3080
|
user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
|
|
2986
3081
|
bot:
|
|
2987
3082
|
name: Visual Site Mapper Crawler
|
|
@@ -2990,7 +3085,7 @@
|
|
|
2990
3085
|
producer:
|
|
2991
3086
|
name: Alentum Software Ltd.
|
|
2992
3087
|
url: http://www.alentum.com
|
|
2993
|
-
-
|
|
3088
|
+
-
|
|
2994
3089
|
user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
|
|
2995
3090
|
bot:
|
|
2996
3091
|
name: W3C CSS Validator
|
|
@@ -2999,7 +3094,7 @@
|
|
|
2999
3094
|
producer:
|
|
3000
3095
|
name: W3C
|
|
3001
3096
|
url: http://www.w3.org
|
|
3002
|
-
-
|
|
3097
|
+
-
|
|
3003
3098
|
user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
|
|
3004
3099
|
bot:
|
|
3005
3100
|
name: W3C I18N Checker
|
|
@@ -3008,7 +3103,7 @@
|
|
|
3008
3103
|
producer:
|
|
3009
3104
|
name: W3C
|
|
3010
3105
|
url: http://www.w3.org
|
|
3011
|
-
-
|
|
3106
|
+
-
|
|
3012
3107
|
user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
|
|
3013
3108
|
bot:
|
|
3014
3109
|
name: W3C Link Checker
|
|
@@ -3017,7 +3112,7 @@
|
|
|
3017
3112
|
producer:
|
|
3018
3113
|
name: W3C
|
|
3019
3114
|
url: http://www.w3.org
|
|
3020
|
-
-
|
|
3115
|
+
-
|
|
3021
3116
|
user_agent: W3C-checklink/4.81 libwww-perl/5.836
|
|
3022
3117
|
bot:
|
|
3023
3118
|
name: W3C Link Checker
|
|
@@ -3026,7 +3121,7 @@
|
|
|
3026
3121
|
producer:
|
|
3027
3122
|
name: W3C
|
|
3028
3123
|
url: http://www.w3.org
|
|
3029
|
-
-
|
|
3124
|
+
-
|
|
3030
3125
|
user_agent: Validator.nu/LV http://validator.w3.org/services
|
|
3031
3126
|
bot:
|
|
3032
3127
|
name: W3C Markup Validation Service
|
|
@@ -3035,7 +3130,7 @@
|
|
|
3035
3130
|
producer:
|
|
3036
3131
|
name: W3C
|
|
3037
3132
|
url: http://www.w3.org
|
|
3038
|
-
-
|
|
3133
|
+
-
|
|
3039
3134
|
user_agent: W3C_Validator/1.3 http://validator.w3.org/services
|
|
3040
3135
|
bot:
|
|
3041
3136
|
name: W3C Markup Validation Service
|
|
@@ -3044,7 +3139,7 @@
|
|
|
3044
3139
|
producer:
|
|
3045
3140
|
name: W3C
|
|
3046
3141
|
url: http://www.w3.org
|
|
3047
|
-
-
|
|
3142
|
+
-
|
|
3048
3143
|
user_agent: W3C_Validator/1.767
|
|
3049
3144
|
bot:
|
|
3050
3145
|
name: W3C Markup Validation Service
|
|
@@ -3053,7 +3148,7 @@
|
|
|
3053
3148
|
producer:
|
|
3054
3149
|
name: W3C
|
|
3055
3150
|
url: http://www.w3.org
|
|
3056
|
-
-
|
|
3151
|
+
-
|
|
3057
3152
|
user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
|
|
3058
3153
|
bot:
|
|
3059
3154
|
name: W3C MobileOK Checker
|
|
@@ -3062,7 +3157,7 @@
|
|
|
3062
3157
|
producer:
|
|
3063
3158
|
name: W3C
|
|
3064
3159
|
url: http://www.w3.org
|
|
3065
|
-
-
|
|
3160
|
+
-
|
|
3066
3161
|
user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
|
|
3067
3162
|
bot:
|
|
3068
3163
|
name: W3C Unified Validator
|
|
@@ -3071,7 +3166,7 @@
|
|
|
3071
3166
|
producer:
|
|
3072
3167
|
name: W3C
|
|
3073
3168
|
url: http://www.w3.org
|
|
3074
|
-
-
|
|
3169
|
+
-
|
|
3075
3170
|
user_agent: Mozilla/5.0 (compatible; Wappalyzer; +https://github.com/AliasIO/Wappalyzer)
|
|
3076
3171
|
bot:
|
|
3077
3172
|
name: Wappalyzer
|
|
@@ -3079,7 +3174,7 @@
|
|
|
3079
3174
|
producer:
|
|
3080
3175
|
name: AliasIO
|
|
3081
3176
|
url: https://github.com/AliasIO
|
|
3082
|
-
-
|
|
3177
|
+
-
|
|
3083
3178
|
user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
|
|
3084
3179
|
bot:
|
|
3085
3180
|
name: WeSEE:Search
|
|
@@ -3088,13 +3183,13 @@
|
|
|
3088
3183
|
producer:
|
|
3089
3184
|
name: WeSEE Ltd
|
|
3090
3185
|
url: http://www.wesee.com
|
|
3091
|
-
-
|
|
3186
|
+
-
|
|
3092
3187
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Moto G (4) Build/MPJ24.139-64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.146 Mobile Safari/537.36 PTST/180829.190838
|
|
3093
3188
|
bot:
|
|
3094
3189
|
name: WebPageTest
|
|
3095
3190
|
category: Site Monitor
|
|
3096
3191
|
url: https://www.webpagetest.org
|
|
3097
|
-
-
|
|
3192
|
+
-
|
|
3098
3193
|
user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
|
|
3099
3194
|
bot:
|
|
3100
3195
|
name: WebSitePulse
|
|
@@ -3103,7 +3198,7 @@
|
|
|
3103
3198
|
producer:
|
|
3104
3199
|
name: WebSitePulse
|
|
3105
3200
|
url: http://www.websitepulse.com/
|
|
3106
|
-
-
|
|
3201
|
+
-
|
|
3107
3202
|
user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
|
|
3108
3203
|
bot:
|
|
3109
3204
|
name: WebbCrawler
|
|
@@ -3112,7 +3207,7 @@
|
|
|
3112
3207
|
producer:
|
|
3113
3208
|
name: Steve Webb
|
|
3114
3209
|
url: http://badcheese.com
|
|
3115
|
-
-
|
|
3210
|
+
-
|
|
3116
3211
|
user_agent: weborama-fetcher (+http://www.weborama.com)
|
|
3117
3212
|
bot:
|
|
3118
3213
|
name: Weborama
|
|
@@ -3121,7 +3216,7 @@
|
|
|
3121
3216
|
producer:
|
|
3122
3217
|
name: Weborama SA
|
|
3123
3218
|
url: https://weborama.com/
|
|
3124
|
-
-
|
|
3219
|
+
-
|
|
3125
3220
|
user_agent: WikiDo/1.1 (http://wikido.com; crawler@wikido.com)
|
|
3126
3221
|
bot:
|
|
3127
3222
|
name: WikiDo
|
|
@@ -3130,7 +3225,7 @@
|
|
|
3130
3225
|
producer:
|
|
3131
3226
|
name: Fotolitografie Fiorentine di Becchi Antonio s.n.c.
|
|
3132
3227
|
url: https://www.wikido.com/
|
|
3133
|
-
-
|
|
3228
|
+
-
|
|
3134
3229
|
user_agent: Mozilla/5.0 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
|
3135
3230
|
bot:
|
|
3136
3231
|
name: WooRank
|
|
@@ -3139,7 +3234,7 @@
|
|
|
3139
3234
|
producer:
|
|
3140
3235
|
name: WooRank sprl
|
|
3141
3236
|
url: https://www.woorank.com/
|
|
3142
|
-
-
|
|
3237
|
+
-
|
|
3143
3238
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/604.1.38 (KHTML, like Gecko) Version/11.0 Mobile/15A372 Safari/604.1 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
|
3144
3239
|
bot:
|
|
3145
3240
|
name: WooRank
|
|
@@ -3148,7 +3243,7 @@
|
|
|
3148
3243
|
producer:
|
|
3149
3244
|
name: WooRank sprl
|
|
3150
3245
|
url: https://www.woorank.com/
|
|
3151
|
-
-
|
|
3246
|
+
-
|
|
3152
3247
|
user_agent: WordPress/4.7.2; https://example.com
|
|
3153
3248
|
bot:
|
|
3154
3249
|
name: WordPress
|
|
@@ -3157,7 +3252,7 @@
|
|
|
3157
3252
|
producer:
|
|
3158
3253
|
name: Wordpress.org
|
|
3159
3254
|
url: https://wordpress.org/
|
|
3160
|
-
-
|
|
3255
|
+
-
|
|
3161
3256
|
user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
|
|
3162
3257
|
bot:
|
|
3163
3258
|
name: Wotbox
|
|
@@ -3166,7 +3261,7 @@
|
|
|
3166
3261
|
producer:
|
|
3167
3262
|
name: Wotbox
|
|
3168
3263
|
url: http://www.wotbox.com
|
|
3169
|
-
-
|
|
3264
|
+
-
|
|
3170
3265
|
user_agent: XenForo/2.x (https://www.example.com)
|
|
3171
3266
|
bot:
|
|
3172
3267
|
name: XenForo
|
|
@@ -3175,7 +3270,7 @@
|
|
|
3175
3270
|
producer:
|
|
3176
3271
|
name: XenForo Ltd.
|
|
3177
3272
|
url: https://xenforo.com/
|
|
3178
|
-
-
|
|
3273
|
+
-
|
|
3179
3274
|
user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
|
|
3180
3275
|
bot:
|
|
3181
3276
|
name: YaCy
|
|
@@ -3184,7 +3279,7 @@
|
|
|
3184
3279
|
producer:
|
|
3185
3280
|
name: YaCy
|
|
3186
3281
|
url: http://yacy.net
|
|
3187
|
-
-
|
|
3282
|
+
-
|
|
3188
3283
|
user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
|
|
3189
3284
|
bot:
|
|
3190
3285
|
name: YaCy
|
|
@@ -3193,7 +3288,7 @@
|
|
|
3193
3288
|
producer:
|
|
3194
3289
|
name: YaCy
|
|
3195
3290
|
url: http://yacy.net
|
|
3196
|
-
-
|
|
3291
|
+
-
|
|
3197
3292
|
user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
|
|
3198
3293
|
bot:
|
|
3199
3294
|
name: Yahoo Gemini
|
|
@@ -3202,7 +3297,7 @@
|
|
|
3202
3297
|
producer:
|
|
3203
3298
|
name: Yahoo! Inc.
|
|
3204
3299
|
url: http://www.yahoo.com
|
|
3205
|
-
-
|
|
3300
|
+
-
|
|
3206
3301
|
user_agent: Y!J-BRW/1.0 (https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716)
|
|
3207
3302
|
bot:
|
|
3208
3303
|
name: Yahoo! Japan BRW
|
|
@@ -3211,7 +3306,7 @@
|
|
|
3211
3306
|
producer:
|
|
3212
3307
|
name: Yahoo! Japan Corp.
|
|
3213
3308
|
url: https://www.yahoo.co.jp/
|
|
3214
|
-
-
|
|
3309
|
+
-
|
|
3215
3310
|
user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
|
|
3216
3311
|
bot:
|
|
3217
3312
|
name: Yahoo! Link Preview
|
|
@@ -3220,7 +3315,7 @@
|
|
|
3220
3315
|
producer:
|
|
3221
3316
|
name: Yahoo! Inc.
|
|
3222
3317
|
url: http://www.yahoo.com
|
|
3223
|
-
-
|
|
3318
|
+
-
|
|
3224
3319
|
user_agent: Yahoo:LinkExpander:Slingstone
|
|
3225
3320
|
bot:
|
|
3226
3321
|
name: Yahoo! Link Preview
|
|
@@ -3229,7 +3324,7 @@
|
|
|
3229
3324
|
producer:
|
|
3230
3325
|
name: Yahoo! Inc.
|
|
3231
3326
|
url: http://www.yahoo.com
|
|
3232
|
-
-
|
|
3327
|
+
-
|
|
3233
3328
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
|
|
3234
3329
|
bot:
|
|
3235
3330
|
name: Yahoo! Slurp
|
|
@@ -3238,7 +3333,7 @@
|
|
|
3238
3333
|
producer:
|
|
3239
3334
|
name: Yahoo! Inc.
|
|
3240
3335
|
url: http://www.yahoo.com
|
|
3241
|
-
-
|
|
3336
|
+
-
|
|
3242
3337
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
|
|
3243
3338
|
bot:
|
|
3244
3339
|
name: Yahoo! Slurp
|
|
@@ -3247,7 +3342,7 @@
|
|
|
3247
3342
|
producer:
|
|
3248
3343
|
name: Yahoo! Inc.
|
|
3249
3344
|
url: http://www.yahoo.com
|
|
3250
|
-
-
|
|
3345
|
+
-
|
|
3251
3346
|
user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
|
|
3252
3347
|
bot:
|
|
3253
3348
|
name: Yandex Bot
|
|
@@ -3256,7 +3351,7 @@
|
|
|
3256
3351
|
producer:
|
|
3257
3352
|
name: Yandex LLC
|
|
3258
3353
|
url: http://company.yandex.com
|
|
3259
|
-
-
|
|
3354
|
+
-
|
|
3260
3355
|
user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
|
|
3261
3356
|
bot:
|
|
3262
3357
|
name: Yandex Bot
|
|
@@ -3265,7 +3360,7 @@
|
|
|
3265
3360
|
producer:
|
|
3266
3361
|
name: Yandex LLC
|
|
3267
3362
|
url: http://company.yandex.com
|
|
3268
|
-
-
|
|
3363
|
+
-
|
|
3269
3364
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
|
3270
3365
|
bot:
|
|
3271
3366
|
name: Yandex Bot
|
|
@@ -3274,7 +3369,7 @@
|
|
|
3274
3369
|
producer:
|
|
3275
3370
|
name: Yandex LLC
|
|
3276
3371
|
url: http://company.yandex.com
|
|
3277
|
-
-
|
|
3372
|
+
-
|
|
3278
3373
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
|
3279
3374
|
bot:
|
|
3280
3375
|
name: Yandex Bot
|
|
@@ -3283,7 +3378,7 @@
|
|
|
3283
3378
|
producer:
|
|
3284
3379
|
name: Yandex LLC
|
|
3285
3380
|
url: http://company.yandex.com
|
|
3286
|
-
-
|
|
3381
|
+
-
|
|
3287
3382
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
|
3288
3383
|
bot:
|
|
3289
3384
|
name: Yandex Bot
|
|
@@ -3292,7 +3387,7 @@
|
|
|
3292
3387
|
producer:
|
|
3293
3388
|
name: Yandex LLC
|
|
3294
3389
|
url: http://company.yandex.com
|
|
3295
|
-
-
|
|
3390
|
+
-
|
|
3296
3391
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
|
3297
3392
|
bot:
|
|
3298
3393
|
name: Yandex Bot
|
|
@@ -3301,7 +3396,7 @@
|
|
|
3301
3396
|
producer:
|
|
3302
3397
|
name: Yandex LLC
|
|
3303
3398
|
url: http://company.yandex.com
|
|
3304
|
-
-
|
|
3399
|
+
-
|
|
3305
3400
|
user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
|
|
3306
3401
|
bot:
|
|
3307
3402
|
name: Yandex Bot
|
|
@@ -3310,7 +3405,7 @@
|
|
|
3310
3405
|
producer:
|
|
3311
3406
|
name: Yandex LLC
|
|
3312
3407
|
url: http://company.yandex.com
|
|
3313
|
-
-
|
|
3408
|
+
-
|
|
3314
3409
|
user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
|
|
3315
3410
|
bot:
|
|
3316
3411
|
name: Yandex Bot
|
|
@@ -3319,7 +3414,7 @@
|
|
|
3319
3414
|
producer:
|
|
3320
3415
|
name: Yandex LLC
|
|
3321
3416
|
url: http://company.yandex.com
|
|
3322
|
-
-
|
|
3417
|
+
-
|
|
3323
3418
|
user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
|
|
3324
3419
|
bot:
|
|
3325
3420
|
name: Yandex Bot
|
|
@@ -3328,7 +3423,7 @@
|
|
|
3328
3423
|
producer:
|
|
3329
3424
|
name: Yandex LLC
|
|
3330
3425
|
url: http://company.yandex.com
|
|
3331
|
-
-
|
|
3426
|
+
-
|
|
3332
3427
|
user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
|
|
3333
3428
|
bot:
|
|
3334
3429
|
name: Yandex Bot
|
|
@@ -3337,7 +3432,7 @@
|
|
|
3337
3432
|
producer:
|
|
3338
3433
|
name: Yandex LLC
|
|
3339
3434
|
url: http://company.yandex.com
|
|
3340
|
-
-
|
|
3435
|
+
-
|
|
3341
3436
|
user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
|
|
3342
3437
|
bot:
|
|
3343
3438
|
name: Yandex Bot
|
|
@@ -3346,7 +3441,7 @@
|
|
|
3346
3441
|
producer:
|
|
3347
3442
|
name: Yandex LLC
|
|
3348
3443
|
url: http://company.yandex.com
|
|
3349
|
-
-
|
|
3444
|
+
-
|
|
3350
3445
|
user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
|
|
3351
3446
|
bot:
|
|
3352
3447
|
name: Yandex Bot
|
|
@@ -3355,7 +3450,7 @@
|
|
|
3355
3450
|
producer:
|
|
3356
3451
|
name: Yandex LLC
|
|
3357
3452
|
url: http://company.yandex.com
|
|
3358
|
-
-
|
|
3453
|
+
-
|
|
3359
3454
|
user_agent: Mozilla/5.0 (compatible; YandexMobileScreenShotBot/1.0; +http://yandex.com/bots)
|
|
3360
3455
|
bot:
|
|
3361
3456
|
name: Yandex Bot
|
|
@@ -3364,7 +3459,7 @@
|
|
|
3364
3459
|
producer:
|
|
3365
3460
|
name: Yandex LLC
|
|
3366
3461
|
url: http://company.yandex.com
|
|
3367
|
-
-
|
|
3462
|
+
-
|
|
3368
3463
|
user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
|
|
3369
3464
|
bot:
|
|
3370
3465
|
name: Yandex Bot
|
|
@@ -3373,7 +3468,7 @@
|
|
|
3373
3468
|
producer:
|
|
3374
3469
|
name: Yandex LLC
|
|
3375
3470
|
url: http://company.yandex.com
|
|
3376
|
-
-
|
|
3471
|
+
-
|
|
3377
3472
|
user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
|
|
3378
3473
|
bot:
|
|
3379
3474
|
name: Yandex Bot
|
|
@@ -3382,7 +3477,7 @@
|
|
|
3382
3477
|
producer:
|
|
3383
3478
|
name: Yandex LLC
|
|
3384
3479
|
url: http://company.yandex.com
|
|
3385
|
-
-
|
|
3480
|
+
-
|
|
3386
3481
|
user_agent: Mozilla/5.0 (compatible; YandexOntoDB/1.0; +http://yandex.com/bots)
|
|
3387
3482
|
bot:
|
|
3388
3483
|
name: Yandex Bot
|
|
@@ -3391,7 +3486,7 @@
|
|
|
3391
3486
|
producer:
|
|
3392
3487
|
name: Yandex LLC
|
|
3393
3488
|
url: http://company.yandex.com
|
|
3394
|
-
-
|
|
3489
|
+
-
|
|
3395
3490
|
user_agent: Mozilla/5.0 (compatible; YandexOntoDBAPI/1.0; +http://yandex.com/bots)
|
|
3396
3491
|
bot:
|
|
3397
3492
|
name: Yandex Bot
|
|
@@ -3400,7 +3495,7 @@
|
|
|
3400
3495
|
producer:
|
|
3401
3496
|
name: Yandex LLC
|
|
3402
3497
|
url: http://company.yandex.com
|
|
3403
|
-
-
|
|
3498
|
+
-
|
|
3404
3499
|
user_agent: Mozilla/5.0 (compatible; YandexPartner/3.0; +http://yandex.com/bots)
|
|
3405
3500
|
bot:
|
|
3406
3501
|
name: Yandex Bot
|
|
@@ -3409,7 +3504,7 @@
|
|
|
3409
3504
|
producer:
|
|
3410
3505
|
name: Yandex LLC
|
|
3411
3506
|
url: http://company.yandex.com
|
|
3412
|
-
-
|
|
3507
|
+
-
|
|
3413
3508
|
user_agent: Mozilla/5.0 (compatible; YandexRCA/1.0; +http://yandex.com/bots)
|
|
3414
3509
|
bot:
|
|
3415
3510
|
name: Yandex Bot
|
|
@@ -3418,7 +3513,7 @@
|
|
|
3418
3513
|
producer:
|
|
3419
3514
|
name: Yandex LLC
|
|
3420
3515
|
url: http://company.yandex.com
|
|
3421
|
-
-
|
|
3516
|
+
-
|
|
3422
3517
|
user_agent: Mozilla/5.0 (compatible; YandexSearchShop/1.0; +http://yandex.com/bots)
|
|
3423
3518
|
bot:
|
|
3424
3519
|
name: Yandex Bot
|
|
@@ -3427,7 +3522,7 @@
|
|
|
3427
3522
|
producer:
|
|
3428
3523
|
name: Yandex LLC
|
|
3429
3524
|
url: http://company.yandex.com
|
|
3430
|
-
-
|
|
3525
|
+
-
|
|
3431
3526
|
user_agent: Mozilla/5.0 (compatible; YandexTracker/1.0; +http://yandex.com/bots)
|
|
3432
3527
|
bot:
|
|
3433
3528
|
name: Yandex Bot
|
|
@@ -3436,7 +3531,7 @@
|
|
|
3436
3531
|
producer:
|
|
3437
3532
|
name: Yandex LLC
|
|
3438
3533
|
url: http://company.yandex.com
|
|
3439
|
-
-
|
|
3534
|
+
-
|
|
3440
3535
|
user_agent: Mozilla/5.0 (compatible; YandexTurbo/1.0; +http://yandex.com/bots)
|
|
3441
3536
|
bot:
|
|
3442
3537
|
name: Yandex Bot
|
|
@@ -3445,7 +3540,7 @@
|
|
|
3445
3540
|
producer:
|
|
3446
3541
|
name: Yandex LLC
|
|
3447
3542
|
url: http://company.yandex.com
|
|
3448
|
-
-
|
|
3543
|
+
-
|
|
3449
3544
|
user_agent: Mozilla/5.0 (compatible; YandexVerticals/1.0; http://yandex.com/bots)
|
|
3450
3545
|
bot:
|
|
3451
3546
|
name: Yandex Bot
|
|
@@ -3454,7 +3549,7 @@
|
|
|
3454
3549
|
producer:
|
|
3455
3550
|
name: Yandex LLC
|
|
3456
3551
|
url: http://company.yandex.com
|
|
3457
|
-
-
|
|
3552
|
+
-
|
|
3458
3553
|
user_agent: Mozilla/5.0 (compatible; NaverJapan/1.0; +http://corp.naver.jp/)
|
|
3459
3554
|
bot:
|
|
3460
3555
|
name: Yeti/Naverbot
|
|
@@ -3463,7 +3558,7 @@
|
|
|
3463
3558
|
producer:
|
|
3464
3559
|
name: Naver
|
|
3465
3560
|
url: http://www.naver.com
|
|
3466
|
-
-
|
|
3561
|
+
-
|
|
3467
3562
|
user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
|
|
3468
3563
|
bot:
|
|
3469
3564
|
name: Yeti/Naverbot
|
|
@@ -3472,7 +3567,7 @@
|
|
|
3472
3567
|
producer:
|
|
3473
3568
|
name: Naver
|
|
3474
3569
|
url: http://www.naver.com
|
|
3475
|
-
-
|
|
3570
|
+
-
|
|
3476
3571
|
user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
|
|
3477
3572
|
bot:
|
|
3478
3573
|
name: Youdao Bot
|
|
@@ -3481,13 +3576,13 @@
|
|
|
3481
3576
|
producer:
|
|
3482
3577
|
name: NetEase, Inc.
|
|
3483
3578
|
url: http://corp.163.com
|
|
3484
|
-
-
|
|
3579
|
+
-
|
|
3485
3580
|
user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
|
|
3486
3581
|
bot:
|
|
3487
3582
|
name: Yourls
|
|
3488
3583
|
category: Crawler
|
|
3489
3584
|
url: http://yourls.org
|
|
3490
|
-
-
|
|
3585
|
+
-
|
|
3491
3586
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
|
|
3492
3587
|
bot:
|
|
3493
3588
|
name: Yunyun Bot
|
|
@@ -3496,7 +3591,7 @@
|
|
|
3496
3591
|
producer:
|
|
3497
3592
|
name: YunYun
|
|
3498
3593
|
url: http://www.yunyun.com
|
|
3499
|
-
-
|
|
3594
|
+
-
|
|
3500
3595
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
|
|
3501
3596
|
bot:
|
|
3502
3597
|
name: Yunyun Bot
|
|
@@ -3505,7 +3600,7 @@
|
|
|
3505
3600
|
producer:
|
|
3506
3601
|
name: YunYun
|
|
3507
3602
|
url: http://www.yunyun.com
|
|
3508
|
-
-
|
|
3603
|
+
-
|
|
3509
3604
|
user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
|
|
3510
3605
|
bot:
|
|
3511
3606
|
name: Yunyun Bot
|
|
@@ -3514,21 +3609,21 @@
|
|
|
3514
3609
|
producer:
|
|
3515
3610
|
name: YunYun
|
|
3516
3611
|
url: http://www.yunyun.com
|
|
3517
|
-
-
|
|
3612
|
+
-
|
|
3518
3613
|
user_agent: Zao/0.1 (http://www.kototol.org/zao)
|
|
3519
3614
|
bot:
|
|
3520
3615
|
name: Zao
|
|
3521
3616
|
category: Crawler
|
|
3522
|
-
-
|
|
3617
|
+
-
|
|
3523
3618
|
user_agent: zelist.ro feed parser (+http://www.zelist.ro)
|
|
3524
3619
|
bot:
|
|
3525
3620
|
name: Ze List
|
|
3526
|
-
category: Feed Fetcher
|
|
3527
3621
|
url: https://www.zelist.ro/
|
|
3622
|
+
category: Feed Fetcher
|
|
3528
3623
|
producer:
|
|
3529
3624
|
name: Treeworks SRL
|
|
3530
3625
|
url: https://www.tree.ro/
|
|
3531
|
-
-
|
|
3626
|
+
-
|
|
3532
3627
|
user_agent: Zookabot/2.5;++http://zookabot.com
|
|
3533
3628
|
bot:
|
|
3534
3629
|
name: Zookabot
|
|
@@ -3537,7 +3632,7 @@
|
|
|
3537
3632
|
producer:
|
|
3538
3633
|
name: Hwacha ApS
|
|
3539
3634
|
url: http://hwacha.dk
|
|
3540
|
-
-
|
|
3635
|
+
-
|
|
3541
3636
|
user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
|
|
3542
3637
|
bot:
|
|
3543
3638
|
name: ZumBot
|
|
@@ -3546,7 +3641,7 @@
|
|
|
3546
3641
|
producer:
|
|
3547
3642
|
name: ZUM internet
|
|
3548
3643
|
url: http://www.zuminternet.com/
|
|
3549
|
-
-
|
|
3644
|
+
-
|
|
3550
3645
|
user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
|
|
3551
3646
|
bot:
|
|
3552
3647
|
name: ZumBot
|
|
@@ -3555,106 +3650,106 @@
|
|
|
3555
3650
|
producer:
|
|
3556
3651
|
name: ZUM internet
|
|
3557
3652
|
url: http://www.zuminternet.com/
|
|
3558
|
-
-
|
|
3653
|
+
-
|
|
3559
3654
|
user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
|
|
3560
3655
|
bot:
|
|
3561
3656
|
name: aHrefs Bot
|
|
3562
3657
|
category: Crawler
|
|
3563
|
-
url:
|
|
3658
|
+
url: https://ahrefs.com/robot
|
|
3564
3659
|
producer:
|
|
3565
3660
|
name: Ahrefs Pte Ltd
|
|
3566
|
-
url:
|
|
3567
|
-
-
|
|
3661
|
+
url: https://ahrefs.com/robot
|
|
3662
|
+
-
|
|
3568
3663
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
|
|
3569
3664
|
bot:
|
|
3570
3665
|
name: aHrefs Bot
|
|
3571
3666
|
category: Crawler
|
|
3572
|
-
url:
|
|
3667
|
+
url: https://ahrefs.com/robot
|
|
3573
3668
|
producer:
|
|
3574
3669
|
name: Ahrefs Pte Ltd
|
|
3575
|
-
url:
|
|
3576
|
-
-
|
|
3670
|
+
url: https://ahrefs.com/robot
|
|
3671
|
+
-
|
|
3577
3672
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
|
|
3578
3673
|
bot:
|
|
3579
3674
|
name: aHrefs Bot
|
|
3580
3675
|
category: Crawler
|
|
3581
|
-
url:
|
|
3676
|
+
url: https://ahrefs.com/robot
|
|
3582
3677
|
producer:
|
|
3583
3678
|
name: Ahrefs Pte Ltd
|
|
3584
|
-
url:
|
|
3585
|
-
-
|
|
3679
|
+
url: https://ahrefs.com/robot
|
|
3680
|
+
-
|
|
3586
3681
|
user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
|
|
3587
3682
|
bot:
|
|
3588
3683
|
name: aHrefs Bot
|
|
3589
3684
|
category: Crawler
|
|
3590
|
-
url:
|
|
3685
|
+
url: https://ahrefs.com/robot
|
|
3591
3686
|
producer:
|
|
3592
3687
|
name: Ahrefs Pte Ltd
|
|
3593
|
-
url:
|
|
3594
|
-
-
|
|
3688
|
+
url: https://ahrefs.com/robot
|
|
3689
|
+
-
|
|
3595
3690
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
|
|
3596
3691
|
bot:
|
|
3597
3692
|
name: archive.org bot
|
|
3598
3693
|
category: Crawler
|
|
3599
|
-
url:
|
|
3694
|
+
url: https://archive.org/details/archive.org_bot
|
|
3600
3695
|
producer:
|
|
3601
3696
|
name: The Internet Archive
|
|
3602
|
-
url:
|
|
3603
|
-
-
|
|
3697
|
+
url: https://archive.org
|
|
3698
|
+
-
|
|
3604
3699
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
|
|
3605
3700
|
bot:
|
|
3606
3701
|
name: archive.org bot
|
|
3607
3702
|
category: Crawler
|
|
3608
|
-
url:
|
|
3703
|
+
url: https://archive.org/details/archive.org_bot
|
|
3609
3704
|
producer:
|
|
3610
3705
|
name: The Internet Archive
|
|
3611
|
-
url:
|
|
3612
|
-
-
|
|
3706
|
+
url: https://archive.org
|
|
3707
|
+
-
|
|
3613
3708
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
|
|
3614
3709
|
bot:
|
|
3615
3710
|
name: archive.org bot
|
|
3616
3711
|
category: Crawler
|
|
3617
|
-
url:
|
|
3712
|
+
url: https://archive.org/details/archive.org_bot
|
|
3618
3713
|
producer:
|
|
3619
3714
|
name: The Internet Archive
|
|
3620
|
-
url:
|
|
3621
|
-
-
|
|
3715
|
+
url: https://archive.org
|
|
3716
|
+
-
|
|
3622
3717
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
|
|
3623
3718
|
bot:
|
|
3624
3719
|
name: archive.org bot
|
|
3625
3720
|
category: Crawler
|
|
3626
|
-
url:
|
|
3721
|
+
url: https://archive.org/details/archive.org_bot
|
|
3627
3722
|
producer:
|
|
3628
3723
|
name: The Internet Archive
|
|
3629
|
-
url:
|
|
3630
|
-
-
|
|
3724
|
+
url: https://archive.org
|
|
3725
|
+
-
|
|
3631
3726
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
|
|
3632
3727
|
bot:
|
|
3633
3728
|
name: archive.org bot
|
|
3634
3729
|
category: Crawler
|
|
3635
|
-
url:
|
|
3730
|
+
url: https://archive.org/details/archive.org_bot
|
|
3636
3731
|
producer:
|
|
3637
3732
|
name: The Internet Archive
|
|
3638
|
-
url:
|
|
3639
|
-
-
|
|
3733
|
+
url: https://archive.org
|
|
3734
|
+
-
|
|
3640
3735
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
|
|
3641
3736
|
bot:
|
|
3642
3737
|
name: archive.org bot
|
|
3643
3738
|
category: Crawler
|
|
3644
|
-
url:
|
|
3739
|
+
url: https://archive.org/details/archive.org_bot
|
|
3645
3740
|
producer:
|
|
3646
3741
|
name: The Internet Archive
|
|
3647
|
-
url:
|
|
3648
|
-
-
|
|
3742
|
+
url: https://archive.org
|
|
3743
|
+
-
|
|
3649
3744
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
|
|
3650
3745
|
bot:
|
|
3651
3746
|
name: archive.org bot
|
|
3652
3747
|
category: Crawler
|
|
3653
|
-
url:
|
|
3748
|
+
url: https://archive.org/details/archive.org_bot
|
|
3654
3749
|
producer:
|
|
3655
3750
|
name: The Internet Archive
|
|
3656
|
-
url:
|
|
3657
|
-
-
|
|
3751
|
+
url: https://archive.org
|
|
3752
|
+
-
|
|
3658
3753
|
user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
|
|
3659
3754
|
bot:
|
|
3660
3755
|
name: ccBot crawler
|
|
@@ -3663,7 +3758,7 @@
|
|
|
3663
3758
|
producer:
|
|
3664
3759
|
name: reddit inc.
|
|
3665
3760
|
url: http://www.reddit.com
|
|
3666
|
-
-
|
|
3761
|
+
-
|
|
3667
3762
|
user_agent: Mozilla/5.0 eCairn-Grabber/1.0 (+http://ecairn.com/grabber)
|
|
3668
3763
|
bot:
|
|
3669
3764
|
name: eCairn-Grabber
|
|
@@ -3671,7 +3766,7 @@
|
|
|
3671
3766
|
producer:
|
|
3672
3767
|
name: eCairn
|
|
3673
3768
|
url: https://ecairn.com
|
|
3674
|
-
-
|
|
3769
|
+
-
|
|
3675
3770
|
user_agent: eZ Publish Link Validator
|
|
3676
3771
|
bot:
|
|
3677
3772
|
name: eZ Publish Link Validator
|
|
@@ -3680,7 +3775,7 @@
|
|
|
3680
3775
|
producer:
|
|
3681
3776
|
name: eZ Systems AS
|
|
3682
3777
|
url: https://ez.no/
|
|
3683
|
-
-
|
|
3778
|
+
-
|
|
3684
3779
|
user_agent: Mozilla/5.0 (compatible; evc-batch/2.0)
|
|
3685
3780
|
bot:
|
|
3686
3781
|
name: evc-batch
|
|
@@ -3689,13 +3784,13 @@
|
|
|
3689
3784
|
producer:
|
|
3690
3785
|
name: eVenture Capital Partners II, LLC
|
|
3691
3786
|
url: http://www.eventures.vc/
|
|
3692
|
-
-
|
|
3787
|
+
-
|
|
3693
3788
|
user_agent: Mozilla/5.0 (compatible; inoreader.com; 2 subscribers)
|
|
3694
3789
|
bot:
|
|
3695
3790
|
name: inoreader
|
|
3696
3791
|
category: Feed Reader
|
|
3697
3792
|
url: https://www.inoreader.com
|
|
3698
|
-
-
|
|
3793
|
+
-
|
|
3699
3794
|
user_agent: masscan/1.0 (https://github.com/robertdavidgraham/masscan)
|
|
3700
3795
|
bot:
|
|
3701
3796
|
name: masscan
|
|
@@ -3704,21 +3799,21 @@
|
|
|
3704
3799
|
producer:
|
|
3705
3800
|
name: Robert Graham
|
|
3706
3801
|
url: https://github.com/robertdavidgraham
|
|
3707
|
-
-
|
|
3802
|
+
-
|
|
3708
3803
|
user_agent: 'Mozilla/5.0/Firefox/42.0 - nbertaupete95(at)gmail.com'
|
|
3709
3804
|
bot:
|
|
3710
3805
|
name: nbertaupete95
|
|
3711
3806
|
category: Crawler
|
|
3712
|
-
-
|
|
3807
|
+
-
|
|
3713
3808
|
user_agent: Mozilla/5.0 (compatible; oBot/2.3.1; http://www.xforce-security.com/crawler/)
|
|
3714
3809
|
bot:
|
|
3715
3810
|
name: oBot
|
|
3716
3811
|
category: Search bot
|
|
3717
|
-
url:
|
|
3812
|
+
url: https://www.xforce-security.com/crawler/
|
|
3718
3813
|
producer:
|
|
3719
3814
|
name: 'IBM Germany Research & Development GmbH'
|
|
3720
3815
|
url: https://exchange.xforce.ibmcloud.com/
|
|
3721
|
-
-
|
|
3816
|
+
-
|
|
3722
3817
|
user_agent: 'sqlmap/1.1.8.2#dev (http://sqlmap.org)'
|
|
3723
3818
|
bot:
|
|
3724
3819
|
name: sqlmap
|
|
@@ -3727,87 +3822,613 @@
|
|
|
3727
3822
|
producer:
|
|
3728
3823
|
name: sqlmap
|
|
3729
3824
|
url: http://sqlmap.org/
|
|
3730
|
-
-
|
|
3825
|
+
-
|
|
3731
3826
|
user_agent: Mozilla/5.0 (compatible; theoldreader.com; 1 subscribers; feed-id=aaa)
|
|
3732
3827
|
bot:
|
|
3733
3828
|
name: theoldreader
|
|
3734
3829
|
category: Feed Reader
|
|
3735
3830
|
url: https://theoldreader.com
|
|
3736
|
-
|
|
3737
3831
|
-
|
|
3738
|
-
user_agent:
|
|
3832
|
+
user_agent: Sprinklr 2.0
|
|
3739
3833
|
bot:
|
|
3740
|
-
name:
|
|
3834
|
+
name: Sprinklr
|
|
3741
3835
|
category: Crawler
|
|
3742
|
-
url:
|
|
3743
|
-
|
|
3836
|
+
url: ""
|
|
3837
|
+
producer:
|
|
3838
|
+
name: Sprinklr, Inc.
|
|
3839
|
+
url: https://www.sprinklr.com/
|
|
3744
3840
|
-
|
|
3745
|
-
user_agent:
|
|
3841
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64)AppleWebKit/537.36 (KHTML, like Gecko; Google-Ads-Qualify)Chrome/85.0.4183.140 Safari/537.36
|
|
3746
3842
|
bot:
|
|
3747
|
-
name:
|
|
3748
|
-
category:
|
|
3749
|
-
url:
|
|
3750
|
-
|
|
3843
|
+
name: Googlebot
|
|
3844
|
+
category: Search bot
|
|
3845
|
+
url: http://www.google.com/bot.html
|
|
3846
|
+
producer:
|
|
3847
|
+
name: Google Inc.
|
|
3848
|
+
url: http://www.google.com
|
|
3751
3849
|
-
|
|
3752
|
-
user_agent:
|
|
3850
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64; BDCbot/1.0; +http://bigweb.bigdatacorp.com.br/faq.aspx) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36
|
|
3753
3851
|
bot:
|
|
3754
|
-
name:
|
|
3755
|
-
category:
|
|
3756
|
-
url:
|
|
3757
|
-
|
|
3852
|
+
name: BDCbot
|
|
3853
|
+
category: Crawler
|
|
3854
|
+
url: https://bigweb.bigdatacorp.com.br/pages/faq.aspx
|
|
3855
|
+
producer:
|
|
3856
|
+
name: BIG Data Solucoes Em Tecnologia de Informatica LTDA
|
|
3857
|
+
url: https://bigdatacorp.com.br/
|
|
3758
3858
|
-
|
|
3759
|
-
user_agent:
|
|
3859
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36 CloudflareDiagnostics/1.0
|
|
3760
3860
|
bot:
|
|
3761
|
-
name:
|
|
3861
|
+
name: Cloudflare Diagnostics
|
|
3862
|
+
category: Site Monitor
|
|
3863
|
+
url: https://www.cloudflare.com/
|
|
3864
|
+
producer:
|
|
3865
|
+
name: Cloudflare
|
|
3866
|
+
url: https://www.cloudflare.com
|
|
3867
|
+
-
|
|
3868
|
+
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 12_0 like Mac OS X) adbeat.com/policy AppleWebKit/605.1.15 (KHTML, like Gecko) CriOS/69.0.3497.105 Mobile/15E148 Safari/605.1
|
|
3869
|
+
bot:
|
|
3870
|
+
name: Adbeat
|
|
3762
3871
|
category: Crawler
|
|
3763
|
-
|
|
3872
|
+
url: https://www.adbeat.com/operation_policy
|
|
3873
|
+
producer:
|
|
3874
|
+
name: PPC Labs LLC
|
|
3875
|
+
url: https://www.adbeat.com/
|
|
3764
3876
|
-
|
|
3765
|
-
user_agent: Mozilla/5.0 (
|
|
3877
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; BW/1.1; bit.ly/2W6Px8S) Chrome/84.0.4147.105 Safari/537.36
|
|
3766
3878
|
bot:
|
|
3767
|
-
name:
|
|
3879
|
+
name: BuiltWith
|
|
3768
3880
|
category: Crawler
|
|
3769
|
-
url: https://
|
|
3770
|
-
|
|
3881
|
+
url: https://builtwith.com/biup
|
|
3882
|
+
producer:
|
|
3883
|
+
name: BuiltWith Pty Ltd
|
|
3884
|
+
url: https://builtwith.com/
|
|
3771
3885
|
-
|
|
3772
|
-
user_agent: Mozilla/5.0 (
|
|
3886
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36 (+https://whatis.contentkingapp.com)
|
|
3773
3887
|
bot:
|
|
3774
|
-
name:
|
|
3888
|
+
name: ContentKing
|
|
3889
|
+
category: Site Monitor
|
|
3890
|
+
url: https://whatis.contentkingapp.com/
|
|
3891
|
+
producer:
|
|
3892
|
+
name: ContentKing BV
|
|
3893
|
+
url: https://www.contentkingapp.com/
|
|
3894
|
+
-
|
|
3895
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.89 Safari/537.36 MicroAdBot/1.1 (https://www.microad.co.jp/contact/)
|
|
3896
|
+
bot:
|
|
3897
|
+
name: MicroAdBot
|
|
3775
3898
|
category: Crawler
|
|
3776
|
-
url: https://
|
|
3777
|
-
|
|
3899
|
+
url: https://www.microad.co.jp/
|
|
3900
|
+
producer:
|
|
3901
|
+
name: MicroAd, Inc.
|
|
3902
|
+
url: https://www.microad.co.jp/
|
|
3778
3903
|
-
|
|
3779
|
-
user_agent:
|
|
3904
|
+
user_agent: Mozilla/5.0 (compatible; PingAdmin.Ru/1.2; +http://pingadmin.ru/free_test/)
|
|
3780
3905
|
bot:
|
|
3781
|
-
name:
|
|
3906
|
+
name: PingAdmin.Ru
|
|
3907
|
+
category: Site Monitor
|
|
3908
|
+
url: https://ping-admin.ru/
|
|
3909
|
+
-
|
|
3910
|
+
user_agent: Mozilla/5.0 (compatible; WebDataStats/1.0 ; +https://webdatastats.com/policy.html)
|
|
3911
|
+
bot:
|
|
3912
|
+
name: WebDataStats
|
|
3782
3913
|
category: Crawler
|
|
3783
|
-
url:
|
|
3784
|
-
|
|
3914
|
+
url: https://webdatastats.com/policy.html
|
|
3915
|
+
producer:
|
|
3916
|
+
name: WebTehRazrabotka LLC
|
|
3917
|
+
url: https://webdatastats.com/
|
|
3785
3918
|
-
|
|
3786
|
-
user_agent:
|
|
3919
|
+
user_agent: Mozilla/5.0 (compatible; parse.ly scraper/0.14; +http://parsely.com)
|
|
3787
3920
|
bot:
|
|
3788
|
-
name:
|
|
3789
|
-
category:
|
|
3790
|
-
url: https://www.
|
|
3791
|
-
|
|
3921
|
+
name: parse.ly
|
|
3922
|
+
category: Crawler
|
|
3923
|
+
url: https://www.parse.ly/help/integration/crawler
|
|
3924
|
+
producer:
|
|
3925
|
+
name: Parsely, Inc.
|
|
3926
|
+
url: https://www.parse.ly/
|
|
3792
3927
|
-
|
|
3793
|
-
user_agent: Mozilla/5.0 (compatible
|
|
3928
|
+
user_agent: Mozilla/5.0 (compatible; Nimbostratus-Bot/v1.3.2; http://cloudsystemnetworks.com)
|
|
3794
3929
|
bot:
|
|
3795
|
-
name:
|
|
3930
|
+
name: Nimbostratus Bot
|
|
3931
|
+
category: Site Monitor
|
|
3932
|
+
url: http://cloudsystemnetworks.com
|
|
3933
|
+
-
|
|
3934
|
+
user_agent: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.17) Gecko/20110515 HeartRails_Capture/1.0.4 (+http://capture.heartrails.com/) Namoroka/3.6.17
|
|
3935
|
+
bot:
|
|
3936
|
+
name: Heart Rails Capture
|
|
3937
|
+
category: Service Agent
|
|
3938
|
+
url: http://capture.heartrails.com
|
|
3939
|
+
-
|
|
3940
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36 http://notifyninja.com/monitoring
|
|
3941
|
+
bot:
|
|
3942
|
+
name: Notify Ninja
|
|
3943
|
+
category: Site Monitor
|
|
3944
|
+
url: http://notifyninja.com
|
|
3945
|
+
-
|
|
3946
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) Project-Resonance (http://project-resonance.com/) (KHTML, like Gecko) Chrome/83.0.4103.61 Safari/537.36
|
|
3947
|
+
bot:
|
|
3948
|
+
name: Project Resonance
|
|
3796
3949
|
category: Crawler
|
|
3797
|
-
url:
|
|
3798
|
-
|
|
3950
|
+
url: http://project-resonance.com
|
|
3799
3951
|
-
|
|
3800
|
-
user_agent: Mozilla/5.0 (compatible;
|
|
3952
|
+
user_agent: Mozilla/5.0 (compatible; DataXu/1.0; +http://dataxu.com)
|
|
3801
3953
|
bot:
|
|
3802
|
-
name:
|
|
3954
|
+
name: DataXu
|
|
3955
|
+
category: Service Agent
|
|
3956
|
+
url: https://advertising.roku.com/dataxu
|
|
3957
|
+
producer:
|
|
3958
|
+
name: Roku, Inc.
|
|
3959
|
+
url: https://roku.com
|
|
3960
|
+
-
|
|
3961
|
+
user_agent: Mozilla/5.0 (Unknown; Linux x86_64) AppleWebKit/534.34 (KHTML, like Gecko) PingdomTMS/0.8.5 Safari/534.34
|
|
3962
|
+
bot:
|
|
3963
|
+
name: Pingdom Bot
|
|
3964
|
+
category: Site Monitor
|
|
3965
|
+
url: ""
|
|
3966
|
+
producer:
|
|
3967
|
+
name: Pingdom AB
|
|
3968
|
+
url: https://www.pingdom.com
|
|
3969
|
+
-
|
|
3970
|
+
user_agent: Mozilla/5.0 (compatible; Cocolyzebot/1.0; https://cocolyze.com/bot)
|
|
3971
|
+
bot:
|
|
3972
|
+
name: Cocolyzebot
|
|
3803
3973
|
category: Crawler
|
|
3804
|
-
url: https://
|
|
3805
|
-
|
|
3974
|
+
url: https://cocolyze.com/en/cocolyzebot
|
|
3975
|
+
producer:
|
|
3976
|
+
name: VSI INNOVATION SAS
|
|
3977
|
+
url: https://vsi-innovation.com/
|
|
3806
3978
|
-
|
|
3807
|
-
user_agent:
|
|
3979
|
+
user_agent: veryhip (http://veryhip.com/)
|
|
3808
3980
|
bot:
|
|
3809
|
-
name:
|
|
3981
|
+
name: VeryHip
|
|
3810
3982
|
category: Crawler
|
|
3811
|
-
url:
|
|
3812
|
-
|
|
3813
|
-
|
|
3983
|
+
url: https://veryhip.com/
|
|
3984
|
+
producer:
|
|
3985
|
+
name: VeryHip
|
|
3986
|
+
url: https://veryhip.com/
|
|
3987
|
+
-
|
|
3988
|
+
user_agent: Mozilla/5.0 (compatible; LinkpadBot/2.3; +http://linkpad.org/robot/)
|
|
3989
|
+
bot:
|
|
3990
|
+
name: LinkpadBot
|
|
3991
|
+
category: Crawler
|
|
3992
|
+
url: https://www.linkpad.org/
|
|
3993
|
+
producer:
|
|
3994
|
+
name: Solomono LLC
|
|
3995
|
+
url: https://www.linkpad.org/
|
|
3996
|
+
-
|
|
3997
|
+
user_agent: Mozilla/4.0 (compatible; MuscatFerret/1.7; http://www.webtop.com/)
|
|
3998
|
+
bot:
|
|
3999
|
+
name: MuscatFerret
|
|
4000
|
+
category: Crawler
|
|
4001
|
+
url: http://www.webtop.com/
|
|
4002
|
+
-
|
|
4003
|
+
user_agent: Quora-Bot/1.0 (http://www.quora.com)
|
|
4004
|
+
bot:
|
|
4005
|
+
name: Quora Bot
|
|
4006
|
+
category: Crawler
|
|
4007
|
+
url: ""
|
|
4008
|
+
producer:
|
|
4009
|
+
name: Quora
|
|
4010
|
+
url: https://www.quora.com/
|
|
4011
|
+
-
|
|
4012
|
+
user_agent: PageThing.com
|
|
4013
|
+
bot:
|
|
4014
|
+
name: PageThing
|
|
4015
|
+
category: Crawler
|
|
4016
|
+
url: https://www.pagething.com/
|
|
4017
|
+
producer:
|
|
4018
|
+
name: SPECIALNOISE LTD
|
|
4019
|
+
url: https://www.specialnoise.com/
|
|
4020
|
+
-
|
|
4021
|
+
user_agent: ArchiveBox/0.5.3 (+https://github.com/ArchiveBox/ArchiveBox/)
|
|
4022
|
+
bot:
|
|
4023
|
+
name: ArchiveBox
|
|
4024
|
+
url: https://archivebox.io/
|
|
4025
|
+
category: Crawler
|
|
4026
|
+
producer:
|
|
4027
|
+
name: ""
|
|
4028
|
+
url: ""
|
|
4029
|
+
-
|
|
4030
|
+
user_agent: Choosito/1.0 +http://www.choosito.com/
|
|
4031
|
+
bot:
|
|
4032
|
+
name: Choosito
|
|
4033
|
+
url: https://www.choosito.com/
|
|
4034
|
+
category: Crawler
|
|
4035
|
+
producer:
|
|
4036
|
+
name: Choosito! Inc.
|
|
4037
|
+
url: https://www.choosito.com/
|
|
4038
|
+
-
|
|
4039
|
+
user_agent: datagnionbot (+http://www.datagnion.com/bot.html)
|
|
4040
|
+
bot:
|
|
4041
|
+
name: datagnionbot
|
|
4042
|
+
url: https://www.datagnion.com/bot.html
|
|
4043
|
+
category: Crawler
|
|
4044
|
+
producer:
|
|
4045
|
+
name: DATAGNION GMBH
|
|
4046
|
+
url: https://www.datagnion.com/
|
|
4047
|
+
-
|
|
4048
|
+
user_agent: InterNaetBoten/0.99 (http://www.xn--internt-bxa.nu)
|
|
4049
|
+
bot:
|
|
4050
|
+
name: Generic Bot
|
|
4051
|
+
-
|
|
4052
|
+
user_agent: EasyBib AutoCite (http://autocite-info.citation-api.com/)
|
|
4053
|
+
bot:
|
|
4054
|
+
name: Generic Bot
|
|
4055
|
+
-
|
|
4056
|
+
user_agent: Bidtellect/0.0.643.0
|
|
4057
|
+
bot:
|
|
4058
|
+
name: Generic Bot
|
|
4059
|
+
-
|
|
4060
|
+
user_agent: Mozilla/5.0 (compatible; meg/0.2; +https://github.com/tomnomnom/meg)
|
|
4061
|
+
bot:
|
|
4062
|
+
name: Generic Bot
|
|
4063
|
+
-
|
|
4064
|
+
user_agent: Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:66.0) WhatCMS/1.0
|
|
4065
|
+
bot:
|
|
4066
|
+
name: WhatCMS
|
|
4067
|
+
url: https://whatcms.org/
|
|
4068
|
+
category: Crawler
|
|
4069
|
+
producer:
|
|
4070
|
+
name: "Nineteen Ten LLC"
|
|
4071
|
+
url: "https://whatcms.org/"
|
|
4072
|
+
-
|
|
4073
|
+
user_agent: httpx - Open-source project (github.com/projectdiscovery/httpx)
|
|
4074
|
+
bot:
|
|
4075
|
+
name: httpx
|
|
4076
|
+
url: https://github.com/projectdiscovery/httpx
|
|
4077
|
+
category: Crawler
|
|
4078
|
+
producer:
|
|
4079
|
+
name: ""
|
|
4080
|
+
url: ""
|
|
4081
|
+
-
|
|
4082
|
+
user_agent: 'Expanse indexes the network perimeters of our customers. If you have any questions or concerns, please reach out to: scaninfo@expanseinc.com'
|
|
4083
|
+
bot:
|
|
4084
|
+
name: Expanse
|
|
4085
|
+
category: Security Checker
|
|
4086
|
+
url: https://expanse.co/
|
|
4087
|
+
producer:
|
|
4088
|
+
name: Expanse Inc.
|
|
4089
|
+
url: https://expanse.co/
|
|
4090
|
+
-
|
|
4091
|
+
user_agent: 'HuaweiWebCatBot/6.0) (To acquire the allowed html pages as reliable information of URL categorization in the automatic process for Huawei Web Categorization.; https://isecurity.huawei.com/; sec at huawei dot com)'
|
|
4092
|
+
bot:
|
|
4093
|
+
name: HuaweiWebCatBot
|
|
4094
|
+
category: Crawler
|
|
4095
|
+
url: https://isecurity.huawei.com
|
|
4096
|
+
producer:
|
|
4097
|
+
name: Huawei Technologies Co., Ltd.
|
|
4098
|
+
url: https://huawei.com
|
|
4099
|
+
-
|
|
4100
|
+
user_agent: Mozilla/5.0 (compatible; SputnikFaviconBot/1.2; +http://corp.sputnik.ru/webmaster)
|
|
4101
|
+
bot:
|
|
4102
|
+
name: Sputnik Favicon Bot
|
|
4103
|
+
url: ""
|
|
4104
|
+
category: Crawler
|
|
4105
|
+
-
|
|
4106
|
+
user_agent: Hatena-Favicon2 (http://www.hatena.ne.jp/faq/)
|
|
4107
|
+
bot:
|
|
4108
|
+
name: Hatena Favicon
|
|
4109
|
+
category: Crawler
|
|
4110
|
+
url: https://www.hatena.ne.jp/faq/
|
|
4111
|
+
producer:
|
|
4112
|
+
name: Hatena Co., Ltd.
|
|
4113
|
+
url: https://www.hatena.ne.jp
|
|
4114
|
+
-
|
|
4115
|
+
user_agent: Mozilla/5.0 (compatible; RyowlEngine/1.0; +https://ryowl.org)
|
|
4116
|
+
bot:
|
|
4117
|
+
name: Ryowl
|
|
4118
|
+
category: Crawler
|
|
4119
|
+
url: https://ryowl.org
|
|
4120
|
+
-
|
|
4121
|
+
user_agent: Mozilla/5.0 (compatible; OdklBot/1.0 like Linux; klass@odnoklassniki.ru)
|
|
4122
|
+
bot:
|
|
4123
|
+
name: Odnoklassniki Bot
|
|
4124
|
+
category: Crawler
|
|
4125
|
+
url: https://odnoklassniki.ru
|
|
4126
|
+
-
|
|
4127
|
+
user_agent: Mediatoolkitbot (complaints@mediatoolkit.com)
|
|
4128
|
+
bot:
|
|
4129
|
+
name: Mediatoolkit Bot
|
|
4130
|
+
category: Crawler
|
|
4131
|
+
url: https://mediatoolkit.com
|
|
4132
|
+
-
|
|
4133
|
+
user_agent: ZoominfoBot (zoominfobot at zoominfo dot com)
|
|
4134
|
+
bot:
|
|
4135
|
+
name: ZoominfoBot
|
|
4136
|
+
category: Crawler
|
|
4137
|
+
url: https://www.zoominfo.com
|
|
4138
|
+
-
|
|
4139
|
+
user_agent: Mozilla/5.0 (compatible; WeViKaBot/1.0; +http://www.wevika.de/)
|
|
4140
|
+
bot:
|
|
4141
|
+
name: WeViKaBot
|
|
4142
|
+
category: Crawler
|
|
4143
|
+
url: http://www.wevika.de
|
|
4144
|
+
-
|
|
4145
|
+
user_agent: Mozilla/5.0 (compatible; SEOkicks; +https://www.seokicks.de/robot.html)
|
|
4146
|
+
bot:
|
|
4147
|
+
name: SEOkicks
|
|
4148
|
+
category: Crawler
|
|
4149
|
+
url: https://www.seokicks.de/robot.html
|
|
4150
|
+
-
|
|
4151
|
+
user_agent: Mozilla/5.0 (compatible; Plukkie/1.6; http://www.botje.com/plukkie.htm)
|
|
4152
|
+
bot:
|
|
4153
|
+
name: Plukkie
|
|
4154
|
+
category: Crawler
|
|
4155
|
+
url: http://www.botje.com/plukkie.htm
|
|
4156
|
+
-
|
|
4157
|
+
user_agent: Mozilla/5.0 (compatible; proximic; https://www.comscore.com/Web-Crawler)
|
|
4158
|
+
bot:
|
|
4159
|
+
name: Comscore
|
|
4160
|
+
category: Crawler
|
|
4161
|
+
url: https://www.comscore.com/Web-Crawler
|
|
4162
|
+
-
|
|
4163
|
+
user_agent: Mozilla/5.0 (compatible; SurdotlyBot/1.0; +http://sur.ly/bot.html)
|
|
4164
|
+
bot:
|
|
4165
|
+
name: SurdotlyBot
|
|
4166
|
+
category: Crawler
|
|
4167
|
+
url: http://sur.ly/bot.html
|
|
4168
|
+
-
|
|
4169
|
+
user_agent: Mozilla/5.0 (compatible; Gowikibot/1.0; +http://www.gowikibot.com)
|
|
4170
|
+
bot:
|
|
4171
|
+
name: Gowikibot
|
|
4172
|
+
category: Crawler
|
|
4173
|
+
url: http:/www.gowikibot.com
|
|
4174
|
+
-
|
|
4175
|
+
user_agent: Mozilla/5.0 (compatible; SabsimBot/3.0; +https://sabsim.com)
|
|
4176
|
+
bot:
|
|
4177
|
+
name: SabsimBot
|
|
4178
|
+
category: Crawler
|
|
4179
|
+
url: https://sabsim.com
|
|
4180
|
+
-
|
|
4181
|
+
user_agent: Mozilla/5.0 (compatible; LumtelBot/1.0; +http://lumtel.com)
|
|
4182
|
+
bot:
|
|
4183
|
+
name: LumtelBot
|
|
4184
|
+
category: Crawler
|
|
4185
|
+
url: https://umtel.com
|
|
4186
|
+
-
|
|
4187
|
+
user_agent: Mozilla/5.0+(compatible;+PiplBot;+http://www.pipl.com/bot/)
|
|
4188
|
+
bot:
|
|
4189
|
+
name: PiplBot
|
|
4190
|
+
category: Crawler
|
|
4191
|
+
url: http://www.pipl.com/bot
|
|
4192
|
+
-
|
|
4193
|
+
user_agent: Mozilla/5.0 (compatible; woobot/2.0; +https://www.woorank.com/bot)
|
|
4194
|
+
bot:
|
|
4195
|
+
name: WooRank
|
|
4196
|
+
category: Crawler
|
|
4197
|
+
url: https://www.woorank.com/bot
|
|
4198
|
+
-
|
|
4199
|
+
user_agent: YahooMailProxy; https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
|
4200
|
+
bot:
|
|
4201
|
+
name: Yahoo! Mail Proxy
|
|
4202
|
+
category: Service Agent
|
|
4203
|
+
url: https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
|
4204
|
+
producer:
|
|
4205
|
+
name: Yahoo! Inc.
|
|
4206
|
+
url: http://www.yahoo.com
|
|
4207
|
+
-
|
|
4208
|
+
user_agent: 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; Cookiebot/1.0; http://cookiebot.com/) Chrome/79.0.3945.117 Safari/537.36'
|
|
4209
|
+
bot:
|
|
4210
|
+
name: Cookiebot
|
|
4211
|
+
category: Crawler
|
|
4212
|
+
url: https://support.cookiebot.com/hc/en-us/articles/360014264140-Scanner-User-Agent
|
|
4213
|
+
producer:
|
|
4214
|
+
name: Cybot A/S
|
|
4215
|
+
url: https://www.cybot.com/
|
|
4216
|
+
-
|
|
4217
|
+
user_agent: NetSystemsResearch studies the availability of various services across the internet. Our website is netsystemsresearch.com
|
|
4218
|
+
bot:
|
|
4219
|
+
name: NetSystemsResearch
|
|
4220
|
+
category: Security Checker
|
|
4221
|
+
url: https://www.netsystemsresearch.com/
|
|
4222
|
+
producer:
|
|
4223
|
+
name: NET SYSTEMS RESEARCH LLC
|
|
4224
|
+
url: https://www.netsystemsresearch.com/
|
|
4225
|
+
-
|
|
4226
|
+
user_agent: 'Mozilla/5.0 (compatible; CensysInspect/1.1; https://about.censys.io/)'
|
|
4227
|
+
bot:
|
|
4228
|
+
name: CensysInspect
|
|
4229
|
+
category: Security Checker
|
|
4230
|
+
url: https://about.censys.io/
|
|
4231
|
+
producer:
|
|
4232
|
+
name: Censys, Inc.
|
|
4233
|
+
url: https://censys.io/
|
|
4234
|
+
-
|
|
4235
|
+
user_agent: https://gdnplus.com:Gather Analyze Provide.
|
|
4236
|
+
bot:
|
|
4237
|
+
name: GDNP
|
|
4238
|
+
category: Crawler
|
|
4239
|
+
url: https://gdnplus.com/
|
|
4240
|
+
producer:
|
|
4241
|
+
name: Global Digital Network Plus, LLC
|
|
4242
|
+
url: https://gdnplus.com/
|
|
4243
|
+
-
|
|
4244
|
+
user_agent: WellKnownBot/0.1 (https://well-known.dev)
|
|
4245
|
+
bot:
|
|
4246
|
+
name: WellKnownBot
|
|
4247
|
+
category: Crawler
|
|
4248
|
+
url: https://well-known.dev
|
|
4249
|
+
-
|
|
4250
|
+
user_agent: Mozilla/5.0 (compatible; Adsbot/3.1; https://seostar.co/robot/)
|
|
4251
|
+
bot:
|
|
4252
|
+
name: Adsbot
|
|
4253
|
+
category: Crawler
|
|
4254
|
+
url: https://seostar.co/robot/
|
|
4255
|
+
-
|
|
4256
|
+
user_agent: MTRobot/0.2 (Metrics Tools Analytics Crawler; https://metrics-tools.de/robot.html; crawler@metrics-tools.de)
|
|
4257
|
+
bot:
|
|
4258
|
+
name: MTRobot
|
|
4259
|
+
category: Crawler
|
|
4260
|
+
url: https://metrics-tools.de/robot.html
|
|
4261
|
+
producer:
|
|
4262
|
+
name: Metrics Tools
|
|
4263
|
+
url: https://metrics-tools.de/
|
|
4264
|
+
-
|
|
4265
|
+
user_agent: My User Agent 1.0
|
|
4266
|
+
bot:
|
|
4267
|
+
name: Generic Bot
|
|
4268
|
+
-
|
|
4269
|
+
user_agent: serpstatbot/1.0 (advanced backlink tracking bot; curl/7.58.0; http://serpstatbot.com/; abuse@serpstatbot.com)
|
|
4270
|
+
bot:
|
|
4271
|
+
name: serpstatbot
|
|
4272
|
+
category: Crawler
|
|
4273
|
+
url: http://serpstatbot.com/
|
|
4274
|
+
producer:
|
|
4275
|
+
name: Netpeak Ltd
|
|
4276
|
+
url: https://netpeak.net/
|
|
4277
|
+
-
|
|
4278
|
+
user_agent: colly - https://github.com/gocolly/colly/v2
|
|
4279
|
+
bot:
|
|
4280
|
+
name: colly
|
|
4281
|
+
category: Crawler
|
|
4282
|
+
url: https://github.com/gocolly/colly/
|
|
4283
|
+
-
|
|
4284
|
+
user_agent: l9tcpid/v1.0.0
|
|
4285
|
+
bot:
|
|
4286
|
+
name: l9tcpid
|
|
4287
|
+
category: Security Checker
|
|
4288
|
+
url: https://github.com/LeakIX/l9tcpid
|
|
4289
|
+
-
|
|
4290
|
+
user_agent: Mozilla/5.0 (compatible; MegaIndex.ru/2.0; +http://megaindex.com/crawler)
|
|
4291
|
+
bot:
|
|
4292
|
+
name: MegaIndex
|
|
4293
|
+
category: Crawler
|
|
4294
|
+
url: https://megaindex.com/crawler
|
|
4295
|
+
-
|
|
4296
|
+
user_agent: Mozilla/5.0 (compatible; Seekport Crawler; http://seekport.com/)
|
|
4297
|
+
bot:
|
|
4298
|
+
name: Seekport
|
|
4299
|
+
category: Crawler
|
|
4300
|
+
url: http://www.seekport.com/
|
|
4301
|
+
producer:
|
|
4302
|
+
name: SISTRIX GmbH
|
|
4303
|
+
url: https://www.sistrix.de/
|
|
4304
|
+
-
|
|
4305
|
+
user_agent: Mozilla/5.0 (compatible; seolyt/1.1; +https://seolyt.com)
|
|
4306
|
+
bot:
|
|
4307
|
+
name: seolyt
|
|
4308
|
+
category: Crawler
|
|
4309
|
+
url: https://seolyt.com/
|
|
4310
|
+
-
|
|
4311
|
+
user_agent: Mozilla/5.0 (compatible; YaK/1.0; http://linkfluence.com/; bot@linkfluence.com)
|
|
4312
|
+
bot:
|
|
4313
|
+
name: YaK
|
|
4314
|
+
category: Crawler
|
|
4315
|
+
url: https://www.linkfluence.com/
|
|
4316
|
+
producer:
|
|
4317
|
+
name: Linkfluence SAS
|
|
4318
|
+
url: https://www.linkfluence.com/
|
|
4319
|
+
-
|
|
4320
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64; +http://www.komodia.com/newwiki/index.php/URL_server_crawler) KomodiaBot/1.0
|
|
4321
|
+
bot:
|
|
4322
|
+
name: KomodiaBot
|
|
4323
|
+
category: Crawler
|
|
4324
|
+
url: http://www.komodia.com/newwiki/index.php/URL_server_crawler
|
|
4325
|
+
producer:
|
|
4326
|
+
name: Komodia Inc.
|
|
4327
|
+
url: https://www.komodia.com/
|
|
4328
|
+
-
|
|
4329
|
+
user_agent: Mozilla/5.0 (Windows NT 6.3; WOW64; Trident/7.0; rv:11.0; Catchpoint) like Gecko
|
|
4330
|
+
bot:
|
|
4331
|
+
name: Catchpoint
|
|
4332
|
+
category: Site Monitor
|
|
4333
|
+
url: https://www.catchpoint.com/
|
|
4334
|
+
producer:
|
|
4335
|
+
name: Catchpoint Systems
|
|
4336
|
+
url: https://www.catchpoint.com/
|
|
4337
|
+
-
|
|
4338
|
+
user_agent: Better Uptime Bot Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36
|
|
4339
|
+
bot:
|
|
4340
|
+
name: Better Uptime Bot
|
|
4341
|
+
category: Site Monitor
|
|
4342
|
+
url: https://betteruptime.com/faq
|
|
4343
|
+
producer:
|
|
4344
|
+
name: Better Uptime
|
|
4345
|
+
url: https://betteruptime.com/
|
|
4346
|
+
-
|
|
4347
|
+
user_agent: gobuster/3.1.0
|
|
4348
|
+
bot:
|
|
4349
|
+
name: Gobuster
|
|
4350
|
+
url: https://github.com/OJ/gobuster
|
|
4351
|
+
-
|
|
4352
|
+
user_agent: k6/0.31.1 (https://k6.io/)
|
|
4353
|
+
bot:
|
|
4354
|
+
name: K6
|
|
4355
|
+
url: https://k6.io/
|
|
4356
|
+
-
|
|
4357
|
+
user_agent: Mozilla/5.0 (compatible; Neevabot/1.0; https://neeva.com/neevabot)
|
|
4358
|
+
bot:
|
|
4359
|
+
name: Neevabot
|
|
4360
|
+
category: Search bot
|
|
4361
|
+
url: https://neeva.com/neevabot
|
|
4362
|
+
producer:
|
|
4363
|
+
name: Neeva Inc.
|
|
4364
|
+
url: https://neeva.com/
|
|
4365
|
+
-
|
|
4366
|
+
user_agent: LinkPreview/1.5 (http://linkpreview.net)
|
|
4367
|
+
bot:
|
|
4368
|
+
name: LinkPreview
|
|
4369
|
+
category: Service Agent
|
|
4370
|
+
url: https://www.linkpreview.net/
|
|
4371
|
+
-
|
|
4372
|
+
user_agent: Mozilla/5.0 (compatible; JungleKeyThumbnail/1.1; +http://www.junglekey.fr/)
|
|
4373
|
+
bot:
|
|
4374
|
+
name: JungleKeyThumbnail
|
|
4375
|
+
category: Crawler
|
|
4376
|
+
url: https://junglekey.com/
|
|
4377
|
+
-
|
|
4378
|
+
user_agent: rocketmonitor 1.0
|
|
4379
|
+
bot:
|
|
4380
|
+
name: RocketMonitorBot
|
|
4381
|
+
category: Site Monitor
|
|
4382
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
|
4383
|
+
producer:
|
|
4384
|
+
name: Radio Mast, Inc.
|
|
4385
|
+
url: https://www.radiomast.io/
|
|
4386
|
+
-
|
|
4387
|
+
user_agent: RocketMonitorBot/1.0 ( https://www.radiomast.io)
|
|
4388
|
+
bot:
|
|
4389
|
+
name: RocketMonitorBot
|
|
4390
|
+
category: Site Monitor
|
|
4391
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
|
4392
|
+
producer:
|
|
4393
|
+
name: Radio Mast, Inc.
|
|
4394
|
+
url: https://www.radiomast.io/
|
|
4395
|
+
-
|
|
4396
|
+
user_agent: SitemapParser-VIPnytt/1.1 ( https://github.com/VIPnytt/SitemapParser/blob/master/README.md)
|
|
4397
|
+
bot:
|
|
4398
|
+
name: SitemapParser-VIPnytt
|
|
4399
|
+
category: Crawler
|
|
4400
|
+
url: https://github.com/VIPnytt/SitemapParser/
|
|
4401
|
+
-
|
|
4402
|
+
user_agent: Turnitin (https://bit.ly/2UvnfoQ)
|
|
4403
|
+
bot:
|
|
4404
|
+
name: Turnitin
|
|
4405
|
+
category: Crawler
|
|
4406
|
+
url: https://turnitin.com/robot/crawlerinfo.html
|
|
4407
|
+
-
|
|
4408
|
+
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; Storebot-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Mobile Safari/537.36
|
|
4409
|
+
bot:
|
|
4410
|
+
name: Google StoreBot
|
|
4411
|
+
category: Crawler
|
|
4412
|
+
-
|
|
4413
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.56 Safari/537.36 DMBrowser/2.1 (UV)
|
|
4414
|
+
bot:
|
|
4415
|
+
name: Dotcom Monitor
|
|
4416
|
+
category: Site Monitor
|
|
4417
|
+
url: https://www.dotcom-monitor.com
|
|
4418
|
+
-
|
|
4419
|
+
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64; rv:29.0) Gecko/20100101 /29.0 DMBrowser-BV
|
|
4420
|
+
bot:
|
|
4421
|
+
name: Dotcom Monitor
|
|
4422
|
+
category: Site Monitor
|
|
4423
|
+
url: https://www.dotcom-monitor.com
|
|
4424
|
+
-
|
|
4425
|
+
user_agent: Mozilla/5.0 (compatible; ThinkChaos/0.3.0; +In_the_test_phase,_if_the_ThinkChaos_brings_you_trouble,_please_add_disallow_to_the_robots.txt._Thank_you.)
|
|
4426
|
+
bot:
|
|
4427
|
+
name: ThinkChaos
|
|
4428
|
+
category: Crawler
|
|
4429
|
+
-
|
|
4430
|
+
user_agent: Mozilla/5.0 (compatible; DataForSeoBot/1.0; +https://dataforseo.com/dataforseo-bot)
|
|
4431
|
+
bot:
|
|
4432
|
+
name: DataForSeoBot
|
|
4433
|
+
category: Crawler
|
|
4434
|
+
url: https://dataforseo.com/dataforseo-bot
|