device_detector 1.0.2 → 1.0.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +5 -5
- data/.rubocop.yml +49 -0
- data/.ruby-version +1 -0
- data/.travis.yml +5 -6
- data/CHANGELOG.md +11 -0
- data/README.md +8 -7
- data/Rakefile +7 -4
- data/device_detector.gemspec +1 -0
- data/lib/device_detector/bot.rb +2 -2
- data/lib/device_detector/browser.rb +364 -0
- data/lib/device_detector/client.rb +11 -2
- data/lib/device_detector/device.rb +1168 -22
- data/lib/device_detector/memory_cache.rb +5 -5
- data/lib/device_detector/metadata_extractor.rb +7 -8
- data/lib/device_detector/model_extractor.rb +3 -3
- data/lib/device_detector/name_extractor.rb +2 -2
- data/lib/device_detector/os.rb +148 -116
- data/lib/device_detector/parser.rb +22 -9
- data/lib/device_detector/version.rb +1 -1
- data/lib/device_detector/version_extractor.rb +10 -2
- data/lib/device_detector.rb +73 -40
- data/regexes/bots.yml +909 -59
- data/regexes/client/browser_engine.yml +14 -2
- data/regexes/client/browsers.yml +1356 -241
- data/regexes/client/feed_readers.yml +10 -10
- data/regexes/client/libraries.yml +75 -1
- data/regexes/client/mediaplayers.yml +39 -3
- data/regexes/client/mobile_apps.yml +524 -45
- data/regexes/client/pim.yml +55 -2
- data/regexes/device/cameras.yml +6 -6
- data/regexes/device/car_browsers.yml +23 -3
- data/regexes/device/consoles.yml +9 -3
- data/regexes/device/mobiles.yml +16903 -3199
- data/regexes/device/notebooks.yml +114 -0
- data/regexes/device/portable_media_player.yml +20 -3
- data/regexes/device/shell_tv.yml +117 -0
- data/regexes/device/televisions.yml +440 -35
- data/regexes/oss.yml +603 -165
- data/regexes/vendorfragments.yml +6 -2
- data/spec/device_detector/concrete_user_agent_spec.rb +38 -51
- data/spec/device_detector/detector_fixtures_spec.rb +36 -37
- data/spec/device_detector/device_spec.rb +52 -56
- data/spec/device_detector/memory_cache_spec.rb +19 -19
- data/spec/device_detector/model_extractor_spec.rb +3 -3
- data/spec/device_detector/version_extractor_spec.rb +5 -6
- data/spec/device_detector_spec.rb +26 -26
- data/spec/fixtures/client/browser.yml +2617 -555
- data/spec/fixtures/client/feed_reader.yml +34 -52
- data/spec/fixtures/client/library.yml +129 -38
- data/spec/fixtures/client/mediaplayer.yml +59 -28
- data/spec/fixtures/client/mobile_app.yml +589 -20
- data/spec/fixtures/client/pim.yml +92 -19
- data/spec/fixtures/detector/bots.yml +1749 -458
- data/spec/fixtures/detector/camera.yml +30 -24
- data/spec/fixtures/detector/car_browser.yml +199 -3
- data/spec/fixtures/detector/console.yml +107 -45
- data/spec/fixtures/detector/desktop.yml +3216 -758
- data/spec/fixtures/detector/feature_phone.yml +935 -181
- data/spec/fixtures/detector/feed_reader.yml +181 -193
- data/spec/fixtures/detector/mediaplayer.yml +157 -60
- data/spec/fixtures/detector/mobile_apps.yml +914 -136
- data/spec/fixtures/detector/peripheral.yml +271 -0
- data/spec/fixtures/detector/phablet.yml +5593 -1533
- data/spec/fixtures/detector/portable_media_player.yml +398 -32
- data/spec/fixtures/detector/smart_display.yml +183 -9
- data/spec/fixtures/detector/smart_speaker.yml +60 -0
- data/spec/fixtures/detector/smartphone-1.yml +3930 -4239
- data/spec/fixtures/detector/smartphone-10.yml +3985 -7366
- data/spec/fixtures/detector/smartphone-11.yml +5083 -3784
- data/spec/fixtures/detector/smartphone-12.yml +8989 -0
- data/spec/fixtures/detector/smartphone-13.yml +9412 -0
- data/spec/fixtures/detector/smartphone-14.yml +9477 -0
- data/spec/fixtures/detector/smartphone-15.yml +9281 -0
- data/spec/fixtures/detector/smartphone-16.yml +9678 -0
- data/spec/fixtures/detector/smartphone-17.yml +9965 -0
- data/spec/fixtures/detector/smartphone-18.yml +9806 -0
- data/spec/fixtures/detector/smartphone-19.yml +9965 -0
- data/spec/fixtures/detector/smartphone-2.yml +6670 -4375
- data/spec/fixtures/detector/smartphone-20.yml +9710 -0
- data/spec/fixtures/detector/smartphone-21.yml +8693 -0
- data/spec/fixtures/detector/smartphone-22.yml +10178 -0
- data/spec/fixtures/detector/smartphone-23.yml +9453 -0
- data/spec/fixtures/detector/smartphone-24.yml +9843 -0
- data/spec/fixtures/detector/smartphone-25.yml +9703 -0
- data/spec/fixtures/detector/smartphone-26.yml +10007 -0
- data/spec/fixtures/detector/smartphone-27.yml +4927 -0
- data/spec/fixtures/detector/smartphone-3.yml +4656 -4711
- data/spec/fixtures/detector/smartphone-4.yml +3518 -4479
- data/spec/fixtures/detector/smartphone-5.yml +3805 -4803
- data/spec/fixtures/detector/smartphone-6.yml +3745 -4693
- data/spec/fixtures/detector/smartphone-7.yml +3721 -4645
- data/spec/fixtures/detector/smartphone-8.yml +4564 -4699
- data/spec/fixtures/detector/smartphone-9.yml +3897 -4888
- data/spec/fixtures/detector/smartphone.yml +3154 -4141
- data/spec/fixtures/detector/tablet-1.yml +4742 -4576
- data/spec/fixtures/detector/tablet-2.yml +3803 -4731
- data/spec/fixtures/detector/tablet-3.yml +6210 -2309
- data/spec/fixtures/detector/tablet-4.yml +9062 -0
- data/spec/fixtures/detector/tablet-5.yml +9273 -0
- data/spec/fixtures/detector/tablet-6.yml +4588 -0
- data/spec/fixtures/detector/tablet.yml +3629 -4613
- data/spec/fixtures/detector/tv-1.yml +2501 -0
- data/spec/fixtures/detector/tv.yml +8856 -2064
- data/spec/fixtures/detector/unknown.yml +412 -587
- data/spec/fixtures/detector/wearable.yml +915 -0
- data/spec/fixtures/device/camera.yml +4 -3
- data/spec/fixtures/device/car_browser.yml +9 -2
- data/spec/fixtures/device/console.yml +15 -14
- data/spec/fixtures/device/notebook.yml +7 -0
- data/spec/fixtures/parser/oss.yml +1392 -21
- data/spec/fixtures/parser/vendorfragments.yml +57 -51
- metadata +70 -4
|
@@ -1,45 +1,51 @@
|
|
|
1
1
|
---
|
|
2
|
-
-
|
|
2
|
+
-
|
|
3
3
|
user_agent: 360spider-image
|
|
4
4
|
bot:
|
|
5
5
|
name: 360Spider
|
|
6
6
|
category: Search bot
|
|
7
|
-
url:
|
|
7
|
+
url: https://www.so.com/help/help_3_2.html
|
|
8
8
|
producer:
|
|
9
9
|
name: Online Media Group, Inc.
|
|
10
10
|
url: ""
|
|
11
|
-
-
|
|
11
|
+
-
|
|
12
12
|
user_agent: Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; MDDR; .NET4.0C; .NET4.0E; .NET CLR 1.1.4322; Tablet PC 2.0); 360Spider
|
|
13
13
|
bot:
|
|
14
14
|
name: 360Spider
|
|
15
15
|
category: Search bot
|
|
16
|
-
url:
|
|
16
|
+
url: https://www.so.com/help/help_3_2.html
|
|
17
17
|
producer:
|
|
18
18
|
name: Online Media Group, Inc.
|
|
19
19
|
url: ""
|
|
20
|
-
-
|
|
20
|
+
-
|
|
21
21
|
user_agent: Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0); 360Spider
|
|
22
22
|
bot:
|
|
23
23
|
name: 360Spider
|
|
24
24
|
category: Search bot
|
|
25
|
-
url:
|
|
25
|
+
url: https://www.so.com/help/help_3_2.html
|
|
26
26
|
producer:
|
|
27
27
|
name: Online Media Group, Inc.
|
|
28
28
|
url: ""
|
|
29
|
-
-
|
|
29
|
+
-
|
|
30
30
|
user_agent: Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.1 (KHTML, like Gecko) Chrome/21.0.1180.89 Safari/537.1; 360Spider
|
|
31
31
|
bot:
|
|
32
32
|
name: 360Spider
|
|
33
33
|
category: Search bot
|
|
34
|
-
url:
|
|
34
|
+
url: https://www.so.com/help/help_3_2.html
|
|
35
35
|
producer:
|
|
36
36
|
name: Online Media Group, Inc.
|
|
37
37
|
url: ""
|
|
38
|
-
-
|
|
38
|
+
-
|
|
39
39
|
user_agent: 'ADmantX Platform Semantic Analyzer - ADmantX Inc. - www.admantx.com - support@admantx.com'
|
|
40
40
|
bot:
|
|
41
41
|
name: ADMantX
|
|
42
|
-
-
|
|
42
|
+
-
|
|
43
|
+
user_agent: ias-va/3.1 (+https://www.admantx.com/service-fetcher.html)
|
|
44
|
+
bot:
|
|
45
|
+
name: ADmantX Service Fetcher
|
|
46
|
+
category: Service bot
|
|
47
|
+
url: https://www.admantx.com/service-fetcher.html
|
|
48
|
+
-
|
|
43
49
|
user_agent: Aboundex/0.3 (http://www.aboundex.com/crawler/)
|
|
44
50
|
bot:
|
|
45
51
|
name: Aboundexbot
|
|
@@ -48,7 +54,7 @@
|
|
|
48
54
|
producer:
|
|
49
55
|
name: Aboundex.com
|
|
50
56
|
url: http://www.aboundex.com
|
|
51
|
-
-
|
|
57
|
+
-
|
|
52
58
|
user_agent: Mozilla/5.0 (compatible; AcoonBot/4.11.1; +http://www.acoon.de/robot.asp)
|
|
53
59
|
bot:
|
|
54
60
|
name: Acoon
|
|
@@ -57,7 +63,7 @@
|
|
|
57
63
|
producer:
|
|
58
64
|
name: Acoon GmbH
|
|
59
65
|
url: http://www.acoon.de
|
|
60
|
-
-
|
|
66
|
+
-
|
|
61
67
|
user_agent: AddThis.com robot tech.support@clearspring.com
|
|
62
68
|
bot:
|
|
63
69
|
name: AddThis.com
|
|
@@ -66,25 +72,50 @@
|
|
|
66
72
|
producer:
|
|
67
73
|
name: Clearspring Technologies, Inc.
|
|
68
74
|
url: http://www.clearspring.com
|
|
69
|
-
-
|
|
75
|
+
-
|
|
70
76
|
user_agent: ia_archiver (+http://www.alexa.com/site/help/webmasters; crawler@alexa.com)
|
|
71
77
|
bot:
|
|
72
78
|
name: Alexa Crawler
|
|
73
79
|
category: Search bot
|
|
74
|
-
url: https://alexa.
|
|
80
|
+
url: https://support.alexa.com/hc/en-us/sections/200100794-Crawlers
|
|
75
81
|
producer:
|
|
76
82
|
name: Alexa Internet
|
|
77
|
-
url:
|
|
78
|
-
-
|
|
83
|
+
url: https://www.alexa.com
|
|
84
|
+
-
|
|
79
85
|
user_agent: Mozilla/5.0 (compatible; alexa site audit/1.0; http://www.alexa.com/help/webmasters; )
|
|
80
86
|
bot:
|
|
81
87
|
name: Alexa Site Audit
|
|
82
88
|
category: Site Monitor
|
|
83
|
-
url:
|
|
89
|
+
url: https://support.alexa.com/hc/en-us/articles/200450194
|
|
84
90
|
producer:
|
|
85
91
|
name: Alexa Internet
|
|
86
|
-
url:
|
|
87
|
-
-
|
|
92
|
+
url: https://www.alexa.com
|
|
93
|
+
-
|
|
94
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Amazonbot/0.1; +https://developer.amazon.com/support/amazonbot)
|
|
95
|
+
bot:
|
|
96
|
+
name: Amazon Bot
|
|
97
|
+
category: Crawler
|
|
98
|
+
url: https://developer.amazon.com/support/amazonbot
|
|
99
|
+
producer:
|
|
100
|
+
name: Amazon.com, Inc.
|
|
101
|
+
url: https://www.amazon.com/
|
|
102
|
+
-
|
|
103
|
+
user_agent: Amazon Route 53 Health Check Service; ref:xxxxxxxx-xxxx-xxxxxxxxx-xxxxxxxxxxxx; report http://amzn.to/xxxxxxx
|
|
104
|
+
bot:
|
|
105
|
+
name: Amazon Route53 Health Check
|
|
106
|
+
category: Service Agent
|
|
107
|
+
producer:
|
|
108
|
+
name: Amazon Web Services
|
|
109
|
+
url: https://aws.amazon.com/
|
|
110
|
+
-
|
|
111
|
+
user_agent: Amazon-Route53-Health-Check-Service (ref b0eb04d5-cb5e-40e7-839b-558e52fc3f0d; report http://amzn.to/1vsZADi)
|
|
112
|
+
bot:
|
|
113
|
+
name: Amazon Route53 Health Check
|
|
114
|
+
category: Service Agent
|
|
115
|
+
producer:
|
|
116
|
+
name: Amazon Web Services
|
|
117
|
+
url: https://aws.amazon.com/
|
|
118
|
+
-
|
|
88
119
|
user_agent: AmorankSpider/0.1; +http://amorank.com/webcrawler.html
|
|
89
120
|
bot:
|
|
90
121
|
name: Amorank Spider
|
|
@@ -93,7 +124,7 @@
|
|
|
93
124
|
producer:
|
|
94
125
|
name: Amorank
|
|
95
126
|
url: http://www.amorank.com
|
|
96
|
-
-
|
|
127
|
+
-
|
|
97
128
|
user_agent: 'Curious George - www.analyticsseo.com/crawler'
|
|
98
129
|
bot:
|
|
99
130
|
name: Analytics SEO Crawler
|
|
@@ -102,7 +133,7 @@
|
|
|
102
133
|
producer:
|
|
103
134
|
name: Analytics SEO
|
|
104
135
|
url: http://www.analyticsseo.com
|
|
105
|
-
-
|
|
136
|
+
-
|
|
106
137
|
user_agent: ApacheBench/2.3
|
|
107
138
|
bot:
|
|
108
139
|
name: ApacheBench
|
|
@@ -110,35 +141,44 @@
|
|
|
110
141
|
url: https://httpd.apache.org/docs/2.4/programs/ab.html
|
|
111
142
|
producer:
|
|
112
143
|
name: The Apache Software Foundation
|
|
113
|
-
url:
|
|
114
|
-
-
|
|
144
|
+
url: https://www.apache.org/foundation/
|
|
145
|
+
-
|
|
115
146
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10 _1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1; +http://www.apple.com/go/applebot)
|
|
116
147
|
bot:
|
|
117
148
|
name: Applebot
|
|
118
149
|
category: Crawler
|
|
119
|
-
url:
|
|
150
|
+
url: https://support.apple.com/en-us/HT204683
|
|
120
151
|
producer:
|
|
121
152
|
name: Apple Inc
|
|
122
|
-
url:
|
|
123
|
-
-
|
|
153
|
+
url: https://www.apple.com
|
|
154
|
+
-
|
|
155
|
+
user_agent: AppSignalBot/1.0 (+https://appsignal.com)
|
|
156
|
+
bot:
|
|
157
|
+
name: AppSignalBot
|
|
158
|
+
category: Site Monitor
|
|
159
|
+
url: https://docs.appsignal.com/uptime-monitoring/
|
|
160
|
+
producer:
|
|
161
|
+
name: AppSignal
|
|
162
|
+
url: https://appsignal.com/
|
|
163
|
+
-
|
|
124
164
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_10_1) AppleWebKit/600.2.5 (KHTML, like Gecko) Version/8.0.2 Safari/600.2.5 (Applebot/0.1)
|
|
125
165
|
bot:
|
|
126
166
|
name: Applebot
|
|
127
167
|
category: Crawler
|
|
128
|
-
url:
|
|
168
|
+
url: https://support.apple.com/en-us/HT204683
|
|
129
169
|
producer:
|
|
130
170
|
name: Apple Inc
|
|
131
|
-
url:
|
|
132
|
-
-
|
|
171
|
+
url: https://www.apple.com
|
|
172
|
+
-
|
|
133
173
|
user_agent: Arachni/v1.5.1
|
|
134
174
|
bot:
|
|
135
175
|
name: Arachni
|
|
136
176
|
category: Security Checker
|
|
137
|
-
url:
|
|
177
|
+
url: https://www.arachni-scanner.com/
|
|
138
178
|
producer:
|
|
139
179
|
name: Sarosys LLC
|
|
140
|
-
url:
|
|
141
|
-
-
|
|
180
|
+
url: https://www.sarosys.com/
|
|
181
|
+
-
|
|
142
182
|
user_agent: Mozilla/2.0 (compatible; Ask Jeeves/Teoma)
|
|
143
183
|
bot:
|
|
144
184
|
name: Ask Jeeves
|
|
@@ -147,7 +187,43 @@
|
|
|
147
187
|
producer:
|
|
148
188
|
name: Ask Jeeves Inc.
|
|
149
189
|
url: http://www.ask.com
|
|
150
|
-
-
|
|
190
|
+
-
|
|
191
|
+
user_agent: Mozilla/5.0 (compatible;AspiegelBot)
|
|
192
|
+
bot:
|
|
193
|
+
name: AspiegelBot
|
|
194
|
+
category: Crawler
|
|
195
|
+
url: https://aspiegel.com/
|
|
196
|
+
producer:
|
|
197
|
+
name: Huawei
|
|
198
|
+
url: https://www.huawei.com/
|
|
199
|
+
-
|
|
200
|
+
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; AspiegelBot)
|
|
201
|
+
bot:
|
|
202
|
+
name: AspiegelBot
|
|
203
|
+
category: Crawler
|
|
204
|
+
url: https://aspiegel.com/
|
|
205
|
+
producer:
|
|
206
|
+
name: Huawei
|
|
207
|
+
url: https://www.huawei.com/
|
|
208
|
+
-
|
|
209
|
+
user_agent: AwarioRssBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
|
210
|
+
bot:
|
|
211
|
+
name: Awario
|
|
212
|
+
category: Feed Fetcher
|
|
213
|
+
url: https://awario.com/bots.html
|
|
214
|
+
producer:
|
|
215
|
+
name: Awario
|
|
216
|
+
url: https://awario.com/
|
|
217
|
+
-
|
|
218
|
+
user_agent: AwarioSmartBot/1.0 (+https://awario.com/bots.html; bots@awario.com)
|
|
219
|
+
bot:
|
|
220
|
+
name: Awario
|
|
221
|
+
category: Search bot
|
|
222
|
+
url: https://awario.com/bots.html
|
|
223
|
+
producer:
|
|
224
|
+
name: Awario
|
|
225
|
+
url: https://awario.com/
|
|
226
|
+
-
|
|
151
227
|
user_agent: Mozilla/5.0 (compatible; BLEXBot/1.0; +http://webmeup-crawler.com/)
|
|
152
228
|
bot:
|
|
153
229
|
name: BLEXBot Crawler
|
|
@@ -156,7 +232,7 @@
|
|
|
156
232
|
producer:
|
|
157
233
|
name: WebMeUp
|
|
158
234
|
url: http://webmeup.com
|
|
159
|
-
-
|
|
235
|
+
-
|
|
160
236
|
user_agent: BUbiNG (+http://law.di.unimi.it/BUbiNG.html)
|
|
161
237
|
bot:
|
|
162
238
|
name: BUbiNG
|
|
@@ -165,7 +241,7 @@
|
|
|
165
241
|
producer:
|
|
166
242
|
name: The Laboratory for Web Algorithmics (LAW)
|
|
167
243
|
url: 'http://law.di.unimi.it/software.php#buging'
|
|
168
|
-
-
|
|
244
|
+
-
|
|
169
245
|
user_agent: Backlink-Check.de (+http://www.backlink-check.de/bot.html)
|
|
170
246
|
bot:
|
|
171
247
|
name: Backlink-Check.de
|
|
@@ -174,7 +250,7 @@
|
|
|
174
250
|
producer:
|
|
175
251
|
name: Mediagreen Medienservice
|
|
176
252
|
url: http://www.backlink-check.de
|
|
177
|
-
-
|
|
253
|
+
-
|
|
178
254
|
user_agent: BacklinkCrawler (http://www.backlinktest.com/crawler.html)
|
|
179
255
|
bot:
|
|
180
256
|
name: BacklinkCrawler
|
|
@@ -183,7 +259,7 @@
|
|
|
183
259
|
producer:
|
|
184
260
|
name: 2.0Promotion GbR
|
|
185
261
|
url: http://www.backlinktest.com
|
|
186
|
-
-
|
|
262
|
+
-
|
|
187
263
|
user_agent: Baiduspider+(+http://www.baidu.com/search/spider.htm)
|
|
188
264
|
bot:
|
|
189
265
|
name: Baidu Spider
|
|
@@ -192,7 +268,7 @@
|
|
|
192
268
|
producer:
|
|
193
269
|
name: Baidu
|
|
194
270
|
url: http://www.baidu.com
|
|
195
|
-
-
|
|
271
|
+
-
|
|
196
272
|
user_agent: Baiduspider-image+(+http://www.baidu.com/search/spider.htm)
|
|
197
273
|
bot:
|
|
198
274
|
name: Baidu Spider
|
|
@@ -201,7 +277,7 @@
|
|
|
201
277
|
producer:
|
|
202
278
|
name: Baidu
|
|
203
279
|
url: http://www.baidu.com
|
|
204
|
-
-
|
|
280
|
+
-
|
|
205
281
|
user_agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; baidu Transcoder;)
|
|
206
282
|
bot:
|
|
207
283
|
name: Baidu Spider
|
|
@@ -210,7 +286,7 @@
|
|
|
210
286
|
producer:
|
|
211
287
|
name: Baidu
|
|
212
288
|
url: http://www.baidu.com
|
|
213
|
-
-
|
|
289
|
+
-
|
|
214
290
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search
|
|
215
291
|
bot:
|
|
216
292
|
name: Baidu Spider
|
|
@@ -219,7 +295,7 @@
|
|
|
219
295
|
producer:
|
|
220
296
|
name: Baidu
|
|
221
297
|
url: http://www.baidu.com
|
|
222
|
-
-
|
|
298
|
+
-
|
|
223
299
|
user_agent: Mozilla/5.0 (compatible; Baiduspider/2.0; +http://www.baidu.com/search/spider.html)
|
|
224
300
|
bot:
|
|
225
301
|
name: Baidu Spider
|
|
@@ -228,7 +304,7 @@
|
|
|
228
304
|
producer:
|
|
229
305
|
name: Baidu
|
|
230
306
|
url: http://www.baidu.com
|
|
231
|
-
-
|
|
307
|
+
-
|
|
232
308
|
user_agent: Mozilla/5.0 (Linux;u;Android 2.3.7;zh-cn;) AppleWebKit/533.1 (KHTML,like Gecko) Version/4.0 Mobile Safari/533.1 (compatible; +http://www.baidu.com/search/spider.html)
|
|
233
309
|
bot:
|
|
234
310
|
name: Baidu Spider
|
|
@@ -237,7 +313,7 @@
|
|
|
237
313
|
producer:
|
|
238
314
|
name: Baidu
|
|
239
315
|
url: http://www.baidu.com
|
|
240
|
-
-
|
|
316
|
+
-
|
|
241
317
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8;baidu Transcoder) Gecko/20100722 Firefox/3.6.8 ( .NET CLR 3.5.30729)
|
|
242
318
|
bot:
|
|
243
319
|
name: Baidu Spider
|
|
@@ -246,7 +322,13 @@
|
|
|
246
322
|
producer:
|
|
247
323
|
name: Baidu
|
|
248
324
|
url: http://www.baidu.com
|
|
249
|
-
-
|
|
325
|
+
-
|
|
326
|
+
user_agent: Barkrowler/0.9 (+http://www.exensa.com/crawl)
|
|
327
|
+
bot:
|
|
328
|
+
name: Barkrowler
|
|
329
|
+
category: Crawler
|
|
330
|
+
url: http://www.exensa.com/crawl
|
|
331
|
+
-
|
|
250
332
|
user_agent: Mozilla/5.0 (compatible; BazQux/2.4; +https://bazqux.com/fetcher; 2 subscribers)
|
|
251
333
|
bot:
|
|
252
334
|
name: BazQux Reader
|
|
@@ -255,7 +337,7 @@
|
|
|
255
337
|
producer:
|
|
256
338
|
name: ""
|
|
257
339
|
url: ""
|
|
258
|
-
-
|
|
340
|
+
-
|
|
259
341
|
user_agent: Mozilla/5.0 (compatible; bingbot/2.0; +http://www.bing.com/bingbot.htm)
|
|
260
342
|
bot:
|
|
261
343
|
name: BingBot
|
|
@@ -264,7 +346,7 @@
|
|
|
264
346
|
producer:
|
|
265
347
|
name: Microsoft Corporation
|
|
266
348
|
url: http://www.microsoft.com
|
|
267
|
-
-
|
|
349
|
+
-
|
|
268
350
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534+ (KHTML, like Gecko) BingPreview/1.0b
|
|
269
351
|
bot:
|
|
270
352
|
name: BingBot
|
|
@@ -273,7 +355,7 @@
|
|
|
273
355
|
producer:
|
|
274
356
|
name: Microsoft Corporation
|
|
275
357
|
url: http://www.microsoft.com
|
|
276
|
-
-
|
|
358
|
+
-
|
|
277
359
|
user_agent: msnbot-media/1.1 (+http://search.msn.com/msnbot.htm)
|
|
278
360
|
bot:
|
|
279
361
|
name: BingBot
|
|
@@ -282,7 +364,7 @@
|
|
|
282
364
|
producer:
|
|
283
365
|
name: Microsoft Corporation
|
|
284
366
|
url: http://www.microsoft.com
|
|
285
|
-
-
|
|
367
|
+
-
|
|
286
368
|
user_agent: msnbot-NewsBlogs/2.0b (+http://search.msn.com/msnbot.htm)
|
|
287
369
|
bot:
|
|
288
370
|
name: BingBot
|
|
@@ -291,7 +373,7 @@
|
|
|
291
373
|
producer:
|
|
292
374
|
name: Microsoft Corporation
|
|
293
375
|
url: http://www.microsoft.com
|
|
294
|
-
-
|
|
376
|
+
-
|
|
295
377
|
user_agent: msnbot/1.1 (+http://search.msn.com/msnbot.htm)
|
|
296
378
|
bot:
|
|
297
379
|
name: BingBot
|
|
@@ -300,7 +382,7 @@
|
|
|
300
382
|
producer:
|
|
301
383
|
name: Microsoft Corporation
|
|
302
384
|
url: http://www.microsoft.com
|
|
303
|
-
-
|
|
385
|
+
-
|
|
304
386
|
user_agent: msnbot/2.0b (+http://search.msn.com/msnbot.htm)
|
|
305
387
|
bot:
|
|
306
388
|
name: BingBot
|
|
@@ -309,7 +391,7 @@
|
|
|
309
391
|
producer:
|
|
310
392
|
name: Microsoft Corporation
|
|
311
393
|
url: http://www.microsoft.com
|
|
312
|
-
-
|
|
394
|
+
-
|
|
313
395
|
user_agent: msnbot/2.0b v1394720947.6703
|
|
314
396
|
bot:
|
|
315
397
|
name: BingBot
|
|
@@ -318,7 +400,7 @@
|
|
|
318
400
|
producer:
|
|
319
401
|
name: Microsoft Corporation
|
|
320
402
|
url: http://www.microsoft.com
|
|
321
|
-
-
|
|
403
|
+
-
|
|
322
404
|
user_agent: MSNBot/Nutch-1.5.1
|
|
323
405
|
bot:
|
|
324
406
|
name: BingBot
|
|
@@ -327,7 +409,7 @@
|
|
|
327
409
|
producer:
|
|
328
410
|
name: Microsoft Corporation
|
|
329
411
|
url: http://www.microsoft.com
|
|
330
|
-
-
|
|
412
|
+
-
|
|
331
413
|
user_agent: bitlybot/3.0
|
|
332
414
|
bot:
|
|
333
415
|
name: BitlyBot
|
|
@@ -336,7 +418,7 @@
|
|
|
336
418
|
producer:
|
|
337
419
|
name: Bitly, Inc.
|
|
338
420
|
url: https://bitly.com
|
|
339
|
-
-
|
|
421
|
+
-
|
|
340
422
|
user_agent: Mozilla/5.0 (compatible; Blekkobot; ScoutJet; +http://blekko.com/about/blekkobot)
|
|
341
423
|
bot:
|
|
342
424
|
name: Blekkobot
|
|
@@ -345,7 +427,7 @@
|
|
|
345
427
|
producer:
|
|
346
428
|
name: Blekko
|
|
347
429
|
url: http://blekko.com
|
|
348
|
-
-
|
|
430
|
+
-
|
|
349
431
|
user_agent: Bloglovin/1.0 (http://www.bloglovin.com; 1 subscribers)
|
|
350
432
|
bot:
|
|
351
433
|
name: Bloglovin
|
|
@@ -354,7 +436,7 @@
|
|
|
354
436
|
producer:
|
|
355
437
|
name: ""
|
|
356
438
|
url: ""
|
|
357
|
-
-
|
|
439
|
+
-
|
|
358
440
|
user_agent: Blogtrottr/2.0
|
|
359
441
|
bot:
|
|
360
442
|
name: Blogtrottr
|
|
@@ -363,7 +445,24 @@
|
|
|
363
445
|
producer:
|
|
364
446
|
name: Blogtrottr Ltd
|
|
365
447
|
url: https://blogtrottr.com/
|
|
366
|
-
-
|
|
448
|
+
-
|
|
449
|
+
user_agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com
|
|
450
|
+
bot:
|
|
451
|
+
name: BoardReader
|
|
452
|
+
category: Search bot
|
|
453
|
+
url: https://boardreader.com/
|
|
454
|
+
producer:
|
|
455
|
+
name: Effyis Inc
|
|
456
|
+
url: https://boardreader.com/
|
|
457
|
+
-
|
|
458
|
+
user_agent: BoardReader Blog Indexer(http://boardreader.com)
|
|
459
|
+
bot:
|
|
460
|
+
name: BoardReader Blog Indexer
|
|
461
|
+
category: Crawler
|
|
462
|
+
producer:
|
|
463
|
+
name: BoardReader
|
|
464
|
+
url: https://boardreader.com/
|
|
465
|
+
-
|
|
367
466
|
user_agent: Mozilla/5.0 (compatible; BountiiBot/1.1; +http://bountii.com/contact.php)
|
|
368
467
|
bot:
|
|
369
468
|
name: Bountii Bot
|
|
@@ -372,7 +471,16 @@
|
|
|
372
471
|
producer:
|
|
373
472
|
name: Bountii Inc.
|
|
374
473
|
url: http://bountii.com
|
|
375
|
-
-
|
|
474
|
+
-
|
|
475
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10.10; rv:41.0) Gecko/20100101 Firefox/55.0 BrandVerity/1.0 (http://www.brandverity.com/why-is-brandverity-visiting-me)
|
|
476
|
+
bot:
|
|
477
|
+
name: BrandVerity
|
|
478
|
+
category: Crawler
|
|
479
|
+
url: https://www.brandverity.com/why-is-brandverity-visiting-me
|
|
480
|
+
producer:
|
|
481
|
+
name: BrandVerity, Inc.
|
|
482
|
+
url: https://www.brandverity.com/
|
|
483
|
+
-
|
|
376
484
|
user_agent: Browsershots
|
|
377
485
|
bot:
|
|
378
486
|
name: Browsershots
|
|
@@ -381,7 +489,16 @@
|
|
|
381
489
|
producer:
|
|
382
490
|
name: Browsershots.org
|
|
383
491
|
url: http://browsershots.org
|
|
384
|
-
-
|
|
492
|
+
-
|
|
493
|
+
user_agent: Buck/2.2; (+https://app.hypefactors.com/media-monitoring/about.html)
|
|
494
|
+
bot:
|
|
495
|
+
name: Buck
|
|
496
|
+
category: Search bot
|
|
497
|
+
url: https://hypefactors.com/
|
|
498
|
+
producer:
|
|
499
|
+
name: Hypefactors A/S
|
|
500
|
+
url: https://hypefactors.com/
|
|
501
|
+
-
|
|
385
502
|
user_agent: Mozilla/5.0 (compatible; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
|
386
503
|
bot:
|
|
387
504
|
name: Butterfly Robot
|
|
@@ -390,7 +507,7 @@
|
|
|
390
507
|
producer:
|
|
391
508
|
name: Topsy Labs
|
|
392
509
|
url: http://labs.topsy.com
|
|
393
|
-
-
|
|
510
|
+
-
|
|
394
511
|
user_agent: Mozilla/5.0 (Macintosh; Butterfly/1.0; +http://labs.topsy.com/butterfly/) Gecko/2009032608 Firefox/3.0.8
|
|
395
512
|
bot:
|
|
396
513
|
name: Butterfly Robot
|
|
@@ -399,7 +516,25 @@
|
|
|
399
516
|
producer:
|
|
400
517
|
name: Topsy Labs
|
|
401
518
|
url: http://labs.topsy.com
|
|
402
|
-
-
|
|
519
|
+
-
|
|
520
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/51.0.5668.1446 Mobile Safari/537.36; Bytespider;bytespider@bytedance.com
|
|
521
|
+
bot:
|
|
522
|
+
name: Bytespider
|
|
523
|
+
category: Search bot
|
|
524
|
+
url: https://bytedance.com/
|
|
525
|
+
producer:
|
|
526
|
+
name: ByteDance Ltd.
|
|
527
|
+
url: https://bytedance.com/
|
|
528
|
+
-
|
|
529
|
+
user_agent: CATExplorador/1.0beta (sistemes at domini dot cat; http://domini.cat/catexplorador.html)
|
|
530
|
+
bot:
|
|
531
|
+
name: CATExplorador
|
|
532
|
+
category: Search bot
|
|
533
|
+
url: https://fundacio.cat/ca/domini/
|
|
534
|
+
producer:
|
|
535
|
+
name: Fundació puntCAT
|
|
536
|
+
url: https://fundacio.cat/ca/domini/
|
|
537
|
+
-
|
|
403
538
|
user_agent: Mozilla/5.0 (compatible; CareerBot/1.1; +http://www.career-x.de/bot.html)
|
|
404
539
|
bot:
|
|
405
540
|
name: CareerBot
|
|
@@ -408,7 +543,7 @@
|
|
|
408
543
|
producer:
|
|
409
544
|
name: career-x GmbH
|
|
410
545
|
url: http://www.career-x.de
|
|
411
|
-
-
|
|
546
|
+
-
|
|
412
547
|
user_agent: Castro 2, Episode Duration Lookup
|
|
413
548
|
bot:
|
|
414
549
|
name: Castro 2
|
|
@@ -417,7 +552,7 @@
|
|
|
417
552
|
producer:
|
|
418
553
|
name: Supertop
|
|
419
554
|
url: http://supertop.co
|
|
420
|
-
-
|
|
555
|
+
-
|
|
421
556
|
user_agent: Cliqzbot/0.1 (+http://cliqz.com/company/cliqzbot)
|
|
422
557
|
bot:
|
|
423
558
|
name: Cliqzbot
|
|
@@ -426,7 +561,7 @@
|
|
|
426
561
|
producer:
|
|
427
562
|
name: 10betterpages GmbH
|
|
428
563
|
url: http://cliqz.com
|
|
429
|
-
-
|
|
564
|
+
-
|
|
430
565
|
user_agent: Mozilla/5.0 (compatible; Cloudflare-AMP/1.0; +https://amp.cloudflare.com/doc/fetcher.html) AppleWebKit/534.34
|
|
431
566
|
bot:
|
|
432
567
|
name: CloudFlare AMP Fetcher
|
|
@@ -435,7 +570,7 @@
|
|
|
435
570
|
producer:
|
|
436
571
|
name: CloudFlare
|
|
437
572
|
url: http://www.cloudflare.com
|
|
438
|
-
-
|
|
573
|
+
-
|
|
439
574
|
user_agent: Mozilla/5.0 (compatible; CloudFlare-AlwaysOnline/1.0; +http://www.cloudflare.com/always-online) AppleWebKit/534.34
|
|
440
575
|
bot:
|
|
441
576
|
name: CloudFlare Always Online
|
|
@@ -444,7 +579,7 @@
|
|
|
444
579
|
producer:
|
|
445
580
|
name: CloudFlare
|
|
446
581
|
url: http://www.cloudflare.com
|
|
447
|
-
-
|
|
582
|
+
-
|
|
448
583
|
user_agent: collectd/5.5.1
|
|
449
584
|
bot:
|
|
450
585
|
name: Collectd
|
|
@@ -453,7 +588,7 @@
|
|
|
453
588
|
producer:
|
|
454
589
|
name: Collectd
|
|
455
590
|
url: https://collectd.org/
|
|
456
|
-
-
|
|
591
|
+
-
|
|
457
592
|
user_agent: CommaFeed/1.0 (http://www.commafeed.com)
|
|
458
593
|
bot:
|
|
459
594
|
name: CommaFeed
|
|
@@ -462,16 +597,79 @@
|
|
|
462
597
|
producer:
|
|
463
598
|
name: ""
|
|
464
599
|
url: ""
|
|
465
|
-
-
|
|
600
|
+
-
|
|
601
|
+
user_agent: coccocbot-web/1.0 (+http://help.coccoc.com/searchengine)
|
|
602
|
+
bot:
|
|
603
|
+
name: Cốc Cốc Bot
|
|
604
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
605
|
+
category: Search bot
|
|
606
|
+
producer:
|
|
607
|
+
name: Cốc Cốc
|
|
608
|
+
url: https://coccoc.com/
|
|
609
|
+
-
|
|
466
610
|
user_agent: Mozilla/5.0 (compatible; coccoc/1.0; +http://help.coccoc.com/)
|
|
467
611
|
bot:
|
|
468
612
|
name: Cốc Cốc Bot
|
|
469
|
-
url:
|
|
613
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
614
|
+
category: Search bot
|
|
615
|
+
producer:
|
|
616
|
+
name: Cốc Cốc
|
|
617
|
+
url: https://coccoc.com/
|
|
618
|
+
-
|
|
619
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-ads/1.0; +http://help.coccoc.com/searchengine)
|
|
620
|
+
bot:
|
|
621
|
+
name: Cốc Cốc Bot
|
|
622
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
623
|
+
category: Search bot
|
|
624
|
+
producer:
|
|
625
|
+
name: Cốc Cốc
|
|
626
|
+
url: https://coccoc.com/
|
|
627
|
+
-
|
|
628
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-fast/1.0; +http://help.coccoc.com/searchengine)
|
|
629
|
+
bot:
|
|
630
|
+
name: Cốc Cốc Bot
|
|
631
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
632
|
+
category: Search bot
|
|
633
|
+
producer:
|
|
634
|
+
name: Cốc Cốc
|
|
635
|
+
url: https://coccoc.com/
|
|
636
|
+
-
|
|
637
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-image/1.0; +http://help.coccoc.com/searchengine)
|
|
638
|
+
bot:
|
|
639
|
+
name: Cốc Cốc Bot
|
|
640
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
641
|
+
category: Search bot
|
|
642
|
+
producer:
|
|
643
|
+
name: Cốc Cốc
|
|
644
|
+
url: https://coccoc.com/
|
|
645
|
+
-
|
|
646
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-shopping/1.0; +http://help.coccoc.com/searchengine)
|
|
647
|
+
bot:
|
|
648
|
+
name: Cốc Cốc Bot
|
|
649
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
650
|
+
category: Search bot
|
|
651
|
+
producer:
|
|
652
|
+
name: Cốc Cốc
|
|
653
|
+
url: https://coccoc.com/
|
|
654
|
+
-
|
|
655
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot-web/1.0; +http://help.coccoc.com/searchengine)
|
|
656
|
+
bot:
|
|
657
|
+
name: Cốc Cốc Bot
|
|
658
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
659
|
+
category: Search bot
|
|
660
|
+
producer:
|
|
661
|
+
name: Cốc Cốc
|
|
662
|
+
url: https://coccoc.com/
|
|
663
|
+
-
|
|
664
|
+
user_agent: Mozilla/5.0 (compatible; coccocbot/1.0; +http://help.coccoc.com/searchengine)
|
|
665
|
+
bot:
|
|
666
|
+
name: Cốc Cốc Bot
|
|
667
|
+
url: https://help.coccoc.com/en/search-engine/coccoc-robots
|
|
470
668
|
category: Search bot
|
|
471
669
|
producer:
|
|
472
670
|
name: Cốc Cốc
|
|
473
|
-
url:
|
|
474
|
-
-
|
|
671
|
+
url: https://coccoc.com/
|
|
672
|
+
-
|
|
475
673
|
user_agent: Datadog Agent/5.10.1
|
|
476
674
|
bot:
|
|
477
675
|
name: Datadog Agent
|
|
@@ -480,7 +678,16 @@
|
|
|
480
678
|
producer:
|
|
481
679
|
name: Datadog
|
|
482
680
|
url: https://www.datadoghq.com/
|
|
483
|
-
-
|
|
681
|
+
-
|
|
682
|
+
user_agent: Mozilla/5.0 (X11; Datanyze; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.181 Safari/537.36
|
|
683
|
+
bot:
|
|
684
|
+
name: Datanyze
|
|
685
|
+
url: ""
|
|
686
|
+
category: Crawler
|
|
687
|
+
producer:
|
|
688
|
+
name: Datanyze
|
|
689
|
+
url: https://www.datanyze.com
|
|
690
|
+
-
|
|
484
691
|
user_agent: Mozilla/5.0 (compatible; Dataprovider/6.92; +https://www.dataprovider.com/)
|
|
485
692
|
bot:
|
|
486
693
|
name: Dataprovider
|
|
@@ -489,7 +696,7 @@
|
|
|
489
696
|
producer:
|
|
490
697
|
name: Dataprovider B.V.
|
|
491
698
|
url: https://www.dataprovider.com/
|
|
492
|
-
-
|
|
699
|
+
-
|
|
493
700
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant; not on Windows server;) Daumoa/4.0;
|
|
494
701
|
bot:
|
|
495
702
|
name: Daum
|
|
@@ -498,7 +705,7 @@
|
|
|
498
705
|
producer:
|
|
499
706
|
name: Daum Communications Corp.
|
|
500
707
|
url: http://www.kakaocorp.com/main
|
|
501
|
-
-
|
|
708
|
+
-
|
|
502
709
|
user_agent: Mozilla/5.0 (compatible; MSIE or Firefox mutant;) Daum 4.1
|
|
503
710
|
bot:
|
|
504
711
|
name: Daum
|
|
@@ -507,7 +714,7 @@
|
|
|
507
714
|
producer:
|
|
508
715
|
name: Daum Communications Corp.
|
|
509
716
|
url: http://www.kakaocorp.com/main
|
|
510
|
-
-
|
|
717
|
+
-
|
|
511
718
|
user_agent: Mozilla/5.0 (compatible; Dazoobot/0.1; +http://dazoo.fr)
|
|
512
719
|
bot:
|
|
513
720
|
name: Dazoobot
|
|
@@ -516,7 +723,7 @@
|
|
|
516
723
|
producer:
|
|
517
724
|
name: DAZOO.FR
|
|
518
725
|
url: http://dazoo.fr
|
|
519
|
-
-
|
|
726
|
+
-
|
|
520
727
|
user_agent: Mozilla/5.0 (compatible; discobot/1.0; +http://discoveryengine.com/discobot.html)
|
|
521
728
|
bot:
|
|
522
729
|
name: Discobot
|
|
@@ -525,7 +732,7 @@
|
|
|
525
732
|
producer:
|
|
526
733
|
name: Discovery Engine
|
|
527
734
|
url: http://discoveryengine.com
|
|
528
|
-
-
|
|
735
|
+
-
|
|
529
736
|
user_agent: 'Domain Re-Animator Bot (http://domainreanimator.com) - support@domainreanimator.com'
|
|
530
737
|
bot:
|
|
531
738
|
name: Domain Re-Animator Bot
|
|
@@ -534,7 +741,7 @@
|
|
|
534
741
|
producer:
|
|
535
742
|
name: Domain Re-Animator, LLC
|
|
536
743
|
url: http://domainreanimator.com
|
|
537
|
-
-
|
|
744
|
+
-
|
|
538
745
|
user_agent: support@domainreanimator.com
|
|
539
746
|
bot:
|
|
540
747
|
name: Domain Re-Animator Bot
|
|
@@ -543,7 +750,13 @@
|
|
|
543
750
|
producer:
|
|
544
751
|
name: Domain Re-Animator, LLC
|
|
545
752
|
url: http://domainreanimator.com
|
|
546
|
-
-
|
|
753
|
+
-
|
|
754
|
+
user_agent: Mozilla/5.0 (compatible; Domains Project/1.1.0; +https://domainsproject.org)
|
|
755
|
+
bot:
|
|
756
|
+
name: Domains Project
|
|
757
|
+
category: Crawler
|
|
758
|
+
url: https://domainsproject.org
|
|
759
|
+
-
|
|
547
760
|
user_agent: dotbot
|
|
548
761
|
bot:
|
|
549
762
|
name: DotBot
|
|
@@ -552,7 +765,16 @@
|
|
|
552
765
|
producer:
|
|
553
766
|
name: SEOmoz, Inc.
|
|
554
767
|
url: http://moz.com/
|
|
555
|
-
-
|
|
768
|
+
-
|
|
769
|
+
user_agent: DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)
|
|
770
|
+
bot:
|
|
771
|
+
name: DuckDuckGo Bot
|
|
772
|
+
category: Search bot
|
|
773
|
+
url: https://duckduckgo.com/duckduckbot
|
|
774
|
+
producer:
|
|
775
|
+
name: DuckDuckGo
|
|
776
|
+
url: https://duckduckgo.com/
|
|
777
|
+
-
|
|
556
778
|
user_agent: Mozilla/5.0 (compatible; DuckDuckGo-Favicons-Bot/1.0; +http://duckduckgo.com)
|
|
557
779
|
bot:
|
|
558
780
|
name: DuckDuckGo Bot
|
|
@@ -561,7 +783,7 @@
|
|
|
561
783
|
producer:
|
|
562
784
|
name: DuckDuckGo
|
|
563
785
|
url: https://duckduckgo.com/
|
|
564
|
-
-
|
|
786
|
+
-
|
|
565
787
|
user_agent: EMail Exractor
|
|
566
788
|
bot:
|
|
567
789
|
name: EMail Exractor
|
|
@@ -570,7 +792,7 @@
|
|
|
570
792
|
producer:
|
|
571
793
|
name: ""
|
|
572
794
|
url: ""
|
|
573
|
-
-
|
|
795
|
+
-
|
|
574
796
|
user_agent: Mozilla/5.0 (compatible; EasouSpider; +http://www.easou.com/search/spider.html)
|
|
575
797
|
bot:
|
|
576
798
|
name: Easou Spider
|
|
@@ -579,7 +801,7 @@
|
|
|
579
801
|
producer:
|
|
580
802
|
name: easou ICP
|
|
581
803
|
url: http://www.easou.com
|
|
582
|
-
-
|
|
804
|
+
-
|
|
583
805
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 3_0 like Mac OS X; en-us; EasouSpider; +http://www.easou.com/search/spider.html)
|
|
584
806
|
bot:
|
|
585
807
|
name: Easou Spider
|
|
@@ -588,7 +810,16 @@
|
|
|
588
810
|
producer:
|
|
589
811
|
name: easou ICP
|
|
590
812
|
url: http://www.easou.com
|
|
591
|
-
-
|
|
813
|
+
-
|
|
814
|
+
user_agent: Mozilla/5.0 (compatible; Embedly/0.2; +http://support.embed.ly/)
|
|
815
|
+
bot:
|
|
816
|
+
name: Embedly
|
|
817
|
+
category: Crawler
|
|
818
|
+
url: https://support.embed.ly/hc/en-us
|
|
819
|
+
producer:
|
|
820
|
+
name: A Medium, Corp.
|
|
821
|
+
url: https://medium.com/
|
|
822
|
+
-
|
|
592
823
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0 (BiggerBetter); +http://www.exabot.com/go/robot)
|
|
593
824
|
bot:
|
|
594
825
|
name: ExaBot
|
|
@@ -597,7 +828,7 @@
|
|
|
597
828
|
producer:
|
|
598
829
|
name: Dassault Systèmes
|
|
599
830
|
url: http://www.3ds.com
|
|
600
|
-
-
|
|
831
|
+
-
|
|
601
832
|
user_agent: Mozilla/5.0 (compatible; Exabot/3.0; +http://www.exabot.com/go/robot)
|
|
602
833
|
bot:
|
|
603
834
|
name: ExaBot
|
|
@@ -606,7 +837,7 @@
|
|
|
606
837
|
producer:
|
|
607
838
|
name: Dassault Systèmes
|
|
608
839
|
url: http://www.3ds.com
|
|
609
|
-
-
|
|
840
|
+
-
|
|
610
841
|
user_agent: Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)
|
|
611
842
|
bot:
|
|
612
843
|
name: ExaBot
|
|
@@ -615,7 +846,7 @@
|
|
|
615
846
|
producer:
|
|
616
847
|
name: Dassault Systèmes
|
|
617
848
|
url: http://www.3ds.com
|
|
618
|
-
-
|
|
849
|
+
-
|
|
619
850
|
user_agent: ExactSeek Crawler (nutch 1.4)/Nutch-1.4 (ExactSeek Crawler; http://www.exactseek.com)
|
|
620
851
|
bot:
|
|
621
852
|
name: ExactSeek Crawler
|
|
@@ -624,7 +855,7 @@
|
|
|
624
855
|
producer:
|
|
625
856
|
name: Jayde Online, Inc.
|
|
626
857
|
url: http://www.jaydeonlineinc.com
|
|
627
|
-
-
|
|
858
|
+
-
|
|
628
859
|
user_agent: Mozilla/5.0 (compatible; Ezooms/1.0; help@moz.com)
|
|
629
860
|
bot:
|
|
630
861
|
name: Ezooms
|
|
@@ -633,7 +864,7 @@
|
|
|
633
864
|
producer:
|
|
634
865
|
name: SEOmoz, Inc.
|
|
635
866
|
url: http://moz.com/
|
|
636
|
-
-
|
|
867
|
+
-
|
|
637
868
|
user_agent: facebookexternalhit/1.1 (+http://www.facebook.com/externalhit_uatext.php)
|
|
638
869
|
bot:
|
|
639
870
|
name: Facebook External Hit
|
|
@@ -642,7 +873,16 @@
|
|
|
642
873
|
producer:
|
|
643
874
|
name: Facebook
|
|
644
875
|
url: http://www.facebook.com
|
|
645
|
-
-
|
|
876
|
+
-
|
|
877
|
+
user_agent: facebookexternalua
|
|
878
|
+
bot:
|
|
879
|
+
name: Facebook External Hit
|
|
880
|
+
category: Social Media Agent
|
|
881
|
+
url: https://www.facebook.com/externalhit_uatext.php
|
|
882
|
+
producer:
|
|
883
|
+
name: Facebook
|
|
884
|
+
url: http://www.facebook.com
|
|
885
|
+
-
|
|
646
886
|
user_agent: facebookplatform/1.0 (+http://developers.facebook.com)
|
|
647
887
|
bot:
|
|
648
888
|
name: Facebook External Hit
|
|
@@ -651,7 +891,7 @@
|
|
|
651
891
|
producer:
|
|
652
892
|
name: Facebook
|
|
653
893
|
url: http://www.facebook.com
|
|
654
|
-
-
|
|
894
|
+
-
|
|
655
895
|
user_agent: Feed Wrangler/1.0 (3 subscribers; feed-id=248559; http://feedwrangler.net; Allow like Gecko)
|
|
656
896
|
bot:
|
|
657
897
|
name: Feed Wrangler
|
|
@@ -660,7 +900,7 @@
|
|
|
660
900
|
producer:
|
|
661
901
|
name: 'David Smith & Developing Perspective, LLC'
|
|
662
902
|
url: https://david-smith.org
|
|
663
|
-
-
|
|
903
|
+
-
|
|
664
904
|
user_agent: FeedBurner/1.0 (http://www.FeedBurner.com)
|
|
665
905
|
bot:
|
|
666
906
|
name: FeedBurner
|
|
@@ -669,7 +909,7 @@
|
|
|
669
909
|
producer:
|
|
670
910
|
name: ""
|
|
671
911
|
url: ""
|
|
672
|
-
-
|
|
912
|
+
-
|
|
673
913
|
user_agent: 'Feedbin - 9 subscribers'
|
|
674
914
|
bot:
|
|
675
915
|
name: Feedbin
|
|
@@ -678,7 +918,7 @@
|
|
|
678
918
|
producer:
|
|
679
919
|
name: ""
|
|
680
920
|
url: ""
|
|
681
|
-
-
|
|
921
|
+
-
|
|
682
922
|
user_agent: Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)
|
|
683
923
|
bot:
|
|
684
924
|
name: Feedly
|
|
@@ -687,7 +927,7 @@
|
|
|
687
927
|
producer:
|
|
688
928
|
name: ""
|
|
689
929
|
url: ""
|
|
690
|
-
-
|
|
930
|
+
-
|
|
691
931
|
user_agent: FeedlyApp/1.0 (http://www.feedly.com)
|
|
692
932
|
bot:
|
|
693
933
|
name: Feedly
|
|
@@ -696,7 +936,7 @@
|
|
|
696
936
|
producer:
|
|
697
937
|
name: ""
|
|
698
938
|
url: ""
|
|
699
|
-
-
|
|
939
|
+
-
|
|
700
940
|
user_agent: FeedlyBot/1.0 (http://feedly.com)
|
|
701
941
|
bot:
|
|
702
942
|
name: Feedly
|
|
@@ -705,7 +945,7 @@
|
|
|
705
945
|
producer:
|
|
706
946
|
name: ""
|
|
707
947
|
url: ""
|
|
708
|
-
-
|
|
948
|
+
-
|
|
709
949
|
user_agent: MetaFeedly/1.0 (http://www.feedly.com)
|
|
710
950
|
bot:
|
|
711
951
|
name: Feedly
|
|
@@ -714,7 +954,7 @@
|
|
|
714
954
|
producer:
|
|
715
955
|
name: ""
|
|
716
956
|
url: ""
|
|
717
|
-
-
|
|
957
|
+
-
|
|
718
958
|
user_agent: Feedspot http://www.feedspot.com
|
|
719
959
|
bot:
|
|
720
960
|
name: Feedspot
|
|
@@ -723,7 +963,7 @@
|
|
|
723
963
|
producer:
|
|
724
964
|
name: ""
|
|
725
965
|
url: ""
|
|
726
|
-
-
|
|
966
|
+
-
|
|
727
967
|
user_agent: Fever/1.38 (Feed Parser; http://feedafever.com; Allow like Gecko)
|
|
728
968
|
bot:
|
|
729
969
|
name: Fever
|
|
@@ -732,13 +972,13 @@
|
|
|
732
972
|
producer:
|
|
733
973
|
name: ""
|
|
734
974
|
url: ""
|
|
735
|
-
-
|
|
975
|
+
-
|
|
736
976
|
user_agent: Mozilla/5.0 (compatible; Findxbot/1.0; +http://www.findxbot.com)
|
|
737
977
|
bot:
|
|
738
978
|
name: Findxbot
|
|
739
979
|
category: Crawler
|
|
740
980
|
url: http://www.findxbot.com
|
|
741
|
-
-
|
|
981
|
+
-
|
|
742
982
|
user_agent: Mozilla/5.0 (compatible; FlipboardProxy/1.2; +http://flipboard.com/browserproxy)
|
|
743
983
|
bot:
|
|
744
984
|
name: Flipboard
|
|
@@ -747,7 +987,7 @@
|
|
|
747
987
|
producer:
|
|
748
988
|
name: Flipboard
|
|
749
989
|
url: http://flipboard.com/
|
|
750
|
-
-
|
|
990
|
+
-
|
|
751
991
|
user_agent: Mozilla/5.0 (compatible; FlipboardRSS/1.2; +http://flipboard.com/browserproxy)
|
|
752
992
|
bot:
|
|
753
993
|
name: Flipboard
|
|
@@ -756,39 +996,76 @@
|
|
|
756
996
|
producer:
|
|
757
997
|
name: Flipboard
|
|
758
998
|
url: http://flipboard.com/
|
|
759
|
-
-
|
|
999
|
+
-
|
|
1000
|
+
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
|
1001
|
+
bot:
|
|
1002
|
+
name: FreshRSS
|
|
1003
|
+
category: Feed Fetcher
|
|
1004
|
+
url: https://freshrss.org/
|
|
1005
|
+
-
|
|
1006
|
+
user_agent: FreshRSS/1.12.0 (Linux; https://freshrss.org)
|
|
1007
|
+
bot:
|
|
1008
|
+
name: FreshRSS
|
|
1009
|
+
category: Feed Fetcher
|
|
1010
|
+
url: https://freshrss.org/
|
|
1011
|
+
-
|
|
1012
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64; GTmetrix https://gtmetrix.com/) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/75.0.3770.100 Safari/537.36
|
|
1013
|
+
bot:
|
|
1014
|
+
name: GTmetrix
|
|
1015
|
+
category: Crawler
|
|
1016
|
+
url: https://gtmetrix.com/
|
|
1017
|
+
producer:
|
|
1018
|
+
name: Carbon60 Operating Co. Ltd.
|
|
1019
|
+
url: https://www.carbon60.com/
|
|
1020
|
+
-
|
|
1021
|
+
user_agent: 7Siters/1.07 (+https://7ooo.ru/siters/)
|
|
1022
|
+
bot:
|
|
1023
|
+
name: Generic Bot
|
|
1024
|
+
-
|
|
760
1025
|
user_agent: COMODO SSL Checker
|
|
761
1026
|
bot:
|
|
762
1027
|
name: Generic Bot
|
|
763
|
-
-
|
|
1028
|
+
-
|
|
764
1029
|
user_agent: help@dataminr.com
|
|
765
1030
|
bot:
|
|
766
1031
|
name: Generic Bot
|
|
767
|
-
-
|
|
1032
|
+
-
|
|
768
1033
|
user_agent: 'HybridBot (hybrid.ru/about. If our bot caused problems please contact us. Contact email: m.lyashkov@targetix.net)'
|
|
769
1034
|
bot:
|
|
770
1035
|
name: Generic Bot
|
|
771
|
-
-
|
|
1036
|
+
-
|
|
1037
|
+
user_agent: 'Mozilla/5.0 (compatible; +centuryb.o.t9[at]gmail.com)'
|
|
1038
|
+
bot:
|
|
1039
|
+
name: Generic Bot
|
|
1040
|
+
-
|
|
772
1041
|
user_agent: Mozilla/5.0 (compatible; +http://tweetedtimes.com)
|
|
773
1042
|
bot:
|
|
774
1043
|
name: Generic Bot
|
|
775
|
-
-
|
|
1044
|
+
-
|
|
776
1045
|
user_agent: Mozilla/5.0 (compatible; Shareaholicbot/2.0; +http://www.shareaholic.com/bot)
|
|
777
1046
|
bot:
|
|
778
1047
|
name: Generic Bot
|
|
779
|
-
-
|
|
1048
|
+
-
|
|
780
1049
|
user_agent: Mozilla/5.0 (compatible; TrendsmapResolver/0.1)
|
|
781
1050
|
bot:
|
|
782
1051
|
name: Generic Bot
|
|
783
|
-
-
|
|
1052
|
+
-
|
|
784
1053
|
user_agent: niki-bot
|
|
785
1054
|
bot:
|
|
786
1055
|
name: Generic Bot
|
|
787
|
-
-
|
|
1056
|
+
-
|
|
788
1057
|
user_agent: PHPCrawl
|
|
789
1058
|
bot:
|
|
790
1059
|
name: Generic Bot
|
|
791
|
-
-
|
|
1060
|
+
-
|
|
1061
|
+
user_agent: robots
|
|
1062
|
+
bot:
|
|
1063
|
+
name: Generic Bot
|
|
1064
|
+
-
|
|
1065
|
+
user_agent: SeopultContentAnalyzer/1.0
|
|
1066
|
+
bot:
|
|
1067
|
+
name: Generic Bot
|
|
1068
|
+
-
|
|
792
1069
|
user_agent: Mozilla/5.0 (compatible; Genieo/1.0 http://www.genieo.com/webfilter.html)
|
|
793
1070
|
bot:
|
|
794
1071
|
name: Genieo Web filter
|
|
@@ -797,7 +1074,7 @@
|
|
|
797
1074
|
producer:
|
|
798
1075
|
name: Genieo
|
|
799
1076
|
url: http://www.genieo.com
|
|
800
|
-
-
|
|
1077
|
+
-
|
|
801
1078
|
user_agent: GigablastOpenSource/1.0
|
|
802
1079
|
bot:
|
|
803
1080
|
name: Gigablast
|
|
@@ -806,7 +1083,7 @@
|
|
|
806
1083
|
producer:
|
|
807
1084
|
name: Matt Wells
|
|
808
1085
|
url: http://www.gigablast.com/faq.html
|
|
809
|
-
-
|
|
1086
|
+
-
|
|
810
1087
|
user_agent: Mozilla/5.0 (compatible; Gluten Free Crawler/1.0; +http://glutenfreepleasure.com/)
|
|
811
1088
|
bot:
|
|
812
1089
|
name: Gluten Free Crawler
|
|
@@ -815,7 +1092,7 @@
|
|
|
815
1092
|
producer:
|
|
816
1093
|
name: ""
|
|
817
1094
|
url: ""
|
|
818
|
-
-
|
|
1095
|
+
-
|
|
819
1096
|
user_agent: Mozilla/5.0 (Windows NT 5.1; rv:11.0) Gecko Firefox/11.0 (via ggpht.com GoogleImageProxy)
|
|
820
1097
|
bot:
|
|
821
1098
|
name: Gmail Image Proxy
|
|
@@ -824,7 +1101,7 @@
|
|
|
824
1101
|
producer:
|
|
825
1102
|
name: Google Inc.
|
|
826
1103
|
url: http://www.google.com
|
|
827
|
-
-
|
|
1104
|
+
-
|
|
828
1105
|
user_agent: DoCoMo/2.0 P900i(c100;TB;W24H11) (compatible; ichiro/mobile goo; +http://search.goo.ne.jp/option/use/sub4/sub4-1/)
|
|
829
1106
|
bot:
|
|
830
1107
|
name: Goo
|
|
@@ -833,7 +1110,12 @@
|
|
|
833
1110
|
producer:
|
|
834
1111
|
name: NTT Resonant
|
|
835
1112
|
url: http://goo.ne.jp
|
|
836
|
-
-
|
|
1113
|
+
-
|
|
1114
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.75 Safari/537.36 Google Favicon
|
|
1115
|
+
bot:
|
|
1116
|
+
name: Google Favicon
|
|
1117
|
+
category: Crawler
|
|
1118
|
+
-
|
|
837
1119
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_0_1 like Mac OS X; en-us) AppleWebKit/537.4 (KHTML, like Gecko; Google Page Speed Insights) Version/4.0.5 Mobile/8A306 Safari/6531.22.7
|
|
838
1120
|
bot:
|
|
839
1121
|
name: Google PageSpeed Insights
|
|
@@ -842,7 +1124,7 @@
|
|
|
842
1124
|
producer:
|
|
843
1125
|
name: Google Inc.
|
|
844
1126
|
url: http://www.google.com
|
|
845
|
-
-
|
|
1127
|
+
-
|
|
846
1128
|
user_agent: Mozilla/5.0 (Windows NT 5.1) AppleWebKit/535.1 (KHTML, like Gecko) Chrome/14.0.835.202 Safari/535.1 google_partner_monitoring FWSzVTDDBz14547302713138T
|
|
847
1129
|
bot:
|
|
848
1130
|
name: Google Partner Monitoring
|
|
@@ -851,7 +1133,7 @@
|
|
|
851
1133
|
producer:
|
|
852
1134
|
name: Google Inc.
|
|
853
1135
|
url: http://www.google.com
|
|
854
|
-
-
|
|
1136
|
+
-
|
|
855
1137
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Search Console) Chrome/41.0.2272.118 Safari/537.36
|
|
856
1138
|
bot:
|
|
857
1139
|
name: Google Search Console
|
|
@@ -860,7 +1142,7 @@
|
|
|
860
1142
|
producer:
|
|
861
1143
|
name: Google Inc.
|
|
862
1144
|
url: http://www.google.com
|
|
863
|
-
-
|
|
1145
|
+
-
|
|
864
1146
|
user_agent: Google-Structured-Data-Testing-Tool +https://search.google.com/structured-data/testing-tool)
|
|
865
1147
|
bot:
|
|
866
1148
|
name: Google Structured Data Testing Tool
|
|
@@ -869,7 +1151,7 @@
|
|
|
869
1151
|
producer:
|
|
870
1152
|
name: Google Inc.
|
|
871
1153
|
url: http://www.google.com
|
|
872
|
-
-
|
|
1154
|
+
-
|
|
873
1155
|
user_agent: AdsBot-Google (+http://www.google.com/adsbot.html)
|
|
874
1156
|
bot:
|
|
875
1157
|
name: Googlebot
|
|
@@ -878,7 +1160,7 @@
|
|
|
878
1160
|
producer:
|
|
879
1161
|
name: Google Inc.
|
|
880
1162
|
url: http://www.google.com
|
|
881
|
-
-
|
|
1163
|
+
-
|
|
882
1164
|
user_agent: AdsBot-Google-Mobile (+http://www.google.com/mobile/adsbot.html) Mozilla (iPhone; U; CPU iPhone OS 3 0 like Mac OS X) AppleWebKit (KHTML, like Gecko) Mobile Safari
|
|
883
1165
|
bot:
|
|
884
1166
|
name: Googlebot
|
|
@@ -887,7 +1169,7 @@
|
|
|
887
1169
|
producer:
|
|
888
1170
|
name: Google Inc.
|
|
889
1171
|
url: http://www.google.com
|
|
890
|
-
-
|
|
1172
|
+
-
|
|
891
1173
|
user_agent: APIs-Google (+https://developers.google.com/webmasters/APIs-Google.html)
|
|
892
1174
|
bot:
|
|
893
1175
|
name: Googlebot
|
|
@@ -896,7 +1178,7 @@
|
|
|
896
1178
|
producer:
|
|
897
1179
|
name: Google Inc.
|
|
898
1180
|
url: http://www.google.com
|
|
899
|
-
-
|
|
1181
|
+
-
|
|
900
1182
|
user_agent: DoCoMo/2.0 N905i(c100;TB;W24H16) (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
|
901
1183
|
bot:
|
|
902
1184
|
name: Googlebot
|
|
@@ -905,7 +1187,7 @@
|
|
|
905
1187
|
producer:
|
|
906
1188
|
name: Google Inc.
|
|
907
1189
|
url: http://www.google.com
|
|
908
|
-
-
|
|
1190
|
+
-
|
|
909
1191
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 19 subscribers; feed-id=13965549748850348809)
|
|
910
1192
|
bot:
|
|
911
1193
|
name: Googlebot
|
|
@@ -914,7 +1196,7 @@
|
|
|
914
1196
|
producer:
|
|
915
1197
|
name: Google Inc.
|
|
916
1198
|
url: http://www.google.com
|
|
917
|
-
-
|
|
1199
|
+
-
|
|
918
1200
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 2 subscribers; feed-id=17860707833818568603)
|
|
919
1201
|
bot:
|
|
920
1202
|
name: Googlebot
|
|
@@ -923,7 +1205,7 @@
|
|
|
923
1205
|
producer:
|
|
924
1206
|
name: Google Inc.
|
|
925
1207
|
url: http://www.google.com
|
|
926
|
-
-
|
|
1208
|
+
-
|
|
927
1209
|
user_agent: Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 375 subscribers; feed-id=15381863289700640853)
|
|
928
1210
|
bot:
|
|
929
1211
|
name: Googlebot
|
|
@@ -932,7 +1214,7 @@
|
|
|
932
1214
|
producer:
|
|
933
1215
|
name: Google Inc.
|
|
934
1216
|
url: http://www.google.com
|
|
935
|
-
-
|
|
1217
|
+
-
|
|
936
1218
|
user_agent: Google-AdWords-Express
|
|
937
1219
|
bot:
|
|
938
1220
|
name: Googlebot
|
|
@@ -941,7 +1223,7 @@
|
|
|
941
1223
|
producer:
|
|
942
1224
|
name: Google Inc.
|
|
943
1225
|
url: http://www.google.com
|
|
944
|
-
-
|
|
1226
|
+
-
|
|
945
1227
|
user_agent: Google-Adwords-Instant (+http://www.google.com/adsbot.html)
|
|
946
1228
|
bot:
|
|
947
1229
|
name: Googlebot
|
|
@@ -950,7 +1232,7 @@
|
|
|
950
1232
|
producer:
|
|
951
1233
|
name: Google Inc.
|
|
952
1234
|
url: http://www.google.com
|
|
953
|
-
-
|
|
1235
|
+
-
|
|
954
1236
|
user_agent: Google-speakr
|
|
955
1237
|
bot:
|
|
956
1238
|
name: Googlebot
|
|
@@ -959,7 +1241,7 @@
|
|
|
959
1241
|
producer:
|
|
960
1242
|
name: Google Inc.
|
|
961
1243
|
url: http://www.google.com
|
|
962
|
-
-
|
|
1244
|
+
-
|
|
963
1245
|
user_agent: Googlebot (gocrawl v0.4)
|
|
964
1246
|
bot:
|
|
965
1247
|
name: Googlebot
|
|
@@ -968,7 +1250,7 @@
|
|
|
968
1250
|
producer:
|
|
969
1251
|
name: Google Inc.
|
|
970
1252
|
url: http://www.google.com
|
|
971
|
-
-
|
|
1253
|
+
-
|
|
972
1254
|
user_agent: Googlebot-Image/1.0
|
|
973
1255
|
bot:
|
|
974
1256
|
name: Googlebot
|
|
@@ -977,7 +1259,7 @@
|
|
|
977
1259
|
producer:
|
|
978
1260
|
name: Google Inc.
|
|
979
1261
|
url: http://www.google.com
|
|
980
|
-
-
|
|
1262
|
+
-
|
|
981
1263
|
user_agent: Googlebot-News (2.3.3, ruby 1.9.3 (2013-11-22))
|
|
982
1264
|
bot:
|
|
983
1265
|
name: Googlebot
|
|
@@ -986,7 +1268,7 @@
|
|
|
986
1268
|
producer:
|
|
987
1269
|
name: Google Inc.
|
|
988
1270
|
url: http://www.google.com
|
|
989
|
-
-
|
|
1271
|
+
-
|
|
990
1272
|
user_agent: Googlebot-Video/1.0
|
|
991
1273
|
bot:
|
|
992
1274
|
name: Googlebot
|
|
@@ -995,7 +1277,7 @@
|
|
|
995
1277
|
producer:
|
|
996
1278
|
name: Google Inc.
|
|
997
1279
|
url: http://www.google.com
|
|
998
|
-
-
|
|
1280
|
+
-
|
|
999
1281
|
user_agent: Googlebot/2.1 (http://www.googlebot.com/bot.html)
|
|
1000
1282
|
bot:
|
|
1001
1283
|
name: Googlebot
|
|
@@ -1004,7 +1286,7 @@
|
|
|
1004
1286
|
producer:
|
|
1005
1287
|
name: Google Inc.
|
|
1006
1288
|
url: http://www.google.com
|
|
1007
|
-
-
|
|
1289
|
+
-
|
|
1008
1290
|
user_agent: Googlebot/Nutch-1.7
|
|
1009
1291
|
bot:
|
|
1010
1292
|
name: Googlebot
|
|
@@ -1013,7 +1295,7 @@
|
|
|
1013
1295
|
producer:
|
|
1014
1296
|
name: Google Inc.
|
|
1015
1297
|
url: http://www.google.com
|
|
1016
|
-
-
|
|
1298
|
+
-
|
|
1017
1299
|
user_agent: GoogleProducer; (+http://goo.gl/7y4SX)
|
|
1018
1300
|
bot:
|
|
1019
1301
|
name: Googlebot
|
|
@@ -1022,7 +1304,7 @@
|
|
|
1022
1304
|
producer:
|
|
1023
1305
|
name: Google Inc.
|
|
1024
1306
|
url: http://www.google.com
|
|
1025
|
-
-
|
|
1307
|
+
-
|
|
1026
1308
|
user_agent: Mediapartners-Google
|
|
1027
1309
|
bot:
|
|
1028
1310
|
name: Googlebot
|
|
@@ -1031,7 +1313,7 @@
|
|
|
1031
1313
|
producer:
|
|
1032
1314
|
name: Google Inc.
|
|
1033
1315
|
url: http://www.google.com
|
|
1034
|
-
-
|
|
1316
|
+
-
|
|
1035
1317
|
user_agent: Mozilla/5.0 (compatible) Feedfetcher-Google;(+http://www.google.com/feedfetcher.html)
|
|
1036
1318
|
bot:
|
|
1037
1319
|
name: Googlebot
|
|
@@ -1040,7 +1322,16 @@
|
|
|
1040
1322
|
producer:
|
|
1041
1323
|
name: Google Inc.
|
|
1042
1324
|
url: http://www.google.com
|
|
1043
|
-
-
|
|
1325
|
+
-
|
|
1326
|
+
user_agent: Mozilla/5.0 (compatible; Google-Youtube-Links)
|
|
1327
|
+
bot:
|
|
1328
|
+
name: Googlebot
|
|
1329
|
+
category: Search bot
|
|
1330
|
+
url: http://www.google.com/bot.html
|
|
1331
|
+
producer:
|
|
1332
|
+
name: Google Inc.
|
|
1333
|
+
url: http://www.google.com
|
|
1334
|
+
-
|
|
1044
1335
|
user_agent: Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)
|
|
1045
1336
|
bot:
|
|
1046
1337
|
name: Googlebot
|
|
@@ -1049,7 +1340,7 @@
|
|
|
1049
1340
|
producer:
|
|
1050
1341
|
name: Google Inc.
|
|
1051
1342
|
url: http://www.google.com
|
|
1052
|
-
-
|
|
1343
|
+
-
|
|
1053
1344
|
user_agent: Mozilla/5.0 (en-US) AppleWebKit/537.36 (KHTML, like Gecko; Google-Assess) Chrome/34.0.1847.116 Safari/537.36
|
|
1054
1345
|
bot:
|
|
1055
1346
|
name: Googlebot
|
|
@@ -1058,7 +1349,7 @@
|
|
|
1058
1349
|
producer:
|
|
1059
1350
|
name: Google Inc.
|
|
1060
1351
|
url: http://www.google.com
|
|
1061
|
-
-
|
|
1352
|
+
-
|
|
1062
1353
|
user_agent: Mozilla/5.0 (en-us) AppleWebKit/537.36(KHTML, like Gecko; Google-Adwords-DisplayAds-WebRender;) Chrome/41.0.2272.118Safari/537.36
|
|
1063
1354
|
bot:
|
|
1064
1355
|
name: Googlebot
|
|
@@ -1067,7 +1358,7 @@
|
|
|
1067
1358
|
producer:
|
|
1068
1359
|
name: Google Inc.
|
|
1069
1360
|
url: http://www.google.com
|
|
1070
|
-
-
|
|
1361
|
+
-
|
|
1071
1362
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5376e Safari/8536.25 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
|
1072
1363
|
bot:
|
|
1073
1364
|
name: Googlebot
|
|
@@ -1076,7 +1367,7 @@
|
|
|
1076
1367
|
producer:
|
|
1077
1368
|
name: Google Inc.
|
|
1078
1369
|
url: http://www.google.com
|
|
1079
|
-
-
|
|
1370
|
+
-
|
|
1080
1371
|
user_agent: Mozilla/5.0 (Linux; Android 4.0.4; Galaxy Nexus Build/IMM76B) AppleWebKit/537.36 (KHTML, like Gecko; Google-Publisher-Plugin) Chrome/27.0.1453 Mobile Safari/537.36
|
|
1081
1372
|
bot:
|
|
1082
1373
|
name: Googlebot
|
|
@@ -1085,7 +1376,16 @@
|
|
|
1085
1376
|
producer:
|
|
1086
1377
|
name: Google Inc.
|
|
1087
1378
|
url: http://www.google.com
|
|
1088
|
-
-
|
|
1379
|
+
-
|
|
1380
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-AMPHTML)
|
|
1381
|
+
bot:
|
|
1382
|
+
name: Googlebot
|
|
1383
|
+
category: Search bot
|
|
1384
|
+
url: http://www.google.com/bot.html
|
|
1385
|
+
producer:
|
|
1386
|
+
name: Google Inc.
|
|
1387
|
+
url: http://www.google.com
|
|
1388
|
+
-
|
|
1089
1389
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Google-Read-Aloud; +https://support.google.com/webmasters/answer/1061943)
|
|
1090
1390
|
bot:
|
|
1091
1391
|
name: Googlebot
|
|
@@ -1094,7 +1394,16 @@
|
|
|
1094
1394
|
producer:
|
|
1095
1395
|
name: Google Inc.
|
|
1096
1396
|
url: http://www.google.com
|
|
1097
|
-
-
|
|
1397
|
+
-
|
|
1398
|
+
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; DuplexWeb-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.131 Mobile Safari/537.36
|
|
1399
|
+
bot:
|
|
1400
|
+
name: Googlebot
|
|
1401
|
+
category: Search bot
|
|
1402
|
+
url: http://www.google.com/bot.html
|
|
1403
|
+
producer:
|
|
1404
|
+
name: Google Inc.
|
|
1405
|
+
url: http://www.google.com
|
|
1406
|
+
-
|
|
1098
1407
|
user_agent: Mozilla/5.0 (Windows NT 6.1; rv:6.0) Gecko/20110814 Firefox/6.0 Google (+https://developers.google.com/+/web/snippet/)
|
|
1099
1408
|
bot:
|
|
1100
1409
|
name: Googlebot
|
|
@@ -1103,7 +1412,16 @@
|
|
|
1103
1412
|
producer:
|
|
1104
1413
|
name: Google Inc.
|
|
1105
1414
|
url: http://www.google.com
|
|
1106
|
-
-
|
|
1415
|
+
-
|
|
1416
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/27.0.1453 Safari/537.36 (compatible; Google-HotelAdsVerifier/2.0)
|
|
1417
|
+
bot:
|
|
1418
|
+
name: Googlebot
|
|
1419
|
+
category: Search bot
|
|
1420
|
+
url: http://www.google.com/bot.html
|
|
1421
|
+
producer:
|
|
1422
|
+
name: Google Inc.
|
|
1423
|
+
url: http://www.google.com
|
|
1424
|
+
-
|
|
1107
1425
|
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko; Google Web Preview) Chrome/27.0.1453 Safari/537.36
|
|
1108
1426
|
bot:
|
|
1109
1427
|
name: Googlebot
|
|
@@ -1112,7 +1430,7 @@
|
|
|
1112
1430
|
producer:
|
|
1113
1431
|
name: Google Inc.
|
|
1114
1432
|
url: http://www.google.com
|
|
1115
|
-
-
|
|
1433
|
+
-
|
|
1116
1434
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36 (compatible; Google-Shopping-Quality +http://www.google.com/merchants/tos/extend/DE/tos.html)
|
|
1117
1435
|
bot:
|
|
1118
1436
|
name: Googlebot
|
|
@@ -1121,7 +1439,7 @@
|
|
|
1121
1439
|
producer:
|
|
1122
1440
|
name: Google Inc.
|
|
1123
1441
|
url: http://www.google.com
|
|
1124
|
-
-
|
|
1442
|
+
-
|
|
1125
1443
|
user_agent: Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; Googlebot/2.1; +http://www.google.com/bot.html) Safari/537.36
|
|
1126
1444
|
bot:
|
|
1127
1445
|
name: Googlebot
|
|
@@ -1130,7 +1448,7 @@
|
|
|
1130
1448
|
producer:
|
|
1131
1449
|
name: Google Inc.
|
|
1132
1450
|
url: http://www.google.com
|
|
1133
|
-
-
|
|
1451
|
+
-
|
|
1134
1452
|
user_agent: SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)
|
|
1135
1453
|
bot:
|
|
1136
1454
|
name: Googlebot
|
|
@@ -1139,7 +1457,13 @@
|
|
|
1139
1457
|
producer:
|
|
1140
1458
|
name: Google Inc.
|
|
1141
1459
|
url: http://www.google.com
|
|
1142
|
-
-
|
|
1460
|
+
-
|
|
1461
|
+
user_agent: Grammarly/1.0 (http://www.grammarly.com)
|
|
1462
|
+
bot:
|
|
1463
|
+
name: Grammarly
|
|
1464
|
+
category: Service bot
|
|
1465
|
+
url: https://www.grammarly.com
|
|
1466
|
+
-
|
|
1143
1467
|
user_agent: Mozilla/5.0 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
|
1144
1468
|
bot:
|
|
1145
1469
|
name: Grapeshot
|
|
@@ -1148,7 +1472,7 @@
|
|
|
1148
1472
|
producer:
|
|
1149
1473
|
name: Grapeshot
|
|
1150
1474
|
url: https://www.grapeshot.com
|
|
1151
|
-
-
|
|
1475
|
+
-
|
|
1152
1476
|
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 8_3 like Mac OS X) AppleWebKit/600.1.4 (KHTML, like Gecko) Version/8.0 Mobile/12F70 Safari/600.1. 4 (compatible; GrapeshotCrawler/2.0; +https://www.grapeshot.com/crawler/)
|
|
1153
1477
|
bot:
|
|
1154
1478
|
name: Grapeshot
|
|
@@ -1157,7 +1481,7 @@
|
|
|
1157
1481
|
producer:
|
|
1158
1482
|
name: Grapeshot
|
|
1159
1483
|
url: https://www.grapeshot.com
|
|
1160
|
-
-
|
|
1484
|
+
-
|
|
1161
1485
|
user_agent: HTTPMon/1.0b (http://www.httpmon.com)
|
|
1162
1486
|
bot:
|
|
1163
1487
|
name: HTTPMon
|
|
@@ -1166,7 +1490,7 @@
|
|
|
1166
1490
|
producer:
|
|
1167
1491
|
name: towards GmbH
|
|
1168
1492
|
url: http://www.towards.ch/
|
|
1169
|
-
-
|
|
1493
|
+
-
|
|
1170
1494
|
user_agent: 'flieder - neofonie heritrix/1.14.3 (+http://spider.neofonie.de)'
|
|
1171
1495
|
bot:
|
|
1172
1496
|
name: Heritrix
|
|
@@ -1174,8 +1498,8 @@
|
|
|
1174
1498
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1175
1499
|
producer:
|
|
1176
1500
|
name: The Internet Archive
|
|
1177
|
-
url:
|
|
1178
|
-
-
|
|
1501
|
+
url: https://archive.org
|
|
1502
|
+
-
|
|
1179
1503
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://webarhive.nlc.gov.cn)
|
|
1180
1504
|
bot:
|
|
1181
1505
|
name: Heritrix
|
|
@@ -1183,8 +1507,8 @@
|
|
|
1183
1507
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1184
1508
|
producer:
|
|
1185
1509
|
name: The Internet Archive
|
|
1186
|
-
url:
|
|
1187
|
-
-
|
|
1510
|
+
url: https://archive.org
|
|
1511
|
+
-
|
|
1188
1512
|
user_agent: Mozilla/5.0 (compatible; heritrix/1.14.4 +http://www.dla-marbach.de)
|
|
1189
1513
|
bot:
|
|
1190
1514
|
name: Heritrix
|
|
@@ -1192,8 +1516,8 @@
|
|
|
1192
1516
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1193
1517
|
producer:
|
|
1194
1518
|
name: The Internet Archive
|
|
1195
|
-
url:
|
|
1196
|
-
-
|
|
1519
|
+
url: https://archive.org
|
|
1520
|
+
-
|
|
1197
1521
|
user_agent: mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)
|
|
1198
1522
|
bot:
|
|
1199
1523
|
name: Heritrix
|
|
@@ -1201,8 +1525,8 @@
|
|
|
1201
1525
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1202
1526
|
producer:
|
|
1203
1527
|
name: The Internet Archive
|
|
1204
|
-
url:
|
|
1205
|
-
-
|
|
1528
|
+
url: https://archive.org
|
|
1529
|
+
-
|
|
1206
1530
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.baidu.com)
|
|
1207
1531
|
bot:
|
|
1208
1532
|
name: Heritrix
|
|
@@ -1210,8 +1534,8 @@
|
|
|
1210
1534
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1211
1535
|
producer:
|
|
1212
1536
|
name: The Internet Archive
|
|
1213
|
-
url:
|
|
1214
|
-
-
|
|
1537
|
+
url: https://archive.org
|
|
1538
|
+
-
|
|
1215
1539
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.1 +http://www.run4dom.com)
|
|
1216
1540
|
bot:
|
|
1217
1541
|
name: Heritrix
|
|
@@ -1219,8 +1543,8 @@
|
|
|
1219
1543
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1220
1544
|
producer:
|
|
1221
1545
|
name: The Internet Archive
|
|
1222
|
-
url:
|
|
1223
|
-
-
|
|
1546
|
+
url: https://archive.org
|
|
1547
|
+
-
|
|
1224
1548
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20130207.001528 +http://webarchiv.cz/kontakty/)
|
|
1225
1549
|
bot:
|
|
1226
1550
|
name: Heritrix
|
|
@@ -1228,8 +1552,8 @@
|
|
|
1228
1552
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1229
1553
|
producer:
|
|
1230
1554
|
name: The Internet Archive
|
|
1231
|
-
url:
|
|
1232
|
-
-
|
|
1555
|
+
url: https://archive.org
|
|
1556
|
+
-
|
|
1233
1557
|
user_agent: Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)
|
|
1234
1558
|
bot:
|
|
1235
1559
|
name: Heritrix
|
|
@@ -1237,8 +1561,8 @@
|
|
|
1237
1561
|
url: https://webarchive.jira.com/wiki/display/Heritrix/Heritrix
|
|
1238
1562
|
producer:
|
|
1239
1563
|
name: The Internet Archive
|
|
1240
|
-
url:
|
|
1241
|
-
-
|
|
1564
|
+
url: https://archive.org
|
|
1565
|
+
-
|
|
1242
1566
|
user_agent: Heurekabot-Feed/1.0 (+https://sluzby.heureka.cz/napoveda/heurekabot/)
|
|
1243
1567
|
bot:
|
|
1244
1568
|
name: Heureka Feed
|
|
@@ -1247,16 +1571,16 @@
|
|
|
1247
1571
|
producer:
|
|
1248
1572
|
name: Heureka.cz, a.s.
|
|
1249
1573
|
url: https://www.heureka.cz/
|
|
1250
|
-
-
|
|
1574
|
+
-
|
|
1251
1575
|
user_agent: HubPages V0.2.2 (http://hubpages.com/help/crawlingpolicy)
|
|
1252
1576
|
bot:
|
|
1253
1577
|
name: HubPages
|
|
1254
1578
|
category: Crawler
|
|
1255
|
-
url:
|
|
1579
|
+
url: https://hubpages.com/help/crawlingpolicy
|
|
1256
1580
|
producer:
|
|
1257
|
-
name: HubPages
|
|
1258
|
-
url:
|
|
1259
|
-
-
|
|
1581
|
+
name: HubPages, Inc.
|
|
1582
|
+
url: https://discover.hubpages.com/
|
|
1583
|
+
-
|
|
1260
1584
|
user_agent: HubSpot Website Grader (web-crawlers@hubspot.com)
|
|
1261
1585
|
bot:
|
|
1262
1586
|
name: HubSpot
|
|
@@ -1264,7 +1588,7 @@
|
|
|
1264
1588
|
producer:
|
|
1265
1589
|
name: HubSpot Inc.
|
|
1266
1590
|
url: https://www.hubspot.com
|
|
1267
|
-
-
|
|
1591
|
+
-
|
|
1268
1592
|
user_agent: ICC-Crawler/2.0 (Mozilla-compatible; ; http://www.nict.go.jp/en/univ-com/plan/crawl.html)
|
|
1269
1593
|
bot:
|
|
1270
1594
|
name: ICC-Crawler
|
|
@@ -1273,7 +1597,16 @@
|
|
|
1273
1597
|
producer:
|
|
1274
1598
|
name: ""
|
|
1275
1599
|
url: ""
|
|
1276
|
-
-
|
|
1600
|
+
-
|
|
1601
|
+
user_agent: IDG/IT (http://spaziodati.eu/)
|
|
1602
|
+
bot:
|
|
1603
|
+
name: IDG/IT
|
|
1604
|
+
category: Search bot
|
|
1605
|
+
url: https://spaziodati.eu/
|
|
1606
|
+
producer:
|
|
1607
|
+
name: SpazioDati S.r.l.
|
|
1608
|
+
url: https://spaziodati.eu/
|
|
1609
|
+
-
|
|
1277
1610
|
user_agent: iisbot/1.0 (+http://www.iis.net/iisbot.html)
|
|
1278
1611
|
bot:
|
|
1279
1612
|
name: IIS Site Analysis
|
|
@@ -1282,7 +1615,7 @@
|
|
|
1282
1615
|
producer:
|
|
1283
1616
|
name: Microsoft Corporation
|
|
1284
1617
|
url: http://www.microsoft.com
|
|
1285
|
-
-
|
|
1618
|
+
-
|
|
1286
1619
|
user_agent: IP-Guide.com Crawler/1.0 (https://ip-guide.com)
|
|
1287
1620
|
bot:
|
|
1288
1621
|
name: IP-Guide Crawler
|
|
@@ -1291,15 +1624,24 @@
|
|
|
1291
1624
|
producer:
|
|
1292
1625
|
name: ""
|
|
1293
1626
|
url: https://ip-guide.com
|
|
1294
|
-
-
|
|
1627
|
+
-
|
|
1295
1628
|
user_agent: Mozilla/5.0 (compatible; ips-agent)
|
|
1296
1629
|
bot:
|
|
1297
1630
|
name: IPS Agent
|
|
1298
|
-
category:
|
|
1631
|
+
category: Crawler
|
|
1299
1632
|
producer:
|
|
1300
1633
|
name: VeriSign, Inc
|
|
1301
1634
|
url: http://www.verisign.com/
|
|
1302
|
-
-
|
|
1635
|
+
-
|
|
1636
|
+
user_agent: Kaspersky Lab CFR link resolver cfradmins@kaspersky.com
|
|
1637
|
+
bot:
|
|
1638
|
+
name: Kaspersky
|
|
1639
|
+
category: Security Checker
|
|
1640
|
+
url: https://www.kaspersky.com/
|
|
1641
|
+
producer:
|
|
1642
|
+
name: AO Kaspersky Lab
|
|
1643
|
+
url: https://www.kaspersky.com/
|
|
1644
|
+
-
|
|
1303
1645
|
user_agent: kouio.com RSS reader
|
|
1304
1646
|
bot:
|
|
1305
1647
|
name: Kouio
|
|
@@ -1308,7 +1650,7 @@
|
|
|
1308
1650
|
producer:
|
|
1309
1651
|
name: ""
|
|
1310
1652
|
url: ""
|
|
1311
|
-
-
|
|
1653
|
+
-
|
|
1312
1654
|
user_agent: 'kouio.com RSS reader - 6 subscribers'
|
|
1313
1655
|
bot:
|
|
1314
1656
|
name: Kouio
|
|
@@ -1317,7 +1659,16 @@
|
|
|
1317
1659
|
producer:
|
|
1318
1660
|
name: ""
|
|
1319
1661
|
url: ""
|
|
1320
|
-
-
|
|
1662
|
+
-
|
|
1663
|
+
user_agent: LCC (+http://corpora.informatik.uni-leipzig.de/crawler_faq.html)
|
|
1664
|
+
bot:
|
|
1665
|
+
name: LCC
|
|
1666
|
+
category: Search bot
|
|
1667
|
+
url: https://corpora.uni-leipzig.de/crawler_faq.html
|
|
1668
|
+
producer:
|
|
1669
|
+
name: Universität Leipzig
|
|
1670
|
+
url: https://www.uni-leipzig.de/
|
|
1671
|
+
-
|
|
1321
1672
|
user_agent: 'ltx71 - (http://ltx71.com/)'
|
|
1322
1673
|
bot:
|
|
1323
1674
|
name: LTX71
|
|
@@ -1325,7 +1676,7 @@
|
|
|
1325
1676
|
producer:
|
|
1326
1677
|
name: ""
|
|
1327
1678
|
url: ""
|
|
1328
|
-
-
|
|
1679
|
+
-
|
|
1329
1680
|
user_agent: larbin_2.6.3 larbin2.6.3@unspecified.mail
|
|
1330
1681
|
bot:
|
|
1331
1682
|
name: Larbin web crawler
|
|
@@ -1334,7 +1685,7 @@
|
|
|
1334
1685
|
producer:
|
|
1335
1686
|
name: ""
|
|
1336
1687
|
url: ""
|
|
1337
|
-
-
|
|
1688
|
+
-
|
|
1338
1689
|
user_agent: "Mozilla/5.0 (compatible; Let's Encrypt validation server; +https://www.letsencrypt.org)"
|
|
1339
1690
|
bot:
|
|
1340
1691
|
name: "Let's Encrypt Validation"
|
|
@@ -1343,7 +1694,7 @@
|
|
|
1343
1694
|
producer:
|
|
1344
1695
|
name: "Let's Encrypt"
|
|
1345
1696
|
url: https://letsencrypt.org
|
|
1346
|
-
-
|
|
1697
|
+
-
|
|
1347
1698
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5 Build/MRA58N) AppleWebKit/537.36(KHTML, like Gecko) Chrome/61.0.3116.0 Mobile Safari/537.36 Chrome-Lighthouse
|
|
1348
1699
|
bot:
|
|
1349
1700
|
name: Lighthouse
|
|
@@ -1352,7 +1703,7 @@
|
|
|
1352
1703
|
producer:
|
|
1353
1704
|
name: Lighthouse
|
|
1354
1705
|
url: https://developers.google.com/web/tools/lighthouse
|
|
1355
|
-
-
|
|
1706
|
+
-
|
|
1356
1707
|
user_agent: linkdex.com/v2.0 and linkdex.com/v2.1
|
|
1357
1708
|
bot:
|
|
1358
1709
|
name: Linkdex Bot
|
|
@@ -1361,7 +1712,7 @@
|
|
|
1361
1712
|
producer:
|
|
1362
1713
|
name: Mojeek Ltd.
|
|
1363
1714
|
url: http://www.mojeek.com
|
|
1364
|
-
-
|
|
1715
|
+
-
|
|
1365
1716
|
user_agent: Mozilla/5.0 (compatible; linkdexbot/2.0; +http://www.linkdex.com/about/bots/)
|
|
1366
1717
|
bot:
|
|
1367
1718
|
name: Linkdex Bot
|
|
@@ -1370,7 +1721,7 @@
|
|
|
1370
1721
|
producer:
|
|
1371
1722
|
name: Mojeek Ltd.
|
|
1372
1723
|
url: http://www.mojeek.com
|
|
1373
|
-
-
|
|
1724
|
+
-
|
|
1374
1725
|
user_agent: Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; en-us) AppleWebKit/532.9 (KHTML, like Gecko) Version/4.0.5 Mobile/8B117 Safari/6531.22.7 (compatible; linkdexbot-mobile/2.1; +http://www.linkdex.com/about/bots/)
|
|
1375
1726
|
bot:
|
|
1376
1727
|
name: Linkdex Bot
|
|
@@ -1379,7 +1730,7 @@
|
|
|
1379
1730
|
producer:
|
|
1380
1731
|
name: Mojeek Ltd.
|
|
1381
1732
|
url: http://www.mojeek.com
|
|
1382
|
-
-
|
|
1733
|
+
-
|
|
1383
1734
|
user_agent: LinkedInBot/1.0 (compatible; Mozilla/5.0; Jakarta Commons-HttpClient/3.1 +http://www.linkedin.com)
|
|
1384
1735
|
bot:
|
|
1385
1736
|
name: LinkedIn Bot
|
|
@@ -1388,7 +1739,7 @@
|
|
|
1388
1739
|
producer:
|
|
1389
1740
|
name: LinkedIn
|
|
1390
1741
|
url: http://www.linkedin.com
|
|
1391
|
-
-
|
|
1742
|
+
-
|
|
1392
1743
|
user_agent: Mozilla/5.0 (compatible; MJ12bot/v1.4.4; http://www.majestic12.co.uk/bot.php?+)
|
|
1393
1744
|
bot:
|
|
1394
1745
|
name: MJ12 Bot
|
|
@@ -1397,7 +1748,7 @@
|
|
|
1397
1748
|
producer:
|
|
1398
1749
|
name: Majestic-12
|
|
1399
1750
|
url: http://majestic12.co.uk
|
|
1400
|
-
-
|
|
1751
|
+
-
|
|
1401
1752
|
user_agent: magpie-crawler/1.1 (U; Linux amd64; en-GB; +http://www.brandwatch.net)
|
|
1402
1753
|
bot:
|
|
1403
1754
|
name: Magpie-Crawler
|
|
@@ -1406,7 +1757,7 @@
|
|
|
1406
1757
|
producer:
|
|
1407
1758
|
name: Brandwatch
|
|
1408
1759
|
url: http://www.brandwatch.com
|
|
1409
|
-
-
|
|
1760
|
+
-
|
|
1410
1761
|
user_agent: MagpieRSS/0.72 (+http://magpierss.sf.net)
|
|
1411
1762
|
bot:
|
|
1412
1763
|
name: MagpieRSS
|
|
@@ -1415,7 +1766,7 @@
|
|
|
1415
1766
|
producer:
|
|
1416
1767
|
name: ""
|
|
1417
1768
|
url: ""
|
|
1418
|
-
-
|
|
1769
|
+
-
|
|
1419
1770
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/2.0; +http://go.mail.ru/help/robots)
|
|
1420
1771
|
bot:
|
|
1421
1772
|
name: Mail.Ru Bot
|
|
@@ -1424,7 +1775,7 @@
|
|
|
1424
1775
|
producer:
|
|
1425
1776
|
name: Mail.Ru Group
|
|
1426
1777
|
url: http://corp.mail.ru
|
|
1427
|
-
-
|
|
1778
|
+
-
|
|
1428
1779
|
user_agent: Mozilla/5.0 (compatible; Linux x86_64; Mail.RU_Bot/Fast/2.0; +http://go.mail.ru/help/robots)
|
|
1429
1780
|
bot:
|
|
1430
1781
|
name: Mail.Ru Bot
|
|
@@ -1433,17 +1784,17 @@
|
|
|
1433
1784
|
producer:
|
|
1434
1785
|
name: Mail.Ru Group
|
|
1435
1786
|
url: http://corp.mail.ru
|
|
1436
|
-
-
|
|
1787
|
+
-
|
|
1437
1788
|
user_agent: http.rb/2.2.2 (Mastodon/1.6.1; +https://mathtod.online/)
|
|
1438
1789
|
bot:
|
|
1439
1790
|
name: Mastodon Bot
|
|
1440
1791
|
category: Social Media Agent
|
|
1441
|
-
-
|
|
1792
|
+
-
|
|
1442
1793
|
user_agent: http.rb/3.2.0 (Mastodon/2.4.3; +https://uwu.social/)
|
|
1443
1794
|
bot:
|
|
1444
1795
|
name: Mastodon Bot
|
|
1445
1796
|
category: Social Media Agent
|
|
1446
|
-
-
|
|
1797
|
+
-
|
|
1447
1798
|
user_agent: Mozilla/5.0 (compatible; meanpathbot/1.0; +http://www.meanpath.com/meanpathbot.html)
|
|
1448
1799
|
bot:
|
|
1449
1800
|
name: Meanpath Bot
|
|
@@ -1452,13 +1803,13 @@
|
|
|
1452
1803
|
producer:
|
|
1453
1804
|
name: Meanpath
|
|
1454
1805
|
url: http://www.meanpath.com
|
|
1455
|
-
-
|
|
1806
|
+
-
|
|
1456
1807
|
user_agent: MetaInspector/5.4.0 (+https://github.com/jaimeiniesta/metainspector)
|
|
1457
1808
|
bot:
|
|
1458
1809
|
name: MetaInspector
|
|
1459
1810
|
category: Crawler
|
|
1460
1811
|
url: https://github.com/jaimeiniesta/metainspector
|
|
1461
|
-
-
|
|
1812
|
+
-
|
|
1462
1813
|
user_agent: Mozilla/5.0 (compatible; MetaJobBot; http://www.metajob.de/crawler)
|
|
1463
1814
|
bot:
|
|
1464
1815
|
name: MetaJobBot
|
|
@@ -1467,7 +1818,7 @@
|
|
|
1467
1818
|
producer:
|
|
1468
1819
|
name: MetaJob
|
|
1469
1820
|
url: http://www.metajob.at
|
|
1470
|
-
-
|
|
1821
|
+
-
|
|
1471
1822
|
user_agent: Mozilla/5.0 (compatible; MixrankBot; crawler@mixrank.com)
|
|
1472
1823
|
bot:
|
|
1473
1824
|
name: Mixrank Bot
|
|
@@ -1476,7 +1827,7 @@
|
|
|
1476
1827
|
producer:
|
|
1477
1828
|
name: Online Media Group, Inc.
|
|
1478
1829
|
url: ""
|
|
1479
|
-
-
|
|
1830
|
+
-
|
|
1480
1831
|
user_agent: Mnogosearch-3.1.21
|
|
1481
1832
|
bot:
|
|
1482
1833
|
name: Mnogosearch
|
|
@@ -1485,7 +1836,7 @@
|
|
|
1485
1836
|
producer:
|
|
1486
1837
|
name: Lavtech.Com Corp.
|
|
1487
1838
|
url: ""
|
|
1488
|
-
-
|
|
1839
|
+
-
|
|
1489
1840
|
user_agent: Mozilla/5.0 (compatible; MojeekBot/0.6; http://www.mojeek.com/bot.html)
|
|
1490
1841
|
bot:
|
|
1491
1842
|
name: MojeekBot
|
|
@@ -1494,7 +1845,7 @@
|
|
|
1494
1845
|
producer:
|
|
1495
1846
|
name: Mojeek Ltd.
|
|
1496
1847
|
url: http://www.mojeek.com
|
|
1497
|
-
-
|
|
1848
|
+
-
|
|
1498
1849
|
user_agent: 'Mozilla/5.0 (compatible; www.monitor.us - free monitoring service; http://www.monitor.us)'
|
|
1499
1850
|
bot:
|
|
1500
1851
|
name: Monitor.Us
|
|
@@ -1503,7 +1854,7 @@
|
|
|
1503
1854
|
producer:
|
|
1504
1855
|
name: Monitor.Us
|
|
1505
1856
|
url: http://www.monitor.us
|
|
1506
|
-
-
|
|
1857
|
+
-
|
|
1507
1858
|
user_agent: munin/2.0.30-1 (libwww-perl/6.15)
|
|
1508
1859
|
bot:
|
|
1509
1860
|
name: Munin
|
|
@@ -1512,7 +1863,7 @@
|
|
|
1512
1863
|
producer:
|
|
1513
1864
|
name: Munin
|
|
1514
1865
|
url: http://munin-monitoring.org/
|
|
1515
|
-
-
|
|
1866
|
+
-
|
|
1516
1867
|
user_agent: munin/http_loadtime
|
|
1517
1868
|
bot:
|
|
1518
1869
|
name: Munin
|
|
@@ -1521,7 +1872,7 @@
|
|
|
1521
1872
|
producer:
|
|
1522
1873
|
name: Munin
|
|
1523
1874
|
url: http://munin-monitoring.org/
|
|
1524
|
-
-
|
|
1875
|
+
-
|
|
1525
1876
|
user_agent: nlcrawler/1.0 (+http://northernlight.com/)
|
|
1526
1877
|
bot:
|
|
1527
1878
|
name: NLCrawler
|
|
@@ -1530,7 +1881,7 @@
|
|
|
1530
1881
|
producer:
|
|
1531
1882
|
name: Northern Light
|
|
1532
1883
|
url: http://northernlight.com
|
|
1533
|
-
-
|
|
1884
|
+
-
|
|
1534
1885
|
user_agent: check_http/v1.5 (nagios-plugins 1.5)
|
|
1535
1886
|
bot:
|
|
1536
1887
|
name: Nagios check_http
|
|
@@ -1539,7 +1890,7 @@
|
|
|
1539
1890
|
producer:
|
|
1540
1891
|
name: Nagios Plugins Development Team
|
|
1541
1892
|
url: https://nagios.org
|
|
1542
|
-
-
|
|
1893
|
+
-
|
|
1543
1894
|
user_agent: NalezenCzBot/1.0 (http://www.nalezen.cz/about-crawler)
|
|
1544
1895
|
bot:
|
|
1545
1896
|
name: NalezenCzBot
|
|
@@ -1548,11 +1899,11 @@
|
|
|
1548
1899
|
producer:
|
|
1549
1900
|
name: Jaroslav Kuboš
|
|
1550
1901
|
url: ""
|
|
1551
|
-
-
|
|
1902
|
+
-
|
|
1552
1903
|
user_agent: NetLyzer FastProbe
|
|
1553
1904
|
bot:
|
|
1554
1905
|
name: NetLyzer FastProbe
|
|
1555
|
-
-
|
|
1906
|
+
-
|
|
1556
1907
|
user_agent: Mozilla/4.0 (compatible; Netcraft Web Server Survey)
|
|
1557
1908
|
bot:
|
|
1558
1909
|
name: Netcraft Survey Bot
|
|
@@ -1561,7 +1912,7 @@
|
|
|
1561
1912
|
producer:
|
|
1562
1913
|
name: Netcraft
|
|
1563
1914
|
url: http://www.netcraft.com
|
|
1564
|
-
-
|
|
1915
|
+
-
|
|
1565
1916
|
user_agent: Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)
|
|
1566
1917
|
bot:
|
|
1567
1918
|
name: Netcraft Survey Bot
|
|
@@ -1570,7 +1921,7 @@
|
|
|
1570
1921
|
producer:
|
|
1571
1922
|
name: Netcraft
|
|
1572
1923
|
url: http://www.netcraft.com
|
|
1573
|
-
-
|
|
1924
|
+
-
|
|
1574
1925
|
user_agent: 'Netcraft SSL Server Survey - contact info@netcraft.com'
|
|
1575
1926
|
bot:
|
|
1576
1927
|
name: Netcraft Survey Bot
|
|
@@ -1579,7 +1930,7 @@
|
|
|
1579
1930
|
producer:
|
|
1580
1931
|
name: Netcraft
|
|
1581
1932
|
url: http://www.netcraft.com
|
|
1582
|
-
-
|
|
1933
|
+
-
|
|
1583
1934
|
user_agent: Netvibes (http://www.netvibes.com)
|
|
1584
1935
|
bot:
|
|
1585
1936
|
name: Netvibes
|
|
@@ -1588,7 +1939,7 @@
|
|
|
1588
1939
|
producer:
|
|
1589
1940
|
name: ""
|
|
1590
1941
|
url: ""
|
|
1591
|
-
-
|
|
1942
|
+
-
|
|
1592
1943
|
user_agent: 'Netvibes (http://www.netvibes.com/; 8 subscribers; feedID: 2244192)'
|
|
1593
1944
|
bot:
|
|
1594
1945
|
name: Netvibes
|
|
@@ -1597,7 +1948,7 @@
|
|
|
1597
1948
|
producer:
|
|
1598
1949
|
name: ""
|
|
1599
1950
|
url: ""
|
|
1600
|
-
-
|
|
1951
|
+
-
|
|
1601
1952
|
user_agent: 'NewsBlur Favicon Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
|
1602
1953
|
bot:
|
|
1603
1954
|
name: NewsBlur
|
|
@@ -1606,7 +1957,7 @@
|
|
|
1606
1957
|
producer:
|
|
1607
1958
|
name: ""
|
|
1608
1959
|
url: ""
|
|
1609
|
-
-
|
|
1960
|
+
-
|
|
1610
1961
|
user_agent: 'NewsBlur Feed Fetcher - 7 subscribers - http://www.newsblur.com/site/1948420/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
|
1611
1962
|
bot:
|
|
1612
1963
|
name: NewsBlur
|
|
@@ -1615,7 +1966,7 @@
|
|
|
1615
1966
|
producer:
|
|
1616
1967
|
name: ""
|
|
1617
1968
|
url: ""
|
|
1618
|
-
-
|
|
1969
|
+
-
|
|
1619
1970
|
user_agent: NewsBlur Feed Finder (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)
|
|
1620
1971
|
bot:
|
|
1621
1972
|
name: NewsBlur
|
|
@@ -1624,7 +1975,7 @@
|
|
|
1624
1975
|
producer:
|
|
1625
1976
|
name: ""
|
|
1626
1977
|
url: ""
|
|
1627
|
-
-
|
|
1978
|
+
-
|
|
1628
1979
|
user_agent: 'NewsBlur Page Fetcher - 7 subscribers - http://www.newsblur.com/site/3966817/analytics-piwik (Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_1) AppleWebKit/534.48.3 (KHTML, like Gecko) Version/5.1 Safari/534.48.3)'
|
|
1629
1980
|
bot:
|
|
1630
1981
|
name: NewsBlur
|
|
@@ -1633,7 +1984,7 @@
|
|
|
1633
1984
|
producer:
|
|
1634
1985
|
name: ""
|
|
1635
1986
|
url: ""
|
|
1636
|
-
-
|
|
1987
|
+
-
|
|
1637
1988
|
user_agent: NewsGatorOnline/2.0 (http://www.newsgator.com; 2 subscribers)
|
|
1638
1989
|
bot:
|
|
1639
1990
|
name: NewsGator
|
|
@@ -1642,7 +1993,7 @@
|
|
|
1642
1993
|
producer:
|
|
1643
1994
|
name: ""
|
|
1644
1995
|
url: ""
|
|
1645
|
-
-
|
|
1996
|
+
-
|
|
1646
1997
|
user_agent: Mozilla/5.0 (compatible; Nmap Scripting Engine; https://nmap.org/book/nse.html)
|
|
1647
1998
|
bot:
|
|
1648
1999
|
name: Nmap
|
|
@@ -1651,7 +2002,7 @@
|
|
|
1651
2002
|
producer:
|
|
1652
2003
|
name: Nmap
|
|
1653
2004
|
url: https://nmap.org/
|
|
1654
|
-
-
|
|
2005
|
+
-
|
|
1655
2006
|
user_agent: 5acd734a-1ed3-4a17-ad9d-0b09ae7bc2d2/Nutch-1.7
|
|
1656
2007
|
bot:
|
|
1657
2008
|
name: Nutch-based Bot
|
|
@@ -1659,8 +2010,8 @@
|
|
|
1659
2010
|
url: https://nutch.apache.org
|
|
1660
2011
|
producer:
|
|
1661
2012
|
name: The Apache Software Foundation
|
|
1662
|
-
url:
|
|
1663
|
-
-
|
|
2013
|
+
url: https://www.apache.org/foundation/
|
|
2014
|
+
-
|
|
1664
2015
|
user_agent: CB/Nutch-1.7
|
|
1665
2016
|
bot:
|
|
1666
2017
|
name: Nutch-based Bot
|
|
@@ -1668,8 +2019,8 @@
|
|
|
1668
2019
|
url: https://nutch.apache.org
|
|
1669
2020
|
producer:
|
|
1670
2021
|
name: The Apache Software Foundation
|
|
1671
|
-
url:
|
|
1672
|
-
-
|
|
2022
|
+
url: https://www.apache.org/foundation/
|
|
2023
|
+
-
|
|
1673
2024
|
user_agent: Mozilla/5.0 (compatible; summers;)/Nutch-1.7
|
|
1674
2025
|
bot:
|
|
1675
2026
|
name: Nutch-based Bot
|
|
@@ -1677,8 +2028,8 @@
|
|
|
1677
2028
|
url: https://nutch.apache.org
|
|
1678
2029
|
producer:
|
|
1679
2030
|
name: The Apache Software Foundation
|
|
1680
|
-
url:
|
|
1681
|
-
-
|
|
2031
|
+
url: https://www.apache.org/foundation/
|
|
2032
|
+
-
|
|
1682
2033
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9.2.8) Firefox/3.6.8/Nutch-1.7
|
|
1683
2034
|
bot:
|
|
1684
2035
|
name: Nutch-based Bot
|
|
@@ -1686,8 +2037,8 @@
|
|
|
1686
2037
|
url: https://nutch.apache.org
|
|
1687
2038
|
producer:
|
|
1688
2039
|
name: The Apache Software Foundation
|
|
1689
|
-
url:
|
|
1690
|
-
-
|
|
2040
|
+
url: https://www.apache.org/foundation/
|
|
2041
|
+
-
|
|
1691
2042
|
user_agent: My Nutch Spider/Nutch-1.6
|
|
1692
2043
|
bot:
|
|
1693
2044
|
name: Nutch-based Bot
|
|
@@ -1695,8 +2046,8 @@
|
|
|
1695
2046
|
url: https://nutch.apache.org
|
|
1696
2047
|
producer:
|
|
1697
2048
|
name: The Apache Software Foundation
|
|
1698
|
-
url:
|
|
1699
|
-
-
|
|
2049
|
+
url: https://www.apache.org/foundation/
|
|
2050
|
+
-
|
|
1700
2051
|
user_agent: MySpider/Nutch-2.2
|
|
1701
2052
|
bot:
|
|
1702
2053
|
name: Nutch-based Bot
|
|
@@ -1704,8 +2055,8 @@
|
|
|
1704
2055
|
url: https://nutch.apache.org
|
|
1705
2056
|
producer:
|
|
1706
2057
|
name: The Apache Software Foundation
|
|
1707
|
-
url:
|
|
1708
|
-
-
|
|
2058
|
+
url: https://www.apache.org/foundation/
|
|
2059
|
+
-
|
|
1709
2060
|
user_agent: Nutch12/Nutch-1.2
|
|
1710
2061
|
bot:
|
|
1711
2062
|
name: Nutch-based Bot
|
|
@@ -1713,8 +2064,8 @@
|
|
|
1713
2064
|
url: https://nutch.apache.org
|
|
1714
2065
|
producer:
|
|
1715
2066
|
name: The Apache Software Foundation
|
|
1716
|
-
url:
|
|
1717
|
-
-
|
|
2067
|
+
url: https://www.apache.org/foundation/
|
|
2068
|
+
-
|
|
1718
2069
|
user_agent: NutchSpider/Nutch-1.4
|
|
1719
2070
|
bot:
|
|
1720
2071
|
name: Nutch-based Bot
|
|
@@ -1722,8 +2073,8 @@
|
|
|
1722
2073
|
url: https://nutch.apache.org
|
|
1723
2074
|
producer:
|
|
1724
2075
|
name: The Apache Software Foundation
|
|
1725
|
-
url:
|
|
1726
|
-
-
|
|
2076
|
+
url: https://www.apache.org/foundation/
|
|
2077
|
+
-
|
|
1727
2078
|
user_agent: spider/Nutch-1.5.1 (spider; http://www.xxx.com)
|
|
1728
2079
|
bot:
|
|
1729
2080
|
name: Nutch-based Bot
|
|
@@ -1731,8 +2082,8 @@
|
|
|
1731
2082
|
url: https://nutch.apache.org
|
|
1732
2083
|
producer:
|
|
1733
2084
|
name: The Apache Software Foundation
|
|
1734
|
-
url:
|
|
1735
|
-
-
|
|
2085
|
+
url: https://www.apache.org/foundation/
|
|
2086
|
+
-
|
|
1736
2087
|
user_agent: Spider/Nutch-2.3-SNAPSHOT (Webcrawler)
|
|
1737
2088
|
bot:
|
|
1738
2089
|
name: Nutch-based Bot
|
|
@@ -1740,8 +2091,8 @@
|
|
|
1740
2091
|
url: https://nutch.apache.org
|
|
1741
2092
|
producer:
|
|
1742
2093
|
name: The Apache Software Foundation
|
|
1743
|
-
url:
|
|
1744
|
-
-
|
|
2094
|
+
url: https://www.apache.org/foundation/
|
|
2095
|
+
-
|
|
1745
2096
|
user_agent: testnutch/Nutch-1.8
|
|
1746
2097
|
bot:
|
|
1747
2098
|
name: Nutch-based Bot
|
|
@@ -1749,8 +2100,8 @@
|
|
|
1749
2100
|
url: https://nutch.apache.org
|
|
1750
2101
|
producer:
|
|
1751
2102
|
name: The Apache Software Foundation
|
|
1752
|
-
url:
|
|
1753
|
-
-
|
|
2103
|
+
url: https://www.apache.org/foundation/
|
|
2104
|
+
-
|
|
1754
2105
|
user_agent: Your Nutch Spider/Nutch-2.2.1
|
|
1755
2106
|
bot:
|
|
1756
2107
|
name: Nutch-based Bot
|
|
@@ -1758,8 +2109,8 @@
|
|
|
1758
2109
|
url: https://nutch.apache.org
|
|
1759
2110
|
producer:
|
|
1760
2111
|
name: The Apache Software Foundation
|
|
1761
|
-
url:
|
|
1762
|
-
-
|
|
2112
|
+
url: https://www.apache.org/foundation/
|
|
2113
|
+
-
|
|
1763
2114
|
user_agent: your sipder name/Nutch-1.7
|
|
1764
2115
|
bot:
|
|
1765
2116
|
name: Nutch-based Bot
|
|
@@ -1767,12 +2118,20 @@
|
|
|
1767
2118
|
url: https://nutch.apache.org
|
|
1768
2119
|
producer:
|
|
1769
2120
|
name: The Apache Software Foundation
|
|
1770
|
-
url:
|
|
1771
|
-
-
|
|
2121
|
+
url: https://www.apache.org/foundation/
|
|
2122
|
+
-
|
|
2123
|
+
user_agent: Nuzzel
|
|
2124
|
+
bot:
|
|
2125
|
+
name: Nuzzel
|
|
2126
|
+
category: Crawler
|
|
2127
|
+
producer:
|
|
2128
|
+
name: Nuzzel
|
|
2129
|
+
url: https://www.nuzzel.com/
|
|
2130
|
+
-
|
|
1772
2131
|
user_agent: Octopus 1.0.2
|
|
1773
2132
|
bot:
|
|
1774
2133
|
name: Octopus
|
|
1775
|
-
-
|
|
2134
|
+
-
|
|
1776
2135
|
user_agent: omgili/0.5 +http://omgili.com
|
|
1777
2136
|
bot:
|
|
1778
2137
|
name: Omgili bot
|
|
@@ -1781,7 +2140,7 @@
|
|
|
1781
2140
|
producer:
|
|
1782
2141
|
name: Omgili
|
|
1783
2142
|
url: http://www.omgili.com
|
|
1784
|
-
-
|
|
2143
|
+
-
|
|
1785
2144
|
user_agent: omgilibot/0.3 +http://www.omgili.com/Crawler.html
|
|
1786
2145
|
bot:
|
|
1787
2146
|
name: Omgili bot
|
|
@@ -1790,7 +2149,7 @@
|
|
|
1790
2149
|
producer:
|
|
1791
2150
|
name: Omgili
|
|
1792
2151
|
url: http://www.omgili.com
|
|
1793
|
-
-
|
|
2152
|
+
-
|
|
1794
2153
|
user_agent: Mozilla/5.0 (compatible; spbot/4.0.9; +http://OpenLinkProfiler.org/bot )
|
|
1795
2154
|
bot:
|
|
1796
2155
|
name: OpenLinkProfiler
|
|
@@ -1799,7 +2158,7 @@
|
|
|
1799
2158
|
producer:
|
|
1800
2159
|
name: Axandra GmbH
|
|
1801
2160
|
url: http://www.axandra.com
|
|
1802
|
-
-
|
|
2161
|
+
-
|
|
1803
2162
|
user_agent: OpenWebSpider v0.1.4 (http://www.openwebspider.org/)
|
|
1804
2163
|
bot:
|
|
1805
2164
|
name: OpenWebSpider
|
|
@@ -1808,7 +2167,7 @@
|
|
|
1808
2167
|
producer:
|
|
1809
2168
|
name: OpenWebSpider Lab
|
|
1810
2169
|
url: http://lab.openwebspider.org
|
|
1811
|
-
-
|
|
2170
|
+
-
|
|
1812
2171
|
user_agent: Mozilla/5.0 (compatible; OpenindexSpider; +http://www.openindex.io/en/webmasters/spider.html)
|
|
1813
2172
|
bot:
|
|
1814
2173
|
name: Openindex Spider
|
|
@@ -1817,7 +2176,7 @@
|
|
|
1817
2176
|
producer:
|
|
1818
2177
|
name: Openindex B.V.
|
|
1819
2178
|
url: http://www.openindex.io
|
|
1820
|
-
-
|
|
2179
|
+
-
|
|
1821
2180
|
user_agent: Mozilla/5.0 (compatible; OrangeBot-Collector/2.0; support.orangebot@orange.com)
|
|
1822
2181
|
bot:
|
|
1823
2182
|
name: Orange Bot
|
|
@@ -1826,7 +2185,7 @@
|
|
|
1826
2185
|
producer:
|
|
1827
2186
|
name: Orange
|
|
1828
2187
|
url: http://www.orange.fr
|
|
1829
|
-
-
|
|
2188
|
+
-
|
|
1830
2189
|
user_agent: Mozilla/5.0 (compatible; OrangeBot/2.0; support.orangebot@orange.com)
|
|
1831
2190
|
bot:
|
|
1832
2191
|
name: Orange Bot
|
|
@@ -1835,7 +2194,7 @@
|
|
|
1835
2194
|
producer:
|
|
1836
2195
|
name: Orange
|
|
1837
2196
|
url: http://www.orange.fr
|
|
1838
|
-
-
|
|
2197
|
+
-
|
|
1839
2198
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)
|
|
1840
2199
|
bot:
|
|
1841
2200
|
name: Orange Bot
|
|
@@ -1844,7 +2203,7 @@
|
|
|
1844
2203
|
producer:
|
|
1845
2204
|
name: Orange
|
|
1846
2205
|
url: http://www.orange.fr
|
|
1847
|
-
-
|
|
2206
|
+
-
|
|
1848
2207
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1;fr;rv:1.8.1) VoilaBotCollector BETA 0.1 (http://www.voila.com/)
|
|
1849
2208
|
bot:
|
|
1850
2209
|
name: Orange Bot
|
|
@@ -1853,7 +2212,7 @@
|
|
|
1853
2212
|
producer:
|
|
1854
2213
|
name: Orange
|
|
1855
2214
|
url: http://www.orange.fr
|
|
1856
|
-
-
|
|
2215
|
+
-
|
|
1857
2216
|
user_agent: Mozilla/5.0 (Java) outbrain
|
|
1858
2217
|
bot:
|
|
1859
2218
|
name: Outbrain
|
|
@@ -1862,7 +2221,7 @@
|
|
|
1862
2221
|
producer:
|
|
1863
2222
|
name: Outbrain
|
|
1864
2223
|
url: http://www.outbrain.com/
|
|
1865
|
-
-
|
|
2224
|
+
-
|
|
1866
2225
|
user_agent: Mozilla/5.0 (compatible; phpservermon/3.1.1; +http://www.phpservermonitor.org)
|
|
1867
2226
|
bot:
|
|
1868
2227
|
name: PHP Server Monitor
|
|
@@ -1871,7 +2230,16 @@
|
|
|
1871
2230
|
producer:
|
|
1872
2231
|
name: PHP Server Monitor
|
|
1873
2232
|
url: http://www.phpservermonitor.org/
|
|
1874
|
-
-
|
|
2233
|
+
-
|
|
2234
|
+
user_agent: Mozilla/5.0 (compatible; PRTG Network Monitor (www.paessler.com); Windows)
|
|
2235
|
+
bot:
|
|
2236
|
+
name: PRTG Network Monitor
|
|
2237
|
+
category: Network Monitor
|
|
2238
|
+
url: https://www.paessler.com/prtg
|
|
2239
|
+
producer:
|
|
2240
|
+
name: Paessler AG
|
|
2241
|
+
url: https://www.paessler.com
|
|
2242
|
+
-
|
|
1875
2243
|
user_agent: Mozilla/5.0 (compatible; PaperLiBot/2.1; http://support.paper.li/entries/20023257-what-is-paper-li)
|
|
1876
2244
|
bot:
|
|
1877
2245
|
name: PaperLiBot
|
|
@@ -1880,13 +2248,19 @@
|
|
|
1880
2248
|
producer:
|
|
1881
2249
|
name: Smallrivers SA
|
|
1882
2250
|
url: http://www.paper.li
|
|
1883
|
-
-
|
|
2251
|
+
-
|
|
2252
|
+
user_agent: Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; PetalBot;+https://aspiegel.com/petalbot)
|
|
2253
|
+
bot:
|
|
2254
|
+
name: Petal Bot
|
|
2255
|
+
category: Crawler
|
|
2256
|
+
url: https://aspiegel.com/petalbot
|
|
2257
|
+
-
|
|
1884
2258
|
user_agent: phantomas/1.11.0 (PhantomJS/1.9.8; linux x64)
|
|
1885
2259
|
bot:
|
|
1886
2260
|
name: Phantomas
|
|
1887
2261
|
category: Site Monitor
|
|
1888
2262
|
url: https://github.com/macbre/phantomas
|
|
1889
|
-
-
|
|
2263
|
+
-
|
|
1890
2264
|
user_agent: psbot-page (+http://www.picsearch.com/bot.html)
|
|
1891
2265
|
bot:
|
|
1892
2266
|
name: Picsearch bot
|
|
@@ -1895,7 +2269,7 @@
|
|
|
1895
2269
|
producer:
|
|
1896
2270
|
name: Picsearch
|
|
1897
2271
|
url: http://www.picsearch.com
|
|
1898
|
-
-
|
|
2272
|
+
-
|
|
1899
2273
|
user_agent: psbot/0.1 (+http://www.picsearch.com/bot.html)
|
|
1900
2274
|
bot:
|
|
1901
2275
|
name: Picsearch bot
|
|
@@ -1904,7 +2278,7 @@
|
|
|
1904
2278
|
producer:
|
|
1905
2279
|
name: Picsearch
|
|
1906
2280
|
url: http://www.picsearch.com
|
|
1907
|
-
-
|
|
2281
|
+
-
|
|
1908
2282
|
user_agent: Pingdom.com_bot_version_1.4_(http://www.pingdom.com/)
|
|
1909
2283
|
bot:
|
|
1910
2284
|
name: Pingdom Bot
|
|
@@ -1913,16 +2287,34 @@
|
|
|
1913
2287
|
producer:
|
|
1914
2288
|
name: Pingdom AB
|
|
1915
2289
|
url: https://www.pingdom.com
|
|
1916
|
-
-
|
|
2290
|
+
-
|
|
2291
|
+
user_agent: Mozilla/5.0 (compatible; Pinterestbot/1.0; http://www.pinterest.com/bot.html)
|
|
2292
|
+
bot:
|
|
2293
|
+
name: Pinterest
|
|
2294
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
|
2295
|
+
category: Crawler
|
|
2296
|
+
producer:
|
|
2297
|
+
name: Pinterest
|
|
2298
|
+
url: https://www.pinterest.com/
|
|
2299
|
+
-
|
|
1917
2300
|
user_agent: Pinterest/0.2 (+http://www.pinterest.com/)
|
|
1918
2301
|
bot:
|
|
1919
2302
|
name: Pinterest
|
|
1920
|
-
url:
|
|
2303
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
|
2304
|
+
category: Crawler
|
|
2305
|
+
producer:
|
|
2306
|
+
name: Pinterest
|
|
2307
|
+
url: https://www.pinterest.com/
|
|
2308
|
+
-
|
|
2309
|
+
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible; Pinterestbot/1.0; https://www.pinterest.com/bot.html)
|
|
2310
|
+
bot:
|
|
2311
|
+
name: Pinterest
|
|
2312
|
+
url: https://help.pinterest.com/en/business/article/pinterest-crawler
|
|
1921
2313
|
category: Crawler
|
|
1922
2314
|
producer:
|
|
1923
2315
|
name: Pinterest
|
|
1924
|
-
url:
|
|
1925
|
-
-
|
|
2316
|
+
url: https://www.pinterest.com/
|
|
2317
|
+
-
|
|
1926
2318
|
user_agent: PocketParser/2.0 (+https://getpocket.com/pocketparser_ua)
|
|
1927
2319
|
bot:
|
|
1928
2320
|
name: PocketParser
|
|
@@ -1931,7 +2323,7 @@
|
|
|
1931
2323
|
producer:
|
|
1932
2324
|
name: Pocket
|
|
1933
2325
|
url: https://getpocket.com/
|
|
1934
|
-
-
|
|
2326
|
+
-
|
|
1935
2327
|
user_agent: PritTorrent/1.0
|
|
1936
2328
|
bot:
|
|
1937
2329
|
name: PritTorrent
|
|
@@ -1940,7 +2332,7 @@
|
|
|
1940
2332
|
producer:
|
|
1941
2333
|
name: Bitlove
|
|
1942
2334
|
url: http://bitlove.org/
|
|
1943
|
-
-
|
|
2335
|
+
-
|
|
1944
2336
|
user_agent: QuerySeekerSpider ( http://queryseeker.com/bot.html )
|
|
1945
2337
|
bot:
|
|
1946
2338
|
name: QuerySeekerSpider
|
|
@@ -1949,7 +2341,7 @@
|
|
|
1949
2341
|
producer:
|
|
1950
2342
|
name: QueryEye Inc.
|
|
1951
2343
|
url: http://queryeye.com
|
|
1952
|
-
-
|
|
2344
|
+
-
|
|
1953
2345
|
user_agent: Quora Link Preview/1.0 (http://www.quora.com)
|
|
1954
2346
|
bot:
|
|
1955
2347
|
name: Quora Link Preview
|
|
@@ -1958,7 +2350,7 @@
|
|
|
1958
2350
|
producer:
|
|
1959
2351
|
name: Quora
|
|
1960
2352
|
url: http://www.quora.com
|
|
1961
|
-
-
|
|
2353
|
+
-
|
|
1962
2354
|
user_agent: 'Mozilla/5.0 (compatible; Qwantify/2.2w; +https://www.qwant.com/)/*'
|
|
1963
2355
|
bot:
|
|
1964
2356
|
name: Qwantify
|
|
@@ -1967,7 +2359,7 @@
|
|
|
1967
2359
|
producer:
|
|
1968
2360
|
name: Qwant Corporation
|
|
1969
2361
|
url: https://www.qwant.com/
|
|
1970
|
-
-
|
|
2362
|
+
-
|
|
1971
2363
|
user_agent: ROI Hunter; https://api-dev.roihunter.com
|
|
1972
2364
|
bot:
|
|
1973
2365
|
name: ROI Hunter
|
|
@@ -1976,13 +2368,17 @@
|
|
|
1976
2368
|
producer:
|
|
1977
2369
|
name: Roihunter a.s.
|
|
1978
2370
|
url: http://roihunter.com/
|
|
1979
|
-
-
|
|
2371
|
+
-
|
|
2372
|
+
user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
|
|
2373
|
+
bot:
|
|
2374
|
+
name: RSSRadio Bot
|
|
2375
|
+
-
|
|
1980
2376
|
user_agent: Rainmeter WebParser plugin
|
|
1981
2377
|
bot:
|
|
1982
2378
|
name: Rainmeter
|
|
1983
2379
|
category: Crawler
|
|
1984
2380
|
url: https://www.rainmeter.net
|
|
1985
|
-
-
|
|
2381
|
+
-
|
|
1986
2382
|
user_agent: RamblerMail/6.0 (incompatible; ImageProxy/6.0)
|
|
1987
2383
|
bot:
|
|
1988
2384
|
name: RamblerMail Image Proxy
|
|
@@ -1991,7 +2387,7 @@
|
|
|
1991
2387
|
producer:
|
|
1992
2388
|
name: 'Rambler&Co'
|
|
1993
2389
|
url: https://rambler-co.ru/
|
|
1994
|
-
-
|
|
2390
|
+
-
|
|
1995
2391
|
user_agent: Mozilla/5.0 (compatible; redditbot/1.0; +http://www.reddit.com/feedback)
|
|
1996
2392
|
bot:
|
|
1997
2393
|
name: Reddit Bot
|
|
@@ -2000,7 +2396,12 @@
|
|
|
2000
2396
|
producer:
|
|
2001
2397
|
name: reddit inc.
|
|
2002
2398
|
url: http://www.reddit.com
|
|
2003
|
-
-
|
|
2399
|
+
-
|
|
2400
|
+
user_agent: Robozilla/1.0
|
|
2401
|
+
bot:
|
|
2402
|
+
name: Robozilla
|
|
2403
|
+
category: Crawler
|
|
2404
|
+
-
|
|
2004
2405
|
user_agent: Mozilla/5.0 (compatible; rogerBot/1.0; UrlCrawler; http://www.seomoz.org/dp/rogerbot)
|
|
2005
2406
|
bot:
|
|
2006
2407
|
name: Rogerbot
|
|
@@ -2009,7 +2410,7 @@
|
|
|
2009
2410
|
producer:
|
|
2010
2411
|
name: SEOmoz, Inc.
|
|
2011
2412
|
url: http://moz.com/
|
|
2012
|
-
-
|
|
2413
|
+
-
|
|
2013
2414
|
user_agent: rogerbot/1.0 (http://moz.com/help/pro/what-is-rogerbot-, rogerbot-crawler+shiny@moz.com)
|
|
2014
2415
|
bot:
|
|
2015
2416
|
name: Rogerbot
|
|
@@ -2018,7 +2419,7 @@
|
|
|
2018
2419
|
producer:
|
|
2019
2420
|
name: SEOmoz, Inc.
|
|
2020
2421
|
url: http://moz.com/
|
|
2021
|
-
-
|
|
2422
|
+
-
|
|
2022
2423
|
user_agent: rogerbot/1.0 (http://www.moz.com/dp/rogerbot, rogerbot-crawler@moz.com)
|
|
2023
2424
|
bot:
|
|
2024
2425
|
name: Rogerbot
|
|
@@ -2027,7 +2428,7 @@
|
|
|
2027
2428
|
producer:
|
|
2028
2429
|
name: SEOmoz, Inc.
|
|
2029
2430
|
url: http://moz.com/
|
|
2030
|
-
-
|
|
2431
|
+
-
|
|
2031
2432
|
user_agent: SEOENGWorldBot/1.0 (+http://www.seoengine.com/seoengbot.htm)
|
|
2032
2433
|
bot:
|
|
2033
2434
|
name: SEOENGBot
|
|
@@ -2036,7 +2437,7 @@
|
|
|
2036
2437
|
producer:
|
|
2037
2438
|
name: SEO Engine
|
|
2038
2439
|
url: http://www.seoengine.com
|
|
2039
|
-
-
|
|
2440
|
+
-
|
|
2040
2441
|
user_agent: Mozilla/5.0 (compatible; SEOkicks-Robot; +http://www.seokicks.de/robot.html)
|
|
2041
2442
|
bot:
|
|
2042
2443
|
name: SEOkicks-Robot
|
|
@@ -2045,7 +2446,7 @@
|
|
|
2045
2446
|
producer:
|
|
2046
2447
|
name: SEOkicks
|
|
2047
2448
|
url: https://www.seokicks.de/
|
|
2048
|
-
-
|
|
2449
|
+
-
|
|
2049
2450
|
user_agent: Mozilla/5.0 (compatible; SISTRIX Crawler; http://crawler.sistrix.net/)
|
|
2050
2451
|
bot:
|
|
2051
2452
|
name: SISTRIX Crawler
|
|
@@ -2054,7 +2455,43 @@
|
|
|
2054
2455
|
producer:
|
|
2055
2456
|
name: SISTRIX GmbH
|
|
2056
2457
|
url: http://www.sistrix.de
|
|
2057
|
-
-
|
|
2458
|
+
-
|
|
2459
|
+
user_agent: Mozilla/5.0 (compatible; Optimizer)
|
|
2460
|
+
bot:
|
|
2461
|
+
name: SISTRIX Optimizer
|
|
2462
|
+
category: Crawler
|
|
2463
|
+
url: https://optimizer.sistrix.com
|
|
2464
|
+
producer:
|
|
2465
|
+
name: SISTRIX GmbH
|
|
2466
|
+
url: http://www.sistrix.de
|
|
2467
|
+
-
|
|
2468
|
+
user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer)
|
|
2469
|
+
bot:
|
|
2470
|
+
name: SISTRIX Optimizer
|
|
2471
|
+
category: Crawler
|
|
2472
|
+
url: https://optimizer.sistrix.com
|
|
2473
|
+
producer:
|
|
2474
|
+
name: SISTRIX GmbH
|
|
2475
|
+
url: http://www.sistrix.de
|
|
2476
|
+
-
|
|
2477
|
+
user_agent: Mozilla/5.0 (compatible; SISTRIX Optimizer; Uptime; +https://www.sistrix.com/faq/uptime)
|
|
2478
|
+
bot:
|
|
2479
|
+
name: SISTRIX Optimizer
|
|
2480
|
+
category: Crawler
|
|
2481
|
+
url: https://optimizer.sistrix.com
|
|
2482
|
+
producer:
|
|
2483
|
+
name: SISTRIX GmbH
|
|
2484
|
+
url: http://www.sistrix.de
|
|
2485
|
+
-
|
|
2486
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.75 Safari/537.36 (compatible; SMTBot/1.0; +http://www.similartech.com/smtbot)
|
|
2487
|
+
bot:
|
|
2488
|
+
name: SMTBot
|
|
2489
|
+
category: Search bot
|
|
2490
|
+
url: https://www.similartech.com/smtbot
|
|
2491
|
+
producer:
|
|
2492
|
+
name: SimilarTech Ltd.
|
|
2493
|
+
url: https://www.similartech.com/
|
|
2494
|
+
-
|
|
2058
2495
|
user_agent: SSL Labs (https://www.ssllabs.com/about/assessment.html)
|
|
2059
2496
|
bot:
|
|
2060
2497
|
name: SSL Labs
|
|
@@ -2063,7 +2500,7 @@
|
|
|
2063
2500
|
producer:
|
|
2064
2501
|
name: SSL Labs
|
|
2065
2502
|
url: https://www.ssllabs.com/about/assessment.html
|
|
2066
|
-
-
|
|
2503
|
+
-
|
|
2067
2504
|
user_agent: SafeDNSBot (https://www.safedns.com/searchbot)
|
|
2068
2505
|
bot:
|
|
2069
2506
|
name: SafeDNSBot
|
|
@@ -2072,13 +2509,13 @@
|
|
|
2072
2509
|
producer:
|
|
2073
2510
|
name: SafeDNS, Inc.
|
|
2074
2511
|
url: https://www.safedns.com/
|
|
2075
|
-
-
|
|
2512
|
+
-
|
|
2076
2513
|
user_agent: Scrapy/1.0.3.post6+g2d688cd (+http://scrapy.org)
|
|
2077
2514
|
bot:
|
|
2078
2515
|
name: Scrapy
|
|
2079
2516
|
category: Crawler
|
|
2080
2517
|
url: http://scrapy.org
|
|
2081
|
-
-
|
|
2518
|
+
-
|
|
2082
2519
|
user_agent: Screaming Frog SEO Spider/2.22
|
|
2083
2520
|
bot:
|
|
2084
2521
|
name: Screaming Frog SEO Spider
|
|
@@ -2087,7 +2524,7 @@
|
|
|
2087
2524
|
producer:
|
|
2088
2525
|
name: Screaming Frog Ltd
|
|
2089
2526
|
url: http://www.screamingfrog.co.uk
|
|
2090
|
-
-
|
|
2527
|
+
-
|
|
2091
2528
|
user_agent: ScreenerBot Crawler Beta 2.0 (+http://www.ScreenerBot.com)
|
|
2092
2529
|
bot:
|
|
2093
2530
|
name: ScreenerBot
|
|
@@ -2096,7 +2533,13 @@
|
|
|
2096
2533
|
producer:
|
|
2097
2534
|
name: ""
|
|
2098
2535
|
url: ""
|
|
2099
|
-
-
|
|
2536
|
+
-
|
|
2537
|
+
user_agent: Mozilla/5.0 (compatible) SemanticScholarBot (+https://www.semanticscholar.org/crawler)
|
|
2538
|
+
bot:
|
|
2539
|
+
name: Semantic Scholar Bot
|
|
2540
|
+
category: Crawler
|
|
2541
|
+
url: https://www.semanticscholar.org/crawler
|
|
2542
|
+
-
|
|
2100
2543
|
user_agent: Mozilla/5.0 (compatible; SemrushBot/0.97; +http://www.semrush.com/bot.html)
|
|
2101
2544
|
bot:
|
|
2102
2545
|
name: Semrush Bot
|
|
@@ -2105,7 +2548,7 @@
|
|
|
2105
2548
|
producer:
|
|
2106
2549
|
name: SEMrush
|
|
2107
2550
|
url: http://www.semrush.com
|
|
2108
|
-
-
|
|
2551
|
+
-
|
|
2109
2552
|
user_agent: SensikaBot/x.33 (+http://sensika.com)
|
|
2110
2553
|
bot:
|
|
2111
2554
|
name: Sensika Bot
|
|
@@ -2114,28 +2557,36 @@
|
|
|
2114
2557
|
producer:
|
|
2115
2558
|
name: Sensika
|
|
2116
2559
|
url: http://sensika.com
|
|
2117
|
-
-
|
|
2560
|
+
-
|
|
2118
2561
|
user_agent: sentry/8.6.0 (https://getsentry.com)
|
|
2119
2562
|
bot:
|
|
2120
2563
|
name: Sentry Bot
|
|
2121
2564
|
producer:
|
|
2122
2565
|
name: Sentry
|
|
2123
2566
|
url: https://sentry.io
|
|
2124
|
-
-
|
|
2567
|
+
-
|
|
2568
|
+
user_agent: Seobility
|
|
2569
|
+
bot:
|
|
2570
|
+
name: Seobility
|
|
2571
|
+
category: Crawler
|
|
2572
|
+
url: 'https://www.seobility.net/en/faq/?category=crawling#!aboutourbot'
|
|
2573
|
+
-
|
|
2125
2574
|
user_agent: Mozilla/5.0 (compatible; seoscanners.net/1; +spider@seoscanners.net)
|
|
2126
2575
|
bot:
|
|
2127
2576
|
name: Seoscanners.net
|
|
2128
2577
|
category: Crawler
|
|
2129
2578
|
url: ""
|
|
2130
|
-
-
|
|
2579
|
+
-
|
|
2580
|
+
user_agent: SerendeputyBot/0.8.6 (http://serendeputy.com/about/serendeputy-bot)
|
|
2581
|
+
bot:
|
|
2582
|
+
name: Serendeputy Bot
|
|
2583
|
+
category: Crawler
|
|
2584
|
+
url: https://serendeputy.com/about/serendeputy-bot
|
|
2585
|
+
-
|
|
2131
2586
|
user_agent: Server Density Service Monitoring v2
|
|
2132
2587
|
bot:
|
|
2133
2588
|
name: Server Density
|
|
2134
|
-
-
|
|
2135
|
-
user_agent: RSSRadio (Push Notification Scanner;support@dorada.co.uk)
|
|
2136
|
-
bot:
|
|
2137
|
-
name: RSSRadio Bot
|
|
2138
|
-
-
|
|
2589
|
+
-
|
|
2139
2590
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.1-test1; +http://fulltext.sblog.cz/)
|
|
2140
2591
|
bot:
|
|
2141
2592
|
name: Seznam Bot
|
|
@@ -2144,7 +2595,7 @@
|
|
|
2144
2595
|
producer:
|
|
2145
2596
|
name: Seznam.cz, a.s.
|
|
2146
2597
|
url: http://www.seznam.cz/
|
|
2147
|
-
-
|
|
2598
|
+
-
|
|
2148
2599
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2-test1; +http://fulltext.sblog.cz/)
|
|
2149
2600
|
bot:
|
|
2150
2601
|
name: Seznam Bot
|
|
@@ -2153,7 +2604,7 @@
|
|
|
2153
2604
|
producer:
|
|
2154
2605
|
name: Seznam.cz, a.s.
|
|
2155
2606
|
url: http://www.seznam.cz/
|
|
2156
|
-
-
|
|
2607
|
+
-
|
|
2157
2608
|
user_agent: Mozilla/5.0 (compatible; SeznamBot/3.2; +http://fulltext.sblog.cz/)
|
|
2158
2609
|
bot:
|
|
2159
2610
|
name: Seznam Bot
|
|
@@ -2162,7 +2613,7 @@
|
|
|
2162
2613
|
producer:
|
|
2163
2614
|
name: Seznam.cz, a.s.
|
|
2164
2615
|
url: http://www.seznam.cz/
|
|
2165
|
-
-
|
|
2616
|
+
-
|
|
2166
2617
|
user_agent: SeznamBot/3.0 (+http://fulltext.sblog.cz/)
|
|
2167
2618
|
bot:
|
|
2168
2619
|
name: Seznam Bot
|
|
@@ -2171,7 +2622,7 @@
|
|
|
2171
2622
|
producer:
|
|
2172
2623
|
name: Seznam.cz, a.s.
|
|
2173
2624
|
url: http://www.seznam.cz/
|
|
2174
|
-
-
|
|
2625
|
+
-
|
|
2175
2626
|
user_agent: Mozilla/5.0 SeznamEmailProxy/2.0.174
|
|
2176
2627
|
bot:
|
|
2177
2628
|
name: Seznam Email Proxy
|
|
@@ -2180,7 +2631,7 @@
|
|
|
2180
2631
|
producer:
|
|
2181
2632
|
name: Seznam.cz, a.s.
|
|
2182
2633
|
url: http://www.seznam.cz/
|
|
2183
|
-
-
|
|
2634
|
+
-
|
|
2184
2635
|
user_agent: Seznam-Zbozi-robot/3.0
|
|
2185
2636
|
bot:
|
|
2186
2637
|
name: Seznam Zbozi.cz
|
|
@@ -2189,7 +2640,7 @@
|
|
|
2189
2640
|
producer:
|
|
2190
2641
|
name: Seznam.cz, a.s.
|
|
2191
2642
|
url: https://www.zbozi.cz/
|
|
2192
|
-
-
|
|
2643
|
+
-
|
|
2193
2644
|
user_agent: Mozilla/5.0 (ShopAlike; LadenZeile) FeedBot
|
|
2194
2645
|
bot:
|
|
2195
2646
|
name: ShopAlike
|
|
@@ -2198,7 +2649,7 @@
|
|
|
2198
2649
|
producer:
|
|
2199
2650
|
name: Visual Meta
|
|
2200
2651
|
url: https://www.shopalike.cz/
|
|
2201
|
-
-
|
|
2652
|
+
-
|
|
2202
2653
|
user_agent: ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)
|
|
2203
2654
|
bot:
|
|
2204
2655
|
name: ShopWiki
|
|
@@ -2207,7 +2658,16 @@
|
|
|
2207
2658
|
producer:
|
|
2208
2659
|
name: ShopWiki Corp.
|
|
2209
2660
|
url: http://www.shopwiki.com
|
|
2210
|
-
-
|
|
2661
|
+
-
|
|
2662
|
+
user_agent: shopify-partner-homepage-scraper
|
|
2663
|
+
bot:
|
|
2664
|
+
name: Shopify Partner
|
|
2665
|
+
category: Crawler
|
|
2666
|
+
url: https://www.shopify.com/partners
|
|
2667
|
+
producer:
|
|
2668
|
+
name: Shopify
|
|
2669
|
+
url: https://www.shopify.com/
|
|
2670
|
+
-
|
|
2211
2671
|
user_agent: SilverReader/1.0; http://silverreader.com
|
|
2212
2672
|
bot:
|
|
2213
2673
|
name: SilverReader
|
|
@@ -2216,16 +2676,7 @@
|
|
|
2216
2676
|
producer:
|
|
2217
2677
|
name: ""
|
|
2218
2678
|
url: ""
|
|
2219
|
-
-
|
|
2220
|
-
user_agent: freshrss/0.8-dev (Linux; http://freshrss.org) SimplePie/1.4-dev-FreshRSS
|
|
2221
|
-
bot:
|
|
2222
|
-
name: SimplePie
|
|
2223
|
-
url: http://www.simplepie.org
|
|
2224
|
-
category: Feed Parser
|
|
2225
|
-
producer:
|
|
2226
|
-
name: ""
|
|
2227
|
-
url: ""
|
|
2228
|
-
-
|
|
2679
|
+
-
|
|
2229
2680
|
user_agent: SimplePie/1.2.1-dev (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20130514092120
|
|
2230
2681
|
bot:
|
|
2231
2682
|
name: SimplePie
|
|
@@ -2234,7 +2685,7 @@
|
|
|
2234
2685
|
producer:
|
|
2235
2686
|
name: ""
|
|
2236
2687
|
url: ""
|
|
2237
|
-
-
|
|
2688
|
+
-
|
|
2238
2689
|
user_agent: SimplePie/1.3.1 (Feed Parser; http://simplepie.org; Allow like Gecko) Build/20121030175911
|
|
2239
2690
|
bot:
|
|
2240
2691
|
name: SimplePie
|
|
@@ -2243,7 +2694,7 @@
|
|
|
2243
2694
|
producer:
|
|
2244
2695
|
name: ""
|
|
2245
2696
|
url: ""
|
|
2246
|
-
-
|
|
2697
|
+
-
|
|
2247
2698
|
user_agent: Site24x7
|
|
2248
2699
|
bot:
|
|
2249
2700
|
name: Site24x7 Website Monitoring
|
|
@@ -2252,13 +2703,31 @@
|
|
|
2252
2703
|
producer:
|
|
2253
2704
|
name: Site24x7
|
|
2254
2705
|
url: https://www.site24x7.com
|
|
2255
|
-
-
|
|
2706
|
+
-
|
|
2256
2707
|
user_agent: SiteSucker for macOS/2.10.5
|
|
2257
2708
|
bot:
|
|
2258
2709
|
name: SiteSucker
|
|
2259
2710
|
category: Crawler
|
|
2260
2711
|
url: http://ricks-apps.com/osx/sitesucker/
|
|
2261
|
-
-
|
|
2712
|
+
-
|
|
2713
|
+
user_agent: Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.0) Match by Siteimprove.com
|
|
2714
|
+
bot:
|
|
2715
|
+
name: Siteimprove
|
|
2716
|
+
category: Search bot
|
|
2717
|
+
url: https://siteimprove.com/
|
|
2718
|
+
producer:
|
|
2719
|
+
name: Siteimprove GmbH
|
|
2720
|
+
url: https://siteimprove.com/
|
|
2721
|
+
-
|
|
2722
|
+
user_agent: Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; Trident/6.0) LinkCheck by Siteimprove.com
|
|
2723
|
+
bot:
|
|
2724
|
+
name: Siteimprove
|
|
2725
|
+
category: Search bot
|
|
2726
|
+
url: https://siteimprove.com/
|
|
2727
|
+
producer:
|
|
2728
|
+
name: Siteimprove GmbH
|
|
2729
|
+
url: https://siteimprove.com/
|
|
2730
|
+
-
|
|
2262
2731
|
user_agent: sixy.ch/1.0
|
|
2263
2732
|
bot:
|
|
2264
2733
|
name: Sixy.ch
|
|
@@ -2267,7 +2736,7 @@
|
|
|
2267
2736
|
producer:
|
|
2268
2737
|
name: Manuel Kasper
|
|
2269
2738
|
url: https://neon1.net/
|
|
2270
|
-
-
|
|
2739
|
+
-
|
|
2271
2740
|
user_agent: Mozilla/5.0 (Windows NT 6.1; WOW64) SkypeUriPreview Preview/0.5
|
|
2272
2741
|
bot:
|
|
2273
2742
|
name: Skype URI Preview
|
|
@@ -2276,7 +2745,7 @@
|
|
|
2276
2745
|
producer:
|
|
2277
2746
|
name: Skype Communications S.à.r.l.
|
|
2278
2747
|
url: https://www.skype.com
|
|
2279
|
-
-
|
|
2748
|
+
-
|
|
2280
2749
|
user_agent: Slackbot-LinkExpanding 1.0 (+https://api.slack.com/robots)
|
|
2281
2750
|
bot:
|
|
2282
2751
|
name: Slackbot
|
|
@@ -2285,7 +2754,7 @@
|
|
|
2285
2754
|
producer:
|
|
2286
2755
|
name: Slack Technologies
|
|
2287
2756
|
url: http://slack.com
|
|
2288
|
-
-
|
|
2757
|
+
-
|
|
2289
2758
|
user_agent: 'AppEngine-Google; (+http://code.google.com/appengine; appid: s~snapchat-proxy)'
|
|
2290
2759
|
bot:
|
|
2291
2760
|
name: Snapchat Proxy
|
|
@@ -2294,7 +2763,7 @@
|
|
|
2294
2763
|
producer:
|
|
2295
2764
|
name: Snapchat Inc.
|
|
2296
2765
|
url: https://www.snapchat.com
|
|
2297
|
-
-
|
|
2766
|
+
-
|
|
2298
2767
|
user_agent: New-Sogou-Spider/1.0 (compatible; MSIE 5.5; Windows 98)
|
|
2299
2768
|
bot:
|
|
2300
2769
|
name: Sogou Spider
|
|
@@ -2303,7 +2772,7 @@
|
|
|
2303
2772
|
producer:
|
|
2304
2773
|
name: Sohu, Inc.
|
|
2305
2774
|
url: http://www.sogou.com
|
|
2306
|
-
-
|
|
2775
|
+
-
|
|
2307
2776
|
user_agent: Sogou inst spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
|
2308
2777
|
bot:
|
|
2309
2778
|
name: Sogou Spider
|
|
@@ -2312,7 +2781,7 @@
|
|
|
2312
2781
|
producer:
|
|
2313
2782
|
name: Sohu, Inc.
|
|
2314
2783
|
url: http://www.sogou.com
|
|
2315
|
-
-
|
|
2784
|
+
-
|
|
2316
2785
|
user_agent: Sogou Pic Spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm
|
|
2317
2786
|
bot:
|
|
2318
2787
|
name: Sogou Spider
|
|
@@ -2321,7 +2790,7 @@
|
|
|
2321
2790
|
producer:
|
|
2322
2791
|
name: Sohu, Inc.
|
|
2323
2792
|
url: http://www.sogou.com
|
|
2324
|
-
-
|
|
2793
|
+
-
|
|
2325
2794
|
user_agent: Sogou web spider/4.0(+http://www.sogou.com/docs/help/webmasters.htm
|
|
2326
2795
|
bot:
|
|
2327
2796
|
name: Sogou Spider
|
|
@@ -2330,7 +2799,7 @@
|
|
|
2330
2799
|
producer:
|
|
2331
2800
|
name: Sohu, Inc.
|
|
2332
2801
|
url: http://www.sogou.com
|
|
2333
|
-
-
|
|
2802
|
+
-
|
|
2334
2803
|
user_agent: Sosospider+(+http://help.soso.com/webspider.htm)
|
|
2335
2804
|
bot:
|
|
2336
2805
|
name: Soso Spider
|
|
@@ -2339,13 +2808,13 @@
|
|
|
2339
2808
|
producer:
|
|
2340
2809
|
name: Tencent Holdings
|
|
2341
2810
|
url: http://www.soso.com
|
|
2342
|
-
-
|
|
2811
|
+
-
|
|
2343
2812
|
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_6) AppleWebKit/537.36 (KHTML, like Gecko) Sparkler/0.2.0-SNAPSHOT
|
|
2344
2813
|
bot:
|
|
2345
2814
|
name: Sparkler
|
|
2346
2815
|
category: Crawler
|
|
2347
2816
|
url: https://github.com/USCDataScience/sparkler
|
|
2348
|
-
-
|
|
2817
|
+
-
|
|
2349
2818
|
user_agent: Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9.0.19; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/2010040121 Firefox/3.0.19
|
|
2350
2819
|
bot:
|
|
2351
2820
|
name: Spinn3r
|
|
@@ -2354,25 +2823,35 @@
|
|
|
2354
2823
|
producer:
|
|
2355
2824
|
name: Tailrank Inc
|
|
2356
2825
|
url: http://spinn3r.com
|
|
2357
|
-
-
|
|
2826
|
+
-
|
|
2827
|
+
user_agent: Spotify/1.0
|
|
2828
|
+
bot:
|
|
2829
|
+
name: Spotify
|
|
2830
|
+
producer:
|
|
2831
|
+
name: Spotify
|
|
2832
|
+
url: https://www.spotify.com
|
|
2833
|
+
-
|
|
2358
2834
|
user_agent: Mozilla/5.0 (compatible; SputnikBot/2.2)
|
|
2359
2835
|
bot:
|
|
2360
2836
|
name: Sputnik Bot
|
|
2361
|
-
category: ""
|
|
2837
|
+
category: "Crawler"
|
|
2362
2838
|
url: ""
|
|
2363
|
-
|
|
2364
|
-
name: ""
|
|
2365
|
-
url: ""
|
|
2366
|
-
-
|
|
2839
|
+
-
|
|
2367
2840
|
user_agent: Mozilla/5.0 (compatible; SputnikImageBot/2.2)
|
|
2368
2841
|
bot:
|
|
2369
|
-
name: Sputnik Bot
|
|
2370
|
-
category: ""
|
|
2842
|
+
name: Sputnik Image Bot
|
|
2843
|
+
category: "Crawler"
|
|
2371
2844
|
url: ""
|
|
2845
|
+
-
|
|
2846
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_8_5) AppleWebKit/536.30.1 (KHTML, like Gecko) (compatible; Startpagina-Linkchecker/1.0; +https://www.startpagina.nl/linkchecker)
|
|
2847
|
+
bot:
|
|
2848
|
+
name: Startpagina Linkchecker
|
|
2849
|
+
category: Search bot
|
|
2850
|
+
url: https://www.startpagina.nl/linkchecker
|
|
2372
2851
|
producer:
|
|
2373
|
-
name:
|
|
2374
|
-
url:
|
|
2375
|
-
-
|
|
2852
|
+
name: Startpagina B.V.
|
|
2853
|
+
url: https://www.startpagina.nl/
|
|
2854
|
+
-
|
|
2376
2855
|
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64) AppleWebKit/537.4 (KHTML, like Gecko) Chrome/98 Safari/537.4 (StatusCake)
|
|
2377
2856
|
bot:
|
|
2378
2857
|
name: StatusCake
|
|
@@ -2381,7 +2860,7 @@
|
|
|
2381
2860
|
producer:
|
|
2382
2861
|
name: StatusCake
|
|
2383
2862
|
url: https://www.statuscake.com
|
|
2384
|
-
-
|
|
2863
|
+
-
|
|
2385
2864
|
user_agent: 'Superfeedr bot/2.0 http://superfeedr.com - Make your feeds realtime: get in touch!'
|
|
2386
2865
|
bot:
|
|
2387
2866
|
name: Superfeedr Bot
|
|
@@ -2390,7 +2869,7 @@
|
|
|
2390
2869
|
producer:
|
|
2391
2870
|
name: Superfeedr
|
|
2392
2871
|
url: https://superfeedr.com/
|
|
2393
|
-
-
|
|
2872
|
+
-
|
|
2394
2873
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 5.1; en; rv:1.9.0.13) Gecko/2009073022 Firefox/3.5.2 (.NET CLR 3.5.30729) SurveyBot/2.3 (DomainTools)
|
|
2395
2874
|
bot:
|
|
2396
2875
|
name: Survey Bot
|
|
@@ -2399,7 +2878,7 @@
|
|
|
2399
2878
|
producer:
|
|
2400
2879
|
name: Domain Tools
|
|
2401
2880
|
url: http://www.domaintools.com
|
|
2402
|
-
-
|
|
2881
|
+
-
|
|
2403
2882
|
user_agent: TLSProbe/1.0 (+https://scan.trustnet.venafi.com/)
|
|
2404
2883
|
bot:
|
|
2405
2884
|
name: TLSProbe
|
|
@@ -2408,18 +2887,23 @@
|
|
|
2408
2887
|
producer:
|
|
2409
2888
|
name: Venafi TrustNet
|
|
2410
2889
|
url: https://www.venafi.com
|
|
2411
|
-
-
|
|
2890
|
+
-
|
|
2412
2891
|
user_agent: Tarmot Gezgin/1.0 (compatible; TarmotGezgin/1.1; +http://www.tarmot.com/gezgin)
|
|
2413
2892
|
bot:
|
|
2414
2893
|
name: Tarmot Gezgin
|
|
2415
2894
|
url: http://www.tarmot.com/gezgin/
|
|
2416
2895
|
category: Search bot
|
|
2417
|
-
-
|
|
2896
|
+
-
|
|
2418
2897
|
user_agent: TelegramBot (like TwitterBot)
|
|
2419
2898
|
bot:
|
|
2420
2899
|
name: TelegramBot
|
|
2421
2900
|
url: https://telegram.org/blog/bot-revolution
|
|
2422
|
-
-
|
|
2901
|
+
-
|
|
2902
|
+
user_agent: The Knowledge AI
|
|
2903
|
+
bot:
|
|
2904
|
+
name: The Knowledge AI
|
|
2905
|
+
category: Crawler
|
|
2906
|
+
-
|
|
2423
2907
|
user_agent: TinEye-bot/0.02 (see http://www.tineye.com/crawler.html)
|
|
2424
2908
|
bot:
|
|
2425
2909
|
name: TinEye Crawler
|
|
@@ -2428,7 +2912,7 @@
|
|
|
2428
2912
|
producer:
|
|
2429
2913
|
name: Idée Inc.
|
|
2430
2914
|
url: http://ideeinc.com
|
|
2431
|
-
-
|
|
2915
|
+
-
|
|
2432
2916
|
user_agent: Tiny Tiny RSS/1.10 (http://tt-rss.org/)
|
|
2433
2917
|
bot:
|
|
2434
2918
|
name: Tiny Tiny RSS
|
|
@@ -2437,7 +2921,7 @@
|
|
|
2437
2921
|
producer:
|
|
2438
2922
|
name: ""
|
|
2439
2923
|
url: ""
|
|
2440
|
-
-
|
|
2924
|
+
-
|
|
2441
2925
|
user_agent: Tiny Tiny RSS/1.11.4c63934 (http://tt-rss.org/)
|
|
2442
2926
|
bot:
|
|
2443
2927
|
name: Tiny Tiny RSS
|
|
@@ -2446,7 +2930,16 @@
|
|
|
2446
2930
|
producer:
|
|
2447
2931
|
name: ""
|
|
2448
2932
|
url: ""
|
|
2449
|
-
-
|
|
2933
|
+
-
|
|
2934
|
+
user_agent: Mozilla/5.0 (compatible; tracemyfile/1.0)
|
|
2935
|
+
bot:
|
|
2936
|
+
name: TraceMyFile
|
|
2937
|
+
category: Search bot
|
|
2938
|
+
url: https://www.tracemyfile.com/
|
|
2939
|
+
producer:
|
|
2940
|
+
name: Idee Inc.
|
|
2941
|
+
url: http://ideeinc.com/
|
|
2942
|
+
-
|
|
2450
2943
|
user_agent: Mozilla/5.0 (Windows; U; Windows NT 6.0; en-GB; rv:1.0; trendictionbot0.5.0; trendiction search; http://www.trendiction.de/bot; please let us know of any problems; web at trendiction.com) Gecko/20071127 Firefox/3.0.0.11
|
|
2451
2944
|
bot:
|
|
2452
2945
|
name: Trendiction Bot
|
|
@@ -2455,7 +2948,7 @@
|
|
|
2455
2948
|
producer:
|
|
2456
2949
|
name: Talkwalker Inc.
|
|
2457
2950
|
url: http://www.talkwalker.com
|
|
2458
|
-
-
|
|
2951
|
+
-
|
|
2459
2952
|
user_agent: TurnitinBot/3.0 (http://www.turnitin.com/robot/crawlerinfo.html)
|
|
2460
2953
|
bot:
|
|
2461
2954
|
name: TurnitinBot
|
|
@@ -2464,7 +2957,7 @@
|
|
|
2464
2957
|
producer:
|
|
2465
2958
|
name: iParadigms, LLC.
|
|
2466
2959
|
url: http://www.turnitin.com
|
|
2467
|
-
-
|
|
2960
|
+
-
|
|
2468
2961
|
user_agent: Mozilla/5.0 (compatible; TweetedTimes Bot/1.0; +http://tweetedtimes.com)
|
|
2469
2962
|
bot:
|
|
2470
2963
|
name: TweetedTimes Bot
|
|
@@ -2473,7 +2966,7 @@
|
|
|
2473
2966
|
producer:
|
|
2474
2967
|
name: TweetedTimes
|
|
2475
2968
|
url: http://tweetedtimes.com/
|
|
2476
|
-
-
|
|
2969
|
+
-
|
|
2477
2970
|
user_agent: TweetedTimes Bot/1.0 (Mozilla/5.0 Compatible, +http://tweetedtimes.com)
|
|
2478
2971
|
bot:
|
|
2479
2972
|
name: TweetedTimes Bot
|
|
@@ -2482,7 +2975,7 @@
|
|
|
2482
2975
|
producer:
|
|
2483
2976
|
name: TweetedTimes
|
|
2484
2977
|
url: http://tweetedtimes.com/
|
|
2485
|
-
-
|
|
2978
|
+
-
|
|
2486
2979
|
user_agent: Mozilla/5.0 (compatible; TweetmemeBot/3.0; +http://tweetmeme.com/)
|
|
2487
2980
|
bot:
|
|
2488
2981
|
name: Tweetmeme Bot
|
|
@@ -2491,7 +2984,15 @@
|
|
|
2491
2984
|
producer:
|
|
2492
2985
|
name: Mediasift
|
|
2493
2986
|
url: ""
|
|
2494
|
-
-
|
|
2987
|
+
-
|
|
2988
|
+
user_agent: Mozilla/5.0 (compatible; Twingly Recon; twingly.com)
|
|
2989
|
+
bot:
|
|
2990
|
+
name: Twingly Recon
|
|
2991
|
+
category: Crawler
|
|
2992
|
+
producer:
|
|
2993
|
+
name: Twingly
|
|
2994
|
+
url: https://www.twingly.com
|
|
2995
|
+
-
|
|
2495
2996
|
user_agent: Twitterbot/1.0
|
|
2496
2997
|
bot:
|
|
2497
2998
|
name: Twitterbot
|
|
@@ -2500,7 +3001,7 @@
|
|
|
2500
3001
|
producer:
|
|
2501
3002
|
name: Twitter
|
|
2502
3003
|
url: http://www.twitter.com
|
|
2503
|
-
-
|
|
3004
|
+
-
|
|
2504
3005
|
user_agent: Mozilla/5.0 (compatible; URLAppendBot/1.0; +http://www.profound.net/urlappendbot.html)
|
|
2505
3006
|
bot:
|
|
2506
3007
|
name: URLAppendBot
|
|
@@ -2509,7 +3010,7 @@
|
|
|
2509
3010
|
producer:
|
|
2510
3011
|
name: Profound Networks
|
|
2511
3012
|
url: http://www.profound.net
|
|
2512
|
-
-
|
|
3013
|
+
-
|
|
2513
3014
|
user_agent: 'Mozilla/5.0 (Windows NT 10.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36 (via secureurl.fwdcdn.com - mail.ukr.net proxy)'
|
|
2514
3015
|
bot:
|
|
2515
3016
|
name: UkrNet Mail Proxy
|
|
@@ -2518,7 +3019,7 @@
|
|
|
2518
3019
|
producer:
|
|
2519
3020
|
name: UkrNet Ltd
|
|
2520
3021
|
url: https://www.ukr.net/
|
|
2521
|
-
-
|
|
3022
|
+
-
|
|
2522
3023
|
user_agent: UniversalFeedParser/5.2.1 +https://code.google.com/p/feedparser/
|
|
2523
3024
|
bot:
|
|
2524
3025
|
name: UniversalFeedParser
|
|
@@ -2527,7 +3028,7 @@
|
|
|
2527
3028
|
producer:
|
|
2528
3029
|
name: Kurt McKee
|
|
2529
3030
|
url: https://github.com/kurtmckee
|
|
2530
|
-
-
|
|
3031
|
+
-
|
|
2531
3032
|
user_agent: Mozilla/5.0+(compatible; UptimeRobot/2.0; http://www.uptimerobot.com/)
|
|
2532
3033
|
bot:
|
|
2533
3034
|
name: Uptime Robot
|
|
@@ -2536,7 +3037,7 @@
|
|
|
2536
3037
|
producer:
|
|
2537
3038
|
name: Uptime Robot
|
|
2538
3039
|
url: http://uptimerobot.com
|
|
2539
|
-
-
|
|
3040
|
+
-
|
|
2540
3041
|
user_agent: Mozilla/5.0 (compatible; Uptimebot/1.0; +http://www.uptime.com/uptimebot)
|
|
2541
3042
|
bot:
|
|
2542
3043
|
name: Uptimebot
|
|
@@ -2545,7 +3046,7 @@
|
|
|
2545
3046
|
producer:
|
|
2546
3047
|
name: Uptime
|
|
2547
3048
|
url: https://uptime.com
|
|
2548
|
-
-
|
|
3049
|
+
-
|
|
2549
3050
|
user_agent: Mozilla/5.0 (compatible; vkShare; +http://vk.com/dev/Share)
|
|
2550
3051
|
bot:
|
|
2551
3052
|
name: VK Share Button
|
|
@@ -2554,7 +3055,7 @@
|
|
|
2554
3055
|
producer:
|
|
2555
3056
|
name: VK
|
|
2556
3057
|
url: http://vk.com/
|
|
2557
|
-
-
|
|
3058
|
+
-
|
|
2558
3059
|
user_agent: 'Mozilla/4.0 (compatible; Vagabondo/4.0; http://webagent.wise-guys.nl/; http://www.wise-guys.nl/)'
|
|
2559
3060
|
bot:
|
|
2560
3061
|
name: Vagabondo
|
|
@@ -2563,7 +3064,19 @@
|
|
|
2563
3064
|
producer:
|
|
2564
3065
|
name: WiseGuys
|
|
2565
3066
|
url: http://www.wise-guys.nl/
|
|
2566
|
-
-
|
|
3067
|
+
-
|
|
3068
|
+
user_agent: Mozilla/5.0 (compatible; VelenPublicWebCrawler/1.0; +https://velen.io)
|
|
3069
|
+
bot:
|
|
3070
|
+
name: Velen Public Web Crawler
|
|
3071
|
+
category: Crawler
|
|
3072
|
+
url: https://hunter.io/robot
|
|
3073
|
+
-
|
|
3074
|
+
user_agent: Vercelbot (+https://vercel.com)
|
|
3075
|
+
bot:
|
|
3076
|
+
name: Vercel Bot
|
|
3077
|
+
category: Service bot
|
|
3078
|
+
url: https://vercel.com
|
|
3079
|
+
-
|
|
2567
3080
|
user_agent: Mozilla/5.0 (compatible; VSMCrawler; http://www.visualsitemapper.com/crawler/)
|
|
2568
3081
|
bot:
|
|
2569
3082
|
name: Visual Site Mapper Crawler
|
|
@@ -2572,7 +3085,7 @@
|
|
|
2572
3085
|
producer:
|
|
2573
3086
|
name: Alentum Software Ltd.
|
|
2574
3087
|
url: http://www.alentum.com
|
|
2575
|
-
-
|
|
3088
|
+
-
|
|
2576
3089
|
user_agent: 'Jigsaw/2.3.0 W3C_CSS_Validator_JFouffa/2.0 (See <http://validator.w3.org/services>)'
|
|
2577
3090
|
bot:
|
|
2578
3091
|
name: W3C CSS Validator
|
|
@@ -2581,7 +3094,7 @@
|
|
|
2581
3094
|
producer:
|
|
2582
3095
|
name: W3C
|
|
2583
3096
|
url: http://www.w3.org
|
|
2584
|
-
-
|
|
3097
|
+
-
|
|
2585
3098
|
user_agent: W3C_I18n-Checker/1.0 (http://validator.w3.org/services)
|
|
2586
3099
|
bot:
|
|
2587
3100
|
name: W3C I18N Checker
|
|
@@ -2590,7 +3103,7 @@
|
|
|
2590
3103
|
producer:
|
|
2591
3104
|
name: W3C
|
|
2592
3105
|
url: http://www.w3.org
|
|
2593
|
-
-
|
|
3106
|
+
-
|
|
2594
3107
|
user_agent: 'W3C-checklink/4.0 [4.4] libwww-perl/5.803'
|
|
2595
3108
|
bot:
|
|
2596
3109
|
name: W3C Link Checker
|
|
@@ -2599,7 +3112,7 @@
|
|
|
2599
3112
|
producer:
|
|
2600
3113
|
name: W3C
|
|
2601
3114
|
url: http://www.w3.org
|
|
2602
|
-
-
|
|
3115
|
+
-
|
|
2603
3116
|
user_agent: W3C-checklink/4.81 libwww-perl/5.836
|
|
2604
3117
|
bot:
|
|
2605
3118
|
name: W3C Link Checker
|
|
@@ -2608,7 +3121,7 @@
|
|
|
2608
3121
|
producer:
|
|
2609
3122
|
name: W3C
|
|
2610
3123
|
url: http://www.w3.org
|
|
2611
|
-
-
|
|
3124
|
+
-
|
|
2612
3125
|
user_agent: Validator.nu/LV http://validator.w3.org/services
|
|
2613
3126
|
bot:
|
|
2614
3127
|
name: W3C Markup Validation Service
|
|
@@ -2617,7 +3130,7 @@
|
|
|
2617
3130
|
producer:
|
|
2618
3131
|
name: W3C
|
|
2619
3132
|
url: http://www.w3.org
|
|
2620
|
-
-
|
|
3133
|
+
-
|
|
2621
3134
|
user_agent: W3C_Validator/1.3 http://validator.w3.org/services
|
|
2622
3135
|
bot:
|
|
2623
3136
|
name: W3C Markup Validation Service
|
|
@@ -2626,7 +3139,7 @@
|
|
|
2626
3139
|
producer:
|
|
2627
3140
|
name: W3C
|
|
2628
3141
|
url: http://www.w3.org
|
|
2629
|
-
-
|
|
3142
|
+
-
|
|
2630
3143
|
user_agent: W3C_Validator/1.767
|
|
2631
3144
|
bot:
|
|
2632
3145
|
name: W3C Markup Validation Service
|
|
@@ -2635,7 +3148,7 @@
|
|
|
2635
3148
|
producer:
|
|
2636
3149
|
name: W3C
|
|
2637
3150
|
url: http://www.w3.org
|
|
2638
|
-
-
|
|
3151
|
+
-
|
|
2639
3152
|
user_agent: W3C-mobileOK/DDC-1.0 (see http://www.w3.org/2006/07/mobileok-ddc)
|
|
2640
3153
|
bot:
|
|
2641
3154
|
name: W3C MobileOK Checker
|
|
@@ -2644,7 +3157,7 @@
|
|
|
2644
3157
|
producer:
|
|
2645
3158
|
name: W3C
|
|
2646
3159
|
url: http://www.w3.org
|
|
2647
|
-
-
|
|
3160
|
+
-
|
|
2648
3161
|
user_agent: W3C_Unicorn/1.0 (http://validator.w3.org/services)
|
|
2649
3162
|
bot:
|
|
2650
3163
|
name: W3C Unified Validator
|
|
@@ -2653,7 +3166,7 @@
|
|
|
2653
3166
|
producer:
|
|
2654
3167
|
name: W3C
|
|
2655
3168
|
url: http://www.w3.org
|
|
2656
|
-
-
|
|
3169
|
+
-
|
|
2657
3170
|
user_agent: Mozilla/5.0 (compatible; Wappalyzer; +https://github.com/AliasIO/Wappalyzer)
|
|
2658
3171
|
bot:
|
|
2659
3172
|
name: Wappalyzer
|
|
@@ -2661,7 +3174,7 @@
|
|
|
2661
3174
|
producer:
|
|
2662
3175
|
name: AliasIO
|
|
2663
3176
|
url: https://github.com/AliasIO
|
|
2664
|
-
-
|
|
3177
|
+
-
|
|
2665
3178
|
user_agent: WeSEE:Search/0.1 (Alpha, http://www.wesee.com/en/support/bot/)
|
|
2666
3179
|
bot:
|
|
2667
3180
|
name: WeSEE:Search
|
|
@@ -2670,13 +3183,13 @@
|
|
|
2670
3183
|
producer:
|
|
2671
3184
|
name: WeSEE Ltd
|
|
2672
3185
|
url: http://www.wesee.com
|
|
2673
|
-
-
|
|
3186
|
+
-
|
|
2674
3187
|
user_agent: Mozilla/5.0 (Linux; Android 6.0.1; Moto G (4) Build/MPJ24.139-64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/65.0.3325.146 Mobile Safari/537.36 PTST/180829.190838
|
|
2675
3188
|
bot:
|
|
2676
3189
|
name: WebPageTest
|
|
2677
3190
|
category: Site Monitor
|
|
2678
3191
|
url: https://www.webpagetest.org
|
|
2679
|
-
-
|
|
3192
|
+
-
|
|
2680
3193
|
user_agent: websitepulse checker/1.1 (compatible; MSIE 5.5; Netscape 4.75; Linux)
|
|
2681
3194
|
bot:
|
|
2682
3195
|
name: WebSitePulse
|
|
@@ -2685,7 +3198,7 @@
|
|
|
2685
3198
|
producer:
|
|
2686
3199
|
name: WebSitePulse
|
|
2687
3200
|
url: http://www.websitepulse.com/
|
|
2688
|
-
-
|
|
3201
|
+
-
|
|
2689
3202
|
user_agent: WebbCrawler 1.0 ( http://badcheese.com/crawler.html )
|
|
2690
3203
|
bot:
|
|
2691
3204
|
name: WebbCrawler
|
|
@@ -2694,16 +3207,52 @@
|
|
|
2694
3207
|
producer:
|
|
2695
3208
|
name: Steve Webb
|
|
2696
3209
|
url: http://badcheese.com
|
|
2697
|
-
-
|
|
2698
|
-
user_agent:
|
|
3210
|
+
-
|
|
3211
|
+
user_agent: weborama-fetcher (+http://www.weborama.com)
|
|
2699
3212
|
bot:
|
|
2700
|
-
name:
|
|
2701
|
-
category:
|
|
3213
|
+
name: Weborama
|
|
3214
|
+
category: Search bot
|
|
3215
|
+
url: https://weborama.com/
|
|
3216
|
+
producer:
|
|
3217
|
+
name: Weborama SA
|
|
3218
|
+
url: https://weborama.com/
|
|
3219
|
+
-
|
|
3220
|
+
user_agent: WikiDo/1.1 (http://wikido.com; crawler@wikido.com)
|
|
3221
|
+
bot:
|
|
3222
|
+
name: WikiDo
|
|
3223
|
+
category: Search bot
|
|
3224
|
+
url: https://www.wikido.com/
|
|
3225
|
+
producer:
|
|
3226
|
+
name: Fotolitografie Fiorentine di Becchi Antonio s.n.c.
|
|
3227
|
+
url: https://www.wikido.com/
|
|
3228
|
+
-
|
|
3229
|
+
user_agent: Mozilla/5.0 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
|
3230
|
+
bot:
|
|
3231
|
+
name: WooRank
|
|
3232
|
+
category: Search bot
|
|
3233
|
+
url: https://www.woorank.com/
|
|
3234
|
+
producer:
|
|
3235
|
+
name: WooRank sprl
|
|
3236
|
+
url: https://www.woorank.com/
|
|
3237
|
+
-
|
|
3238
|
+
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 11_0 like Mac OS X) AppleWebKit/604.1.38 (KHTML, like Gecko) Version/11.0 Mobile/15A372 Safari/604.1 (compatible; woorankreview/2.0; +https://www.woorank.com/)
|
|
3239
|
+
bot:
|
|
3240
|
+
name: WooRank
|
|
3241
|
+
category: Search bot
|
|
3242
|
+
url: https://www.woorank.com/
|
|
3243
|
+
producer:
|
|
3244
|
+
name: WooRank sprl
|
|
3245
|
+
url: https://www.woorank.com/
|
|
3246
|
+
-
|
|
3247
|
+
user_agent: WordPress/4.7.2; https://example.com
|
|
3248
|
+
bot:
|
|
3249
|
+
name: WordPress
|
|
3250
|
+
category: Service Agent
|
|
2702
3251
|
url: https://wordpress.org/
|
|
2703
3252
|
producer:
|
|
2704
3253
|
name: Wordpress.org
|
|
2705
3254
|
url: https://wordpress.org/
|
|
2706
|
-
-
|
|
3255
|
+
-
|
|
2707
3256
|
user_agent: Wotbox/2.01 (+http://www.wotbox.com/bot/)
|
|
2708
3257
|
bot:
|
|
2709
3258
|
name: Wotbox
|
|
@@ -2712,7 +3261,16 @@
|
|
|
2712
3261
|
producer:
|
|
2713
3262
|
name: Wotbox
|
|
2714
3263
|
url: http://www.wotbox.com
|
|
2715
|
-
-
|
|
3264
|
+
-
|
|
3265
|
+
user_agent: XenForo/2.x (https://www.example.com)
|
|
3266
|
+
bot:
|
|
3267
|
+
name: XenForo
|
|
3268
|
+
category: Service Agent
|
|
3269
|
+
url: https://xenforo.com/
|
|
3270
|
+
producer:
|
|
3271
|
+
name: XenForo Ltd.
|
|
3272
|
+
url: https://xenforo.com/
|
|
3273
|
+
-
|
|
2716
3274
|
user_agent: yacybot (freeworld/global; amd64 Linux 3.2.0-4-amd64; java 1.7.0_25; Europe/en) http://yacy.net/bot.html
|
|
2717
3275
|
bot:
|
|
2718
3276
|
name: YaCy
|
|
@@ -2721,7 +3279,7 @@
|
|
|
2721
3279
|
producer:
|
|
2722
3280
|
name: YaCy
|
|
2723
3281
|
url: http://yacy.net
|
|
2724
|
-
-
|
|
3282
|
+
-
|
|
2725
3283
|
user_agent: yacybot (freeworld/global; x86 Windows XP 5.1; java 1.7.0_21; GMT+04:00/ru) http://yacy.net/bot.html
|
|
2726
3284
|
bot:
|
|
2727
3285
|
name: YaCy
|
|
@@ -2730,7 +3288,7 @@
|
|
|
2730
3288
|
producer:
|
|
2731
3289
|
name: YaCy
|
|
2732
3290
|
url: http://yacy.net
|
|
2733
|
-
-
|
|
3291
|
+
-
|
|
2734
3292
|
user_agent: Mozilla/5.0 (compatible; Yahoo Ad monitoring; https://help.yahoo.com/kb/yahoo-ad-monitoring-SLN24857.html)
|
|
2735
3293
|
bot:
|
|
2736
3294
|
name: Yahoo Gemini
|
|
@@ -2739,7 +3297,16 @@
|
|
|
2739
3297
|
producer:
|
|
2740
3298
|
name: Yahoo! Inc.
|
|
2741
3299
|
url: http://www.yahoo.com
|
|
2742
|
-
-
|
|
3300
|
+
-
|
|
3301
|
+
user_agent: Y!J-BRW/1.0 (https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716)
|
|
3302
|
+
bot:
|
|
3303
|
+
name: Yahoo! Japan BRW
|
|
3304
|
+
category: Crawler
|
|
3305
|
+
url: https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716/~/ウェブページにアクセスするシステムのユーザーエージェントについて
|
|
3306
|
+
producer:
|
|
3307
|
+
name: Yahoo! Japan Corp.
|
|
3308
|
+
url: https://www.yahoo.co.jp/
|
|
3309
|
+
-
|
|
2743
3310
|
user_agent: Mozilla/5.0 (compatible; Yahoo Link Preview; https://help.yahoo.com/kb/mail/yahoo-link-preview-SLN23615.html)
|
|
2744
3311
|
bot:
|
|
2745
3312
|
name: Yahoo! Link Preview
|
|
@@ -2748,7 +3315,7 @@
|
|
|
2748
3315
|
producer:
|
|
2749
3316
|
name: Yahoo! Inc.
|
|
2750
3317
|
url: http://www.yahoo.com
|
|
2751
|
-
-
|
|
3318
|
+
-
|
|
2752
3319
|
user_agent: Yahoo:LinkExpander:Slingstone
|
|
2753
3320
|
bot:
|
|
2754
3321
|
name: Yahoo! Link Preview
|
|
@@ -2757,7 +3324,7 @@
|
|
|
2757
3324
|
producer:
|
|
2758
3325
|
name: Yahoo! Inc.
|
|
2759
3326
|
url: http://www.yahoo.com
|
|
2760
|
-
-
|
|
3327
|
+
-
|
|
2761
3328
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp/3.0; http://help.yahoo.com/help/us/ysearch/slurp) NOT Firefox/3.5
|
|
2762
3329
|
bot:
|
|
2763
3330
|
name: Yahoo! Slurp
|
|
@@ -2766,7 +3333,7 @@
|
|
|
2766
3333
|
producer:
|
|
2767
3334
|
name: Yahoo! Inc.
|
|
2768
3335
|
url: http://www.yahoo.com
|
|
2769
|
-
-
|
|
3336
|
+
-
|
|
2770
3337
|
user_agent: Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)
|
|
2771
3338
|
bot:
|
|
2772
3339
|
name: Yahoo! Slurp
|
|
@@ -2775,7 +3342,7 @@
|
|
|
2775
3342
|
producer:
|
|
2776
3343
|
name: Yahoo! Inc.
|
|
2777
3344
|
url: http://www.yahoo.com
|
|
2778
|
-
-
|
|
3345
|
+
-
|
|
2779
3346
|
user_agent: Mozilla/5.0 (compatible; Linux i686; Yandex.Gazeta Bot/1.0; +http://gazeta.yandex.ru)
|
|
2780
3347
|
bot:
|
|
2781
3348
|
name: Yandex Bot
|
|
@@ -2784,7 +3351,7 @@
|
|
|
2784
3351
|
producer:
|
|
2785
3352
|
name: Yandex LLC
|
|
2786
3353
|
url: http://company.yandex.com
|
|
2787
|
-
-
|
|
3354
|
+
-
|
|
2788
3355
|
user_agent: Mozilla/5.0 (compatible; YaDirectFetcher/1.0; +http://yandex.com/bots)
|
|
2789
3356
|
bot:
|
|
2790
3357
|
name: Yandex Bot
|
|
@@ -2793,7 +3360,7 @@
|
|
|
2793
3360
|
producer:
|
|
2794
3361
|
name: Yandex LLC
|
|
2795
3362
|
url: http://company.yandex.com
|
|
2796
|
-
-
|
|
3363
|
+
-
|
|
2797
3364
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
|
2798
3365
|
bot:
|
|
2799
3366
|
name: Yandex Bot
|
|
@@ -2802,7 +3369,7 @@
|
|
|
2802
3369
|
producer:
|
|
2803
3370
|
name: Yandex LLC
|
|
2804
3371
|
url: http://company.yandex.com
|
|
2805
|
-
-
|
|
3372
|
+
-
|
|
2806
3373
|
user_agent: Mozilla/5.0 (compatible; YandexAntivirus/2.0; +http://yandex.com/bots)
|
|
2807
3374
|
bot:
|
|
2808
3375
|
name: Yandex Bot
|
|
@@ -2811,7 +3378,7 @@
|
|
|
2811
3378
|
producer:
|
|
2812
3379
|
name: Yandex LLC
|
|
2813
3380
|
url: http://company.yandex.com
|
|
2814
|
-
-
|
|
3381
|
+
-
|
|
2815
3382
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
|
2816
3383
|
bot:
|
|
2817
3384
|
name: Yandex Bot
|
|
@@ -2820,7 +3387,7 @@
|
|
|
2820
3387
|
producer:
|
|
2821
3388
|
name: Yandex LLC
|
|
2822
3389
|
url: http://company.yandex.com
|
|
2823
|
-
-
|
|
3390
|
+
-
|
|
2824
3391
|
user_agent: Mozilla/5.0 (compatible; YandexBlogs/0.99; robot; B; +http://yandex.com/bots)
|
|
2825
3392
|
bot:
|
|
2826
3393
|
name: Yandex Bot
|
|
@@ -2829,7 +3396,7 @@
|
|
|
2829
3396
|
producer:
|
|
2830
3397
|
name: Yandex LLC
|
|
2831
3398
|
url: http://company.yandex.com
|
|
2832
|
-
-
|
|
3399
|
+
-
|
|
2833
3400
|
user_agent: Mozilla/5.0 (compatible; YandexBot/3.0; +http://yandex.com/bots)
|
|
2834
3401
|
bot:
|
|
2835
3402
|
name: Yandex Bot
|
|
@@ -2838,7 +3405,7 @@
|
|
|
2838
3405
|
producer:
|
|
2839
3406
|
name: Yandex LLC
|
|
2840
3407
|
url: http://company.yandex.com
|
|
2841
|
-
-
|
|
3408
|
+
-
|
|
2842
3409
|
user_agent: Mozilla/5.0 (compatible; YandexDirect/3.0; +http://yandex.com/bots)
|
|
2843
3410
|
bot:
|
|
2844
3411
|
name: Yandex Bot
|
|
@@ -2847,7 +3414,7 @@
|
|
|
2847
3414
|
producer:
|
|
2848
3415
|
name: Yandex LLC
|
|
2849
3416
|
url: http://company.yandex.com
|
|
2850
|
-
-
|
|
3417
|
+
-
|
|
2851
3418
|
user_agent: Mozilla/5.0 (compatible; YandexFavicons/1.0; +http://yandex.com/bots)
|
|
2852
3419
|
bot:
|
|
2853
3420
|
name: Yandex Bot
|
|
@@ -2856,7 +3423,7 @@
|
|
|
2856
3423
|
producer:
|
|
2857
3424
|
name: Yandex LLC
|
|
2858
3425
|
url: http://company.yandex.com
|
|
2859
|
-
-
|
|
3426
|
+
-
|
|
2860
3427
|
user_agent: Mozilla/5.0 (compatible; YandexImageResizer/2.0; +http://yandex.com/bots)
|
|
2861
3428
|
bot:
|
|
2862
3429
|
name: Yandex Bot
|
|
@@ -2865,7 +3432,7 @@
|
|
|
2865
3432
|
producer:
|
|
2866
3433
|
name: Yandex LLC
|
|
2867
3434
|
url: http://company.yandex.com
|
|
2868
|
-
-
|
|
3435
|
+
-
|
|
2869
3436
|
user_agent: Mozilla/5.0 (compatible; YandexImages/3.0; +http://yandex.com/bots)
|
|
2870
3437
|
bot:
|
|
2871
3438
|
name: Yandex Bot
|
|
@@ -2874,7 +3441,7 @@
|
|
|
2874
3441
|
producer:
|
|
2875
3442
|
name: Yandex LLC
|
|
2876
3443
|
url: http://company.yandex.com
|
|
2877
|
-
-
|
|
3444
|
+
-
|
|
2878
3445
|
user_agent: Mozilla/5.0 (compatible; YandexMetrika/2.0; +http://yandex.com/bots)
|
|
2879
3446
|
bot:
|
|
2880
3447
|
name: Yandex Bot
|
|
@@ -2883,7 +3450,16 @@
|
|
|
2883
3450
|
producer:
|
|
2884
3451
|
name: Yandex LLC
|
|
2885
3452
|
url: http://company.yandex.com
|
|
2886
|
-
-
|
|
3453
|
+
-
|
|
3454
|
+
user_agent: Mozilla/5.0 (compatible; YandexMobileScreenShotBot/1.0; +http://yandex.com/bots)
|
|
3455
|
+
bot:
|
|
3456
|
+
name: Yandex Bot
|
|
3457
|
+
category: Search bot
|
|
3458
|
+
url: http://www.yandex.com/bots
|
|
3459
|
+
producer:
|
|
3460
|
+
name: Yandex LLC
|
|
3461
|
+
url: http://company.yandex.com
|
|
3462
|
+
-
|
|
2887
3463
|
user_agent: Mozilla/5.0 (compatible; YandexNews/3.0; +http://yandex.com/bots)
|
|
2888
3464
|
bot:
|
|
2889
3465
|
name: Yandex Bot
|
|
@@ -2892,7 +3468,7 @@
|
|
|
2892
3468
|
producer:
|
|
2893
3469
|
name: Yandex LLC
|
|
2894
3470
|
url: http://company.yandex.com
|
|
2895
|
-
-
|
|
3471
|
+
-
|
|
2896
3472
|
user_agent: Mozilla/5.0 (compatible; YandexNewslinks; +http://yandex.com/bots)
|
|
2897
3473
|
bot:
|
|
2898
3474
|
name: Yandex Bot
|
|
@@ -2901,7 +3477,70 @@
|
|
|
2901
3477
|
producer:
|
|
2902
3478
|
name: Yandex LLC
|
|
2903
3479
|
url: http://company.yandex.com
|
|
2904
|
-
-
|
|
3480
|
+
-
|
|
3481
|
+
user_agent: Mozilla/5.0 (compatible; YandexOntoDB/1.0; +http://yandex.com/bots)
|
|
3482
|
+
bot:
|
|
3483
|
+
name: Yandex Bot
|
|
3484
|
+
category: Search bot
|
|
3485
|
+
url: http://www.yandex.com/bots
|
|
3486
|
+
producer:
|
|
3487
|
+
name: Yandex LLC
|
|
3488
|
+
url: http://company.yandex.com
|
|
3489
|
+
-
|
|
3490
|
+
user_agent: Mozilla/5.0 (compatible; YandexOntoDBAPI/1.0; +http://yandex.com/bots)
|
|
3491
|
+
bot:
|
|
3492
|
+
name: Yandex Bot
|
|
3493
|
+
category: Search bot
|
|
3494
|
+
url: http://www.yandex.com/bots
|
|
3495
|
+
producer:
|
|
3496
|
+
name: Yandex LLC
|
|
3497
|
+
url: http://company.yandex.com
|
|
3498
|
+
-
|
|
3499
|
+
user_agent: Mozilla/5.0 (compatible; YandexPartner/3.0; +http://yandex.com/bots)
|
|
3500
|
+
bot:
|
|
3501
|
+
name: Yandex Bot
|
|
3502
|
+
category: Search bot
|
|
3503
|
+
url: http://www.yandex.com/bots
|
|
3504
|
+
producer:
|
|
3505
|
+
name: Yandex LLC
|
|
3506
|
+
url: http://company.yandex.com
|
|
3507
|
+
-
|
|
3508
|
+
user_agent: Mozilla/5.0 (compatible; YandexRCA/1.0; +http://yandex.com/bots)
|
|
3509
|
+
bot:
|
|
3510
|
+
name: Yandex Bot
|
|
3511
|
+
category: Search bot
|
|
3512
|
+
url: http://www.yandex.com/bots
|
|
3513
|
+
producer:
|
|
3514
|
+
name: Yandex LLC
|
|
3515
|
+
url: http://company.yandex.com
|
|
3516
|
+
-
|
|
3517
|
+
user_agent: Mozilla/5.0 (compatible; YandexSearchShop/1.0; +http://yandex.com/bots)
|
|
3518
|
+
bot:
|
|
3519
|
+
name: Yandex Bot
|
|
3520
|
+
category: Search bot
|
|
3521
|
+
url: http://www.yandex.com/bots
|
|
3522
|
+
producer:
|
|
3523
|
+
name: Yandex LLC
|
|
3524
|
+
url: http://company.yandex.com
|
|
3525
|
+
-
|
|
3526
|
+
user_agent: Mozilla/5.0 (compatible; YandexTracker/1.0; +http://yandex.com/bots)
|
|
3527
|
+
bot:
|
|
3528
|
+
name: Yandex Bot
|
|
3529
|
+
category: Search bot
|
|
3530
|
+
url: http://www.yandex.com/bots
|
|
3531
|
+
producer:
|
|
3532
|
+
name: Yandex LLC
|
|
3533
|
+
url: http://company.yandex.com
|
|
3534
|
+
-
|
|
3535
|
+
user_agent: Mozilla/5.0 (compatible; YandexTurbo/1.0; +http://yandex.com/bots)
|
|
3536
|
+
bot:
|
|
3537
|
+
name: Yandex Bot
|
|
3538
|
+
category: Search bot
|
|
3539
|
+
url: http://www.yandex.com/bots
|
|
3540
|
+
producer:
|
|
3541
|
+
name: Yandex LLC
|
|
3542
|
+
url: http://company.yandex.com
|
|
3543
|
+
-
|
|
2905
3544
|
user_agent: Mozilla/5.0 (compatible; YandexVerticals/1.0; http://yandex.com/bots)
|
|
2906
3545
|
bot:
|
|
2907
3546
|
name: Yandex Bot
|
|
@@ -2910,7 +3549,16 @@
|
|
|
2910
3549
|
producer:
|
|
2911
3550
|
name: Yandex LLC
|
|
2912
3551
|
url: http://company.yandex.com
|
|
2913
|
-
-
|
|
3552
|
+
-
|
|
3553
|
+
user_agent: Mozilla/5.0 (compatible; NaverJapan/1.0; +http://corp.naver.jp/)
|
|
3554
|
+
bot:
|
|
3555
|
+
name: Yeti/Naverbot
|
|
3556
|
+
category: Search bot
|
|
3557
|
+
url: http://help.naver.com/robots/
|
|
3558
|
+
producer:
|
|
3559
|
+
name: Naver
|
|
3560
|
+
url: http://www.naver.com
|
|
3561
|
+
-
|
|
2914
3562
|
user_agent: Yeti/1.1 (Naver Corp.; http://help.naver.com/robots/)
|
|
2915
3563
|
bot:
|
|
2916
3564
|
name: Yeti/Naverbot
|
|
@@ -2919,7 +3567,7 @@
|
|
|
2919
3567
|
producer:
|
|
2920
3568
|
name: Naver
|
|
2921
3569
|
url: http://www.naver.com
|
|
2922
|
-
-
|
|
3570
|
+
-
|
|
2923
3571
|
user_agent: Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )
|
|
2924
3572
|
bot:
|
|
2925
3573
|
name: Youdao Bot
|
|
@@ -2928,13 +3576,13 @@
|
|
|
2928
3576
|
producer:
|
|
2929
3577
|
name: NetEase, Inc.
|
|
2930
3578
|
url: http://corp.163.com
|
|
2931
|
-
-
|
|
3579
|
+
-
|
|
2932
3580
|
user_agent: YOURLS v1.5.1 +http://yourls.org/ (running on http://fhort.com)
|
|
2933
3581
|
bot:
|
|
2934
3582
|
name: Yourls
|
|
2935
3583
|
category: Crawler
|
|
2936
3584
|
url: http://yourls.org
|
|
2937
|
-
-
|
|
3585
|
+
-
|
|
2938
3586
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunrang.com/yrspider.html)
|
|
2939
3587
|
bot:
|
|
2940
3588
|
name: Yunyun Bot
|
|
@@ -2943,7 +3591,7 @@
|
|
|
2943
3591
|
producer:
|
|
2944
3592
|
name: YunYun
|
|
2945
3593
|
url: http://www.yunyun.com
|
|
2946
|
-
-
|
|
3594
|
+
-
|
|
2947
3595
|
user_agent: Mozilla/5.0 (compatible; YRSpider; +http://www.yunyun.com/SiteInfo.php?r=about)
|
|
2948
3596
|
bot:
|
|
2949
3597
|
name: Yunyun Bot
|
|
@@ -2952,7 +3600,7 @@
|
|
|
2952
3600
|
producer:
|
|
2953
3601
|
name: YunYun
|
|
2954
3602
|
url: http://www.yunyun.com
|
|
2955
|
-
-
|
|
3603
|
+
-
|
|
2956
3604
|
user_agent: Mozilla/5.0 (compatible; YYSpider; +http://www.yunyun.com/spider.html)
|
|
2957
3605
|
bot:
|
|
2958
3606
|
name: Yunyun Bot
|
|
@@ -2961,12 +3609,21 @@
|
|
|
2961
3609
|
producer:
|
|
2962
3610
|
name: YunYun
|
|
2963
3611
|
url: http://www.yunyun.com
|
|
2964
|
-
-
|
|
3612
|
+
-
|
|
2965
3613
|
user_agent: Zao/0.1 (http://www.kototol.org/zao)
|
|
2966
3614
|
bot:
|
|
2967
3615
|
name: Zao
|
|
2968
3616
|
category: Crawler
|
|
2969
|
-
-
|
|
3617
|
+
-
|
|
3618
|
+
user_agent: zelist.ro feed parser (+http://www.zelist.ro)
|
|
3619
|
+
bot:
|
|
3620
|
+
name: Ze List
|
|
3621
|
+
url: https://www.zelist.ro/
|
|
3622
|
+
category: Feed Fetcher
|
|
3623
|
+
producer:
|
|
3624
|
+
name: Treeworks SRL
|
|
3625
|
+
url: https://www.tree.ro/
|
|
3626
|
+
-
|
|
2970
3627
|
user_agent: Zookabot/2.5;++http://zookabot.com
|
|
2971
3628
|
bot:
|
|
2972
3629
|
name: Zookabot
|
|
@@ -2975,7 +3632,7 @@
|
|
|
2975
3632
|
producer:
|
|
2976
3633
|
name: Hwacha ApS
|
|
2977
3634
|
url: http://hwacha.dk
|
|
2978
|
-
-
|
|
3635
|
+
-
|
|
2979
3636
|
user_agent: Mozilla/5.0 (compatible; ZumBot/1.0; http://help.zum.com/inquiry)
|
|
2980
3637
|
bot:
|
|
2981
3638
|
name: ZumBot
|
|
@@ -2984,7 +3641,7 @@
|
|
|
2984
3641
|
producer:
|
|
2985
3642
|
name: ZUM internet
|
|
2986
3643
|
url: http://www.zuminternet.com/
|
|
2987
|
-
-
|
|
3644
|
+
-
|
|
2988
3645
|
user_agent: ZumBot/1.0 (ZUM Search; http://help.zum.com/inquiry)
|
|
2989
3646
|
bot:
|
|
2990
3647
|
name: ZumBot
|
|
@@ -2993,106 +3650,106 @@
|
|
|
2993
3650
|
producer:
|
|
2994
3651
|
name: ZUM internet
|
|
2995
3652
|
url: http://www.zuminternet.com/
|
|
2996
|
-
-
|
|
3653
|
+
-
|
|
2997
3654
|
user_agent: AhrefsBot.Feeds v0.1; http://ahrefs.com/
|
|
2998
3655
|
bot:
|
|
2999
3656
|
name: aHrefs Bot
|
|
3000
3657
|
category: Crawler
|
|
3001
|
-
url:
|
|
3658
|
+
url: https://ahrefs.com/robot
|
|
3002
3659
|
producer:
|
|
3003
3660
|
name: Ahrefs Pte Ltd
|
|
3004
|
-
url:
|
|
3005
|
-
-
|
|
3661
|
+
url: https://ahrefs.com/robot
|
|
3662
|
+
-
|
|
3006
3663
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/3.1; +http://ahrefs.com/robot/
|
|
3007
3664
|
bot:
|
|
3008
3665
|
name: aHrefs Bot
|
|
3009
3666
|
category: Crawler
|
|
3010
|
-
url:
|
|
3667
|
+
url: https://ahrefs.com/robot
|
|
3011
3668
|
producer:
|
|
3012
3669
|
name: Ahrefs Pte Ltd
|
|
3013
|
-
url:
|
|
3014
|
-
-
|
|
3670
|
+
url: https://ahrefs.com/robot
|
|
3671
|
+
-
|
|
3015
3672
|
user_agent: Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/)
|
|
3016
3673
|
bot:
|
|
3017
3674
|
name: aHrefs Bot
|
|
3018
3675
|
category: Crawler
|
|
3019
|
-
url:
|
|
3676
|
+
url: https://ahrefs.com/robot
|
|
3020
3677
|
producer:
|
|
3021
3678
|
name: Ahrefs Pte Ltd
|
|
3022
|
-
url:
|
|
3023
|
-
-
|
|
3679
|
+
url: https://ahrefs.com/robot
|
|
3680
|
+
-
|
|
3024
3681
|
user_agent: 'Mozilla/5.0 (compatible; AhrefsBot/5.0; +http://ahrefs.com/robot/) AppEngine-Google; (+http://code.google.com/appengine; appid: s~proxyfile1-hrd)'
|
|
3025
3682
|
bot:
|
|
3026
3683
|
name: aHrefs Bot
|
|
3027
3684
|
category: Crawler
|
|
3028
|
-
url:
|
|
3685
|
+
url: https://ahrefs.com/robot
|
|
3029
3686
|
producer:
|
|
3030
3687
|
name: Ahrefs Pte Ltd
|
|
3031
|
-
url:
|
|
3032
|
-
-
|
|
3688
|
+
url: https://ahrefs.com/robot
|
|
3689
|
+
-
|
|
3033
3690
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot +http://www.archive.org/details/archive.org_bot)
|
|
3034
3691
|
bot:
|
|
3035
3692
|
name: archive.org bot
|
|
3036
3693
|
category: Crawler
|
|
3037
|
-
url:
|
|
3694
|
+
url: https://archive.org/details/archive.org_bot
|
|
3038
3695
|
producer:
|
|
3039
3696
|
name: The Internet Archive
|
|
3040
|
-
url:
|
|
3041
|
-
-
|
|
3697
|
+
url: https://archive.org
|
|
3698
|
+
-
|
|
3042
3699
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot/3.3.0 +http://pandora.nla.gov.au/crawl.html)
|
|
3043
3700
|
bot:
|
|
3044
3701
|
name: archive.org bot
|
|
3045
3702
|
category: Crawler
|
|
3046
|
-
url:
|
|
3703
|
+
url: https://archive.org/details/archive.org_bot
|
|
3047
3704
|
producer:
|
|
3048
3705
|
name: The Internet Archive
|
|
3049
|
-
url:
|
|
3050
|
-
-
|
|
3706
|
+
url: https://archive.org
|
|
3707
|
+
-
|
|
3051
3708
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Archive-It; +http://archive-it.org/files/site-owners.html)
|
|
3052
3709
|
bot:
|
|
3053
3710
|
name: archive.org bot
|
|
3054
3711
|
category: Crawler
|
|
3055
|
-
url:
|
|
3712
|
+
url: https://archive.org/details/archive.org_bot
|
|
3056
3713
|
producer:
|
|
3057
3714
|
name: The Internet Archive
|
|
3058
|
-
url:
|
|
3059
|
-
-
|
|
3715
|
+
url: https://archive.org
|
|
3716
|
+
-
|
|
3060
3717
|
user_agent: Mozilla/5.0 (compatible; archive.org_bot; Wayback Machine Live Record; +http://archive.org/details/archive.org_bot)
|
|
3061
3718
|
bot:
|
|
3062
3719
|
name: archive.org bot
|
|
3063
3720
|
category: Crawler
|
|
3064
|
-
url:
|
|
3721
|
+
url: https://archive.org/details/archive.org_bot
|
|
3065
3722
|
producer:
|
|
3066
3723
|
name: The Internet Archive
|
|
3067
|
-
url:
|
|
3068
|
-
-
|
|
3724
|
+
url: https://archive.org
|
|
3725
|
+
-
|
|
3069
3726
|
user_agent: Mozilla/5.0 (compatible; heritrix/3.1.2-SNAPSHOT-20131029-0036 +http://archive.org/details/archive.org_bot)
|
|
3070
3727
|
bot:
|
|
3071
3728
|
name: archive.org bot
|
|
3072
3729
|
category: Crawler
|
|
3073
|
-
url:
|
|
3730
|
+
url: https://archive.org/details/archive.org_bot
|
|
3074
3731
|
producer:
|
|
3075
3732
|
name: The Internet Archive
|
|
3076
|
-
url:
|
|
3077
|
-
-
|
|
3733
|
+
url: https://archive.org
|
|
3734
|
+
-
|
|
3078
3735
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.1.1 +http://www.archive.org/details/archive.org_bot)
|
|
3079
3736
|
bot:
|
|
3080
3737
|
name: archive.org bot
|
|
3081
3738
|
category: Crawler
|
|
3082
|
-
url:
|
|
3739
|
+
url: https://archive.org/details/archive.org_bot
|
|
3083
3740
|
producer:
|
|
3084
3741
|
name: The Internet Archive
|
|
3085
|
-
url:
|
|
3086
|
-
-
|
|
3742
|
+
url: https://archive.org
|
|
3743
|
+
-
|
|
3087
3744
|
user_agent: Mozilla/5.0 (compatible; special_archiver/3.2.0 +http://www.loc.gov/webarchiving/notice_to_webmasters.html)
|
|
3088
3745
|
bot:
|
|
3089
3746
|
name: archive.org bot
|
|
3090
3747
|
category: Crawler
|
|
3091
|
-
url:
|
|
3748
|
+
url: https://archive.org/details/archive.org_bot
|
|
3092
3749
|
producer:
|
|
3093
3750
|
name: The Internet Archive
|
|
3094
|
-
url:
|
|
3095
|
-
-
|
|
3751
|
+
url: https://archive.org
|
|
3752
|
+
-
|
|
3096
3753
|
user_agent: CCBot/2.0 (http://commoncrawl.org/faq/)
|
|
3097
3754
|
bot:
|
|
3098
3755
|
name: ccBot crawler
|
|
@@ -3101,7 +3758,24 @@
|
|
|
3101
3758
|
producer:
|
|
3102
3759
|
name: reddit inc.
|
|
3103
3760
|
url: http://www.reddit.com
|
|
3104
|
-
-
|
|
3761
|
+
-
|
|
3762
|
+
user_agent: Mozilla/5.0 eCairn-Grabber/1.0 (+http://ecairn.com/grabber)
|
|
3763
|
+
bot:
|
|
3764
|
+
name: eCairn-Grabber
|
|
3765
|
+
category: Crawler
|
|
3766
|
+
producer:
|
|
3767
|
+
name: eCairn
|
|
3768
|
+
url: https://ecairn.com
|
|
3769
|
+
-
|
|
3770
|
+
user_agent: eZ Publish Link Validator
|
|
3771
|
+
bot:
|
|
3772
|
+
name: eZ Publish Link Validator
|
|
3773
|
+
category: Crawler
|
|
3774
|
+
url: https://ez.no/
|
|
3775
|
+
producer:
|
|
3776
|
+
name: eZ Systems AS
|
|
3777
|
+
url: https://ez.no/
|
|
3778
|
+
-
|
|
3105
3779
|
user_agent: Mozilla/5.0 (compatible; evc-batch/2.0)
|
|
3106
3780
|
bot:
|
|
3107
3781
|
name: evc-batch
|
|
@@ -3110,7 +3784,13 @@
|
|
|
3110
3784
|
producer:
|
|
3111
3785
|
name: eVenture Capital Partners II, LLC
|
|
3112
3786
|
url: http://www.eventures.vc/
|
|
3113
|
-
-
|
|
3787
|
+
-
|
|
3788
|
+
user_agent: Mozilla/5.0 (compatible; inoreader.com; 2 subscribers)
|
|
3789
|
+
bot:
|
|
3790
|
+
name: inoreader
|
|
3791
|
+
category: Feed Reader
|
|
3792
|
+
url: https://www.inoreader.com
|
|
3793
|
+
-
|
|
3114
3794
|
user_agent: masscan/1.0 (https://github.com/robertdavidgraham/masscan)
|
|
3115
3795
|
bot:
|
|
3116
3796
|
name: masscan
|
|
@@ -3119,7 +3799,21 @@
|
|
|
3119
3799
|
producer:
|
|
3120
3800
|
name: Robert Graham
|
|
3121
3801
|
url: https://github.com/robertdavidgraham
|
|
3122
|
-
-
|
|
3802
|
+
-
|
|
3803
|
+
user_agent: 'Mozilla/5.0/Firefox/42.0 - nbertaupete95(at)gmail.com'
|
|
3804
|
+
bot:
|
|
3805
|
+
name: nbertaupete95
|
|
3806
|
+
category: Crawler
|
|
3807
|
+
-
|
|
3808
|
+
user_agent: Mozilla/5.0 (compatible; oBot/2.3.1; http://www.xforce-security.com/crawler/)
|
|
3809
|
+
bot:
|
|
3810
|
+
name: oBot
|
|
3811
|
+
category: Search bot
|
|
3812
|
+
url: https://www.xforce-security.com/crawler/
|
|
3813
|
+
producer:
|
|
3814
|
+
name: 'IBM Germany Research & Development GmbH'
|
|
3815
|
+
url: https://exchange.xforce.ibmcloud.com/
|
|
3816
|
+
-
|
|
3123
3817
|
user_agent: 'sqlmap/1.1.8.2#dev (http://sqlmap.org)'
|
|
3124
3818
|
bot:
|
|
3125
3819
|
name: sqlmap
|
|
@@ -3128,16 +3822,613 @@
|
|
|
3128
3822
|
producer:
|
|
3129
3823
|
name: sqlmap
|
|
3130
3824
|
url: http://sqlmap.org/
|
|
3131
|
-
-
|
|
3132
|
-
user_agent: Mozilla/5.0
|
|
3825
|
+
-
|
|
3826
|
+
user_agent: Mozilla/5.0 (compatible; theoldreader.com; 1 subscribers; feed-id=aaa)
|
|
3827
|
+
bot:
|
|
3828
|
+
name: theoldreader
|
|
3829
|
+
category: Feed Reader
|
|
3830
|
+
url: https://theoldreader.com
|
|
3831
|
+
-
|
|
3832
|
+
user_agent: Sprinklr 2.0
|
|
3133
3833
|
bot:
|
|
3134
|
-
name:
|
|
3834
|
+
name: Sprinklr
|
|
3835
|
+
category: Crawler
|
|
3836
|
+
url: ""
|
|
3837
|
+
producer:
|
|
3838
|
+
name: Sprinklr, Inc.
|
|
3839
|
+
url: https://www.sprinklr.com/
|
|
3840
|
+
-
|
|
3841
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64)AppleWebKit/537.36 (KHTML, like Gecko; Google-Ads-Qualify)Chrome/85.0.4183.140 Safari/537.36
|
|
3842
|
+
bot:
|
|
3843
|
+
name: Googlebot
|
|
3844
|
+
category: Search bot
|
|
3845
|
+
url: http://www.google.com/bot.html
|
|
3846
|
+
producer:
|
|
3847
|
+
name: Google Inc.
|
|
3848
|
+
url: http://www.google.com
|
|
3849
|
+
-
|
|
3850
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64; BDCbot/1.0; +http://bigweb.bigdatacorp.com.br/faq.aspx) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36
|
|
3851
|
+
bot:
|
|
3852
|
+
name: BDCbot
|
|
3853
|
+
category: Crawler
|
|
3854
|
+
url: https://bigweb.bigdatacorp.com.br/pages/faq.aspx
|
|
3855
|
+
producer:
|
|
3856
|
+
name: BIG Data Solucoes Em Tecnologia de Informatica LTDA
|
|
3857
|
+
url: https://bigdatacorp.com.br/
|
|
3858
|
+
-
|
|
3859
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/67.0.3396.99 Safari/537.36 CloudflareDiagnostics/1.0
|
|
3860
|
+
bot:
|
|
3861
|
+
name: Cloudflare Diagnostics
|
|
3862
|
+
category: Site Monitor
|
|
3863
|
+
url: https://www.cloudflare.com/
|
|
3864
|
+
producer:
|
|
3865
|
+
name: Cloudflare
|
|
3866
|
+
url: https://www.cloudflare.com
|
|
3867
|
+
-
|
|
3868
|
+
user_agent: Mozilla/5.0 (iPhone; CPU iPhone OS 12_0 like Mac OS X) adbeat.com/policy AppleWebKit/605.1.15 (KHTML, like Gecko) CriOS/69.0.3497.105 Mobile/15E148 Safari/605.1
|
|
3869
|
+
bot:
|
|
3870
|
+
name: Adbeat
|
|
3871
|
+
category: Crawler
|
|
3872
|
+
url: https://www.adbeat.com/operation_policy
|
|
3873
|
+
producer:
|
|
3874
|
+
name: PPC Labs LLC
|
|
3875
|
+
url: https://www.adbeat.com/
|
|
3876
|
+
-
|
|
3877
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; BW/1.1; bit.ly/2W6Px8S) Chrome/84.0.4147.105 Safari/537.36
|
|
3878
|
+
bot:
|
|
3879
|
+
name: BuiltWith
|
|
3880
|
+
category: Crawler
|
|
3881
|
+
url: https://builtwith.com/biup
|
|
3882
|
+
producer:
|
|
3883
|
+
name: BuiltWith Pty Ltd
|
|
3884
|
+
url: https://builtwith.com/
|
|
3885
|
+
-
|
|
3886
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36 (+https://whatis.contentkingapp.com)
|
|
3887
|
+
bot:
|
|
3888
|
+
name: ContentKing
|
|
3889
|
+
category: Site Monitor
|
|
3890
|
+
url: https://whatis.contentkingapp.com/
|
|
3891
|
+
producer:
|
|
3892
|
+
name: ContentKing BV
|
|
3893
|
+
url: https://www.contentkingapp.com/
|
|
3894
|
+
-
|
|
3895
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/84.0.4147.89 Safari/537.36 MicroAdBot/1.1 (https://www.microad.co.jp/contact/)
|
|
3896
|
+
bot:
|
|
3897
|
+
name: MicroAdBot
|
|
3898
|
+
category: Crawler
|
|
3899
|
+
url: https://www.microad.co.jp/
|
|
3900
|
+
producer:
|
|
3901
|
+
name: MicroAd, Inc.
|
|
3902
|
+
url: https://www.microad.co.jp/
|
|
3903
|
+
-
|
|
3904
|
+
user_agent: Mozilla/5.0 (compatible; PingAdmin.Ru/1.2; +http://pingadmin.ru/free_test/)
|
|
3905
|
+
bot:
|
|
3906
|
+
name: PingAdmin.Ru
|
|
3907
|
+
category: Site Monitor
|
|
3908
|
+
url: https://ping-admin.ru/
|
|
3909
|
+
-
|
|
3910
|
+
user_agent: Mozilla/5.0 (compatible; WebDataStats/1.0 ; +https://webdatastats.com/policy.html)
|
|
3911
|
+
bot:
|
|
3912
|
+
name: WebDataStats
|
|
3913
|
+
category: Crawler
|
|
3914
|
+
url: https://webdatastats.com/policy.html
|
|
3915
|
+
producer:
|
|
3916
|
+
name: WebTehRazrabotka LLC
|
|
3917
|
+
url: https://webdatastats.com/
|
|
3918
|
+
-
|
|
3919
|
+
user_agent: Mozilla/5.0 (compatible; parse.ly scraper/0.14; +http://parsely.com)
|
|
3920
|
+
bot:
|
|
3921
|
+
name: parse.ly
|
|
3922
|
+
category: Crawler
|
|
3923
|
+
url: https://www.parse.ly/help/integration/crawler
|
|
3924
|
+
producer:
|
|
3925
|
+
name: Parsely, Inc.
|
|
3926
|
+
url: https://www.parse.ly/
|
|
3927
|
+
-
|
|
3928
|
+
user_agent: Mozilla/5.0 (compatible; Nimbostratus-Bot/v1.3.2; http://cloudsystemnetworks.com)
|
|
3929
|
+
bot:
|
|
3930
|
+
name: Nimbostratus Bot
|
|
3931
|
+
category: Site Monitor
|
|
3932
|
+
url: http://cloudsystemnetworks.com
|
|
3933
|
+
-
|
|
3934
|
+
user_agent: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9.2.17) Gecko/20110515 HeartRails_Capture/1.0.4 (+http://capture.heartrails.com/) Namoroka/3.6.17
|
|
3935
|
+
bot:
|
|
3936
|
+
name: Heart Rails Capture
|
|
3937
|
+
category: Service Agent
|
|
3938
|
+
url: http://capture.heartrails.com
|
|
3939
|
+
-
|
|
3940
|
+
user_agent: Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/43.0.2357.134 Safari/537.36 http://notifyninja.com/monitoring
|
|
3941
|
+
bot:
|
|
3942
|
+
name: Notify Ninja
|
|
3943
|
+
category: Site Monitor
|
|
3944
|
+
url: http://notifyninja.com
|
|
3945
|
+
-
|
|
3946
|
+
user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) Project-Resonance (http://project-resonance.com/) (KHTML, like Gecko) Chrome/83.0.4103.61 Safari/537.36
|
|
3947
|
+
bot:
|
|
3948
|
+
name: Project Resonance
|
|
3949
|
+
category: Crawler
|
|
3950
|
+
url: http://project-resonance.com
|
|
3951
|
+
-
|
|
3952
|
+
user_agent: Mozilla/5.0 (compatible; DataXu/1.0; +http://dataxu.com)
|
|
3953
|
+
bot:
|
|
3954
|
+
name: DataXu
|
|
3955
|
+
category: Service Agent
|
|
3956
|
+
url: https://advertising.roku.com/dataxu
|
|
3957
|
+
producer:
|
|
3958
|
+
name: Roku, Inc.
|
|
3959
|
+
url: https://roku.com
|
|
3960
|
+
-
|
|
3961
|
+
user_agent: Mozilla/5.0 (Unknown; Linux x86_64) AppleWebKit/534.34 (KHTML, like Gecko) PingdomTMS/0.8.5 Safari/534.34
|
|
3962
|
+
bot:
|
|
3963
|
+
name: Pingdom Bot
|
|
3964
|
+
category: Site Monitor
|
|
3965
|
+
url: ""
|
|
3966
|
+
producer:
|
|
3967
|
+
name: Pingdom AB
|
|
3968
|
+
url: https://www.pingdom.com
|
|
3969
|
+
-
|
|
3970
|
+
user_agent: Mozilla/5.0 (compatible; Cocolyzebot/1.0; https://cocolyze.com/bot)
|
|
3971
|
+
bot:
|
|
3972
|
+
name: Cocolyzebot
|
|
3973
|
+
category: Crawler
|
|
3974
|
+
url: https://cocolyze.com/en/cocolyzebot
|
|
3975
|
+
producer:
|
|
3976
|
+
name: VSI INNOVATION SAS
|
|
3977
|
+
url: https://vsi-innovation.com/
|
|
3978
|
+
-
|
|
3979
|
+
user_agent: veryhip (http://veryhip.com/)
|
|
3980
|
+
bot:
|
|
3981
|
+
name: VeryHip
|
|
3982
|
+
category: Crawler
|
|
3983
|
+
url: https://veryhip.com/
|
|
3984
|
+
producer:
|
|
3985
|
+
name: VeryHip
|
|
3986
|
+
url: https://veryhip.com/
|
|
3987
|
+
-
|
|
3988
|
+
user_agent: Mozilla/5.0 (compatible; LinkpadBot/2.3; +http://linkpad.org/robot/)
|
|
3989
|
+
bot:
|
|
3990
|
+
name: LinkpadBot
|
|
3991
|
+
category: Crawler
|
|
3992
|
+
url: https://www.linkpad.org/
|
|
3993
|
+
producer:
|
|
3994
|
+
name: Solomono LLC
|
|
3995
|
+
url: https://www.linkpad.org/
|
|
3996
|
+
-
|
|
3997
|
+
user_agent: Mozilla/4.0 (compatible; MuscatFerret/1.7; http://www.webtop.com/)
|
|
3998
|
+
bot:
|
|
3999
|
+
name: MuscatFerret
|
|
4000
|
+
category: Crawler
|
|
4001
|
+
url: http://www.webtop.com/
|
|
4002
|
+
-
|
|
4003
|
+
user_agent: Quora-Bot/1.0 (http://www.quora.com)
|
|
4004
|
+
bot:
|
|
4005
|
+
name: Quora Bot
|
|
4006
|
+
category: Crawler
|
|
4007
|
+
url: ""
|
|
4008
|
+
producer:
|
|
4009
|
+
name: Quora
|
|
4010
|
+
url: https://www.quora.com/
|
|
4011
|
+
-
|
|
4012
|
+
user_agent: PageThing.com
|
|
4013
|
+
bot:
|
|
4014
|
+
name: PageThing
|
|
4015
|
+
category: Crawler
|
|
4016
|
+
url: https://www.pagething.com/
|
|
4017
|
+
producer:
|
|
4018
|
+
name: SPECIALNOISE LTD
|
|
4019
|
+
url: https://www.specialnoise.com/
|
|
4020
|
+
-
|
|
4021
|
+
user_agent: ArchiveBox/0.5.3 (+https://github.com/ArchiveBox/ArchiveBox/)
|
|
4022
|
+
bot:
|
|
4023
|
+
name: ArchiveBox
|
|
4024
|
+
url: https://archivebox.io/
|
|
4025
|
+
category: Crawler
|
|
4026
|
+
producer:
|
|
4027
|
+
name: ""
|
|
4028
|
+
url: ""
|
|
4029
|
+
-
|
|
4030
|
+
user_agent: Choosito/1.0 +http://www.choosito.com/
|
|
4031
|
+
bot:
|
|
4032
|
+
name: Choosito
|
|
4033
|
+
url: https://www.choosito.com/
|
|
4034
|
+
category: Crawler
|
|
4035
|
+
producer:
|
|
4036
|
+
name: Choosito! Inc.
|
|
4037
|
+
url: https://www.choosito.com/
|
|
4038
|
+
-
|
|
4039
|
+
user_agent: datagnionbot (+http://www.datagnion.com/bot.html)
|
|
4040
|
+
bot:
|
|
4041
|
+
name: datagnionbot
|
|
4042
|
+
url: https://www.datagnion.com/bot.html
|
|
4043
|
+
category: Crawler
|
|
4044
|
+
producer:
|
|
4045
|
+
name: DATAGNION GMBH
|
|
4046
|
+
url: https://www.datagnion.com/
|
|
4047
|
+
-
|
|
4048
|
+
user_agent: InterNaetBoten/0.99 (http://www.xn--internt-bxa.nu)
|
|
4049
|
+
bot:
|
|
4050
|
+
name: Generic Bot
|
|
4051
|
+
-
|
|
4052
|
+
user_agent: EasyBib AutoCite (http://autocite-info.citation-api.com/)
|
|
4053
|
+
bot:
|
|
4054
|
+
name: Generic Bot
|
|
4055
|
+
-
|
|
4056
|
+
user_agent: Bidtellect/0.0.643.0
|
|
4057
|
+
bot:
|
|
4058
|
+
name: Generic Bot
|
|
4059
|
+
-
|
|
4060
|
+
user_agent: Mozilla/5.0 (compatible; meg/0.2; +https://github.com/tomnomnom/meg)
|
|
4061
|
+
bot:
|
|
4062
|
+
name: Generic Bot
|
|
4063
|
+
-
|
|
4064
|
+
user_agent: Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:66.0) WhatCMS/1.0
|
|
4065
|
+
bot:
|
|
4066
|
+
name: WhatCMS
|
|
4067
|
+
url: https://whatcms.org/
|
|
4068
|
+
category: Crawler
|
|
4069
|
+
producer:
|
|
4070
|
+
name: "Nineteen Ten LLC"
|
|
4071
|
+
url: "https://whatcms.org/"
|
|
4072
|
+
-
|
|
4073
|
+
user_agent: httpx - Open-source project (github.com/projectdiscovery/httpx)
|
|
4074
|
+
bot:
|
|
4075
|
+
name: httpx
|
|
4076
|
+
url: https://github.com/projectdiscovery/httpx
|
|
4077
|
+
category: Crawler
|
|
4078
|
+
producer:
|
|
4079
|
+
name: ""
|
|
4080
|
+
url: ""
|
|
4081
|
+
-
|
|
4082
|
+
user_agent: 'Expanse indexes the network perimeters of our customers. If you have any questions or concerns, please reach out to: scaninfo@expanseinc.com'
|
|
4083
|
+
bot:
|
|
4084
|
+
name: Expanse
|
|
3135
4085
|
category: Security Checker
|
|
3136
|
-
url: https://
|
|
3137
|
-
|
|
3138
|
-
|
|
4086
|
+
url: https://expanse.co/
|
|
4087
|
+
producer:
|
|
4088
|
+
name: Expanse Inc.
|
|
4089
|
+
url: https://expanse.co/
|
|
4090
|
+
-
|
|
4091
|
+
user_agent: 'HuaweiWebCatBot/6.0) (To acquire the allowed html pages as reliable information of URL categorization in the automatic process for Huawei Web Categorization.; https://isecurity.huawei.com/; sec at huawei dot com)'
|
|
3139
4092
|
bot:
|
|
3140
|
-
name:
|
|
4093
|
+
name: HuaweiWebCatBot
|
|
4094
|
+
category: Crawler
|
|
4095
|
+
url: https://isecurity.huawei.com
|
|
3141
4096
|
producer:
|
|
3142
|
-
name:
|
|
3143
|
-
url: https://
|
|
4097
|
+
name: Huawei Technologies Co., Ltd.
|
|
4098
|
+
url: https://huawei.com
|
|
4099
|
+
-
|
|
4100
|
+
user_agent: Mozilla/5.0 (compatible; SputnikFaviconBot/1.2; +http://corp.sputnik.ru/webmaster)
|
|
4101
|
+
bot:
|
|
4102
|
+
name: Sputnik Favicon Bot
|
|
4103
|
+
url: ""
|
|
4104
|
+
category: Crawler
|
|
4105
|
+
-
|
|
4106
|
+
user_agent: Hatena-Favicon2 (http://www.hatena.ne.jp/faq/)
|
|
4107
|
+
bot:
|
|
4108
|
+
name: Hatena Favicon
|
|
4109
|
+
category: Crawler
|
|
4110
|
+
url: https://www.hatena.ne.jp/faq/
|
|
4111
|
+
producer:
|
|
4112
|
+
name: Hatena Co., Ltd.
|
|
4113
|
+
url: https://www.hatena.ne.jp
|
|
4114
|
+
-
|
|
4115
|
+
user_agent: Mozilla/5.0 (compatible; RyowlEngine/1.0; +https://ryowl.org)
|
|
4116
|
+
bot:
|
|
4117
|
+
name: Ryowl
|
|
4118
|
+
category: Crawler
|
|
4119
|
+
url: https://ryowl.org
|
|
4120
|
+
-
|
|
4121
|
+
user_agent: Mozilla/5.0 (compatible; OdklBot/1.0 like Linux; klass@odnoklassniki.ru)
|
|
4122
|
+
bot:
|
|
4123
|
+
name: Odnoklassniki Bot
|
|
4124
|
+
category: Crawler
|
|
4125
|
+
url: https://odnoklassniki.ru
|
|
4126
|
+
-
|
|
4127
|
+
user_agent: Mediatoolkitbot (complaints@mediatoolkit.com)
|
|
4128
|
+
bot:
|
|
4129
|
+
name: Mediatoolkit Bot
|
|
4130
|
+
category: Crawler
|
|
4131
|
+
url: https://mediatoolkit.com
|
|
4132
|
+
-
|
|
4133
|
+
user_agent: ZoominfoBot (zoominfobot at zoominfo dot com)
|
|
4134
|
+
bot:
|
|
4135
|
+
name: ZoominfoBot
|
|
4136
|
+
category: Crawler
|
|
4137
|
+
url: https://www.zoominfo.com
|
|
4138
|
+
-
|
|
4139
|
+
user_agent: Mozilla/5.0 (compatible; WeViKaBot/1.0; +http://www.wevika.de/)
|
|
4140
|
+
bot:
|
|
4141
|
+
name: WeViKaBot
|
|
4142
|
+
category: Crawler
|
|
4143
|
+
url: http://www.wevika.de
|
|
4144
|
+
-
|
|
4145
|
+
user_agent: Mozilla/5.0 (compatible; SEOkicks; +https://www.seokicks.de/robot.html)
|
|
4146
|
+
bot:
|
|
4147
|
+
name: SEOkicks
|
|
4148
|
+
category: Crawler
|
|
4149
|
+
url: https://www.seokicks.de/robot.html
|
|
4150
|
+
-
|
|
4151
|
+
user_agent: Mozilla/5.0 (compatible; Plukkie/1.6; http://www.botje.com/plukkie.htm)
|
|
4152
|
+
bot:
|
|
4153
|
+
name: Plukkie
|
|
4154
|
+
category: Crawler
|
|
4155
|
+
url: http://www.botje.com/plukkie.htm
|
|
4156
|
+
-
|
|
4157
|
+
user_agent: Mozilla/5.0 (compatible; proximic; https://www.comscore.com/Web-Crawler)
|
|
4158
|
+
bot:
|
|
4159
|
+
name: Comscore
|
|
4160
|
+
category: Crawler
|
|
4161
|
+
url: https://www.comscore.com/Web-Crawler
|
|
4162
|
+
-
|
|
4163
|
+
user_agent: Mozilla/5.0 (compatible; SurdotlyBot/1.0; +http://sur.ly/bot.html)
|
|
4164
|
+
bot:
|
|
4165
|
+
name: SurdotlyBot
|
|
4166
|
+
category: Crawler
|
|
4167
|
+
url: http://sur.ly/bot.html
|
|
4168
|
+
-
|
|
4169
|
+
user_agent: Mozilla/5.0 (compatible; Gowikibot/1.0; +http://www.gowikibot.com)
|
|
4170
|
+
bot:
|
|
4171
|
+
name: Gowikibot
|
|
4172
|
+
category: Crawler
|
|
4173
|
+
url: http:/www.gowikibot.com
|
|
4174
|
+
-
|
|
4175
|
+
user_agent: Mozilla/5.0 (compatible; SabsimBot/3.0; +https://sabsim.com)
|
|
4176
|
+
bot:
|
|
4177
|
+
name: SabsimBot
|
|
4178
|
+
category: Crawler
|
|
4179
|
+
url: https://sabsim.com
|
|
4180
|
+
-
|
|
4181
|
+
user_agent: Mozilla/5.0 (compatible; LumtelBot/1.0; +http://lumtel.com)
|
|
4182
|
+
bot:
|
|
4183
|
+
name: LumtelBot
|
|
4184
|
+
category: Crawler
|
|
4185
|
+
url: https://umtel.com
|
|
4186
|
+
-
|
|
4187
|
+
user_agent: Mozilla/5.0+(compatible;+PiplBot;+http://www.pipl.com/bot/)
|
|
4188
|
+
bot:
|
|
4189
|
+
name: PiplBot
|
|
4190
|
+
category: Crawler
|
|
4191
|
+
url: http://www.pipl.com/bot
|
|
4192
|
+
-
|
|
4193
|
+
user_agent: Mozilla/5.0 (compatible; woobot/2.0; +https://www.woorank.com/bot)
|
|
4194
|
+
bot:
|
|
4195
|
+
name: WooRank
|
|
4196
|
+
category: Crawler
|
|
4197
|
+
url: https://www.woorank.com/bot
|
|
4198
|
+
-
|
|
4199
|
+
user_agent: YahooMailProxy; https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
|
4200
|
+
bot:
|
|
4201
|
+
name: Yahoo! Mail Proxy
|
|
4202
|
+
category: Service Agent
|
|
4203
|
+
url: https://help.yahoo.com/kb/yahoo-mail-proxy-SLN28749.html
|
|
4204
|
+
producer:
|
|
4205
|
+
name: Yahoo! Inc.
|
|
4206
|
+
url: http://www.yahoo.com
|
|
4207
|
+
-
|
|
4208
|
+
user_agent: 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko; compatible; Cookiebot/1.0; http://cookiebot.com/) Chrome/79.0.3945.117 Safari/537.36'
|
|
4209
|
+
bot:
|
|
4210
|
+
name: Cookiebot
|
|
4211
|
+
category: Crawler
|
|
4212
|
+
url: https://support.cookiebot.com/hc/en-us/articles/360014264140-Scanner-User-Agent
|
|
4213
|
+
producer:
|
|
4214
|
+
name: Cybot A/S
|
|
4215
|
+
url: https://www.cybot.com/
|
|
4216
|
+
-
|
|
4217
|
+
user_agent: NetSystemsResearch studies the availability of various services across the internet. Our website is netsystemsresearch.com
|
|
4218
|
+
bot:
|
|
4219
|
+
name: NetSystemsResearch
|
|
4220
|
+
category: Security Checker
|
|
4221
|
+
url: https://www.netsystemsresearch.com/
|
|
4222
|
+
producer:
|
|
4223
|
+
name: NET SYSTEMS RESEARCH LLC
|
|
4224
|
+
url: https://www.netsystemsresearch.com/
|
|
4225
|
+
-
|
|
4226
|
+
user_agent: 'Mozilla/5.0 (compatible; CensysInspect/1.1; https://about.censys.io/)'
|
|
4227
|
+
bot:
|
|
4228
|
+
name: CensysInspect
|
|
4229
|
+
category: Security Checker
|
|
4230
|
+
url: https://about.censys.io/
|
|
4231
|
+
producer:
|
|
4232
|
+
name: Censys, Inc.
|
|
4233
|
+
url: https://censys.io/
|
|
4234
|
+
-
|
|
4235
|
+
user_agent: https://gdnplus.com:Gather Analyze Provide.
|
|
4236
|
+
bot:
|
|
4237
|
+
name: GDNP
|
|
4238
|
+
category: Crawler
|
|
4239
|
+
url: https://gdnplus.com/
|
|
4240
|
+
producer:
|
|
4241
|
+
name: Global Digital Network Plus, LLC
|
|
4242
|
+
url: https://gdnplus.com/
|
|
4243
|
+
-
|
|
4244
|
+
user_agent: WellKnownBot/0.1 (https://well-known.dev)
|
|
4245
|
+
bot:
|
|
4246
|
+
name: WellKnownBot
|
|
4247
|
+
category: Crawler
|
|
4248
|
+
url: https://well-known.dev
|
|
4249
|
+
-
|
|
4250
|
+
user_agent: Mozilla/5.0 (compatible; Adsbot/3.1; https://seostar.co/robot/)
|
|
4251
|
+
bot:
|
|
4252
|
+
name: Adsbot
|
|
4253
|
+
category: Crawler
|
|
4254
|
+
url: https://seostar.co/robot/
|
|
4255
|
+
-
|
|
4256
|
+
user_agent: MTRobot/0.2 (Metrics Tools Analytics Crawler; https://metrics-tools.de/robot.html; crawler@metrics-tools.de)
|
|
4257
|
+
bot:
|
|
4258
|
+
name: MTRobot
|
|
4259
|
+
category: Crawler
|
|
4260
|
+
url: https://metrics-tools.de/robot.html
|
|
4261
|
+
producer:
|
|
4262
|
+
name: Metrics Tools
|
|
4263
|
+
url: https://metrics-tools.de/
|
|
4264
|
+
-
|
|
4265
|
+
user_agent: My User Agent 1.0
|
|
4266
|
+
bot:
|
|
4267
|
+
name: Generic Bot
|
|
4268
|
+
-
|
|
4269
|
+
user_agent: serpstatbot/1.0 (advanced backlink tracking bot; curl/7.58.0; http://serpstatbot.com/; abuse@serpstatbot.com)
|
|
4270
|
+
bot:
|
|
4271
|
+
name: serpstatbot
|
|
4272
|
+
category: Crawler
|
|
4273
|
+
url: http://serpstatbot.com/
|
|
4274
|
+
producer:
|
|
4275
|
+
name: Netpeak Ltd
|
|
4276
|
+
url: https://netpeak.net/
|
|
4277
|
+
-
|
|
4278
|
+
user_agent: colly - https://github.com/gocolly/colly/v2
|
|
4279
|
+
bot:
|
|
4280
|
+
name: colly
|
|
4281
|
+
category: Crawler
|
|
4282
|
+
url: https://github.com/gocolly/colly/
|
|
4283
|
+
-
|
|
4284
|
+
user_agent: l9tcpid/v1.0.0
|
|
4285
|
+
bot:
|
|
4286
|
+
name: l9tcpid
|
|
4287
|
+
category: Security Checker
|
|
4288
|
+
url: https://github.com/LeakIX/l9tcpid
|
|
4289
|
+
-
|
|
4290
|
+
user_agent: Mozilla/5.0 (compatible; MegaIndex.ru/2.0; +http://megaindex.com/crawler)
|
|
4291
|
+
bot:
|
|
4292
|
+
name: MegaIndex
|
|
4293
|
+
category: Crawler
|
|
4294
|
+
url: https://megaindex.com/crawler
|
|
4295
|
+
-
|
|
4296
|
+
user_agent: Mozilla/5.0 (compatible; Seekport Crawler; http://seekport.com/)
|
|
4297
|
+
bot:
|
|
4298
|
+
name: Seekport
|
|
4299
|
+
category: Crawler
|
|
4300
|
+
url: http://www.seekport.com/
|
|
4301
|
+
producer:
|
|
4302
|
+
name: SISTRIX GmbH
|
|
4303
|
+
url: https://www.sistrix.de/
|
|
4304
|
+
-
|
|
4305
|
+
user_agent: Mozilla/5.0 (compatible; seolyt/1.1; +https://seolyt.com)
|
|
4306
|
+
bot:
|
|
4307
|
+
name: seolyt
|
|
4308
|
+
category: Crawler
|
|
4309
|
+
url: https://seolyt.com/
|
|
4310
|
+
-
|
|
4311
|
+
user_agent: Mozilla/5.0 (compatible; YaK/1.0; http://linkfluence.com/; bot@linkfluence.com)
|
|
4312
|
+
bot:
|
|
4313
|
+
name: YaK
|
|
4314
|
+
category: Crawler
|
|
4315
|
+
url: https://www.linkfluence.com/
|
|
4316
|
+
producer:
|
|
4317
|
+
name: Linkfluence SAS
|
|
4318
|
+
url: https://www.linkfluence.com/
|
|
4319
|
+
-
|
|
4320
|
+
user_agent: Mozilla/5.0 (Windows NT 6.1; Win64; x64; +http://www.komodia.com/newwiki/index.php/URL_server_crawler) KomodiaBot/1.0
|
|
4321
|
+
bot:
|
|
4322
|
+
name: KomodiaBot
|
|
4323
|
+
category: Crawler
|
|
4324
|
+
url: http://www.komodia.com/newwiki/index.php/URL_server_crawler
|
|
4325
|
+
producer:
|
|
4326
|
+
name: Komodia Inc.
|
|
4327
|
+
url: https://www.komodia.com/
|
|
4328
|
+
-
|
|
4329
|
+
user_agent: Mozilla/5.0 (Windows NT 6.3; WOW64; Trident/7.0; rv:11.0; Catchpoint) like Gecko
|
|
4330
|
+
bot:
|
|
4331
|
+
name: Catchpoint
|
|
4332
|
+
category: Site Monitor
|
|
4333
|
+
url: https://www.catchpoint.com/
|
|
4334
|
+
producer:
|
|
4335
|
+
name: Catchpoint Systems
|
|
4336
|
+
url: https://www.catchpoint.com/
|
|
4337
|
+
-
|
|
4338
|
+
user_agent: Better Uptime Bot Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36
|
|
4339
|
+
bot:
|
|
4340
|
+
name: Better Uptime Bot
|
|
4341
|
+
category: Site Monitor
|
|
4342
|
+
url: https://betteruptime.com/faq
|
|
4343
|
+
producer:
|
|
4344
|
+
name: Better Uptime
|
|
4345
|
+
url: https://betteruptime.com/
|
|
4346
|
+
-
|
|
4347
|
+
user_agent: gobuster/3.1.0
|
|
4348
|
+
bot:
|
|
4349
|
+
name: Gobuster
|
|
4350
|
+
url: https://github.com/OJ/gobuster
|
|
4351
|
+
-
|
|
4352
|
+
user_agent: k6/0.31.1 (https://k6.io/)
|
|
4353
|
+
bot:
|
|
4354
|
+
name: K6
|
|
4355
|
+
url: https://k6.io/
|
|
4356
|
+
-
|
|
4357
|
+
user_agent: Mozilla/5.0 (compatible; Neevabot/1.0; https://neeva.com/neevabot)
|
|
4358
|
+
bot:
|
|
4359
|
+
name: Neevabot
|
|
4360
|
+
category: Search bot
|
|
4361
|
+
url: https://neeva.com/neevabot
|
|
4362
|
+
producer:
|
|
4363
|
+
name: Neeva Inc.
|
|
4364
|
+
url: https://neeva.com/
|
|
4365
|
+
-
|
|
4366
|
+
user_agent: LinkPreview/1.5 (http://linkpreview.net)
|
|
4367
|
+
bot:
|
|
4368
|
+
name: LinkPreview
|
|
4369
|
+
category: Service Agent
|
|
4370
|
+
url: https://www.linkpreview.net/
|
|
4371
|
+
-
|
|
4372
|
+
user_agent: Mozilla/5.0 (compatible; JungleKeyThumbnail/1.1; +http://www.junglekey.fr/)
|
|
4373
|
+
bot:
|
|
4374
|
+
name: JungleKeyThumbnail
|
|
4375
|
+
category: Crawler
|
|
4376
|
+
url: https://junglekey.com/
|
|
4377
|
+
-
|
|
4378
|
+
user_agent: rocketmonitor 1.0
|
|
4379
|
+
bot:
|
|
4380
|
+
name: RocketMonitorBot
|
|
4381
|
+
category: Site Monitor
|
|
4382
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
|
4383
|
+
producer:
|
|
4384
|
+
name: Radio Mast, Inc.
|
|
4385
|
+
url: https://www.radiomast.io/
|
|
4386
|
+
-
|
|
4387
|
+
user_agent: RocketMonitorBot/1.0 ( https://www.radiomast.io)
|
|
4388
|
+
bot:
|
|
4389
|
+
name: RocketMonitorBot
|
|
4390
|
+
category: Site Monitor
|
|
4391
|
+
url: https://www.radiomast.io/docs/stream-monitoring/technical_details.html
|
|
4392
|
+
producer:
|
|
4393
|
+
name: Radio Mast, Inc.
|
|
4394
|
+
url: https://www.radiomast.io/
|
|
4395
|
+
-
|
|
4396
|
+
user_agent: SitemapParser-VIPnytt/1.1 ( https://github.com/VIPnytt/SitemapParser/blob/master/README.md)
|
|
4397
|
+
bot:
|
|
4398
|
+
name: SitemapParser-VIPnytt
|
|
4399
|
+
category: Crawler
|
|
4400
|
+
url: https://github.com/VIPnytt/SitemapParser/
|
|
4401
|
+
-
|
|
4402
|
+
user_agent: Turnitin (https://bit.ly/2UvnfoQ)
|
|
4403
|
+
bot:
|
|
4404
|
+
name: Turnitin
|
|
4405
|
+
category: Crawler
|
|
4406
|
+
url: https://turnitin.com/robot/crawlerinfo.html
|
|
4407
|
+
-
|
|
4408
|
+
user_agent: Mozilla/5.0 (Linux; Android 8.0; Pixel 2 Build/OPD3.170816.012; Storebot-Google/1.0) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Mobile Safari/537.36
|
|
4409
|
+
bot:
|
|
4410
|
+
name: Google StoreBot
|
|
4411
|
+
category: Crawler
|
|
4412
|
+
-
|
|
4413
|
+
user_agent: Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.56 Safari/537.36 DMBrowser/2.1 (UV)
|
|
4414
|
+
bot:
|
|
4415
|
+
name: Dotcom Monitor
|
|
4416
|
+
category: Site Monitor
|
|
4417
|
+
url: https://www.dotcom-monitor.com
|
|
4418
|
+
-
|
|
4419
|
+
user_agent: Mozilla/5.0 (Windows NT 6.2; WOW64; rv:29.0) Gecko/20100101 /29.0 DMBrowser-BV
|
|
4420
|
+
bot:
|
|
4421
|
+
name: Dotcom Monitor
|
|
4422
|
+
category: Site Monitor
|
|
4423
|
+
url: https://www.dotcom-monitor.com
|
|
4424
|
+
-
|
|
4425
|
+
user_agent: Mozilla/5.0 (compatible; ThinkChaos/0.3.0; +In_the_test_phase,_if_the_ThinkChaos_brings_you_trouble,_please_add_disallow_to_the_robots.txt._Thank_you.)
|
|
4426
|
+
bot:
|
|
4427
|
+
name: ThinkChaos
|
|
4428
|
+
category: Crawler
|
|
4429
|
+
-
|
|
4430
|
+
user_agent: Mozilla/5.0 (compatible; DataForSeoBot/1.0; +https://dataforseo.com/dataforseo-bot)
|
|
4431
|
+
bot:
|
|
4432
|
+
name: DataForSeoBot
|
|
4433
|
+
category: Crawler
|
|
4434
|
+
url: https://dataforseo.com/dataforseo-bot
|