@alitu/user-agents-v2-api 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +3 -0
- package/dist/index.js +65 -0
- package/dist/index.test.js +24 -0
- package/dist/user-agents-v2/apps.json +4061 -0
- package/dist/user-agents-v2/bots.json +1307 -0
- package/dist/user-agents-v2/browsers.json +94 -0
- package/dist/user-agents-v2/devices.json +198 -0
- package/dist/user-agents-v2/index.js +38 -0
- package/dist/user-agents-v2/libraries.json +521 -0
- package/dist/user-agents-v2/referrers.json +556 -0
- package/package.json +41 -0
|
@@ -0,0 +1,1307 @@
|
|
|
1
|
+
{
|
|
2
|
+
"comments": [
|
|
3
|
+
"Look for User-Agent matches in this file order: 'bots', 'apps', 'libraries', 'browsers', and return the first entry matched, processing each entry in order in which they appear in the file."
|
|
4
|
+
],
|
|
5
|
+
"$schema": "https://raw.githubusercontent.com/opawg/user-agents-v2/master/schemas/patterns.schema.json",
|
|
6
|
+
"entries": [
|
|
7
|
+
{
|
|
8
|
+
"name": "AAABot - unknown bot",
|
|
9
|
+
"pattern": "AAABot",
|
|
10
|
+
"examples": [
|
|
11
|
+
"AAABot"
|
|
12
|
+
]
|
|
13
|
+
},
|
|
14
|
+
{
|
|
15
|
+
"name": "Adswizz",
|
|
16
|
+
"pattern": "^AIS VirtualListener",
|
|
17
|
+
"urls": [
|
|
18
|
+
"https://www.adswizz.com/publishers/insertion-suite/"
|
|
19
|
+
],
|
|
20
|
+
"examples": [
|
|
21
|
+
"AIS VirtualListener"
|
|
22
|
+
]
|
|
23
|
+
},
|
|
24
|
+
{
|
|
25
|
+
"name": "AhrefsBot",
|
|
26
|
+
"pattern": "AhrefsBot/",
|
|
27
|
+
"urls": [
|
|
28
|
+
"http://ahrefs.com/robot/"
|
|
29
|
+
],
|
|
30
|
+
"examples": [
|
|
31
|
+
"Mozilla/5.0 (compatible; AhrefsBot/7.0; http://ahrefs.com/robot/)",
|
|
32
|
+
"Mozilla/5.0 (compatible; AhrefsBot/6.1; +http://ahrefs.com/robot/)"
|
|
33
|
+
]
|
|
34
|
+
},
|
|
35
|
+
{
|
|
36
|
+
"name": "AirableBot",
|
|
37
|
+
"pattern": "AirableBot-Podcast/",
|
|
38
|
+
"description": "An aggregator of internet radio and podcasts, for connected devices.",
|
|
39
|
+
"urls": [
|
|
40
|
+
"https://www.airablenow.com"
|
|
41
|
+
],
|
|
42
|
+
"examples": [
|
|
43
|
+
"AirableBot-Podcast/1.0 (+https//www.airablenow.com)",
|
|
44
|
+
"AirableBot-Podcast/1.0 ( https//www.airablenow.com)"
|
|
45
|
+
]
|
|
46
|
+
},
|
|
47
|
+
{
|
|
48
|
+
"name": "Alexa Flash Briefing cache",
|
|
49
|
+
"pattern": "^AmazonNewsContentService",
|
|
50
|
+
"description": "A service which downloads, caches and normalises audio for the Flash Briefing service on Alexa-enabled devices",
|
|
51
|
+
"svg": "amazon.svg",
|
|
52
|
+
"urls": [
|
|
53
|
+
"https://developer.amazon.com/docs/flashbriefing/flash-briefing-skill-api-feed-reference.html#performance-requirements"
|
|
54
|
+
],
|
|
55
|
+
"comments": "Stats are available within the Alexa skills dashboard."
|
|
56
|
+
},
|
|
57
|
+
{
|
|
58
|
+
"name": "AlignaBot",
|
|
59
|
+
"pattern": "^Alignabot",
|
|
60
|
+
"examples": [
|
|
61
|
+
"Alignabot 1.0 (https://www.alignable.com/)"
|
|
62
|
+
]
|
|
63
|
+
},
|
|
64
|
+
{
|
|
65
|
+
"name": "All Ears",
|
|
66
|
+
"pattern": "^AllEars/",
|
|
67
|
+
"examples": [
|
|
68
|
+
"AllEars/1.0; (+www.allears.ai)"
|
|
69
|
+
],
|
|
70
|
+
"urls": [
|
|
71
|
+
"https://allears.ai"
|
|
72
|
+
]
|
|
73
|
+
},
|
|
74
|
+
{
|
|
75
|
+
"name": "Amazon Music Podcasts Bot",
|
|
76
|
+
"pattern": "^Amazon Music Podcast",
|
|
77
|
+
"description": "A music and podcasts streaming app",
|
|
78
|
+
"svg": "amazon.svg",
|
|
79
|
+
"comments": "Backend ingestion service"
|
|
80
|
+
},
|
|
81
|
+
{
|
|
82
|
+
"name": "Anchor Importer",
|
|
83
|
+
"pattern": "AnchorImport",
|
|
84
|
+
"description": "Anchor's tool for importing podcasts",
|
|
85
|
+
"comments": "This useragent is used during a user importing a podcast to the Anchor platform",
|
|
86
|
+
"examples": [
|
|
87
|
+
"AnchorImport/1.0"
|
|
88
|
+
]
|
|
89
|
+
},
|
|
90
|
+
{
|
|
91
|
+
"name": "Apple Notes share extension",
|
|
92
|
+
"pattern": "^com.apple.(mobilenotes.SharingExtension|Notes.SharingExtension)/",
|
|
93
|
+
"examples": [
|
|
94
|
+
"com.apple.mobilenotes.SharingExtension/2511 CFNetwork/1494.0.7 Darwin/23.4.0",
|
|
95
|
+
"com.apple.Notes.SharingExtension/2812 CFNetwork/1494.0.7 Darwin/23.4.0"
|
|
96
|
+
]
|
|
97
|
+
},
|
|
98
|
+
{
|
|
99
|
+
"name": "Apple Podcasts (Watch)",
|
|
100
|
+
"pattern": "^atc/|\\(null\\) watchOS/",
|
|
101
|
+
"comments": "Verified (via stamping the audio URL with the RSS useragent) as being sourced from Apple Podcasts; and accordingly this is marked as a bot since these downloads are duplicated with the phone.",
|
|
102
|
+
"examples": [
|
|
103
|
+
"atc/1.0",
|
|
104
|
+
"atc/1.0 watchOS/6.2 model/Watch3,3 hwp/t8004 build/17T529 (6; dt:155)",
|
|
105
|
+
"atc/1.0 watchOS/6.2.8 model/Watch2,3 hwp/t8002 build/17U63 (6; dt:133)",
|
|
106
|
+
"atc/1.0 watchOS/6.2.8 model/Watch3,3 hwp/t8004 build/17U63 (6; dt:155)",
|
|
107
|
+
"atc/1.0 watchOS/6.2.8 model/Watch4,2 hwp/t8006 build/17U63 (6; dt:191)",
|
|
108
|
+
"atc/1.0 watchOS/7.0.2 model/Watch5,10 hwp/t8006 build/18R402 (6; dt:233)",
|
|
109
|
+
"atc/1.0 watchOS/7.0.2 model/Watch5,11 hwp/t8006 build/18R402 (6; dt:234)",
|
|
110
|
+
"atc/1.0 watchOS/7.1 model/Watch4,2 hwp/t8006 build/18R590 (6; dt:191)",
|
|
111
|
+
"atc/1.0 watchOS/7.1 model/Watch4,3 hwp/t8006 build/18R590 (6; dt:192)",
|
|
112
|
+
"atc/1.0 watchOS/7.1 model/Watch4,4 hwp/t8006 build/18R590 (6; dt:193)",
|
|
113
|
+
"atc/1.0 watchOS/7.1 model/Watch5,1 hwp/t8006 build/18R590 (6; dt:201)",
|
|
114
|
+
"atc/1.0 watchOS/7.1 model/Watch5,3 hwp/t8006 build/18R590 (6; dt:202)",
|
|
115
|
+
"atc/1.0 watchOS/7.1 model/Watch5,4 hwp/t8006 build/18R590 (6; dt:202)",
|
|
116
|
+
"(null)/(null) watchOS/5.0.1 model/Watch3,3 hwp/t8004 build/16R381 (6; dt:155)"
|
|
117
|
+
]
|
|
118
|
+
},
|
|
119
|
+
{
|
|
120
|
+
"name": "Apple Podcasts automated checks",
|
|
121
|
+
"pattern": "(iTMS|itunesstored|itms)"
|
|
122
|
+
},
|
|
123
|
+
{
|
|
124
|
+
"name": "Applebot",
|
|
125
|
+
"pattern": "^Applebot/",
|
|
126
|
+
"description": "Applebot is the web crawler for Apple. Products like Siri and Spotlight Suggestions use Applebot.",
|
|
127
|
+
"urls": [
|
|
128
|
+
"http://www.apple.com/go/applebot"
|
|
129
|
+
]
|
|
130
|
+
},
|
|
131
|
+
{
|
|
132
|
+
"name": "Archive.org",
|
|
133
|
+
"pattern": "archive\\.org_bot",
|
|
134
|
+
"description": "The Internet Archive is a nonprofit digital library that preserves web data and makes it available for research purposes through the Wayback Machine.",
|
|
135
|
+
"urls": [
|
|
136
|
+
"https://archive.org/details/archive.org_bot"
|
|
137
|
+
],
|
|
138
|
+
"examples": [
|
|
139
|
+
"Mozilla/5.0 (compatible; archive.org_bot http://archive.org/details/archive.org_bot)"
|
|
140
|
+
]
|
|
141
|
+
},
|
|
142
|
+
{
|
|
143
|
+
"name": "atheerfm",
|
|
144
|
+
"pattern": "^atheerfm/",
|
|
145
|
+
"examples": [
|
|
146
|
+
"atheerfm/1 CFNetwork/758.3.15 Darwin/15.3.0"
|
|
147
|
+
]
|
|
148
|
+
},
|
|
149
|
+
{
|
|
150
|
+
"name": "Audiomack",
|
|
151
|
+
"pattern": "^Audiomack Podcast Processor/",
|
|
152
|
+
"examples": [
|
|
153
|
+
"Audiomack Podcast Processor/1.0 (https://audiomack.com/)"
|
|
154
|
+
]
|
|
155
|
+
},
|
|
156
|
+
{
|
|
157
|
+
"name": "AudioWave feed parser",
|
|
158
|
+
"pattern": "^AudioWaveBot/1\\.0",
|
|
159
|
+
"urls": [
|
|
160
|
+
"https://audiowave.io"
|
|
161
|
+
],
|
|
162
|
+
"examples": [
|
|
163
|
+
"AudioWaveBot/1.0"
|
|
164
|
+
]
|
|
165
|
+
},
|
|
166
|
+
{
|
|
167
|
+
"name": "AwarioSmartBot",
|
|
168
|
+
"pattern": "^AwarioSmartBot/",
|
|
169
|
+
"examples": [
|
|
170
|
+
"AwarioSmartBot/1.0 (+https://awario.com/bots.html; bots@awario.com)"
|
|
171
|
+
]
|
|
172
|
+
},
|
|
173
|
+
{
|
|
174
|
+
"name": "Babbar",
|
|
175
|
+
"pattern": "Barkrowler/",
|
|
176
|
+
"urls": [
|
|
177
|
+
"https://beta.babbar.tech/crawler"
|
|
178
|
+
]
|
|
179
|
+
},
|
|
180
|
+
{
|
|
181
|
+
"name": "Baidu",
|
|
182
|
+
"pattern": "\\(ce\\.baidu\\.com",
|
|
183
|
+
"examples": [
|
|
184
|
+
"Baidu-YunGuanCe-SLABot(ce.baidu.com)"
|
|
185
|
+
]
|
|
186
|
+
},
|
|
187
|
+
{
|
|
188
|
+
"name": "bbot",
|
|
189
|
+
"pattern": "^bbot/",
|
|
190
|
+
"examples": [
|
|
191
|
+
"bbot/0.1"
|
|
192
|
+
]
|
|
193
|
+
},
|
|
194
|
+
{
|
|
195
|
+
"name": "Beacon Podcast Sync",
|
|
196
|
+
"pattern": "^Beacon/\\d",
|
|
197
|
+
"examples": [
|
|
198
|
+
"Beacon/1.0 Podcast Sync +https://getbeacons.com/"
|
|
199
|
+
],
|
|
200
|
+
"urls": [
|
|
201
|
+
"https://getbeacons.com/"
|
|
202
|
+
]
|
|
203
|
+
},
|
|
204
|
+
{
|
|
205
|
+
"name": "British Library",
|
|
206
|
+
"pattern": "^bl\\.uk_ldfc_bot",
|
|
207
|
+
"description": "British Library's legal deposit web crawler",
|
|
208
|
+
"urls": [
|
|
209
|
+
"http://www.bl.uk/aboutus/legaldeposit/websites/websites/faqswebmaster/index.html"
|
|
210
|
+
],
|
|
211
|
+
"examples": [
|
|
212
|
+
"bl.uk_ldfc_bot/3.4.0-20200518 ( http://www.bl.uk/aboutus/legaldeposit/websites/websites/faqswebmaster/index.html)"
|
|
213
|
+
]
|
|
214
|
+
},
|
|
215
|
+
{
|
|
216
|
+
"name": "Blubrry Migration Service",
|
|
217
|
+
"pattern": "^Blubrry Migration Service",
|
|
218
|
+
"examples": [
|
|
219
|
+
"Blubrry Migration Service"
|
|
220
|
+
]
|
|
221
|
+
},
|
|
222
|
+
{
|
|
223
|
+
"name": "Bullhorn Crawler",
|
|
224
|
+
"pattern": "^BullhornCrawler/",
|
|
225
|
+
"examples": [
|
|
226
|
+
"BullhornCrawler/unknown-version(+http://bullhorn.fm/)"
|
|
227
|
+
],
|
|
228
|
+
"urls": [
|
|
229
|
+
"https://bullhorn.fm/"
|
|
230
|
+
]
|
|
231
|
+
},
|
|
232
|
+
{
|
|
233
|
+
"name": "Buzzsprout Importer",
|
|
234
|
+
"pattern": "^Buzzsprout Importer",
|
|
235
|
+
"examples": [
|
|
236
|
+
"Buzzsprout Importer"
|
|
237
|
+
]
|
|
238
|
+
},
|
|
239
|
+
{
|
|
240
|
+
"name": "Bytespider.*bytedance",
|
|
241
|
+
"pattern": "Bytespider",
|
|
242
|
+
"examples": [
|
|
243
|
+
"Mozilla/5.0 (Linux; Android 5.0) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; Bytespider; spider-feedback@bytedance.com)"
|
|
244
|
+
]
|
|
245
|
+
},
|
|
246
|
+
{
|
|
247
|
+
"name": "CastFeedValidator",
|
|
248
|
+
"pattern": "^CastFeedValidator/",
|
|
249
|
+
"examples": [
|
|
250
|
+
"CastFeedValidator/3.0.5 (https://castfeedvalidator.com)"
|
|
251
|
+
]
|
|
252
|
+
},
|
|
253
|
+
{
|
|
254
|
+
"name": "Castopod",
|
|
255
|
+
"pattern": "Castopod/\\d",
|
|
256
|
+
"examples": [
|
|
257
|
+
"Castopod/1.0",
|
|
258
|
+
"Castopod/1.1.2"
|
|
259
|
+
]
|
|
260
|
+
},
|
|
261
|
+
{
|
|
262
|
+
"name": "Chartable",
|
|
263
|
+
"pattern": "^Trackable/",
|
|
264
|
+
"urls": [
|
|
265
|
+
"https://chartable.com/"
|
|
266
|
+
]
|
|
267
|
+
},
|
|
268
|
+
{
|
|
269
|
+
"name": "Clark-Crawler, unknown",
|
|
270
|
+
"pattern": "^clark-crawler2"
|
|
271
|
+
},
|
|
272
|
+
{
|
|
273
|
+
"name": "Claudebot",
|
|
274
|
+
"pattern": "ClaudeBot/",
|
|
275
|
+
"description": "Claude is a family of large language models developed by Anthropic and designed to revolutionize the way you interact with AI",
|
|
276
|
+
"urls": [
|
|
277
|
+
"https://docs.anthropic.com/claude/docs/intro-to-claude"
|
|
278
|
+
],
|
|
279
|
+
"examples": [
|
|
280
|
+
"Mozilla/5.0 AppleWebKit/537.36 (KHTML, like Gecko; compatible; ClaudeBot/1.0; +claudebot@anthropic.com)"
|
|
281
|
+
]
|
|
282
|
+
},
|
|
283
|
+
{
|
|
284
|
+
"name": "Critical Mention",
|
|
285
|
+
"pattern": "^Podcast-CriticalMention/",
|
|
286
|
+
"description": "Critical Mention is a business intelligence company, monitoring podcasts on the web for their clients",
|
|
287
|
+
"examples": [
|
|
288
|
+
"Podcast-CriticalMention/1.0"
|
|
289
|
+
]
|
|
290
|
+
},
|
|
291
|
+
{
|
|
292
|
+
"name": "curl",
|
|
293
|
+
"pattern": "^curl|^libcurl/|^PycURL/| curl/",
|
|
294
|
+
"examples": [
|
|
295
|
+
"libcurl/7.65.1",
|
|
296
|
+
"PycURL/7.43.0 libcurl/7.47.0 GnuTLS/3.4.10 zlib/1.2.8 libidn/1.32 librtmp/2.3",
|
|
297
|
+
"GuzzleHttp/6.1.0 curl/7.50.1 PHP/7.0.13-0ubuntu0.16.10.1"
|
|
298
|
+
]
|
|
299
|
+
},
|
|
300
|
+
{
|
|
301
|
+
"name": "DataforSEO",
|
|
302
|
+
"pattern": "DataForSeoBot/",
|
|
303
|
+
"description": "Working on the biggest available backlink database on the web that every single member of the community, including you, can use and benefit from.",
|
|
304
|
+
"urls": [
|
|
305
|
+
"https://dataforseo.com/dataforseo-bot"
|
|
306
|
+
],
|
|
307
|
+
"examples": [
|
|
308
|
+
"Mozilla/5.0 (compatible; DataForSeoBot/1.0; +https://dataforseo.com/dataforseo-bot)"
|
|
309
|
+
]
|
|
310
|
+
},
|
|
311
|
+
{
|
|
312
|
+
"name": "Datagnion Bot",
|
|
313
|
+
"pattern": "^datagnionbot"
|
|
314
|
+
},
|
|
315
|
+
{
|
|
316
|
+
"name": "dataprovider.com",
|
|
317
|
+
"pattern": "Dataprovider\\.com",
|
|
318
|
+
"examples": [
|
|
319
|
+
"Mozilla/5.0 (compatible; Dataprovider.com)"
|
|
320
|
+
]
|
|
321
|
+
},
|
|
322
|
+
{
|
|
323
|
+
"name": "Daum",
|
|
324
|
+
"pattern": "http://cs\\.daum\\.net",
|
|
325
|
+
"examples": [
|
|
326
|
+
"Mozilla/5.0 (compatible; Daum/4.1; +http://cs.daum.net/faq/15/4118.html?faqId=28966)"
|
|
327
|
+
]
|
|
328
|
+
},
|
|
329
|
+
{
|
|
330
|
+
"name": "Deezer Podcasters",
|
|
331
|
+
"pattern": "^Deezer Podcasters/1\\.0"
|
|
332
|
+
},
|
|
333
|
+
{
|
|
334
|
+
"name": "Digg",
|
|
335
|
+
"pattern": "^Digg ",
|
|
336
|
+
"examples": [
|
|
337
|
+
"Digg Mozilla/5.0 (Digg/1.0; support@digg.com)"
|
|
338
|
+
]
|
|
339
|
+
},
|
|
340
|
+
{
|
|
341
|
+
"name": "dorada",
|
|
342
|
+
"pattern": "support@dorada\\.co\\.uk"
|
|
343
|
+
},
|
|
344
|
+
{
|
|
345
|
+
"name": "DotBot",
|
|
346
|
+
"pattern": "DotBot",
|
|
347
|
+
"examples": [
|
|
348
|
+
"Mozilla/5.0 (compatible; DotBot/1.1; http://www.opensiteexplorer.org/dotbot, help@moz.com)",
|
|
349
|
+
"Mozilla/5.0 (compatible; DotBot/1.2; https://opensiteexplorer.org/dotbot; help@moz.com)"
|
|
350
|
+
]
|
|
351
|
+
},
|
|
352
|
+
{
|
|
353
|
+
"name": "Downcast Bot",
|
|
354
|
+
"pattern": "downcast feed consumer/",
|
|
355
|
+
"examples": [
|
|
356
|
+
"downcast feed consumer/0.0.175; (mode=dev; id=u2NgjBSPM6; downcast.fm)"
|
|
357
|
+
]
|
|
358
|
+
},
|
|
359
|
+
{
|
|
360
|
+
"name": "DuckDuckBot",
|
|
361
|
+
"pattern": "DuckDuckBot",
|
|
362
|
+
"examples": [
|
|
363
|
+
"Mozilla/5.0 (compatible; DuckDuckBot-Https/1.1; https://duckduckgo.com/duckduckbot)"
|
|
364
|
+
]
|
|
365
|
+
},
|
|
366
|
+
{
|
|
367
|
+
"name": "F-Secure Riddler",
|
|
368
|
+
"pattern": "^Riddler ",
|
|
369
|
+
"description": "an online research project which investigates algorithms for mapping the topology of the Internet",
|
|
370
|
+
"examples": [
|
|
371
|
+
"Riddler (http://riddler.io/about)"
|
|
372
|
+
]
|
|
373
|
+
},
|
|
374
|
+
{
|
|
375
|
+
"name": "Facebook Bot",
|
|
376
|
+
"pattern": "FacebookBot|f?acebookexternalhit/?|^podcastbot$|Facebot|facebookexternalua|^facebookplatform/",
|
|
377
|
+
"urls": [
|
|
378
|
+
"https://www.facebook.com/externalhit_uatext.php"
|
|
379
|
+
],
|
|
380
|
+
"comments": "The podcastbot UA appears to be part of Facebook Podcasts onboarding",
|
|
381
|
+
"examples": [
|
|
382
|
+
"facebookexternalhit/1.1 ( http://www.facebook.com/externalhit_uatext.php)",
|
|
383
|
+
"podcastbot",
|
|
384
|
+
"facebookexternalhit",
|
|
385
|
+
"Facebot",
|
|
386
|
+
"facebookexternalua",
|
|
387
|
+
"facebookplatform/1.0 (+http://developers.facebook.com)",
|
|
388
|
+
"acebookexternalhit/1.0 (+http://www.facebook.com/externalhit_uatext.php)"
|
|
389
|
+
]
|
|
390
|
+
},
|
|
391
|
+
{
|
|
392
|
+
"name": "Feedly",
|
|
393
|
+
"pattern": "^Feedly/",
|
|
394
|
+
"examples": [
|
|
395
|
+
"Feedly/1.0 (+http://www.feedly.com/fetcher.html; like FeedFetcher-Google)"
|
|
396
|
+
]
|
|
397
|
+
},
|
|
398
|
+
{
|
|
399
|
+
"name": "Feedspot Fetcher",
|
|
400
|
+
"pattern": "https://www\\.feedspot\\.com/fs/fetcher",
|
|
401
|
+
"description": "Feedspot Fetcher is how Feedspot fetches RSS/Atom feed when users add the feed to their Feedspot account.",
|
|
402
|
+
"urls": [
|
|
403
|
+
"https://www.feedspot.com/fs/fetcher"
|
|
404
|
+
],
|
|
405
|
+
"examples": [
|
|
406
|
+
"Mozilla/5.0 (compatible; Feedspot/1.0 (+https://www.feedspot.com/fs/fetcher; like FeedFetcher-Google)"
|
|
407
|
+
]
|
|
408
|
+
},
|
|
409
|
+
{
|
|
410
|
+
"name": "FlexGet",
|
|
411
|
+
"pattern": "^FlexGet/",
|
|
412
|
+
"examples": [
|
|
413
|
+
"FlexGet/3.3.4 (www.flexget.com)"
|
|
414
|
+
]
|
|
415
|
+
},
|
|
416
|
+
{
|
|
417
|
+
"name": "Flipboard Proxy",
|
|
418
|
+
"pattern": "FlipboardProxy/",
|
|
419
|
+
"examples": [
|
|
420
|
+
"Mozilla/5.0 (compatible; FlipboardProxy/1.1; +http://flipboard.com/browserproxy)"
|
|
421
|
+
]
|
|
422
|
+
},
|
|
423
|
+
{
|
|
424
|
+
"name": "Fyyd",
|
|
425
|
+
"pattern": "^fyyd-poll"
|
|
426
|
+
},
|
|
427
|
+
{
|
|
428
|
+
"name": "Go Storage Gateway V1",
|
|
429
|
+
"pattern": "^storagegw-v1-go$",
|
|
430
|
+
"comments": "Found coming from TikTok/ByteDance ASNs, along with Go Http Client.",
|
|
431
|
+
"examples": [
|
|
432
|
+
"storagegw-v1-go"
|
|
433
|
+
]
|
|
434
|
+
},
|
|
435
|
+
{
|
|
436
|
+
"name": "Goodpods Bot",
|
|
437
|
+
"pattern": "Goodpods/\\d+\\.\\d+",
|
|
438
|
+
"description": "The social podcasting app",
|
|
439
|
+
"svg": "goodpods.svg",
|
|
440
|
+
"urls": [
|
|
441
|
+
"https://www.goodpods.com/"
|
|
442
|
+
],
|
|
443
|
+
"comments": "RSS scraper / podcast verifier. Contact hello at goodpods dot com.",
|
|
444
|
+
"examples": [
|
|
445
|
+
"Goodpods/2.2"
|
|
446
|
+
]
|
|
447
|
+
},
|
|
448
|
+
{
|
|
449
|
+
"name": "Google Adsense Bot",
|
|
450
|
+
"pattern": "Mediapartners-Google",
|
|
451
|
+
"examples": [
|
|
452
|
+
"Mediapartners-Google"
|
|
453
|
+
],
|
|
454
|
+
"urls": [
|
|
455
|
+
"https://developers.google.com/search/docs/crawling-indexing/overview-google-crawlers"
|
|
456
|
+
]
|
|
457
|
+
},
|
|
458
|
+
{
|
|
459
|
+
"name": "Google AdsBot",
|
|
460
|
+
"pattern": "AdsBot-Google",
|
|
461
|
+
"urls": [
|
|
462
|
+
"http://www.google.com/adsbot.html"
|
|
463
|
+
]
|
|
464
|
+
},
|
|
465
|
+
{
|
|
466
|
+
"name": "Google Podcasts Manager",
|
|
467
|
+
"pattern": "Google-Podcast"
|
|
468
|
+
},
|
|
469
|
+
{
|
|
470
|
+
"name": "Googlebot",
|
|
471
|
+
"pattern": "Googlebot/|Googlebot-Video/|Googlebot-Image/|^Feedfetcher-Google|google-xrawler|^Googlebot-News|^Google-Safety$",
|
|
472
|
+
"description": "Google's search bots",
|
|
473
|
+
"urls": [
|
|
474
|
+
"http://www.google.com/bot.html"
|
|
475
|
+
],
|
|
476
|
+
"examples": [
|
|
477
|
+
"Mozilla/5.0 (Linux; Android 6.0.1; Nexus 5X Build/MMB29P) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.96 Mobile Safari/537.36 (compatible; Googlebot/2.1; http://www.google.com/bot.html)",
|
|
478
|
+
"Googlebot-Image/1.0",
|
|
479
|
+
"Feedfetcher-Google; (+http://www.google.com/feedfetcher.html; 1 subscribers; feed-id=4653447469100830145)",
|
|
480
|
+
"google-xrawler",
|
|
481
|
+
"Googlebot-News Audio",
|
|
482
|
+
"Google-Safety"
|
|
483
|
+
]
|
|
484
|
+
},
|
|
485
|
+
{
|
|
486
|
+
"name": "Gumball",
|
|
487
|
+
"pattern": "^Gumball",
|
|
488
|
+
"description": "An attribution service (known as Gumshoe) from the Gumball network",
|
|
489
|
+
"examples": [
|
|
490
|
+
"Gumball.fm Analytics Prefix Checker"
|
|
491
|
+
]
|
|
492
|
+
},
|
|
493
|
+
{
|
|
494
|
+
"name": "Headliner",
|
|
495
|
+
"pattern": "^Headliner/.*\\+https://headliner\\.app$",
|
|
496
|
+
"comments": "Variety of tools to help promote and drive listens to a podcast.",
|
|
497
|
+
"examples": [
|
|
498
|
+
"Headliner/1.0.0 +https://headliner.app"
|
|
499
|
+
]
|
|
500
|
+
},
|
|
501
|
+
{
|
|
502
|
+
"name": "HubSpot Crawler",
|
|
503
|
+
"pattern": "HubSpot Crawler",
|
|
504
|
+
"examples": [
|
|
505
|
+
"Mozilla/5.0 (compatible; HubSpot Crawler; +https://www.hubspot.com)"
|
|
506
|
+
]
|
|
507
|
+
},
|
|
508
|
+
{
|
|
509
|
+
"name": "Internet Archive",
|
|
510
|
+
"pattern": "Archive-It;|web\\.archive\\.org",
|
|
511
|
+
"description": "Archive-It is a web archiving service that allows institutions to build and preserve collections of born digital content saving this content for future generations.",
|
|
512
|
+
"urls": [
|
|
513
|
+
"https://archive-it.org/files/site-owners-special.html"
|
|
514
|
+
],
|
|
515
|
+
"examples": [
|
|
516
|
+
"Mozilla/5.0 (compatible; special_archiver; Archive-It; http://archive-it.org/files/site-owners-special.html)",
|
|
517
|
+
"ia_archiver-web.archive.org"
|
|
518
|
+
]
|
|
519
|
+
},
|
|
520
|
+
{
|
|
521
|
+
"name": "iOS share menu",
|
|
522
|
+
"pattern": "^SharingUIService/",
|
|
523
|
+
"examples": [
|
|
524
|
+
"SharingUIService/1 CFNetwork/1467.1 Darwin/23.0.0",
|
|
525
|
+
"SharingUIService/1 CFNetwork/1490.0.4 Darwin/23.2.0"
|
|
526
|
+
],
|
|
527
|
+
"comments": "Found on iOS 17 e.g. when long-pressing an enclosure link from Safari and choosing Share..."
|
|
528
|
+
},
|
|
529
|
+
{
|
|
530
|
+
"name": "IPFS Podcasting Node",
|
|
531
|
+
"description": "Nodes downloading from the original source (before pinning to IPFS)",
|
|
532
|
+
"pattern": "^IPFS Podcasting Node/",
|
|
533
|
+
"examples": [
|
|
534
|
+
"IPFS Podcasting Node/0.6n (+https://ipfspodcasting.net)",
|
|
535
|
+
"IPFS Podcasting Node/0.7p,u,s (+https://ipfspodcasting.net)"
|
|
536
|
+
],
|
|
537
|
+
"urls": [
|
|
538
|
+
"https://ipfspodcasting.net"
|
|
539
|
+
]
|
|
540
|
+
},
|
|
541
|
+
{
|
|
542
|
+
"name": "Jaunt",
|
|
543
|
+
"pattern": "^Jaunt/",
|
|
544
|
+
"examples": [
|
|
545
|
+
"Jaunt/1.5"
|
|
546
|
+
]
|
|
547
|
+
},
|
|
548
|
+
{
|
|
549
|
+
"name": "l'Institut national de l'audiovisuel",
|
|
550
|
+
"pattern": "INA dlweb",
|
|
551
|
+
"urls": [
|
|
552
|
+
"https://institut.ina.fr/collecte-du-depot-legal-web"
|
|
553
|
+
],
|
|
554
|
+
"comments": "Institut National de l'Audiovisuel is a repository of all French radio and television audiovisual archives."
|
|
555
|
+
},
|
|
556
|
+
{
|
|
557
|
+
"name": "Library and Archives Canada",
|
|
558
|
+
"description": "The Web and Social Media Preservation Program at Library and Archives Canada (LAC) acquires Canadian web resources for the purposes of digital preservation and makes them available to the public via the Government of Canada Web Archive (GCWA) for future research.",
|
|
559
|
+
"pattern": "LAC_IAHarvester/",
|
|
560
|
+
"examples": [
|
|
561
|
+
"Mozilla/5.0 (compatible; LAC_IAHarvester/3.3.0; +https://library-archives.canada.ca/eng/services/government-canada/web-social-media-preservation-program/Pages/web-archive.aspx)"
|
|
562
|
+
],
|
|
563
|
+
"urls": [
|
|
564
|
+
"https://library-archives.canada.ca/eng/services/government-canada/web-social-media-preservation-program/Pages/web-archive.aspx"
|
|
565
|
+
]
|
|
566
|
+
},
|
|
567
|
+
{
|
|
568
|
+
"name": "Libsyn",
|
|
569
|
+
"pattern": "^Libsyn4",
|
|
570
|
+
"examples": [
|
|
571
|
+
"Libsyn4-Download"
|
|
572
|
+
]
|
|
573
|
+
},
|
|
574
|
+
{
|
|
575
|
+
"name": "libwww-perl",
|
|
576
|
+
"pattern": "^libwww-perl| libwww-perl",
|
|
577
|
+
"examples": [
|
|
578
|
+
"LWP::Simple/6.34 libwww-perl/6.34"
|
|
579
|
+
]
|
|
580
|
+
},
|
|
581
|
+
{
|
|
582
|
+
"name": "Livelap Crawler",
|
|
583
|
+
"pattern": "LivelapBot"
|
|
584
|
+
},
|
|
585
|
+
{
|
|
586
|
+
"name": "ListenNotes",
|
|
587
|
+
"pattern": "^ListenNotes/3\\.0 \\(",
|
|
588
|
+
"examples": [
|
|
589
|
+
"ListenNotes/3.0 (id=c1ef144e30174bf6ba1fedf9174ed908; +https://www.listennotes.com/about/)"
|
|
590
|
+
],
|
|
591
|
+
"urls": [
|
|
592
|
+
"https://www.listennotes.com/about/"
|
|
593
|
+
]
|
|
594
|
+
},
|
|
595
|
+
{
|
|
596
|
+
"name": "LTX71",
|
|
597
|
+
"pattern": "^ltx71 ",
|
|
598
|
+
"description": "We continuously scan the internet for security research purposes.",
|
|
599
|
+
"urls": [
|
|
600
|
+
"http://ltx71.com/"
|
|
601
|
+
],
|
|
602
|
+
"examples": [
|
|
603
|
+
"ltx71 - (http://ltx71.com/)"
|
|
604
|
+
]
|
|
605
|
+
},
|
|
606
|
+
{
|
|
607
|
+
"name": "MacOS share menu",
|
|
608
|
+
"pattern": "^ShareSheetUI/",
|
|
609
|
+
"examples": [
|
|
610
|
+
"ShareSheetUI/1 CFNetwork/1399.4 Darwin/22.1.0",
|
|
611
|
+
"ShareSheetUI/1 CFNetwork/1474 Darwin/23.0.0"
|
|
612
|
+
],
|
|
613
|
+
"comments": "Found on MacOS 13 (Ventura) and higher e.g. when right-clicking an enclosure link from Safari and choosing Share..."
|
|
614
|
+
},
|
|
615
|
+
{
|
|
616
|
+
"name": "MauiBot",
|
|
617
|
+
"pattern": "^MauiBot",
|
|
618
|
+
"examples": [
|
|
619
|
+
"MauiBot (crawler.feedback dc@gmail.com)"
|
|
620
|
+
]
|
|
621
|
+
},
|
|
622
|
+
{
|
|
623
|
+
"name": "Mastodon Bot",
|
|
624
|
+
"pattern": "rb/.*Mastodon/",
|
|
625
|
+
"examples": [
|
|
626
|
+
"http.rb/5.0.4 (Mastodon/3.5.3; +https://mastodon.xyz/) Bot"
|
|
627
|
+
]
|
|
628
|
+
},
|
|
629
|
+
{
|
|
630
|
+
"name": "Microsoft Bingbot",
|
|
631
|
+
"pattern": "(BingPreview/|adidxbot/|[bB]ingbot/)",
|
|
632
|
+
"urls": [
|
|
633
|
+
"https://www.bing.com/webmaster/help/which-crawlers-does-bing-use-8c184ec0"
|
|
634
|
+
],
|
|
635
|
+
"examples": [
|
|
636
|
+
"Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/534 (KHTML, like Gecko) BingPreview/1.0b",
|
|
637
|
+
"Mozilla/5.0 (compatible; Bingbot/2.0; +http://www.bing.com/bingbot.htm)"
|
|
638
|
+
]
|
|
639
|
+
},
|
|
640
|
+
{
|
|
641
|
+
"name": "Microsoft Office",
|
|
642
|
+
"pattern": "ms-office; MSOffice",
|
|
643
|
+
"examples": [
|
|
644
|
+
"Mozilla/4.0 (compatible; ms-office; MSOffice 16)"
|
|
645
|
+
]
|
|
646
|
+
},
|
|
647
|
+
{
|
|
648
|
+
"name": "Mixcloud Podcast Importer",
|
|
649
|
+
"pattern": "^MixcloudPodcastImporter/",
|
|
650
|
+
"examples": [
|
|
651
|
+
"MixcloudPodcastImporter/2.0"
|
|
652
|
+
]
|
|
653
|
+
},
|
|
654
|
+
{
|
|
655
|
+
"name": "MJ12bot",
|
|
656
|
+
"pattern": ".*MJ12bot",
|
|
657
|
+
"examples": [
|
|
658
|
+
"Mozilla/5.0 (compatible; MJ12bot/v1.4.8; http://mj12bot.com/)"
|
|
659
|
+
]
|
|
660
|
+
},
|
|
661
|
+
{
|
|
662
|
+
"name": "Mozilla Bot",
|
|
663
|
+
"pattern": "^'?Mozilla(/5\\.0(\\.\\.\\.)?)?$|^\\(Mozilla/5\\.0\\)$",
|
|
664
|
+
"examples": [
|
|
665
|
+
"Mozilla/5.0",
|
|
666
|
+
"Mozilla",
|
|
667
|
+
"Mozilla/5.0...",
|
|
668
|
+
"'Mozilla/5.0",
|
|
669
|
+
"(Mozilla/5.0)"
|
|
670
|
+
]
|
|
671
|
+
},
|
|
672
|
+
{
|
|
673
|
+
"name": "MSN Bot",
|
|
674
|
+
"pattern": "^msnbot/"
|
|
675
|
+
},
|
|
676
|
+
{
|
|
677
|
+
"name": "Neevabot",
|
|
678
|
+
"pattern": ".*Neevabot",
|
|
679
|
+
"urls": [
|
|
680
|
+
"https://neeva.com/neevabot"
|
|
681
|
+
],
|
|
682
|
+
"examples": [
|
|
683
|
+
"Mozilla/5.0 (compatible; Neevabot/1.0; https://neeva.com/neevabot)"
|
|
684
|
+
]
|
|
685
|
+
},
|
|
686
|
+
{
|
|
687
|
+
"name": "Netcraft Survey Agent",
|
|
688
|
+
"pattern": " NetcraftSurveyAgent/",
|
|
689
|
+
"examples": [
|
|
690
|
+
"Mozilla/5.0 (compatible; NetcraftSurveyAgent/1.0; +info@netcraft.com)"
|
|
691
|
+
]
|
|
692
|
+
},
|
|
693
|
+
{
|
|
694
|
+
"name": "Newspaper",
|
|
695
|
+
"description": "News, full-text, and article metadata extraction in Python 3.",
|
|
696
|
+
"pattern": "^newspaper/\\d",
|
|
697
|
+
"examples": [
|
|
698
|
+
"newspaper/0.3.0"
|
|
699
|
+
],
|
|
700
|
+
"urls": [
|
|
701
|
+
"https://github.com/codelucas/newspaper"
|
|
702
|
+
]
|
|
703
|
+
},
|
|
704
|
+
{
|
|
705
|
+
"name": "OgScrper",
|
|
706
|
+
"pattern": "OgScrper",
|
|
707
|
+
"examples": [
|
|
708
|
+
"OgScrper"
|
|
709
|
+
]
|
|
710
|
+
},
|
|
711
|
+
{
|
|
712
|
+
"name": "OkDownload",
|
|
713
|
+
"pattern": "^OkDownload/"
|
|
714
|
+
},
|
|
715
|
+
{
|
|
716
|
+
"name": "OP3 Fetcher",
|
|
717
|
+
"pattern": "^op3-fetcher/",
|
|
718
|
+
"examples": [
|
|
719
|
+
"op3-fetcher/1.0 (https://op3.dev)"
|
|
720
|
+
],
|
|
721
|
+
"urls": [
|
|
722
|
+
"https://op3.dev"
|
|
723
|
+
]
|
|
724
|
+
},
|
|
725
|
+
{
|
|
726
|
+
"name": "Overcast feed parser",
|
|
727
|
+
"pattern": "^Overcast/1\\.0 Podcast Sync",
|
|
728
|
+
"comments": "Marco Arment says: when a new episode is detected, the servers fetch a copy of it to seed these values with an initial set of data to make the privacy screen more accurate.",
|
|
729
|
+
"examples": [
|
|
730
|
+
"Overcast/1.0 Podcast Sync",
|
|
731
|
+
"Overcast/1.0 Podcast Sync (+http://overcast.fm/)",
|
|
732
|
+
"Overcast/1.0 Podcast Sync (1 subscribers; feed-id=1234567; +http://overcast.fm/)"
|
|
733
|
+
]
|
|
734
|
+
},
|
|
735
|
+
{
|
|
736
|
+
"name": "Pandora RSS crawler",
|
|
737
|
+
"pattern": "^PandoraRSSCrawler"
|
|
738
|
+
},
|
|
739
|
+
{
|
|
740
|
+
"name": "PaperLi",
|
|
741
|
+
"pattern": "PaperLiBot/",
|
|
742
|
+
"examples": [
|
|
743
|
+
"Mozilla/5.0 (compatible; PaperLiBot/2.1; https://support.paper.li/entries/20023257-what-is-paper-li)"
|
|
744
|
+
]
|
|
745
|
+
},
|
|
746
|
+
{
|
|
747
|
+
"name": "PetalBot",
|
|
748
|
+
"pattern": "PetalBot",
|
|
749
|
+
"description": "PetalBot is an automatic program of the Petal search engine.",
|
|
750
|
+
"urls": [
|
|
751
|
+
"https://aspiegel.com/petalbot"
|
|
752
|
+
],
|
|
753
|
+
"examples": [
|
|
754
|
+
"Mozilla/5.0 (Linux; Android 7.0;) AppleWebKit/537.36 (KHTML, like Gecko) Mobile Safari/537.36 (compatible; PetalBot; https://aspiegel.com/petalbot)"
|
|
755
|
+
]
|
|
756
|
+
},
|
|
757
|
+
{
|
|
758
|
+
"name": "Pingdom",
|
|
759
|
+
"pattern": "^Pingdom"
|
|
760
|
+
},
|
|
761
|
+
{
|
|
762
|
+
"name": "PlayerFM Podcast Sync",
|
|
763
|
+
"pattern": "PlayerFM/.* Podcast Sync",
|
|
764
|
+
"examples": [
|
|
765
|
+
"PlayerFM/1.0 Podcast Sync (0 subscribers; url=https://player.fm/series/series-2567872)"
|
|
766
|
+
]
|
|
767
|
+
},
|
|
768
|
+
{
|
|
769
|
+
"name": "Podbean Importer",
|
|
770
|
+
"pattern": "^Podbean Importer",
|
|
771
|
+
"examples": [
|
|
772
|
+
"Podbean Importer"
|
|
773
|
+
]
|
|
774
|
+
},
|
|
775
|
+
{
|
|
776
|
+
"name": "Podcastindex.org",
|
|
777
|
+
"pattern": "^Podcastindex\\.org/",
|
|
778
|
+
"svg": "podcast-index.svg",
|
|
779
|
+
"urls": [
|
|
780
|
+
"https://podcastindex.org/"
|
|
781
|
+
],
|
|
782
|
+
"examples": [
|
|
783
|
+
"Podcastindex.org/v0.3.3 (Aggrivate)"
|
|
784
|
+
]
|
|
785
|
+
},
|
|
786
|
+
{
|
|
787
|
+
"name": "Podcast de facto Standard",
|
|
788
|
+
"description": "Dedicated to providing guidance and information on the conventions and standards used in podcasting",
|
|
789
|
+
"pattern": "^PodcastStandard/",
|
|
790
|
+
"examples": [
|
|
791
|
+
"PodcastStandard/0.1.0 (+https://podcast-standard.org)"
|
|
792
|
+
],
|
|
793
|
+
"urls": [
|
|
794
|
+
"https://podcast-standard.org/"
|
|
795
|
+
]
|
|
796
|
+
},
|
|
797
|
+
{
|
|
798
|
+
"name": "Podcast Archiver",
|
|
799
|
+
"pattern": "^Podcast%20Archiver/",
|
|
800
|
+
"urls": [
|
|
801
|
+
"https://www.fredrikblank.com/podcast-archiver/"
|
|
802
|
+
],
|
|
803
|
+
"examples": [
|
|
804
|
+
"Podcast%20Archiver/3000000003 CFNetwork/1406.0.4 Darwin/22.4.0"
|
|
805
|
+
]
|
|
806
|
+
},
|
|
807
|
+
{
|
|
808
|
+
"name": "PodCloud",
|
|
809
|
+
"pattern": "podCloud",
|
|
810
|
+
"description": "Le podcast, simplement. A French-language web-based podcast player.",
|
|
811
|
+
"urls": [
|
|
812
|
+
"https://podcloud.fr"
|
|
813
|
+
],
|
|
814
|
+
"comments": "This useragent is a bot, doing feed updates and downloading media files. It was observed every six hours. User plays will have a standard browser useragent with a referer of https://podcloud.fr/"
|
|
815
|
+
},
|
|
816
|
+
{
|
|
817
|
+
"name": "Podcorn",
|
|
818
|
+
"pattern": "Podcorn/",
|
|
819
|
+
"description": "The leading podcast influencer marketplace. Connecting unique voices to unique brands for native advertising.",
|
|
820
|
+
"urls": [
|
|
821
|
+
"https://podcorn.com/"
|
|
822
|
+
],
|
|
823
|
+
"examples": [
|
|
824
|
+
"Podcorn/1.0"
|
|
825
|
+
]
|
|
826
|
+
},
|
|
827
|
+
{
|
|
828
|
+
"name": "PodderBot",
|
|
829
|
+
"pattern": "PodderBot/",
|
|
830
|
+
"description": "PodderApp bot",
|
|
831
|
+
"urls": [
|
|
832
|
+
"https://www.podderapp.com/"
|
|
833
|
+
],
|
|
834
|
+
"comments": "PodderApp bot for RSS fetching / verification",
|
|
835
|
+
"examples": [
|
|
836
|
+
"PodderBot/1.0"
|
|
837
|
+
]
|
|
838
|
+
},
|
|
839
|
+
{
|
|
840
|
+
"name": "Podfollow",
|
|
841
|
+
"pattern": "podfollowbot/",
|
|
842
|
+
"description": "Podfollow, a service to help link to your podcast",
|
|
843
|
+
"urls": [
|
|
844
|
+
"https://podfollow.com"
|
|
845
|
+
],
|
|
846
|
+
"examples": [
|
|
847
|
+
"Mozilla/5.0 https://podfollow.com/crawling podfollowbot/1.0"
|
|
848
|
+
]
|
|
849
|
+
},
|
|
850
|
+
{
|
|
851
|
+
"name": "Podgrab",
|
|
852
|
+
"pattern": "^Podgrab$",
|
|
853
|
+
"description": "A self-hosted podcast manager to download episodes as soon as they become live",
|
|
854
|
+
"urls": [
|
|
855
|
+
"https://github.com/akhilrex/podgrab"
|
|
856
|
+
],
|
|
857
|
+
"examples": [
|
|
858
|
+
"Podgrab"
|
|
859
|
+
],
|
|
860
|
+
"comments": "Found used for automated archiving."
|
|
861
|
+
},
|
|
862
|
+
{
|
|
863
|
+
"name": "Podhound",
|
|
864
|
+
"pattern": "PodhoundBeta",
|
|
865
|
+
"description": "AI-powered podcast discovery",
|
|
866
|
+
"urls": [
|
|
867
|
+
"http://podhound.co"
|
|
868
|
+
],
|
|
869
|
+
"comments": "'It grabs it once to get the audio file length.', says the developer.",
|
|
870
|
+
"examples": [
|
|
871
|
+
"PodhoundBeta"
|
|
872
|
+
]
|
|
873
|
+
},
|
|
874
|
+
{
|
|
875
|
+
"name": "Podio Bot",
|
|
876
|
+
"pattern": "^Podio/",
|
|
877
|
+
"description": "Podcasts + Radio = Podio",
|
|
878
|
+
"urls": [
|
|
879
|
+
"https://podio.radio/"
|
|
880
|
+
],
|
|
881
|
+
"comments": "This useragent appears to download and cache audio",
|
|
882
|
+
"examples": [
|
|
883
|
+
"Podio/1.0"
|
|
884
|
+
]
|
|
885
|
+
},
|
|
886
|
+
{
|
|
887
|
+
"name": "Podnews",
|
|
888
|
+
"pattern": "PodnewsBot",
|
|
889
|
+
"description": "Podnews runs a number of bots to read and test RSS and audio files",
|
|
890
|
+
"urls": [
|
|
891
|
+
"http://podnews.net"
|
|
892
|
+
]
|
|
893
|
+
},
|
|
894
|
+
{
|
|
895
|
+
"name": "Podnods Bot",
|
|
896
|
+
"pattern": "(podnods-crawler|podnods)",
|
|
897
|
+
"description": "Podnods is a podcast discovery site. This user agent is for crawling podcast data.",
|
|
898
|
+
"urls": [
|
|
899
|
+
"https://podnods.com/about"
|
|
900
|
+
]
|
|
901
|
+
},
|
|
902
|
+
{
|
|
903
|
+
"name": "Podroll Analyzer",
|
|
904
|
+
"pattern": "^pdrl\\.fm ",
|
|
905
|
+
"examples": [
|
|
906
|
+
"pdrl.fm Analyzer / 1.0.0"
|
|
907
|
+
]
|
|
908
|
+
},
|
|
909
|
+
{
|
|
910
|
+
"name": "Podscan Bot",
|
|
911
|
+
"pattern": "^PodscanBot/",
|
|
912
|
+
"examples": [
|
|
913
|
+
"PodscanBot/1.1.0 Ubuntu/22.04 (Linux) +https://podscan.fm",
|
|
914
|
+
"PodscanBot/1.1.0 Ubuntu/22.04 (Linux) Podscan.fm"
|
|
915
|
+
],
|
|
916
|
+
"urls": [
|
|
917
|
+
"https://podscan.fm"
|
|
918
|
+
]
|
|
919
|
+
},
|
|
920
|
+
{
|
|
921
|
+
"name": "Podscribe",
|
|
922
|
+
"pattern": "(^Adswizz-podscribe/|^Podscribe/)",
|
|
923
|
+
"examples": [
|
|
924
|
+
"Adswizz-podscribe/1.0",
|
|
925
|
+
"Podscribe/1.1"
|
|
926
|
+
]
|
|
927
|
+
},
|
|
928
|
+
{
|
|
929
|
+
"name": "PodUptime",
|
|
930
|
+
"description": "Uptime Monitoring for the Podcast Industry",
|
|
931
|
+
"pattern": "PodUptime/\\d",
|
|
932
|
+
"examples": [
|
|
933
|
+
"Mozilla/5.0 (compatible; PodUptime/1.0; +https://poduptime.com)"
|
|
934
|
+
],
|
|
935
|
+
"urls": [
|
|
936
|
+
"https://poduptime.com/"
|
|
937
|
+
]
|
|
938
|
+
},
|
|
939
|
+
{
|
|
940
|
+
"name": "Podverse Feed Parser",
|
|
941
|
+
"pattern": "^Podverse/Feed Parser",
|
|
942
|
+
"description": "The Podverse feed parser.",
|
|
943
|
+
"urls": [
|
|
944
|
+
"https://podverse.fm"
|
|
945
|
+
],
|
|
946
|
+
"comments": "This service parses publicly-accessible RSS feeds on a timer, then stores parsed data in the Podverse database."
|
|
947
|
+
},
|
|
948
|
+
{
|
|
949
|
+
"name": "PodvineBot",
|
|
950
|
+
"pattern": "^PodvineBot/",
|
|
951
|
+
"examples": [
|
|
952
|
+
"PodvineBot/4.0.1 (www.podvine.com)"
|
|
953
|
+
]
|
|
954
|
+
},
|
|
955
|
+
{
|
|
956
|
+
"name": "PostRank Bot",
|
|
957
|
+
"pattern": "^PostRank/",
|
|
958
|
+
"examples": [
|
|
959
|
+
"PostRank/2.0 (postrank.com; 1 subscribers)"
|
|
960
|
+
],
|
|
961
|
+
"comments": "Acquired by Google, https://en.wikipedia.org/wiki/PostRank"
|
|
962
|
+
},
|
|
963
|
+
{
|
|
964
|
+
"name": "PodwatchPro",
|
|
965
|
+
"pattern": "Podwatch-Pro Crawler",
|
|
966
|
+
"examples": [
|
|
967
|
+
"Podwatch-Pro Crawler"
|
|
968
|
+
],
|
|
969
|
+
"description": "PodwatchPro is a podcast analytics software. This user agent is for crawling podcast data.",
|
|
970
|
+
"urls": ["https://www.agma-mmc.de/media-analyse/ma-podcast"]
|
|
971
|
+
},
|
|
972
|
+
{
|
|
973
|
+
"name": "Puppeteer",
|
|
974
|
+
"pattern": " HeadlessChrome/\\d",
|
|
975
|
+
"examples": [
|
|
976
|
+
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/105.0.5173.0 Safari/537.36"
|
|
977
|
+
],
|
|
978
|
+
"urls": [
|
|
979
|
+
"https://pptr.dev/"
|
|
980
|
+
]
|
|
981
|
+
},
|
|
982
|
+
{
|
|
983
|
+
"name": "python-requests",
|
|
984
|
+
"pattern": "python-requests"
|
|
985
|
+
},
|
|
986
|
+
{
|
|
987
|
+
"name": "Qiniu spider",
|
|
988
|
+
"pattern": "qiniu.*spider",
|
|
989
|
+
"examples": [
|
|
990
|
+
"z0-qiniu-imgstg-spider-1.0"
|
|
991
|
+
]
|
|
992
|
+
},
|
|
993
|
+
{
|
|
994
|
+
"name": "Radioline Stream Monitoring",
|
|
995
|
+
"pattern": "^Radioline Stream Monitoring",
|
|
996
|
+
"examples": [
|
|
997
|
+
"Radioline Stream Monitoring (tech@radioline.co)"
|
|
998
|
+
]
|
|
999
|
+
},
|
|
1000
|
+
{
|
|
1001
|
+
"name": "RedCircle",
|
|
1002
|
+
"pattern": "RedCircle",
|
|
1003
|
+
"description": "A platform for podcasts and brands to scale their message.",
|
|
1004
|
+
"urls": [
|
|
1005
|
+
"https://redcircle.com/"
|
|
1006
|
+
],
|
|
1007
|
+
"examples": [
|
|
1008
|
+
"RedCircle"
|
|
1009
|
+
]
|
|
1010
|
+
},
|
|
1011
|
+
{
|
|
1012
|
+
"name": "Rephonic",
|
|
1013
|
+
"pattern": "^Rephonic/\\d",
|
|
1014
|
+
"urls": [
|
|
1015
|
+
"https://rephonic.com/"
|
|
1016
|
+
],
|
|
1017
|
+
"examples": [
|
|
1018
|
+
"Rephonic/1.0"
|
|
1019
|
+
]
|
|
1020
|
+
},
|
|
1021
|
+
{
|
|
1022
|
+
"name": "Ridder Bot",
|
|
1023
|
+
"pattern": " RidderBot/",
|
|
1024
|
+
"examples": [
|
|
1025
|
+
"Mozilla/5.0 (compatible; RidderBot/1.0; bot@ridder.co)"
|
|
1026
|
+
]
|
|
1027
|
+
},
|
|
1028
|
+
{
|
|
1029
|
+
"name": "RSS to Telegram",
|
|
1030
|
+
"pattern": "^RSStT",
|
|
1031
|
+
"description": "an RSS to Telegram bot",
|
|
1032
|
+
"urls": [
|
|
1033
|
+
"https://apps.apple.com/be/app/audiowave-podcast-player/id1602776751"
|
|
1034
|
+
],
|
|
1035
|
+
"examples": [
|
|
1036
|
+
"RSStT/2.2.1 RSS Reader"
|
|
1037
|
+
]
|
|
1038
|
+
},
|
|
1039
|
+
{
|
|
1040
|
+
"name": "RSSRadio",
|
|
1041
|
+
"pattern": "^RSSRadio \\("
|
|
1042
|
+
},
|
|
1043
|
+
{
|
|
1044
|
+
"name": "Ruby Mechanize",
|
|
1045
|
+
"pattern": "^Mechanize|[ -]Mechanize/",
|
|
1046
|
+
"examples": [
|
|
1047
|
+
"Mozilla/5.0 (compatible; Mechanize/2.7.4)",
|
|
1048
|
+
"WWW-Mechanize/1.72"
|
|
1049
|
+
]
|
|
1050
|
+
},
|
|
1051
|
+
{
|
|
1052
|
+
"name": "Screaming Frog SEO Spider",
|
|
1053
|
+
"pattern": "^Screaming Frog ",
|
|
1054
|
+
"examples": [
|
|
1055
|
+
"Screaming Frog SEO Spider/5.1"
|
|
1056
|
+
]
|
|
1057
|
+
},
|
|
1058
|
+
{
|
|
1059
|
+
"name": "SearchAtlas.com SEO Crawler",
|
|
1060
|
+
"pattern": "^SearchAtlas.*Crawler",
|
|
1061
|
+
"examples": [
|
|
1062
|
+
"SearchAtlas.com SEO Crawler"
|
|
1063
|
+
]
|
|
1064
|
+
},
|
|
1065
|
+
{
|
|
1066
|
+
"name": "SEMrushBot",
|
|
1067
|
+
"pattern": "SemrushBot/|^SEMrushBot$",
|
|
1068
|
+
"examples": [
|
|
1069
|
+
"Mozilla/5.0 (compatible; SemrushBot/6~bl; http://www.semrush.com/bot.html)",
|
|
1070
|
+
"SEMrushBot"
|
|
1071
|
+
]
|
|
1072
|
+
},
|
|
1073
|
+
{
|
|
1074
|
+
"name": "Serendeputy",
|
|
1075
|
+
"pattern": "SerendeputyBot/",
|
|
1076
|
+
"urls": [
|
|
1077
|
+
"https://serendeputy.com/about/serendeputy-bot"
|
|
1078
|
+
],
|
|
1079
|
+
"examples": [
|
|
1080
|
+
"SerendeputyBot/0.8.6 (http://serendeputy.com/about/serendeputy-bot)"
|
|
1081
|
+
]
|
|
1082
|
+
},
|
|
1083
|
+
{
|
|
1084
|
+
"name": "Simplecast",
|
|
1085
|
+
"pattern": "^Simplecast$",
|
|
1086
|
+
"examples": [
|
|
1087
|
+
"Simplecast"
|
|
1088
|
+
]
|
|
1089
|
+
},
|
|
1090
|
+
{
|
|
1091
|
+
"name": "Slack Bot",
|
|
1092
|
+
"pattern": "^Slackbot 1\\.0",
|
|
1093
|
+
"examples": [
|
|
1094
|
+
"Slackbot 1.0 ( https://api.slack.com/robots)"
|
|
1095
|
+
]
|
|
1096
|
+
},
|
|
1097
|
+
{
|
|
1098
|
+
"name": "Snapchat Bot",
|
|
1099
|
+
"pattern": "://developers\\.snap\\.com/robots",
|
|
1100
|
+
"examples": [
|
|
1101
|
+
"Snap URL Preview Service; bot; snapchat; https://developers.snap.com/robots"
|
|
1102
|
+
]
|
|
1103
|
+
},
|
|
1104
|
+
{
|
|
1105
|
+
"name": "SoundOn Bot",
|
|
1106
|
+
"pattern": "^SoundOn/[\\d.]+\\s+\\(bot"
|
|
1107
|
+
},
|
|
1108
|
+
{
|
|
1109
|
+
"name": "Spotify cache service",
|
|
1110
|
+
"pattern": "^Spotify/1\\.0$",
|
|
1111
|
+
"comments": "This useragent, currently simply Spotify/1.0, is used when retrieving the RSS and audio for Spotify's catalogue. It isn't used for passthru.",
|
|
1112
|
+
"examples": [
|
|
1113
|
+
"Spotify/1.0"
|
|
1114
|
+
]
|
|
1115
|
+
},
|
|
1116
|
+
{
|
|
1117
|
+
"name": "Stitcher Bot",
|
|
1118
|
+
"pattern": "^StitcherBot"
|
|
1119
|
+
},
|
|
1120
|
+
{
|
|
1121
|
+
"name": "Substack Content Fetcher",
|
|
1122
|
+
"pattern": "^SubstackContentFetch/",
|
|
1123
|
+
"examples": [
|
|
1124
|
+
"SubstackContentFetch/1.0 (https://substack.com/)"
|
|
1125
|
+
]
|
|
1126
|
+
},
|
|
1127
|
+
{
|
|
1128
|
+
"name": "SupportingCast",
|
|
1129
|
+
"pattern": "^SupportingCast(/.*)?$",
|
|
1130
|
+
"examples": [
|
|
1131
|
+
"SupportingCast/1.0",
|
|
1132
|
+
"SupportingCast"
|
|
1133
|
+
]
|
|
1134
|
+
},
|
|
1135
|
+
{
|
|
1136
|
+
"name": "Timpi search crawler",
|
|
1137
|
+
"pattern": "Timpibot/",
|
|
1138
|
+
"examples": [
|
|
1139
|
+
"Timpibot/0.8 ( http://www.timpi.io)"
|
|
1140
|
+
]
|
|
1141
|
+
},
|
|
1142
|
+
{
|
|
1143
|
+
"name": "Tiny Tiny RSS",
|
|
1144
|
+
"pattern": "^Tiny Tiny RSS/",
|
|
1145
|
+
"examples": [
|
|
1146
|
+
"Tiny Tiny RSS/22.12-c30b24d09 (Unsupported) (https://tt-rss.org/)"
|
|
1147
|
+
],
|
|
1148
|
+
"urls": [
|
|
1149
|
+
"https://tt-rss.org/"
|
|
1150
|
+
],
|
|
1151
|
+
"comments": "Found autodownloading hundreds of episodes from an entire feed in rapid succession"
|
|
1152
|
+
},
|
|
1153
|
+
{
|
|
1154
|
+
"name": "Transistor",
|
|
1155
|
+
"pattern": "^Transistor\\.fm/",
|
|
1156
|
+
"examples": [
|
|
1157
|
+
"Transistor.fm/1.0"
|
|
1158
|
+
],
|
|
1159
|
+
"urls": [
|
|
1160
|
+
"https://transistor.fm"
|
|
1161
|
+
]
|
|
1162
|
+
},
|
|
1163
|
+
{
|
|
1164
|
+
"name": "Trendsmap Resolver",
|
|
1165
|
+
"pattern": "TrendsmapResolver/"
|
|
1166
|
+
},
|
|
1167
|
+
{
|
|
1168
|
+
"name": "Triton Digital Podcast Sync",
|
|
1169
|
+
"pattern": "^Triton Digital Podcast Sync$",
|
|
1170
|
+
"examples": [
|
|
1171
|
+
"Triton Digital Podcast Sync"
|
|
1172
|
+
]
|
|
1173
|
+
},
|
|
1174
|
+
{
|
|
1175
|
+
"name": "Twingly Bot",
|
|
1176
|
+
"pattern": "Twingly Recon;",
|
|
1177
|
+
"examples": [
|
|
1178
|
+
"Mozilla/5.0 (compatible; Twingly Recon; twingly.com)"
|
|
1179
|
+
]
|
|
1180
|
+
},
|
|
1181
|
+
{
|
|
1182
|
+
"name": "Twitterbot",
|
|
1183
|
+
"pattern": "^Twitterbot"
|
|
1184
|
+
},
|
|
1185
|
+
{
|
|
1186
|
+
"name": "Typhoeus",
|
|
1187
|
+
"pattern": "^Typhoeus"
|
|
1188
|
+
},
|
|
1189
|
+
{
|
|
1190
|
+
"name": "UCast",
|
|
1191
|
+
"pattern": "^UCast/",
|
|
1192
|
+
"examples": [
|
|
1193
|
+
"UCast/1.0 Podcast Sync (1 subscribers; feed-id=aHR0cHM6Ly9mZWVkcy5idXp6c3Byb3V0LmNvbS8yMDg0OTQucnNzEAEBAD32-0242-42AC-8583-21E9BAD8C544; +http://www.ucastapp.com/)"
|
|
1194
|
+
]
|
|
1195
|
+
},
|
|
1196
|
+
{
|
|
1197
|
+
"name": "TelegramBot",
|
|
1198
|
+
"pattern": "^TelegramBot ",
|
|
1199
|
+
"examples": [
|
|
1200
|
+
"TelegramBot (like TwitterBot)"
|
|
1201
|
+
]
|
|
1202
|
+
},
|
|
1203
|
+
{
|
|
1204
|
+
"name": "theTradeDesk Content Web Scraper",
|
|
1205
|
+
"pattern": "TTD-Content",
|
|
1206
|
+
"examples": [
|
|
1207
|
+
"Mozilla/5.0 (compatible; TTD-Content; +https://www.thetradedesk.com/general/ttd-content)"
|
|
1208
|
+
],
|
|
1209
|
+
"urls": [
|
|
1210
|
+
"https://www.thetradedesk.com/us/ttd-content"
|
|
1211
|
+
]
|
|
1212
|
+
},
|
|
1213
|
+
{
|
|
1214
|
+
"name": "Veritone Engine Toolkit",
|
|
1215
|
+
"pattern": "^veritone/engine-toolkit",
|
|
1216
|
+
"urls": [
|
|
1217
|
+
"https://machinebox.io/veritone/engine-toolkit"
|
|
1218
|
+
],
|
|
1219
|
+
"examples": [
|
|
1220
|
+
"veritone/engine-toolkit-3.0"
|
|
1221
|
+
]
|
|
1222
|
+
},
|
|
1223
|
+
{
|
|
1224
|
+
"name": "Vurbl",
|
|
1225
|
+
"pattern": "VurblBot",
|
|
1226
|
+
"description": "An audio streaming destination",
|
|
1227
|
+
"urls": [
|
|
1228
|
+
"https://vurbl.com/about-us/"
|
|
1229
|
+
],
|
|
1230
|
+
"examples": [
|
|
1231
|
+
"Mozilla/5.0 https://vurbl.com VurblBot/1.0"
|
|
1232
|
+
]
|
|
1233
|
+
},
|
|
1234
|
+
{
|
|
1235
|
+
"name": "Wget",
|
|
1236
|
+
"pattern": "Wget"
|
|
1237
|
+
},
|
|
1238
|
+
{
|
|
1239
|
+
"name": "weborama",
|
|
1240
|
+
"pattern": "^weborama-fetcher",
|
|
1241
|
+
"examples": [
|
|
1242
|
+
"weborama-fetcher (+http://www.weborama.com)"
|
|
1243
|
+
]
|
|
1244
|
+
},
|
|
1245
|
+
{
|
|
1246
|
+
"name": "Windows Crawler",
|
|
1247
|
+
"pattern": "^ZDM/.*Windows",
|
|
1248
|
+
"examples": [
|
|
1249
|
+
"ZDM/4.0; Windows Mobile 7.0;"
|
|
1250
|
+
]
|
|
1251
|
+
},
|
|
1252
|
+
{
|
|
1253
|
+
"name": "Windows PowerShell",
|
|
1254
|
+
"pattern": "WindowsPowerShell/",
|
|
1255
|
+
"examples": [
|
|
1256
|
+
"Mozilla/5.0 (Windows NT; Windows NT 10.0; en-US) WindowsPowerShell/5.1.19041.2673"
|
|
1257
|
+
]
|
|
1258
|
+
},
|
|
1259
|
+
{
|
|
1260
|
+
"name": "WordPress",
|
|
1261
|
+
"pattern": "^WordPress"
|
|
1262
|
+
},
|
|
1263
|
+
{
|
|
1264
|
+
"name": "wsrv.nl",
|
|
1265
|
+
"pattern": "https?://wsrv.nl/",
|
|
1266
|
+
"examples": [
|
|
1267
|
+
"Mozilla/5.0 (compatible; ImageFetcher/9.0; +http://wsrv.nl/)"
|
|
1268
|
+
]
|
|
1269
|
+
},
|
|
1270
|
+
{
|
|
1271
|
+
"name": "YaCy",
|
|
1272
|
+
"pattern": "^yacybot",
|
|
1273
|
+
"description": "Decentralized Web Search",
|
|
1274
|
+
"urls": [
|
|
1275
|
+
"http://yacy.net/bot.html"
|
|
1276
|
+
],
|
|
1277
|
+
"examples": [
|
|
1278
|
+
"yacybot (/global; amd64 Linux 5.9.8-zen1-1-zen; java 1.8.0_265; Europe/de) http://yacy.net/bot.html"
|
|
1279
|
+
]
|
|
1280
|
+
},
|
|
1281
|
+
{
|
|
1282
|
+
"name": "Yahoo Crawler",
|
|
1283
|
+
"pattern": "Yahoo! Slurp",
|
|
1284
|
+
"examples": [
|
|
1285
|
+
"Crawler Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)"
|
|
1286
|
+
]
|
|
1287
|
+
},
|
|
1288
|
+
{
|
|
1289
|
+
"name": "YandexBot",
|
|
1290
|
+
"pattern": "YandexBot/"
|
|
1291
|
+
},
|
|
1292
|
+
{
|
|
1293
|
+
"name": "Zapier",
|
|
1294
|
+
"pattern": "^Zapier$",
|
|
1295
|
+
"examples": [
|
|
1296
|
+
"Zapier"
|
|
1297
|
+
]
|
|
1298
|
+
},
|
|
1299
|
+
{
|
|
1300
|
+
"name": "Zencast",
|
|
1301
|
+
"pattern": "^Zencastr/",
|
|
1302
|
+
"examples": [
|
|
1303
|
+
"Zencastr/2.0"
|
|
1304
|
+
]
|
|
1305
|
+
}
|
|
1306
|
+
]
|
|
1307
|
+
}
|