crawler_detect 0.1.5 → 0.1.6
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/crawler_detect/detector.rb +1 -1
- data/lib/crawler_detect/library/crawlers.rb +127 -162
- data/lib/crawler_detect/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: d59268ab3ed03de60b67ac58bc9f1891b131f282cefdd32344a7ae633061700b
|
|
4
|
+
data.tar.gz: c2efe88dc14eb589636ae11f0ef0e78d36091c8de449ea8884a6ba81f545459a
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: fb23c32b42868dfe6c687c6b20d44312b35031a54ec0570f43bb209db5bcf8b94193500057aea3b69df61e6a7b5c947e2bce552308be2b23530e7562a8316f56
|
|
7
|
+
data.tar.gz: c74a44a447eab8c6665ff556a21d1eef3757fb5e18bb585dca852a1c3081b9850a81c5927bbf5e5c11324ce55cdbd09b20a9f3657fad5bac12d3e35c399fab31
|
|
@@ -37,7 +37,6 @@ module CrawlerDetect
|
|
|
37
37
|
13TABS
|
|
38
38
|
192\.comAgent
|
|
39
39
|
2ip\.ru
|
|
40
|
-
404checker
|
|
41
40
|
404enemy
|
|
42
41
|
7Siters
|
|
43
42
|
80legs
|
|
@@ -55,42 +54,41 @@ AdAuth\/
|
|
|
55
54
|
adbeat
|
|
56
55
|
AddThis
|
|
57
56
|
ADmantX
|
|
57
|
+
AdminLabs
|
|
58
58
|
adressendeutschland
|
|
59
|
-
adscanner
|
|
60
|
-
Advanced Email Extractor v
|
|
59
|
+
adscanner
|
|
61
60
|
agentslug
|
|
62
61
|
AHC
|
|
63
62
|
aihit
|
|
64
63
|
aiohttp\/
|
|
65
64
|
Airmail
|
|
66
|
-
Akamai_Site_Analyzer
|
|
67
65
|
akka-http\/
|
|
68
66
|
akula\/
|
|
69
67
|
alertra
|
|
70
68
|
alexa site audit
|
|
71
69
|
Alibaba\.Security\.Heimdall
|
|
72
70
|
Alligator
|
|
73
|
-
allloadin
|
|
71
|
+
allloadin
|
|
74
72
|
AllSubmitter
|
|
75
73
|
alyze\.info
|
|
76
74
|
amagit
|
|
77
75
|
Anarchie
|
|
78
76
|
AndroidDownloadManager
|
|
79
77
|
Anemone
|
|
80
|
-
AngleSharp
|
|
78
|
+
AngleSharp
|
|
81
79
|
annotate_google
|
|
82
80
|
Ant\.com
|
|
83
81
|
Anturis Agent
|
|
84
82
|
AnyEvent-HTTP\/
|
|
85
83
|
Apache Droid
|
|
86
84
|
Apache OpenOffice
|
|
87
|
-
Apache-HttpAsyncClient
|
|
88
|
-
Apache-HttpClient
|
|
89
|
-
ApacheBench
|
|
85
|
+
Apache-HttpAsyncClient
|
|
86
|
+
Apache-HttpClient
|
|
87
|
+
ApacheBench
|
|
90
88
|
Apexoo
|
|
91
89
|
APIs-Google
|
|
92
|
-
AportWorm\/
|
|
93
|
-
AppBeat\/
|
|
90
|
+
AportWorm\/
|
|
91
|
+
AppBeat\/
|
|
94
92
|
AppEngine-Google
|
|
95
93
|
AppStoreScraperZ
|
|
96
94
|
Aprc\/[0-9]
|
|
@@ -99,7 +97,7 @@ arachnode
|
|
|
99
97
|
Arachnophilia
|
|
100
98
|
aria2
|
|
101
99
|
Arukereso
|
|
102
|
-
asafaweb
|
|
100
|
+
asafaweb
|
|
103
101
|
AskQuickly
|
|
104
102
|
Ask Jeeves
|
|
105
103
|
ASPSeek
|
|
@@ -122,15 +120,14 @@ baidu\.com
|
|
|
122
120
|
Bandit
|
|
123
121
|
basicstate
|
|
124
122
|
BatchFTP
|
|
125
|
-
|
|
126
|
-
baypup\/
|
|
127
|
-
baypup\/colbert
|
|
123
|
+
Battlezta Bazinga
|
|
124
|
+
baypup\/
|
|
128
125
|
BazQux
|
|
129
126
|
BBBike
|
|
130
127
|
BCKLINKS
|
|
131
128
|
BDFetch
|
|
132
|
-
BegunAdvertising
|
|
133
|
-
Bidtellect
|
|
129
|
+
BegunAdvertising
|
|
130
|
+
Bidtellect
|
|
134
131
|
BigBozz
|
|
135
132
|
Bigfoot
|
|
136
133
|
biglotron
|
|
@@ -140,24 +137,23 @@ binlar
|
|
|
140
137
|
biNu image cacher
|
|
141
138
|
Bitacle
|
|
142
139
|
biz_Directory
|
|
143
|
-
Black
|
|
140
|
+
Black Hole
|
|
144
141
|
Blackboard Safeassign
|
|
145
142
|
BlackWidow
|
|
146
143
|
BlockNote\.Net
|
|
147
|
-
Bloglines
|
|
144
|
+
Bloglines
|
|
148
145
|
Bloglovin
|
|
149
146
|
BlogPulseLive
|
|
150
147
|
BlogSearch
|
|
151
148
|
Blogtrottr
|
|
152
149
|
BlowFish
|
|
153
|
-
Boardreader
|
|
154
150
|
boitho\.com-dc
|
|
155
151
|
BPImageWalker
|
|
156
152
|
Braintree-Webhooks
|
|
157
153
|
Branch Metrics API
|
|
158
154
|
Branch-Passthrough
|
|
159
155
|
Brandprotect
|
|
160
|
-
BrandVerity
|
|
156
|
+
BrandVerity
|
|
161
157
|
Brandwatch
|
|
162
158
|
Brodie\/
|
|
163
159
|
Browsershots
|
|
@@ -174,7 +170,6 @@ CAAM\/[0-9]
|
|
|
174
170
|
CakePHP
|
|
175
171
|
Calculon
|
|
176
172
|
Canary%20Mail
|
|
177
|
-
CapsuleChecker
|
|
178
173
|
CaretNail
|
|
179
174
|
catexplorador
|
|
180
175
|
CC Metadata Scaper
|
|
@@ -184,37 +179,37 @@ Cerberian Drtrs
|
|
|
184
179
|
CERT\.at-Statistics-Survey
|
|
185
180
|
cg-eye
|
|
186
181
|
changedetection
|
|
187
|
-
ChangesMeter
|
|
182
|
+
ChangesMeter
|
|
188
183
|
Charlotte
|
|
189
184
|
CheckHost
|
|
190
185
|
checkprivacy
|
|
191
186
|
CherryPicker
|
|
192
187
|
ChinaClaw
|
|
193
|
-
Chirp\/
|
|
188
|
+
Chirp\/
|
|
194
189
|
chkme\.com
|
|
195
190
|
Chlooe
|
|
196
191
|
Chromaxa
|
|
197
|
-
CirrusExplorer
|
|
192
|
+
CirrusExplorer
|
|
198
193
|
CISPA Vulnerability Notification
|
|
199
194
|
Citoid
|
|
200
195
|
CJNetworkQuality
|
|
201
196
|
Clarsentia
|
|
202
197
|
clips\.ua\.ac\.be
|
|
203
|
-
Cloud
|
|
198
|
+
Cloud mapping
|
|
204
199
|
CloudEndure
|
|
205
200
|
CloudFlare-AlwaysOnline
|
|
206
|
-
Cloudinary
|
|
201
|
+
Cloudinary
|
|
207
202
|
cmcm\.com
|
|
208
203
|
coccoc
|
|
209
204
|
cognitiveseo
|
|
210
205
|
colly -
|
|
211
206
|
CommaFeed
|
|
212
207
|
Commons-HttpClient
|
|
213
|
-
|
|
208
|
+
commonscan
|
|
214
209
|
contactbigdatafr
|
|
215
210
|
contentkingapp
|
|
216
211
|
convera
|
|
217
|
-
CookieReports
|
|
212
|
+
CookieReports
|
|
218
213
|
copyright sheriff
|
|
219
214
|
CopyRightCheck
|
|
220
215
|
Copyscape
|
|
@@ -227,7 +222,7 @@ CSHttp
|
|
|
227
222
|
curb
|
|
228
223
|
Curious George
|
|
229
224
|
curl
|
|
230
|
-
cuwhois\/
|
|
225
|
+
cuwhois\/
|
|
231
226
|
cybo\.com
|
|
232
227
|
DAP\/NetHTTP
|
|
233
228
|
DareBoost
|
|
@@ -239,7 +234,6 @@ DataparkSearch
|
|
|
239
234
|
dataprovider
|
|
240
235
|
DataXu
|
|
241
236
|
Daum(oa)?[ \/][0-9]
|
|
242
|
-
DemandbasePublisherAnalyzer\/
|
|
243
237
|
Demon
|
|
244
238
|
DeuSu
|
|
245
239
|
developers\.google\.com\/\+\/web\/snippet\/
|
|
@@ -253,23 +247,21 @@ Dispatch\/
|
|
|
253
247
|
DittoSpyder
|
|
254
248
|
dlvr
|
|
255
249
|
DMBrowser
|
|
256
|
-
DNS-Tools Header-Analyzer
|
|
257
250
|
DNSPod-reporting
|
|
258
251
|
docoloc
|
|
259
|
-
Dolphin http client
|
|
252
|
+
Dolphin http client
|
|
260
253
|
DomainAppender
|
|
261
254
|
Donuts Content Explorer
|
|
262
255
|
dotMailer content retrieval
|
|
263
256
|
dotSemantic
|
|
264
257
|
downforeveryoneorjustme
|
|
265
|
-
Download
|
|
266
|
-
downnotifier
|
|
258
|
+
Download Wonder
|
|
259
|
+
downnotifier
|
|
267
260
|
DowntimeDetector
|
|
268
|
-
Dragonfly File Reader
|
|
269
261
|
Drip
|
|
270
262
|
drupact
|
|
271
263
|
Drupal \(\+http:\/\/drupal\.org\/\)
|
|
272
|
-
DTS
|
|
264
|
+
DTS Agent
|
|
273
265
|
dubaiindex
|
|
274
266
|
EARTHCOM
|
|
275
267
|
Easy-Thumb
|
|
@@ -285,8 +277,7 @@ EirGrabber
|
|
|
285
277
|
ElectricMonk
|
|
286
278
|
elefent
|
|
287
279
|
EMail Exractor
|
|
288
|
-
EMail
|
|
289
|
-
Email%20Extractor
|
|
280
|
+
EMail Wolf
|
|
290
281
|
EmailWolf
|
|
291
282
|
Embarcadero
|
|
292
283
|
Embed PHP Library
|
|
@@ -304,8 +295,7 @@ Excel\/
|
|
|
304
295
|
exif
|
|
305
296
|
Exploratodo
|
|
306
297
|
Express WebPictures
|
|
307
|
-
|
|
308
|
-
Extreme\ Picture\ Finder
|
|
298
|
+
Extreme Picture Finder
|
|
309
299
|
EyeNetIE
|
|
310
300
|
ezooms
|
|
311
301
|
facebookexternalhit
|
|
@@ -322,14 +312,13 @@ Feedable\/
|
|
|
322
312
|
Feedbin
|
|
323
313
|
FeedBooster
|
|
324
314
|
FeedBucket
|
|
325
|
-
FeedBunch\/
|
|
315
|
+
FeedBunch\/
|
|
326
316
|
FeedBurner
|
|
327
|
-
|
|
317
|
+
feeder
|
|
328
318
|
Feedly
|
|
329
|
-
Feedreader
|
|
330
319
|
FeedshowOnline
|
|
331
320
|
Feedspot
|
|
332
|
-
Feedwind\/
|
|
321
|
+
Feedwind\/
|
|
333
322
|
FeedZcollector
|
|
334
323
|
feeltiptop
|
|
335
324
|
Fetch API
|
|
@@ -348,33 +337,30 @@ fluffy
|
|
|
348
337
|
Flunky
|
|
349
338
|
flynxapp
|
|
350
339
|
forensiq
|
|
351
|
-
FoundSeoTool
|
|
340
|
+
FoundSeoTool
|
|
352
341
|
http:\/\/www.neomo.de\/
|
|
353
342
|
free thumbnails
|
|
354
343
|
Freeuploader
|
|
355
|
-
FreeWebMonitoring SiteChecker
|
|
356
344
|
Funnelback
|
|
357
345
|
G-i-g-a-b-o-t
|
|
358
346
|
g00g1e\.net
|
|
359
|
-
|
|
360
|
-
ganarvisitas\/[0-9]
|
|
347
|
+
ganarvisitas
|
|
361
348
|
geek-tools
|
|
362
|
-
Genderanalyzer
|
|
363
349
|
Genieo
|
|
364
350
|
GentleSource
|
|
365
351
|
GetCode
|
|
366
352
|
Getintent
|
|
367
353
|
GetLinkInfo
|
|
368
|
-
getprismatic
|
|
354
|
+
getprismatic
|
|
369
355
|
GetRight
|
|
370
356
|
getroot
|
|
371
|
-
GetURLInfo\/
|
|
357
|
+
GetURLInfo\/
|
|
372
358
|
GetWeb
|
|
373
359
|
Ghost Inspector
|
|
374
360
|
GigablastOpenSource
|
|
375
361
|
GIS-LABS
|
|
376
362
|
github-camo
|
|
377
|
-
github\.com
|
|
363
|
+
github\.com
|
|
378
364
|
Go [\d\.]* package http
|
|
379
365
|
Go http package
|
|
380
366
|
Go-Ahead-Got-It
|
|
@@ -384,7 +370,7 @@ gobyus
|
|
|
384
370
|
gofetch
|
|
385
371
|
GomezAgent
|
|
386
372
|
gooblog
|
|
387
|
-
Goodzer\/
|
|
373
|
+
Goodzer\/
|
|
388
374
|
Google AppsViewer
|
|
389
375
|
Google Desktop
|
|
390
376
|
Google favicon
|
|
@@ -394,7 +380,6 @@ Google Page Speed Insights
|
|
|
394
380
|
Google PP Default
|
|
395
381
|
Google Search Console
|
|
396
382
|
Google Web Preview
|
|
397
|
-
google_partner_monitoring
|
|
398
383
|
Google-Adwords
|
|
399
384
|
Google-Apps-Script
|
|
400
385
|
Google-Calendar-Importer
|
|
@@ -406,7 +391,6 @@ Google-Site-Verification
|
|
|
406
391
|
Google-Structured-Data-Testing-Tool
|
|
407
392
|
Google-Youtube-Links
|
|
408
393
|
google-xrawler
|
|
409
|
-
GoogleCloudMonitoring
|
|
410
394
|
GoogleDocs
|
|
411
395
|
GoogleHC\/
|
|
412
396
|
GoogleProducer
|
|
@@ -415,7 +399,6 @@ Google-Transparency-Report
|
|
|
415
399
|
Gookey
|
|
416
400
|
GoScraper
|
|
417
401
|
GoSpotCheck
|
|
418
|
-
GoSquared-Status-Checker
|
|
419
402
|
gosquared-thumbnailer
|
|
420
403
|
Gotit
|
|
421
404
|
GoZilla
|
|
@@ -438,29 +421,29 @@ HAA(A)?RTLAND http client
|
|
|
438
421
|
Haansoft
|
|
439
422
|
hackney\/
|
|
440
423
|
Hadi Agent
|
|
424
|
+
HappyApps-WebCheck
|
|
441
425
|
Hatena
|
|
442
426
|
Havij
|
|
443
|
-
hawkReader
|
|
444
427
|
HeadlessChrome
|
|
445
428
|
HEADMasterSEO
|
|
446
429
|
HeartRails_Capture
|
|
447
430
|
help@dataminr\.com
|
|
448
431
|
heritrix
|
|
449
|
-
historious
|
|
432
|
+
historious
|
|
450
433
|
hkedcity
|
|
451
|
-
hledejLevne\.cz
|
|
434
|
+
hledejLevne\.cz
|
|
452
435
|
Hloader
|
|
453
436
|
HMView
|
|
454
437
|
Holmes
|
|
455
|
-
HonesoSearchEngine
|
|
438
|
+
HonesoSearchEngine
|
|
456
439
|
HootSuite Image proxy
|
|
457
|
-
Hootsuite-WebFeed
|
|
440
|
+
Hootsuite-WebFeed
|
|
458
441
|
hosterstats
|
|
459
442
|
HostTracker
|
|
460
443
|
ht:\/\/check
|
|
461
444
|
htdig
|
|
462
445
|
HTMLparser
|
|
463
|
-
htmlyse
|
|
446
|
+
htmlyse
|
|
464
447
|
HTTP Banner Detection
|
|
465
448
|
HTTP_Compression_Test
|
|
466
449
|
http_request2
|
|
@@ -485,19 +468,18 @@ httrack
|
|
|
485
468
|
huaweisymantec
|
|
486
469
|
HubSpot
|
|
487
470
|
Humanlinks
|
|
488
|
-
HyperZbozi\.cz Feeder
|
|
489
471
|
i2kconnect\/
|
|
490
472
|
Iblog
|
|
491
473
|
ichiro
|
|
492
474
|
Id-search
|
|
493
475
|
IdeelaborPlagiaat
|
|
494
476
|
IDG Twitter Links Resolver
|
|
495
|
-
IDwhois\/
|
|
477
|
+
IDwhois\/
|
|
496
478
|
Iframely
|
|
497
479
|
igdeSpyder
|
|
498
480
|
IlTrovatore
|
|
499
|
-
Image
|
|
500
|
-
Image
|
|
481
|
+
Image Fetch
|
|
482
|
+
Image Sucker
|
|
501
483
|
ImageEngine\/
|
|
502
484
|
ImageVisu\/
|
|
503
485
|
Imagga
|
|
@@ -506,12 +488,12 @@ imgsizer
|
|
|
506
488
|
InAGist
|
|
507
489
|
inbound\.li parser
|
|
508
490
|
InDesign%20CC
|
|
509
|
-
Indy
|
|
491
|
+
Indy Library
|
|
510
492
|
InetURL
|
|
511
493
|
infegy
|
|
512
494
|
infohelfer
|
|
513
495
|
InfoTekies
|
|
514
|
-
InfoWizards Reciprocal Link
|
|
496
|
+
InfoWizards Reciprocal Link
|
|
515
497
|
inpwrd\.com
|
|
516
498
|
instabid
|
|
517
499
|
Instapaper
|
|
@@ -520,7 +502,7 @@ integromedb
|
|
|
520
502
|
Intelliseek
|
|
521
503
|
InterGET
|
|
522
504
|
internet_archive
|
|
523
|
-
Internet
|
|
505
|
+
Internet Ninja
|
|
524
506
|
InternetSeer
|
|
525
507
|
internetVista monitor
|
|
526
508
|
intraVnews
|
|
@@ -536,7 +518,7 @@ Irokez
|
|
|
536
518
|
isitup\.org
|
|
537
519
|
iskanie
|
|
538
520
|
isUp\.li
|
|
539
|
-
iThemes Sync\/
|
|
521
|
+
iThemes Sync\/
|
|
540
522
|
iZSearch
|
|
541
523
|
JAHHO
|
|
542
524
|
janforman
|
|
@@ -558,12 +540,10 @@ Jorgee
|
|
|
558
540
|
JS-Kit
|
|
559
541
|
JustView
|
|
560
542
|
Kaspersky Lab CFR link resolver
|
|
561
|
-
KeepRight OpenStreetMap Checker
|
|
562
543
|
Kelny\/
|
|
563
544
|
Kerrigan\/
|
|
564
545
|
KeyCDN
|
|
565
|
-
Keyword
|
|
566
|
-
Keyword\ Density
|
|
546
|
+
Keyword Density
|
|
567
547
|
Keywords Research
|
|
568
548
|
KickFire
|
|
569
549
|
KimonoLabs\/
|
|
@@ -577,7 +557,6 @@ KumKie
|
|
|
577
557
|
L\.webis
|
|
578
558
|
Larbin
|
|
579
559
|
Lavf\/
|
|
580
|
-
LayeredExtractor
|
|
581
560
|
LeechFTP
|
|
582
561
|
LeechGet
|
|
583
562
|
letsencrypt
|
|
@@ -590,7 +569,6 @@ Licorne
|
|
|
590
569
|
Liferea\/
|
|
591
570
|
Lightspeedsystems
|
|
592
571
|
Likse
|
|
593
|
-
link checker
|
|
594
572
|
Link Valet
|
|
595
573
|
link_thumbnailer
|
|
596
574
|
LinkAlarm\/
|
|
@@ -630,15 +608,14 @@ MapperCmd
|
|
|
630
608
|
marketinggrader
|
|
631
609
|
MarkMonitor
|
|
632
610
|
MarkWatch
|
|
633
|
-
Mass
|
|
634
|
-
masscan\/
|
|
635
|
-
Mata
|
|
611
|
+
Mass Downloader
|
|
612
|
+
masscan\/
|
|
613
|
+
Mata Hari
|
|
636
614
|
Mediapartners-Google
|
|
637
615
|
mediawords
|
|
638
616
|
MegaIndex\.ru
|
|
639
617
|
MeltwaterNews
|
|
640
|
-
Melvil Rawi
|
|
641
|
-
MergeFlow-PageReader
|
|
618
|
+
Melvil Rawi
|
|
642
619
|
Metaspinner
|
|
643
620
|
MetaURI
|
|
644
621
|
MFC_Tear_Sample
|
|
@@ -647,13 +624,13 @@ Microsoft Office
|
|
|
647
624
|
Microsoft Outlook
|
|
648
625
|
Microsoft Windows Network Diagnostics
|
|
649
626
|
Microsoft-WebDAV-MiniRedir
|
|
650
|
-
Microsoft
|
|
651
|
-
MIDown
|
|
627
|
+
Microsoft Data Access
|
|
628
|
+
MIDown tool
|
|
652
629
|
MIIxpc
|
|
653
630
|
Mindjet
|
|
654
|
-
Miniature\.io
|
|
631
|
+
Miniature\.io
|
|
655
632
|
Miniflux
|
|
656
|
-
Mister
|
|
633
|
+
Mister PiX
|
|
657
634
|
mixdata dot com
|
|
658
635
|
mixed-content-scan
|
|
659
636
|
Mixmax-LinkPreview
|
|
@@ -664,16 +641,16 @@ Mojeek
|
|
|
664
641
|
Mojolicious \(Perl\)
|
|
665
642
|
Monit\/
|
|
666
643
|
monitis
|
|
667
|
-
Monitority\/
|
|
644
|
+
Monitority\/
|
|
668
645
|
montastic
|
|
669
646
|
MonTools
|
|
670
647
|
Moreover
|
|
671
|
-
Morfeus
|
|
648
|
+
Morfeus Fucking Scanner
|
|
672
649
|
Morning Paper
|
|
673
650
|
MovableType
|
|
674
651
|
mowser
|
|
675
652
|
Mrcgiguy
|
|
676
|
-
MS
|
|
653
|
+
MS Web Services Client Protocol
|
|
677
654
|
MSFrontPage
|
|
678
655
|
mShots
|
|
679
656
|
MuckRack\/
|
|
@@ -681,14 +658,14 @@ muhstik-scan
|
|
|
681
658
|
MVAClient
|
|
682
659
|
MxToolbox\/
|
|
683
660
|
nagios
|
|
684
|
-
Najdi\.si
|
|
685
|
-
Name
|
|
661
|
+
Najdi\.si
|
|
662
|
+
Name Intelligence
|
|
686
663
|
Nameprotect
|
|
687
664
|
Navroad
|
|
688
665
|
NearSite
|
|
689
666
|
Needle
|
|
690
667
|
Nessus
|
|
691
|
-
Net
|
|
668
|
+
Net Vampire
|
|
692
669
|
NetAnts
|
|
693
670
|
NETCRAFT
|
|
694
671
|
NetLyzer
|
|
@@ -713,11 +690,11 @@ NG-Search
|
|
|
713
690
|
Nibbler
|
|
714
691
|
NICErsPRO
|
|
715
692
|
Nikto
|
|
716
|
-
nineconnections
|
|
693
|
+
nineconnections
|
|
717
694
|
NLNZ_IAHarvester
|
|
718
695
|
Nmap Scripting Engine
|
|
719
696
|
node-superagent
|
|
720
|
-
node-urllib
|
|
697
|
+
node-urllib
|
|
721
698
|
node\.io
|
|
722
699
|
Nodemeter
|
|
723
700
|
NodePing
|
|
@@ -729,16 +706,16 @@ nuhk
|
|
|
729
706
|
nutch
|
|
730
707
|
Nuzzel
|
|
731
708
|
nWormFeedFinder
|
|
709
|
+
nyawc\/
|
|
732
710
|
Nymesis
|
|
733
711
|
NYU
|
|
734
|
-
Ocelli\/
|
|
712
|
+
Ocelli\/
|
|
735
713
|
Octopus
|
|
736
714
|
oegp
|
|
737
715
|
Offline Explorer
|
|
738
|
-
Offline
|
|
739
|
-
og-scraper
|
|
716
|
+
Offline Navigator
|
|
717
|
+
og-scraper
|
|
740
718
|
okhttp
|
|
741
|
-
Omea Reader
|
|
742
719
|
omgili
|
|
743
720
|
OMSC
|
|
744
721
|
Online Domain Tools
|
|
@@ -749,26 +726,25 @@ Openstat\/
|
|
|
749
726
|
OpenVAS
|
|
750
727
|
Optimizer
|
|
751
728
|
Orbiter
|
|
752
|
-
OrgProbe\/
|
|
729
|
+
OrgProbe\/
|
|
753
730
|
orion-semantics
|
|
754
731
|
Outlook-Express
|
|
732
|
+
Outlook-iOS
|
|
755
733
|
ow\.ly
|
|
756
734
|
Owler
|
|
757
735
|
ownCloud News
|
|
758
|
-
OxfordCloudService
|
|
759
|
-
Page Analyzer
|
|
736
|
+
OxfordCloudService
|
|
760
737
|
Page Valet
|
|
761
738
|
page_verifier
|
|
762
|
-
page
|
|
739
|
+
page scorer
|
|
763
740
|
page2rss
|
|
764
|
-
PageAnalyzer
|
|
765
741
|
PageGrabber
|
|
766
742
|
PagePeeker
|
|
767
743
|
PageScorer
|
|
768
|
-
Pagespeed\/
|
|
744
|
+
Pagespeed\/
|
|
769
745
|
Panopta
|
|
770
746
|
panscient
|
|
771
|
-
Papa
|
|
747
|
+
Papa Foto
|
|
772
748
|
parsijoo
|
|
773
749
|
Pavuk
|
|
774
750
|
PayPal IPN
|
|
@@ -789,7 +765,7 @@ Picscout
|
|
|
789
765
|
Picsearch
|
|
790
766
|
PictureFinder
|
|
791
767
|
Pimonster
|
|
792
|
-
ping\.blo\.gs
|
|
768
|
+
ping\.blo\.gs
|
|
793
769
|
Pingability
|
|
794
770
|
PingAdmin\.Ru
|
|
795
771
|
Pingdom
|
|
@@ -806,21 +782,21 @@ PocketImageCache
|
|
|
806
782
|
PocketParser
|
|
807
783
|
Pockey
|
|
808
784
|
POE-Component-Client-HTTP
|
|
785
|
+
Polymail\/
|
|
809
786
|
Pompos
|
|
810
787
|
Porkbun
|
|
811
788
|
Port Monitor
|
|
812
789
|
postano
|
|
813
|
-
PostmanRuntime
|
|
790
|
+
PostmanRuntime
|
|
814
791
|
PostPost
|
|
815
792
|
postrank
|
|
816
793
|
PowerPoint\/
|
|
817
794
|
Priceonomics Analysis Engine
|
|
818
|
-
PrintFriendly
|
|
819
|
-
PritTorrent
|
|
795
|
+
PrintFriendly
|
|
796
|
+
PritTorrent
|
|
820
797
|
Prlog
|
|
821
798
|
probethenet
|
|
822
799
|
Project 25499
|
|
823
|
-
Promotion_Tools_www\.searchenginepromotionhelp\.com
|
|
824
800
|
prospectb2b
|
|
825
801
|
Protopage
|
|
826
802
|
ProWebWalker
|
|
@@ -838,8 +814,8 @@ Qirina Hurdler
|
|
|
838
814
|
QQDownload
|
|
839
815
|
QrafterPro
|
|
840
816
|
Qseero
|
|
841
|
-
Qualidator
|
|
842
|
-
QueryN
|
|
817
|
+
Qualidator
|
|
818
|
+
QueryN Metasearch
|
|
843
819
|
queuedriver
|
|
844
820
|
Quora Link Preview
|
|
845
821
|
Qwantify
|
|
@@ -855,22 +831,19 @@ RebelMouse
|
|
|
855
831
|
Recorder
|
|
856
832
|
RecurPost\/
|
|
857
833
|
redback\/
|
|
858
|
-
Redirect Checker Tool
|
|
859
834
|
ReederForMac
|
|
860
835
|
ReGet
|
|
861
836
|
RepoMonkey
|
|
862
837
|
request\.js
|
|
863
|
-
ResponseCodeTest
|
|
838
|
+
ResponseCodeTest
|
|
864
839
|
RestSharp
|
|
865
840
|
Riddler
|
|
866
841
|
Rival IQ
|
|
867
842
|
Robosourcer
|
|
868
|
-
Robozilla
|
|
843
|
+
Robozilla
|
|
869
844
|
ROI Hunter
|
|
870
845
|
RPT-HTTPClient
|
|
871
|
-
rss reader
|
|
872
846
|
RSSOwl
|
|
873
|
-
RssReader\/
|
|
874
847
|
safe-agent-scanner
|
|
875
848
|
SalesIntelligent
|
|
876
849
|
Saleslift
|
|
@@ -888,11 +861,12 @@ ScrapeBox Page Scanner
|
|
|
888
861
|
SimpleScraper
|
|
889
862
|
Scrapy
|
|
890
863
|
Screaming
|
|
891
|
-
ScreenShotService
|
|
864
|
+
ScreenShotService
|
|
892
865
|
Scrubby
|
|
893
866
|
Scrutiny\/
|
|
894
867
|
search\.thunderstone
|
|
895
|
-
Search37
|
|
868
|
+
Search37
|
|
869
|
+
searchenginepromotionhelp
|
|
896
870
|
Searchestate
|
|
897
871
|
SearchExpress
|
|
898
872
|
SearchSight
|
|
@@ -912,29 +886,26 @@ SeoCheck
|
|
|
912
886
|
SEOkicks
|
|
913
887
|
Seomoz
|
|
914
888
|
SEOprofiler
|
|
915
|
-
SEOsearch
|
|
916
|
-
SeopultContentAnalyzer
|
|
889
|
+
SEOsearch
|
|
917
890
|
seoscanners
|
|
891
|
+
seositecheckup
|
|
918
892
|
SEOstats
|
|
919
|
-
|
|
920
|
-
servernfo\.com
|
|
893
|
+
servernfo
|
|
921
894
|
sexsearcher
|
|
922
895
|
Seznam
|
|
923
896
|
Shelob
|
|
924
897
|
Shodan
|
|
925
|
-
Shoppimon
|
|
926
|
-
ShoppimonAgent\/[0-9]
|
|
898
|
+
Shoppimon
|
|
927
899
|
ShopWiki
|
|
928
900
|
ShortLinkTranslate
|
|
929
901
|
shrinktheweb
|
|
930
902
|
Sideqik
|
|
931
|
-
SilverReader
|
|
932
903
|
SimplePie
|
|
933
904
|
SimplyFast
|
|
934
905
|
Siphon
|
|
935
906
|
SISTRIX
|
|
936
907
|
Site-Shot\/
|
|
937
|
-
Site
|
|
908
|
+
Site Sucker
|
|
938
909
|
Site24x7
|
|
939
910
|
SiteBar
|
|
940
911
|
Sitebeam
|
|
@@ -1002,7 +973,6 @@ StumbleUpon
|
|
|
1002
973
|
suchen
|
|
1003
974
|
Sucuri
|
|
1004
975
|
summify
|
|
1005
|
-
Super Monitoring
|
|
1006
976
|
SuperHTTP
|
|
1007
977
|
Surphace Scout
|
|
1008
978
|
Suzuran
|
|
@@ -1024,16 +994,16 @@ Telesphoreo
|
|
|
1024
994
|
Telesphorep
|
|
1025
995
|
Tenon\.io
|
|
1026
996
|
teoma
|
|
1027
|
-
terrainformatica
|
|
997
|
+
terrainformatica
|
|
1028
998
|
Test Certificate Info
|
|
1029
|
-
|
|
999
|
+
testuri
|
|
1000
|
+
Tetrahedron
|
|
1030
1001
|
The Drop Reaper
|
|
1031
1002
|
The Expert HTML Source Viewer
|
|
1032
1003
|
The Knowledge AI
|
|
1033
|
-
The
|
|
1004
|
+
The Intraformant
|
|
1034
1005
|
theinternetrules
|
|
1035
1006
|
TheNomad
|
|
1036
|
-
theoldreader\.com
|
|
1037
1007
|
Thinklab
|
|
1038
1008
|
Thumbshots
|
|
1039
1009
|
ThumbSniper
|
|
@@ -1049,13 +1019,13 @@ tracemyfile
|
|
|
1049
1019
|
TrapitAgent
|
|
1050
1020
|
Trendiction
|
|
1051
1021
|
Trendsmap
|
|
1052
|
-
trendspottr
|
|
1022
|
+
trendspottr
|
|
1053
1023
|
truwoGPS
|
|
1054
1024
|
TryJsoup
|
|
1055
1025
|
TulipChain
|
|
1056
1026
|
Turingos
|
|
1057
1027
|
Turnitin
|
|
1058
|
-
tweetedtimes
|
|
1028
|
+
tweetedtimes
|
|
1059
1029
|
Tweetminster
|
|
1060
1030
|
Tweezler\/
|
|
1061
1031
|
twibble
|
|
@@ -1077,16 +1047,15 @@ updown\.io daemon
|
|
|
1077
1047
|
Upflow
|
|
1078
1048
|
Uptimia
|
|
1079
1049
|
URL Verifier
|
|
1080
|
-
|
|
1081
|
-
URLitor\.com
|
|
1050
|
+
URLitor
|
|
1082
1051
|
urlresolver
|
|
1083
1052
|
Urlstat
|
|
1084
1053
|
UrlTrends Ranking Updater
|
|
1085
|
-
URLy
|
|
1054
|
+
URLy Warning
|
|
1086
1055
|
URLy\.Warning
|
|
1087
1056
|
Vacuum
|
|
1088
1057
|
Vagabondo
|
|
1089
|
-
VB
|
|
1058
|
+
VB Project
|
|
1090
1059
|
vBSEO
|
|
1091
1060
|
VCI
|
|
1092
1061
|
via ggpht\.com GoogleImageProxy
|
|
@@ -1098,12 +1067,11 @@ VoidEYE
|
|
|
1098
1067
|
Voil
|
|
1099
1068
|
voltron
|
|
1100
1069
|
voyager\/
|
|
1101
|
-
VSAgent\/
|
|
1102
|
-
VSB-TUO\/
|
|
1070
|
+
VSAgent\/
|
|
1071
|
+
VSB-TUO\/
|
|
1103
1072
|
Vulnbusters Meter
|
|
1104
1073
|
VYU2
|
|
1105
1074
|
w3af\.org
|
|
1106
|
-
W3C_I18n-Checker
|
|
1107
1075
|
W3C_Unicorn
|
|
1108
1076
|
W3C-checklink
|
|
1109
1077
|
W3C-mobileOK
|
|
@@ -1116,16 +1084,15 @@ WatchMouse
|
|
|
1116
1084
|
WbSrch\/
|
|
1117
1085
|
WDT\.io
|
|
1118
1086
|
web-capture\.net
|
|
1119
|
-
Web-Monitoring
|
|
1120
1087
|
Web-sniffer
|
|
1121
|
-
Web
|
|
1122
|
-
Web
|
|
1123
|
-
Web
|
|
1124
|
-
Web
|
|
1125
|
-
Web
|
|
1126
|
-
Web
|
|
1127
|
-
Web
|
|
1128
|
-
Web
|
|
1088
|
+
Web Auto
|
|
1089
|
+
Web Collage
|
|
1090
|
+
Web Enhancer
|
|
1091
|
+
Web Fetch
|
|
1092
|
+
Web Fuck
|
|
1093
|
+
Web Pix
|
|
1094
|
+
Web Sauger
|
|
1095
|
+
Web Sucker
|
|
1129
1096
|
Webalta
|
|
1130
1097
|
Webauskunft
|
|
1131
1098
|
WebAuto
|
|
@@ -1135,36 +1102,35 @@ webcollage
|
|
|
1135
1102
|
WebCookies
|
|
1136
1103
|
WebCopier
|
|
1137
1104
|
WebCorp
|
|
1138
|
-
WebDataStats
|
|
1105
|
+
WebDataStats
|
|
1139
1106
|
WebDoc
|
|
1140
1107
|
WebEnhancer
|
|
1141
1108
|
WebFetch
|
|
1142
1109
|
WebFuck
|
|
1143
|
-
|
|
1110
|
+
WebGazer
|
|
1111
|
+
WebGo IS
|
|
1144
1112
|
WebImageCollector
|
|
1145
1113
|
WebImages
|
|
1146
1114
|
WebIndex
|
|
1147
1115
|
webkit2png
|
|
1148
1116
|
WebLeacher
|
|
1149
1117
|
webmastercoffee
|
|
1150
|
-
webmon
|
|
1118
|
+
webmon\s
|
|
1151
1119
|
WebPix
|
|
1152
1120
|
WebReaper
|
|
1153
1121
|
WebSauger
|
|
1154
1122
|
webscreenie
|
|
1155
1123
|
Webshag
|
|
1156
1124
|
Webshot
|
|
1157
|
-
Website
|
|
1158
|
-
Website\ Quester
|
|
1159
|
-
WebsiteExtractor
|
|
1125
|
+
Website Quester
|
|
1160
1126
|
websitepulse agent
|
|
1161
|
-
websitepulse[+ ]checker
|
|
1162
1127
|
WebsiteQuester
|
|
1163
|
-
Websnapr
|
|
1128
|
+
Websnapr
|
|
1129
|
+
WebSniffer
|
|
1164
1130
|
Webster
|
|
1165
1131
|
WebStripper
|
|
1166
1132
|
WebSucker
|
|
1167
|
-
Webthumb\/
|
|
1133
|
+
Webthumb\/
|
|
1168
1134
|
WebThumbnail
|
|
1169
1135
|
WebWhacker
|
|
1170
1136
|
WebZIP
|
|
@@ -1206,13 +1172,12 @@ x09Mozilla
|
|
|
1206
1172
|
x22Mozilla
|
|
1207
1173
|
XaxisSemanticsClassifier
|
|
1208
1174
|
Xenu Link Sleuth
|
|
1209
|
-
XING-contenttabreceiver
|
|
1175
|
+
XING-contenttabreceiver
|
|
1210
1176
|
xpymep([0-9]?)\.exe
|
|
1211
1177
|
Y!J-(ASR|BSC)
|
|
1212
1178
|
Y\!J-BRW
|
|
1213
1179
|
Yaanb
|
|
1214
1180
|
yacy
|
|
1215
|
-
Yahoo Ad monitoring
|
|
1216
1181
|
Yahoo Link Preview
|
|
1217
1182
|
YahooCacheSystem
|
|
1218
1183
|
YahooYSMcm
|
|
@@ -1224,7 +1189,7 @@ Yo-yo
|
|
|
1224
1189
|
Yoleo Consumer
|
|
1225
1190
|
yoogliFetchAgent
|
|
1226
1191
|
YottaaMonitor
|
|
1227
|
-
Your-Website-Sucks
|
|
1192
|
+
Your-Website-Sucks
|
|
1228
1193
|
yourls\.org
|
|
1229
1194
|
YoYs\.net
|
|
1230
1195
|
YP\.PL
|
|
@@ -1242,7 +1207,7 @@ ZnajdzFoto
|
|
|
1242
1207
|
Zombie\.js
|
|
1243
1208
|
Zoom\.Mac
|
|
1244
1209
|
ZyBorg
|
|
1245
|
-
[a-z0-9\-_]*(bot|crawl|archiver|transcoder|spider|uptime|validator|fetcher|cron)
|
|
1210
|
+
[a-z0-9\-_]*(bot|crawl|archiver|transcoder|spider|uptime|validator|fetcher|cron|checker|reader|extractor|monitoring|analyzer)
|
|
1246
1211
|
].strip.split(/\n+/).freeze
|
|
1247
1212
|
end
|
|
1248
1213
|
end
|
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: crawler_detect
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.1.
|
|
4
|
+
version: 0.1.6
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Pavel Kozlov
|
|
8
8
|
autorequire:
|
|
9
9
|
bindir: exe
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date:
|
|
11
|
+
date: 2019-02-23 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: bundler
|