RubyGems - device_detector - Versions diffs - 1.0.1 → 1.0.5 - Mend

device_detector 1.0.1 → 1.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (95) hide show

checksums.yaml +5 -5
data/.rubocop.yml +49 -0
data/.ruby-version +1 -0
data/.travis.yml +5 -10
data/CHANGELOG.md +14 -1
data/README.md +6 -6
data/Rakefile +20 -13
data/device_detector.gemspec +1 -0
data/lib/device_detector.rb +30 -26
data/lib/device_detector/bot.rb +2 -2
data/lib/device_detector/client.rb +3 -2
data/lib/device_detector/device.rb +46 -20
data/lib/device_detector/memory_cache.rb +26 -19
data/lib/device_detector/metadata_extractor.rb +7 -8
data/lib/device_detector/model_extractor.rb +3 -3
data/lib/device_detector/name_extractor.rb +2 -2
data/lib/device_detector/os.rb +121 -111
data/lib/device_detector/parser.rb +22 -9
data/lib/device_detector/version.rb +3 -1
data/lib/device_detector/version_extractor.rb +2 -3
data/regexes/bots.yml +442 -19
data/regexes/client/browser_engine.yml +7 -1
data/regexes/client/browsers.yml +773 -103
data/regexes/client/feed_readers.yml +14 -8
data/regexes/client/libraries.yml +43 -2
data/regexes/client/mediaplayers.yml +21 -5
data/regexes/client/mobile_apps.yml +131 -1
data/regexes/client/pim.yml +6 -1
data/regexes/device/cameras.yml +1 -1
data/regexes/device/car_browsers.yml +7 -3
data/regexes/device/consoles.yml +3 -3
data/regexes/device/mobiles.yml +11365 -791
data/regexes/device/notebooks.yml +114 -0
data/regexes/device/portable_media_player.yml +2 -2
data/regexes/device/televisions.yml +17 -3
data/regexes/oss.yml +115 -47
data/regexes/vendorfragments.yml +6 -2
data/spec/device_detector/concrete_user_agent_spec.rb +16 -17
data/spec/device_detector/detector_fixtures_spec.rb +30 -35
data/spec/device_detector/device_spec.rb +28 -48
data/spec/device_detector/memory_cache_spec.rb +60 -28
data/spec/device_detector/model_extractor_spec.rb +3 -3
data/spec/device_detector/version_extractor_spec.rb +5 -6
data/spec/device_detector_spec.rb +49 -78
data/spec/fixtures/client/browser.yml +1521 -406
data/spec/fixtures/client/feed_reader.yml +39 -51
data/spec/fixtures/client/library.yml +72 -11
data/spec/fixtures/client/mediaplayer.yml +29 -40
data/spec/fixtures/client/mobile_app.yml +172 -32
data/spec/fixtures/client/pim.yml +32 -19
data/spec/fixtures/detector/bots.yml +854 -19
data/spec/fixtures/detector/camera.yml +22 -2
data/spec/fixtures/detector/car_browser.yml +60 -0
data/spec/fixtures/detector/console.yml +43 -3
data/spec/fixtures/detector/desktop.yml +2860 -1527
data/spec/fixtures/detector/feature_phone.yml +69 -1
data/spec/fixtures/detector/feed_reader.yml +158 -130
data/spec/fixtures/detector/mediaplayer.yml +113 -39
data/spec/fixtures/detector/mobile_apps.yml +262 -89
data/spec/fixtures/detector/phablet.yml +3444 -663
data/spec/fixtures/detector/portable_media_player.yml +57 -0
data/spec/fixtures/detector/smart_speaker.yml +55 -0
data/spec/fixtures/detector/smartphone-1.yml +4739 -4765
data/spec/fixtures/detector/smartphone-10.yml +9973 -0
data/spec/fixtures/detector/smartphone-11.yml +10015 -0
data/spec/fixtures/detector/smartphone-12.yml +9897 -0
data/spec/fixtures/detector/smartphone-13.yml +9912 -0
data/spec/fixtures/detector/smartphone-14.yml +9935 -0
data/spec/fixtures/detector/smartphone-15.yml +6595 -0
data/spec/fixtures/detector/smartphone-16.yml +10021 -0
data/spec/fixtures/detector/smartphone-17.yml +9408 -0
data/spec/fixtures/detector/smartphone-2.yml +4265 -4238
data/spec/fixtures/detector/smartphone-3.yml +4487 -4391
data/spec/fixtures/detector/smartphone-4.yml +4210 -4179
data/spec/fixtures/detector/smartphone-5.yml +5794 -2901
data/spec/fixtures/detector/smartphone-6.yml +10114 -0
data/spec/fixtures/detector/smartphone-7.yml +9975 -0
data/spec/fixtures/detector/smartphone-8.yml +9897 -0
data/spec/fixtures/detector/smartphone-9.yml +9880 -0
data/spec/fixtures/detector/smartphone.yml +4152 -4048
data/spec/fixtures/detector/tablet-1.yml +3997 -3991
data/spec/fixtures/detector/tablet-2.yml +6820 -1935
data/spec/fixtures/detector/tablet-3.yml +9968 -0
data/spec/fixtures/detector/tablet-4.yml +7113 -0
data/spec/fixtures/detector/tablet.yml +3789 -3804
data/spec/fixtures/detector/tv.yml +3889 -1495
data/spec/fixtures/detector/unknown.yml +45 -179
data/spec/fixtures/detector/wearable.yml +61 -0
data/spec/fixtures/device/camera.yml +4 -3
data/spec/fixtures/device/car_browser.yml +9 -2
data/spec/fixtures/device/console.yml +15 -14
data/spec/fixtures/device/notebook.yml +7 -0
data/spec/fixtures/parser/oss.yml +177 -0
data/spec/fixtures/parser/vendorfragments.yml +6 -0
metadata +57 -7

data/lib/device_detector/version.rb CHANGED

@@ -1,3 +1,5 @@
+# frozen_string_literal: true
 class DeviceDetector
-  VERSION = '1.0.1'
+  VERSION = '1.0.5'
 end

data/lib/device_detector/version_extractor.rb CHANGED

@@ -1,12 +1,11 @@
+# frozen_string_literal: true
 class DeviceDetector
   class VersionExtractor < MetadataExtractor
     private
     def metadata_string
       String(regex_meta[:version])
     end
   end
 end

data/regexes/bots.yml CHANGED

@@ -1,7 +1,7 @@
 ###############
 # Device Detector - The Universal Device Detection library for parsing User Agents
 #
-# @link http://piwik.org
+# @link https://matomo.org
 # @license http://www.gnu.org/licenses/lgpl.html LGPL v3 or later
 ###############
@@ -53,6 +53,21 @@
     name: 'Alexa Internet'
     url: 'http://www.alexa.com'
+- regex: 'alexa site audit'
+  name: 'Alexa Site Audit'
+  category: 'Site Monitor'
+  url: 'http://www.alexa.com/help/webmasters'
+  producer:
+    name: 'Alexa Internet'
+    url: 'http://www.alexa.com'
+- regex: 'Amazon[ -]Route ?53[ -]Health[ -]Check[ -]Service'
+  name: 'Amazon Route53 Health Check'
+  category: 'Service Agent'
+  producer:
+    name: 'Amazon Web Services'
+    url: 'https://aws.amazon.com/'
 - regex: 'AmorankSpider'
   name: 'Amorank Spider'
   category: 'Crawler'
@@ -77,6 +92,22 @@
     name: 'Apple Inc'
     url: 'http://www.apple.com'
+- regex: 'Arachni'
+  name: 'Arachni'
+  category: 'Security Checker'
+  url: 'http://www.arachni-scanner.com'
+  producer:
+    name: 'Sarosys LLC'
+    url: 'http://www.sarosys.com/'
+- regex: 'AspiegelBot'
+  name: 'AspiegelBot'
+  category: 'Crawler'
+  url: 'https://aspiegel.com/'
+  producer:
+    name: 'Huawei'
+    url: 'https://www.huawei.com/'
 - regex: 'Castro 2, Episode Duration Lookup'
   name: 'Castro 2'
   category: 'Service Agent'
@@ -181,6 +212,13 @@
     name: 'Blogtrottr Ltd'
     url: 'https://blogtrottr.com/'
+- regex: 'BoardReader Blog Indexer'
+  name: 'BoardReader Blog Indexer'
+  category: 'Crawler'
+  producer:
+    name: 'BoardReader'
+    url: 'http://boardreader.com/'
 - regex: 'BountiiBot'
   name: 'Bountii Bot'
   category: 'Search bot'
@@ -253,13 +291,13 @@
     name: 'CloudFlare'
     url: 'http://www.cloudflare.com'
-- regex: 'coccoc/'
+- regex: 'coccoc|coccocbot(-ads|-fast|-image|-shopping|-web)?'
   name: 'Cốc Cốc Bot'
-  url: 'http://help.coccoc.com/'
+  url: 'https://help.coccoc.com/en/search-engine/coccoc-robots'
   category: 'Search bot'
   producer:
     name: 'Cốc Cốc'
-    url: 'http://coccoc.com/'
+    url: 'https://coccoc.com/'
 - regex: 'collectd'
   name: 'Collectd'
@@ -293,6 +331,15 @@
     name: 'Datadog'
     url: 'https://www.datadoghq.com/'
+- regex: 'Datanyze'
+  name: 'Datanyze'
+  url: ''
+  category: 'Crawler'
+  producer:
+    name: 'Datanyze'
+    url: 'https://www.datanyze.com'
 - regex: 'Dataprovider'
   name: 'Dataprovider'
   category: 'Crawler'
@@ -341,7 +388,7 @@
     name: 'SEOmoz, Inc.'
     url: 'http://moz.com/'
-- regex: 'DuckDuck'
+- regex: 'DuckDuck(?:Go-Favicons-)?Bot'
   name: 'DuckDuckGo Bot'
   category: 'Search bot'
   url: 'https://duckduckgo.com/duckduckbot'
@@ -357,6 +404,13 @@
     name: 'easou ICP'
     url: 'http://www.easou.com'
+- regex: 'eCairn-Grabber'
+  name: 'eCairn-Grabber'
+  category: 'Crawler'
+  producer:
+    name: 'eCairn'
+    url: 'https://ecairn.com'
 - regex: 'EMail Exractor'
   name: 'EMail Exractor'
   category: 'Crawler'
@@ -397,7 +451,7 @@
     name: 'SEOmoz, Inc.'
     url: 'http://moz.com/'
-- regex: 'facebookexternalhit|facebookplatform'
+- regex: 'facebookexternalhit|facebookplatform|facebookexternalua'
   name: 'Facebook External Hit'
   category: 'Social Media Agent'
   url: 'https://www.facebook.com/externalhit_uatext.php'
@@ -466,6 +520,11 @@
   category: 'Crawler'
   url: 'http://www.findxbot.com'
+- regex: 'FreshRSS'
+  name: 'FreshRSS'
+  category: 'Feed Fetcher'
+  url: 'https://freshrss.org/'
 - regex: 'Genieo'
   name: 'Genieo Web filter'
   category: ''
@@ -498,6 +557,18 @@
     name: 'NTT Resonant'
     url: 'http://goo.ne.jp'
+- regex: 'Google Favicon'
+  name: 'Google Favicon'
+  category: 'Crawler'
+- regex: 'Google Search Console'
+  name: 'Google Search Console'
+  category: 'Crawler'
+  url: 'https://search.google.com/search-console/about'
+  producer:
+    name: 'Google Inc.'
+    url: 'http://www.google.com'
 - regex: 'Google Page Speed Insights'
   name: 'Google PageSpeed Insights'
   category: 'Site Monitor'
@@ -514,6 +585,14 @@
     name: 'Google Inc.'
     url: 'http://www.google.com'
+- regex: 'Google-Cloud-Scheduler'
+  name: 'Google Cloud Scheduler'
+  category: 'Crawler'
+  url: 'https://cloud.google.com/scheduler'
+  producer:
+    name: 'Google Inc.'
+    url: 'https://www.google.com'
 - regex: 'Google-Structured-Data-Testing-Tool'
   name: 'Google Structured Data Testing Tool'
   category: 'Validator'
@@ -522,6 +601,14 @@
     name: 'Google Inc.'
     url: 'http://www.google.com'
+- regex: 'GoogleStackdriverMonitoring'
+  name: 'Google Stackdriver Monitoring'
+  category: 'Site Monitor'
+  url: 'https://cloud.google.com/monitoring'
+  producer:
+    name: 'Google Inc.'
+    url: 'https://www.google.com'
 - regex: 'via ggpht\.com GoogleImageProxy'
   name: 'Gmail Image Proxy'
   category: 'Crawler'
@@ -529,7 +616,7 @@
   producer:
     name: 'Google Inc.'
     url: 'http://www.google.com'
 - regex: 'SeznamEmailProxy'
   name: 'Seznam Email Proxy'
   category: 'Crawler'
@@ -562,7 +649,7 @@
     name: 'Visual Meta'
     url: 'https://www.shopalike.cz/'
-- regex: 'Googlebot(-Mobile|-Image|-Video|-News)?|Feedfetcher-Google|Google-Test|Google-Site-Verification|Google Web Preview|AdsBot-Google(-Mobile)?|Google-Adwords-Instant|Mediapartners-Google|Google.*/\+/web/snippet|GoogleProducer|Google[ -]Publisher[ -]Plugin|Google-Shopping-Quality'
+- regex: 'AdsBot-Google(-Mobile)?|Adwords-(DisplayAds|Express|Instant)|Google Web Preview|Google[ -]Publisher[ -]Plugin|Google-(Adwords|AMPHTML|Assess|HotelAdsVerifier|Read-Aloud|Shopping-Quality|Site-Verification|speakr|Test|Youtube-Links)|(APIs|DuplexWeb|Feedfetcher|Mediapartners)-Google|Googlebot(-Mobile|-Image|-Video|-News)?|GoogleProducer|Google.*/\+/web/snippet'
   name: 'Googlebot'
   category: 'Search bot'
   url: 'http://www.google.com/bot.html'
@@ -602,6 +689,11 @@
     name: ''
     url: ''
+- regex: 'inoreader.com'
+  name: 'inoreader'
+  category: 'Feed Reader'
+  url: 'https://www.inoreader.com'
 - regex: 'iisbot'
   name: 'IIS Site Analysis'
   category: 'Crawler'
@@ -704,6 +796,10 @@
     name: 'Robert Graham'
     url: 'https://github.com/robertdavidgraham'
+- regex: 'Mastodon/'
+  name: 'Mastodon Bot'
+  category: 'Social Media Agent'
 - regex: 'meanpathbot'
   name: 'Meanpath Bot'
   category: 'Search bot'
@@ -780,6 +876,10 @@
     name: 'Nagios Plugins Development Team'
     url: 'https://nagios.org'
+- regex: 'nbertaupete95\(at\)gmail.com'
+  name: 'nbertaupete95'
+  category: 'Crawler'
 - regex: 'Netcraft( Web Server Survey| SSL Server Survey|SurveyAgent)'
   name: 'Netcraft Survey Bot'
   category: 'Search bot'
@@ -790,7 +890,7 @@
 - regex: 'netEstate NE Crawler'
   name: 'netEstate'
-  category: 'Analytics SEO Crawler'
+  category: 'Crawler'
   url: 'http://www.website-datenbank.de/Impressum'
   producer:
     name: 'netEstate GmbH'
@@ -836,10 +936,17 @@
     name: 'Nmap'
     url: 'https://nmap.org/'
+- regex: 'Nuzzel'
+  name: 'Nuzzel'
+  category: 'Crawler'
+  producer:
+    name: 'Nuzzel'
+    url: https://www.nuzzel.com/
 - regex: 'Octopus [0-9]'
   name: 'Octopus'
-- regex: 'omgilibot'
+- regex: 'omgili(?:bot)?'
   name: 'Omgili bot'
   category: 'Search bot'
   url: 'http://www.omgili.com/Crawler.html'
@@ -931,7 +1038,15 @@
   producer:
     name: 'Pingdom AB'
     url: 'https://www.pingdom.com'
+- regex: 'Quora Link Preview'
+  name: 'Quora Link Preview'
+  category: 'Crawler'
+  url: ''
+  producer:
+    name: 'Quora'
+    url: 'http://www.quora.com'
 - regex: 'RamblerMail'
   name: 'RamblerMail Image Proxy'
   category: 'Crawler'
@@ -1075,6 +1190,14 @@
     name: 'Seznam.cz, a.s.'
     url: 'http://www.seznam.cz/'
+- regex: 'shopify-partner-homepage-scraper'
+  name: 'Shopify Partner'
+  category: 'Crawler'
+  url: 'https://www.shopify.com/partners'
+  producer:
+    name: 'Shopify'
+    url: 'https://www.shopify.com/'
 - regex: 'ShopWiki'
   name: 'ShopWiki'
   category: 'Search tools'
@@ -1107,6 +1230,14 @@
     name: 'SISTRIX GmbH'
     url: 'http://www.sistrix.de'
+- regex: 'compatible; (?:SISTRIX )?Optimizer'
+  name: 'SISTRIX Optimizer'
+  category: 'Crawler'
+  url: 'https://optimizer.sistrix.com'
+  producer:
+    name: 'SISTRIX GmbH'
+    url: 'http://www.sistrix.de'
 - regex: 'SiteSucker'
   name: 'SiteSucker'
   category: 'Crawler'
@@ -1211,7 +1342,7 @@
   category: 'Search bot'
 - regex: 'TelegramBot'
-  name: 'TelgramBot'
+  name: 'TelegramBot'
   url: 'https://telegram.org/blog/bot-revolution'
 - regex: 'TLSProbe'
@@ -1238,6 +1369,11 @@
     name: ''
     url: ''
+- regex: 'theoldreader.com'
+  name: 'theoldreader'
+  category: 'Feed Reader'
+  url: 'https://theoldreader.com'
 - regex: 'trendictionbot'
   name: 'Trendiction Bot'
   category: 'Crawler'
@@ -1270,6 +1406,13 @@
     name: 'Mediasift'
     url: ''
+- regex: 'Twingly Recon'
+  name: 'Twingly Recon'
+  category: 'Crawler'
+  producer:
+    name: 'Twingly'
+    url: 'https://www.twingly.com'
 - regex: 'Twitterbot'
   name: 'Twitterbot'
   category: 'Social Media Agent'
@@ -1326,6 +1469,14 @@
     name: 'WiseGuys'
     url: 'http://www.wise-guys.nl/'
+- regex: 'vkShare; '
+  name: 'VK Share Button'
+  category: 'Crawler'
+  url: 'http://vk.com/dev/Share'
+  producer:
+    name: 'VK'
+    url: 'http://vk.com/'
 - regex: 'VSMCrawler'
   name: 'Visual Site Mapper Crawler'
   category: 'Crawler'
@@ -1389,6 +1540,11 @@
     name: 'AliasIO'
     url: 'https://github.com/AliasIO'
+- regex: 'PTST/'
+  name: 'WebPageTest'
+  category: 'Site Monitor'
+  url: 'https://www.webpagetest.org'
 - regex: 'WeSEE(:Search)?'
   name: 'WeSEE:Search'
   category: 'Search bot'
@@ -1429,6 +1585,14 @@
     name: 'Wotbox'
     url: 'http://www.wotbox.com'
+- regex: 'XenForo'
+  name: 'XenForo'
+  category: 'Service Agent'
+  url: 'https://xenforo.com/'
+  producer:
+    name: 'XenForo Ltd.'
+    url: 'https://xenforo.com/'
 - regex: 'yacybot'
   name: 'YaCy'
   category: 'Search bot'
@@ -1461,7 +1625,15 @@
     name: 'Yahoo! Inc.'
     url: 'http://www.yahoo.com'
-- regex: 'Yandex(SpravBot|ScreenshotBot|MobileBot|AccessibilityBot|ForDomain|Vertis|Market|Catalog|Calendar|Sitelinks|AdNet|Pagechecker|Webmaster|Media|Video|Bot|Images|Antivirus|Direct|Blogs|Favicons|ImageResizer|News(links)?|Metrika|\.Gazeta Bot)|YaDirectFetcher'
+- regex: 'Y!J-BRW'
+  name: 'Yahoo! Japan BRW'
+  category: 'Crawler'
+  url: 'https://www.yahoo-help.jp/app/answers/detail/p/595/a_id/42716/~/ウェブページにアクセスするシステムのユーザーエージェントについて'
+  producer:
+    name: 'Yahoo! Japan Corp.'
+    url: 'https://www.yahoo.co.jp/'
+- regex: 'Yandex(SpravBot|ScreenshotBot|MobileBot|AccessibilityBot|ForDomain|Vertis|Market|Catalog|Calendar|Sitelinks|AdNet|Pagechecker|Webmaster|Media|Video|Bot|Images|Antivirus|Direct|Blogs|Favicons|ImageResizer|Verticals|News(links)?|Metrika|\.Gazeta Bot)|YaDirectFetcher|YandexTurbo|YandexTracker|YandexSearchShop|YandexRCA|YandexPartner|YandexOntoDBAPI|YandexOntoDB|YandexMobileScreenShotBot'
   name: 'Yandex Bot'
   category: 'Search bot'
   url: 'http://www.yandex.com/bots'
@@ -1469,7 +1641,7 @@
     name: 'Yandex LLC'
     url: 'http://company.yandex.com'
-- regex: 'Yeti'
+- regex: 'Yeti|NaverJapan'
   name: 'Yeti/Naverbot'
   category: 'Search bot'
   url: 'http://help.naver.com/robots/'
@@ -1551,9 +1723,9 @@
     name: 'HubPages'
     url: 'http://hubpages.com/'
-- regex: 'Pinterest/\d\.\d.*www\.pinterest\.com.*'
+- regex: 'Pinterest(bot)?/\d\.\d.*www\.pinterest\.com.*'
   name: 'Pinterest'
-  url: ''
+  url: 'http://www.pinterest.com/bot.html'
   category: 'Crawler'
   producer:
     name: 'Pinterest'
@@ -1567,6 +1739,14 @@
     name: 'Site24x7'
     url: 'https://www.site24x7.com'
+- regex: 's~snapchat-proxy'
+  name: 'Snapchat Proxy'
+  category: 'Crawler'
+  url: 'https://www.snapchat.com'
+  producer:
+    name: 'Snapchat Inc.'
+    url: 'https://www.snapchat.com'
 - regex: "Let's Encrypt validation server"
   name: "Let's Encrypt Validation"
   category: 'Service Agent'
@@ -1662,7 +1842,10 @@
 - regex: 'Server Density Service Monitoring.*'
   name: 'Server Density'
-- regex: '(A6-Indexer|nuhk|TsolCrawler|Yammybot|Openbot|Gulper Web Bot|grub-client|Download Demon|SearchExpress|Microsoft URL Control|borg|altavista|teoma|blitzbot|oegp|furlbot|http%20client|polybot|htdig|mogimogi|larbin|scrubby|searchsight|seekbot|semanticdiscovery|snappy|vortex(?! Build)|zeal|fast-webcrawler|converacrawler|dataparksearch|findlinks|BrowserMob|HttpMonitor|ThumbShotsBot|URL2PNG|ZooShot|GomezA|Google SketchUp|Read%20Later|Minimo|RackspaceBot)'
+- regex: 'RSSRadio \(Push Notification Scanner;support@dorada\.co\.uk\)'
+  name: 'RSSRadio Bot'
+- regex: '(A6-Indexer|nuhk|TsolCrawler|Yammybot|Openbot|Gulper Web Bot|grub-client|Download Demon|SearchExpress|Microsoft URL Control|borg|altavista|dataminr.com|tweetedtimes.com|TrendsmapResolver|teoma|blitzbot|oegp|furlbot|http%20client|polybot|htdig|mogimogi|larbin|scrubby|searchsight|seekbot|semanticdiscovery|snappy|vortex(?! Build)|zeal|fast-webcrawler|converacrawler|dataparksearch|findlinks|BrowserMob|HttpMonitor|ThumbShotsBot|URL2PNG|ZooShot|GomezA|Google SketchUp|Read%20Later|RackspaceBot|robots|SeopultContentAnalyzer|7Siters|centuryb.o.t9)'
   name: 'Generic Bot'
 - regex: '^sentry'
@@ -1671,7 +1854,191 @@
     name: 'Sentry'
     url: 'https://sentry.io'
-# Generic detections
+- regex: '^Spotify'
+  name: 'Spotify'
+  producer:
+    name: 'Spotify'
+    url: 'https://www.spotify.com'
+- regex: 'The Knowledge AI'
+  name: 'The Knowledge AI'
+  category: 'Crawler'
+- regex: 'Embedly'
+  name: 'Embedly'
+  category: 'Crawler'
+  url: 'https://support.embed.ly/hc/en-us'
+  producer:
+    name: 'A Medium, Corp.'
+    url: 'https://medium.com/'
+- regex: 'BrandVerity'
+  name: 'BrandVerity'
+  category: 'Crawler'
+  url: 'https://www.brandverity.com/why-is-brandverity-visiting-me'
+  producer:
+    name: 'BrandVerity, Inc.'
+    url: 'https://www.brandverity.com/'
+- regex: 'Kaspersky Lab CFR link resolver'
+  name: 'Kaspersky'
+  category: 'Security Checker'
+  url: 'https://www.kaspersky.com/'
+  producer:
+    name: 'AO Kaspersky Lab'
+    url: 'https://www.kaspersky.com/'
+- regex: 'eZ Publish Link Validator'
+  name: 'eZ Publish Link Validator'
+  category: 'Crawler'
+  url: 'https://ez.no/'
+  producer:
+    name: 'eZ Systems AS'
+    url: 'https://ez.no/'
+- regex: 'woorankreview'
+  name: 'WooRank'
+  category: 'Search bot'
+  url: 'https://www.woorank.com/'
+  producer:
+    name: 'WooRank sprl'
+    url: 'https://www.woorank.com/'
+- regex: '(Match|LinkCheck) by Siteimprove.com'
+  name: 'Siteimprove'
+  category: 'Search bot'
+  url: 'https://siteimprove.com/'
+  producer:
+    name: 'Siteimprove GmbH'
+    url: 'https://siteimprove.com/'
+- regex: 'CATExplorador'
+  name: 'CATExplorador'
+  category: 'Search bot'
+  url: 'https://fundacio.cat/ca/domini/'
+  producer:
+    name: 'Fundació puntCAT'
+    url: 'https://fundacio.cat/ca/domini/'
+- regex: 'Buck'
+  name: 'Buck'
+  category: 'Search bot'
+  url: 'https://hypefactors.com/'
+  producer:
+    name: 'Hypefactors A/S'
+    url: 'https://hypefactors.com/'
+- regex: 'tracemyfile'
+  name: 'TraceMyFile'
+  category: 'Search bot'
+  url: 'https://www.tracemyfile.com/'
+  producer:
+    name: 'Idee Inc.'
+    url: 'http://ideeinc.com/'
+- regex: 'zelist.ro feed parser'
+  name: 'Ze List'
+  url: 'https://www.zelist.ro/'
+  category: 'Feed Fetcher'
+  producer:
+    name: 'Treeworks SRL'
+    url: 'https://www.tree.ro/'
+- regex: 'weborama-fetcher'
+  name: 'Weborama'
+  category: 'Search bot'
+  url: 'https://weborama.com/'
+  producer:
+    name: 'Weborama SA'
+    url: 'https://weborama.com/'
+- regex: 'BoardReader Favicon Fetcher'
+  name: 'BoardReader'
+  category: 'Search bot'
+  url: 'http://boardreader.com/'
+  producer:
+    name: 'Effyis Inc'
+    url: 'http://boardreader.com/'
+- regex: 'IDG/IT'
+  name: 'IDG/IT'
+  category: 'Search bot'
+  url: 'https://spaziodati.eu/'
+  producer:
+    name: 'SpazioDati S.r.l.'
+    url: 'https://spaziodati.eu/'
+- regex: 'Bytespider'
+  name: 'Bytespider'
+  category: 'Search bot'
+  url: 'https://bytedance.com/'
+  producer:
+    name: 'ByteDance Ltd.'
+    url: 'https://bytedance.com/'
+- regex: 'WikiDo'
+  name: 'WikiDo'
+  category: 'Search bot'
+  url: 'https://www.wikido.com/'
+  producer:
+    name: 'Fotolitografie Fiorentine di Becchi Antonio s.n.c.'
+    url: 'https://www.wikido.com/'
+- regex: 'AwarioSmartBot'
+  name: 'Awario'
+  category: 'Search bot'
+  url: 'https://awario.com/bots.html'
+  producer:
+    name: 'Awario'
+    url: 'https://awario.com/'
+- regex: 'AwarioRssBot'
+  name: 'Awario'
+  category: 'Feed Fetcher'
+  url: 'https://awario.com/bots.html'
+  producer:
+    name: 'Awario'
+    url: 'https://awario.com/'
+- regex: 'oBot'
+  name: 'oBot'
+  category: 'Search bot'
+  url: 'http://www.xforce-security.com/crawler/'
+  producer:
+    name: 'IBM Germany Research & Development GmbH'
+    url: 'https://exchange.xforce.ibmcloud.com/'
+- regex: 'SMTBot'
+  name: 'SMTBot'
+  category: 'Search bot'
+  url: 'https://www.similartech.com/smtbot'
+  producer:
+    name: 'SimilarTech Ltd.'
+    url: 'https://www.similartech.com/'
+- regex: 'LCC'
+  name: 'LCC'
+  category: 'Search bot'
+  url: 'https://corpora.uni-leipzig.de/crawler_faq.html'
+  producer:
+    name: 'Universität Leipzig'
+    url: 'https://www.uni-leipzig.de/'
+- regex: 'Startpagina-Linkchecker'
+  name: 'Startpagina Linkchecker'
+  category: 'Search bot'
+  url: 'https://www.startpagina.nl/linkchecker'
+  producer:
+    name: 'Startpagina B.V.'
+    url: 'https://www.startpagina.nl/'
+- regex: 'GTmetrix'
+  name: 'GTmetrix'
+  category: 'Crawler'
+  url: 'https://gtmetrix.com/'
+  producer:
+    name: 'Carbon60 Operating Co. Ltd.'
+    url: 'https://www.carbon60.com/'
 - regex: 'Nutch'
   name: 'Nutch-based Bot'
@@ -1681,5 +2048,61 @@
     name: 'The Apache Software Foundation'
     url: 'http://www.apache.org/foundation/'
-- regex: '[a-z0-9\-_]*((?<!cu|power )bot(?! TAB| ?5[0-9])|crawler|crawl|checker|archiver|transcoder|spider)([^a-z]|$)'
+- regex: 'Seobility'
+  name: 'Seobility'
+  category: 'Crawler'
+  url: 'https://www.seobility.net/en/faq/?category=crawling#!aboutourbot'
+- regex: 'Vercelbot'
+  name: 'Vercel Bot'
+  category: 'Service bot'
+  url: 'https://vercel.com'
+- regex: 'Grammarly'
+  name: 'Grammarly'
+  category: 'Service bot'
+  url: 'http://www.grammarly.com'
+- regex: 'Robozilla'
+  name: 'Robozilla'
+  category: 'Crawler'
+- regex: 'Domains Project'
+  name: 'Domains Project'
+  category: 'Crawler'
+  url: 'https://domainsproject.org'
+- regex: 'PetalBot'
+  name: 'Petal Bot'
+  category: 'Crawler'
+  url: 'https://aspiegel.com/petalbot'
+- regex: 'SerendeputyBot'
+  name: 'Serendeputy Bot'
+  category: 'Crawler'
+  url: 'http://serendeputy.com/about/serendeputy-bot'
+- regex: 'ias-va.*admantx.*service-fetcher'
+  name: 'ADmantX Service Fetcher'
+  category: 'Service bot'
+  url: 'https://www.admantx.com/service-fetcher.html'
+- regex: 'SemanticScholarBot'
+  name: 'Semantic Scholar Bot'
+  category: 'Crawler'
+  url: 'https://www.semanticscholar.org/crawler'
+- regex: 'VelenPublicWebCrawler'
+  name: 'Velen Public Web Crawler'
+  category: 'Crawler'
+  url: 'https://hunter.io/robot'
+- regex: 'Barkrowler'
+  name: 'Barkrowler'
+  category: 'Crawler'
+  url: 'http://www.exensa.com/crawl'
+# Generic detections
+- regex: '[a-z0-9\-_]*((?<!cu|power[ _]|m[ _])bot(?![ _]TAB|[ _]?5[0-9])|crawler|crawl|checker|archiver|transcoder|spider)([^a-z]|$)'
   name: 'Generic Bot'