textract 0.0.19 → 0.0.20
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/textract.rb +2 -1
- data/lib/textract/version.rb +1 -1
- metadata +1 -1
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: f7045052b7ae856893fd2855cafe0b995cd8691b
|
4
|
+
data.tar.gz: 410cae4e7a27cbc02b1df05357e58d88985079e9
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 1bf53ec28fe1c7dce25bbd0ac73b2c45d1f2e954767d2ec0de02b39210a66fd4136bee7343dfcdfdb0db5187570441e5a461052afd0d1e185247d1f77900e7c4
|
7
|
+
data.tar.gz: 2136d43fbb2ddcd60018939a451a1205ceed759d2482b23dec5eca8a6e7f8674c36e1c9b85bba19375123ebc89fbc334e0a2ad980a27e3c3e3850630dd62084b
|
data/lib/textract.rb
CHANGED
@@ -82,7 +82,8 @@ module Textract
|
|
82
82
|
site_twitter = Nokogiri::HTML(html).search('meta[name="twitter:site"]')
|
83
83
|
site_name = Nokogiri::HTML(html).search('meta[property="og:site_name"]')
|
84
84
|
if site_name.empty?
|
85
|
-
|
85
|
+
domain_regex = /^(http|ftp)s?:\/\/(([\w\d\-_]+\.)?([\w\d\-_]+)\.(\w+))\//
|
86
|
+
site = url.match domain_regex
|
86
87
|
site = site[2] unless site[2].nil?
|
87
88
|
site_name = site.sub(/^www\./, '').capitalize!
|
88
89
|
else
|
data/lib/textract/version.rb
CHANGED