lingua-it-readability 1.2.0 → 1.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/lingua/it/readability/version.rb +1 -1
- data/lib/lingua/it/sentence.rb +5 -5
- metadata +2 -2
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA1:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: ca114de122207c4fd403dc3924048730476c4e76
|
|
4
|
+
data.tar.gz: 39a5096edc53d15f7490431e017df9a32136c066
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 2241a6fb60d3c1abcaa973ba4f47e783130ce68d3ed9786532b4848d3fb16324f8baf441a31843e72ebd12e728bdd8a2108037301eab6972a4ecd0775191564c
|
|
7
|
+
data.tar.gz: ea25e7858230f530e49db91b8442fc543dc722acdde7771b7504f8e0e1aa24594348e1ef0b123cd2ca7cb8e426e35eef92533f37ab6b8607e2c460bcddcdedd1
|
data/lib/lingua/it/sentence.rb
CHANGED
|
@@ -13,10 +13,10 @@ module Lingua
|
|
|
13
13
|
end
|
|
14
14
|
|
|
15
15
|
# Common abbreviations
|
|
16
|
-
TITLES = %w(
|
|
17
|
-
MISC = %w(
|
|
18
|
-
MONTHS = %w(
|
|
19
|
-
DAYS = %w(
|
|
16
|
+
TITLES = %w(Sig Sigg Dott Preg Prof Mr Jr Amn Avv Co Stim Dr Egr Geom Ing Mons On Rag Rev Soc Spett Card Ill Gent Cav) unless defined?(TITLES)
|
|
17
|
+
MISC = %w(P V Femm Dim Ecc Etc Corr Cc Bcc All Es Fatt G Gg Id Int Lett Ogg Pag Pagg Cap Pp Tel Ind V N Num Min Sec Ms Abbr Agg Art Aus) unless defined?(MISC)
|
|
18
|
+
MONTHS = %w(Gen Feb Mar Apr Mag Giu Lug Ago Set Sett Ott Nov Dic) unless defined?(MONTHS)
|
|
19
|
+
DAYS = %w(Lun Mar Mer Gio Ven Sab Dom) unless defined?(DAYS)
|
|
20
20
|
|
|
21
21
|
# Standard delimiters
|
|
22
22
|
STD = %w(. ? !)
|
|
@@ -31,7 +31,7 @@ module Lingua
|
|
|
31
31
|
txt.gsub!(/\b(#{@abbr_regex})(\.)\B/i, '\10002')
|
|
32
32
|
txt.gsub!(/["']?[A-Z][^\Q#{@delim_regex}\E]+((?![\Q#{@delim_regex}\E]['"]?\s["']?[A-Z][^\Q#{@delim_regex}\E]).)+[\Q#{@delim_regex}\E'"]+/, '\2\001')
|
|
33
33
|
txt.gsub!(/\b(#{@abbr_regex})(0002)/i, '\1.')
|
|
34
|
-
txt.split(/01/).map { |sentence| sentence.strip }
|
|
34
|
+
txt.split(/01|\n\s*\n/).map { |sentence| sentence.strip }
|
|
35
35
|
end
|
|
36
36
|
|
|
37
37
|
# Add customized abbreviations to standard set
|
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: lingua-it-readability
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 1.2.
|
|
4
|
+
version: 1.2.1
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Andrea Giacomo Baldan
|
|
8
8
|
autorequire:
|
|
9
9
|
bindir: exe
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2016-02-
|
|
11
|
+
date: 2016-02-18 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: bundler
|