textutils 0.8.1 → 0.8.2

Sign up to get free protection for your applications and to get access to all the features.
@@ -45,12 +45,14 @@ module TextUtils
45
45
 
46
46
  def strip_whitespaces( title )
47
47
  # remove all whitespace and punctuation
48
- title.gsub( /[ \t_\-\.()\[\]'"\/]/, '' )
48
+ title.gsub( /[ \t_\-\.!()\[\]'"\/]/, '' )
49
49
  end
50
50
 
51
51
  def strip_special_chars( title )
52
52
  # remove special chars (e.g. %°&)
53
- title.gsub( /[%&°]/, '' )
53
+ # e.g. +Malta
54
+ # Minerva 8:60
55
+ title.gsub( /[%&°+:]/, '' )
54
56
  end
55
57
 
56
58
  def title_to_key( title )
@@ -118,24 +120,29 @@ module TextUtils
118
120
  ['ť', 't' ], # e.g. Měšťan
119
121
  ['ü', 'ue'],
120
122
  ['ú', 'u' ], # e.g. Fútbol
123
+ ['ù', 'u' ], # e.g. Xyauyù (it)
121
124
  ['ū', 'u' ], # e.g. Sūduva
122
125
  ['ů', 'u' ], # e.g. Sládkův
123
126
  ['ı', 'u' ], # e.g. Bakı # use u?? (Baku) why-why not?
124
127
  ['ý', 'y' ], # e.g. Nefitrovaný
125
128
  ['ź', 'z' ], # e.g. Łódź
126
129
  ['ž', 'z' ], # e.g. Domžale, Petržalka
130
+ ['ż', 'z' ], # e.g. Lomża (polish)
127
131
 
132
+ ['Á', 'a' ], # e.g. Águila (es)
128
133
  ['Č', 'c' ], # e.g. České
129
134
  ['İ', 'i' ], # e.g. İnter
130
135
  ['Í', 'i' ], # e.g. ÍBV
131
136
  ['Ł', 'l' ], # e.g. Łódź
132
137
  ['Ö', 'oe' ], # e.g. Örebro
138
+ ['Ø', 'o' ], # e.g. Nogne Ø Imperial Stout (no)
133
139
  ['Ř', 'r' ], # e.g. Řezák
134
140
  ['Ś', 's' ], # e.g. Śląsk
135
141
  ['Š', 's' ], # e.g. MŠK
136
142
  ['Ş', 's' ], # e.g. Şüvälan
137
143
  ['Ú', 'u' ], # e.g. Ústí, Újpest
138
- ['Ž', 'z' ] # e.g. Žilina
144
+ ['Ž', 'z' ], # e.g. Žilina
145
+ ['Ż', 'z' ] # e.g. Żywiec (polish)
139
146
  ]
140
147
 
141
148
  alternatives.each do |alt|
@@ -187,6 +194,10 @@ module TextUtils
187
194
  ['ú', '(ú|u)'] ## e.g. Fútbol
188
195
  ]
189
196
 
197
+ ### fix/todo: check for dot+space e.g. . and make dot optional
198
+ ## e.g. U. de. G. or U de G or U.de.G ??
199
+ ## collect some more (real-world) examples first!!!!!
200
+
190
201
  alternatives.each do |alt|
191
202
  title = title.gsub( alt[0], alt[1] )
192
203
  end
@@ -1,7 +1,7 @@
1
1
 
2
2
  module TextUtils
3
3
 
4
- VERSION = '0.8.1'
4
+ VERSION = '0.8.2'
5
5
 
6
6
  end # module TextUtils
7
7
 
@@ -24,7 +24,17 @@ class TestTitleHelper < MiniTest::Unit::TestCase
24
24
  [ '‹Hirter› Pils', 'hirterpils' ],
25
25
  [ '‹Villacher› Märzen', 'villachermaerzen' ],
26
26
  [ 'Bock <Damm>', 'bockdamm' ],
27
- [ '<Estrella> <Damm> Inedit', 'estrelladamminedit' ]
27
+ [ '<Estrella> <Damm> Inedit', 'estrelladamminedit' ],
28
+ [ 'Żubr', 'zubr' ],
29
+ [ 'Żywiec', 'zywiec' ],
30
+ [ 'Lomża Export', 'lomzaexport' ],
31
+ [ 'Nogne Ø Imperial Stout', 'nogneoimperialstout' ],
32
+ [ 'Xyauyù', 'xyauyu' ],
33
+ [ 'Águila', 'aguila' ],
34
+ [ '+Lupulus', 'lupulus' ],
35
+ [ '+Malta', 'malta' ],
36
+ [ 'Minerva 8:60', 'minerva860' ],
37
+ [ 'Hop Crisis!', 'hopcrisis' ]
28
38
  ]
29
39
 
30
40
  txt_io.each do |txt|
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: textutils
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.8.1
4
+ version: 0.8.2
5
5
  prerelease:
6
6
  platform: ruby
7
7
  authors:
@@ -9,11 +9,11 @@ authors:
9
9
  autorequire:
10
10
  bindir: bin
11
11
  cert_chain: []
12
- date: 2014-01-17 00:00:00.000000000 Z
12
+ date: 2014-01-22 00:00:00.000000000 Z
13
13
  dependencies:
14
14
  - !ruby/object:Gem::Dependency
15
15
  name: logutils
16
- requirement: &21276780 !ruby/object:Gem::Requirement
16
+ requirement: &20656452 !ruby/object:Gem::Requirement
17
17
  none: false
18
18
  requirements:
19
19
  - - ~>
@@ -21,10 +21,10 @@ dependencies:
21
21
  version: '0.5'
22
22
  type: :runtime
23
23
  prerelease: false
24
- version_requirements: *21276780
24
+ version_requirements: *20656452
25
25
  - !ruby/object:Gem::Dependency
26
26
  name: rdoc
27
- requirement: &21341748 !ruby/object:Gem::Requirement
27
+ requirement: &20655864 !ruby/object:Gem::Requirement
28
28
  none: false
29
29
  requirements:
30
30
  - - ~>
@@ -32,10 +32,10 @@ dependencies:
32
32
  version: '4.0'
33
33
  type: :development
34
34
  prerelease: false
35
- version_requirements: *21341748
35
+ version_requirements: *20655864
36
36
  - !ruby/object:Gem::Dependency
37
37
  name: hoe
38
- requirement: &21341412 !ruby/object:Gem::Requirement
38
+ requirement: &20655132 !ruby/object:Gem::Requirement
39
39
  none: false
40
40
  requirements:
41
41
  - - ~>
@@ -43,7 +43,7 @@ dependencies:
43
43
  version: '3.7'
44
44
  type: :development
45
45
  prerelease: false
46
- version_requirements: *21341412
46
+ version_requirements: *20655132
47
47
  description: textutils - Text Filters, Helpers, Readers and More
48
48
  email: ruby-talk@ruby-lang.org
49
49
  executables: []