confidential_info_redactor 0.0.12 → 0.0.13

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 1233d3ddc47135630231617aaebbabe48bdcaef5
4
- data.tar.gz: 009da140352b1929a471a6a214f110369a6e7d22
3
+ metadata.gz: d698521a92a28fa94c1cd8f2c6317b4249a0a19d
4
+ data.tar.gz: ab825e72bb74de93b72efaac0364f4b01ba7b3fb
5
5
  SHA512:
6
- metadata.gz: 2f09ed5dbe85f303577d3e1d11d61e83157e06fbb8764ef7b6b86960ce1265b9e560b8a880494264214399386156b405e24d1cb12cad90ec02ab8cbd13089a90
7
- data.tar.gz: 5048ecb8b50262c157e2b6cd02b7d14d1f5f5c446ef5299df7a3efdf7efe1660301a22827b06208f96cab90a3c7d6d85d79c5c7d8f1e55e85799f4feaa3be9e4
6
+ metadata.gz: b91adab393e7137f24f9255a20b9d35cb812fbbb0513b0a3daf01944065d3659ef40864bc8013c7291d210593a60341e1dae898d6c5c97262029d7f0fefc8a5f
7
+ data.tar.gz: c554f97b0ce9fe0341ab983641bc347c415d770561acb150ce810236271c485cd0b395d8ebf8eef333372ebbb6719a703adca82cef36855022b8d565c1d196e1
@@ -34,7 +34,7 @@ module ConfidentialInfoRedactor
34
34
  tracker = false if corpus.include?(token.downcase)
35
35
  end
36
36
  end
37
- extracted_terms << t.gsub(/[\?\)\(\!\\\/\"\:\;\,]/, '').gsub(/\'$/, '').gsub(/”/,'').gsub(/\.\z/, '').strip unless corpus.include?(t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip) || !tracker
37
+ extracted_terms << t.gsub(/[\?\)\(\!\\\/\"\:\;\,]/, '').gsub(/\'$/, '').gsub(/”/,'').gsub(/\.\z/, '').strip unless corpus.include?(t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip) || !tracker || (corpus.include?(t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[0...-2]) && t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[-2..-1].eql?('en')) || (corpus.include?(t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[0...-2]) && t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[-2..-1].eql?('es')) || (corpus.include?(t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[0...-2]) && t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[-2..-1].eql?('er')) || (corpus.include?(t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[0...-1]) && t.downcase.gsub(/[\?\.\)\(\!\\\/\"\:\;]/, '').gsub(/”/,'').gsub(/\'$/, '').strip[-1].eql?('s'))
38
38
  end
39
39
  end
40
40
  end
@@ -1,3 +1,3 @@
1
1
  module ConfidentialInfoRedactor
2
- VERSION = "0.0.12"
2
+ VERSION = "0.0.13"
3
3
  end
@@ -141,10 +141,15 @@ RSpec.describe ConfidentialInfoRedactor::Extractor do
141
141
  expect(described_class.new(text: text, language: 'de').extract).to eq(['Deutschen Bank'])
142
142
  end
143
143
 
144
- it 'extracts the proper nouns from a text #001' do
144
+ it 'extracts the proper nouns from a text #002' do
145
145
  text = 'Viele Mitarbeiter der Deutsche Bank suchen eine andere Arbeitsstelle.'
146
146
  expect(described_class.new(text: text, language: 'de').extract).to eq(['Deutsche Bank'])
147
147
  end
148
+
149
+ it 'extracts the proper nouns from a text #003' do
150
+ text = 'Ich behielt diese Routine während und sogar während des Studiums an der Uni bei, und ich war damals froh, wenn ich pro Tag zwei ganze Mahlzeiten zu mir nahm.'
151
+ expect(described_class.new(text: text, language: 'de').extract).to eq([])
152
+ end
148
153
  end
149
154
  end
150
155
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: confidential_info_redactor
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.0.12
4
+ version: 0.0.13
5
5
  platform: ruby
6
6
  authors:
7
7
  - Kevin S. Dias
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2015-04-23 00:00:00.000000000 Z
11
+ date: 2015-04-24 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: bundler