sterilizer 0.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
data/.gitignore ADDED
@@ -0,0 +1,17 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
data/Gemfile ADDED
@@ -0,0 +1,6 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in sterilizer.gemspec
4
+ gemspec
5
+
6
+ gem "pry"
data/LICENSE.txt ADDED
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2013 Ben Thompson
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,53 @@
1
+ # Sterilizer
2
+
3
+ A simple module that extends a String, giving it a `sterilize!` method which to ensure the string is always valid UTF-8
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ gem 'sterilizer'
10
+
11
+ And then execute:
12
+
13
+ $ bundle
14
+
15
+ Or install it yourself as:
16
+
17
+ $ gem install sterilizer
18
+
19
+ ## Usage
20
+ Handy when you want to ensure incoming strings will contain invalid characters
21
+ ```ruby
22
+
23
+ dodgy_params = {
24
+ :ok => "Hello",
25
+ :dodgy => "hi \255",
26
+ :accented => "\xE9",
27
+ }
28
+ guarantee_strings!(dodgy_params)
29
+ # =>
30
+ {
31
+ :ok=>"Hello",
32
+ :dodgy=>"hi ­"
33
+ :accented=>"é"
34
+ }
35
+
36
+ private
37
+
38
+ def guarantee_strings!(unclean_params)
39
+ unclean_params.each do |_,v|
40
+ v.sterilize!
41
+ end
42
+ end
43
+ ```
44
+
45
+ It uses the https://github.com/oleander/rchardet gem to guess the character encoding if the string isn't valid when forced to UTF-8
46
+
47
+ ## Contributing
48
+
49
+ 1. Fork it
50
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
51
+ 3. Commit your changes (`git commit -am 'Add some feature'`)
52
+ 4. Push to the branch (`git push origin my-new-feature`)
53
+ 5. Create new Pull Request
data/Rakefile ADDED
@@ -0,0 +1 @@
1
+ require "bundler/gem_tasks"
data/lib/sterilizer.rb ADDED
@@ -0,0 +1,79 @@
1
+ require "sterilizer/version"
2
+ require "rchardet19"
3
+
4
+ module Sterilizer
5
+ def sterilize!
6
+
7
+ return self unless !!defined?(Encoding)
8
+ # return if encoding is valid and equal to default_internal
9
+ return self if valid_when_default?
10
+
11
+ # force to default encoding if valid when forced
12
+ return self.force_encoding(Encoding.default_internal) if valid_when_forced?
13
+
14
+ # At this point, we know the string is not valid encoding, it the encoding is UTF-8,
15
+ # we must try a different encoding that is valid before forcefully encoding to UTF-8
16
+ # Otherwise, the encoding type is non-default. If it is valid, encode it to UTF-8, otherwise
17
+ # find an alternative before forcefully encoding to UTF-8
18
+ if encoding_is_default?
19
+ # Might have a situation where encoding is the same as default, but it's not valid
20
+ # Force it to something else so we can String#encode
21
+ non_default_encoding = find_a_valid_encoding
22
+ force_encoding_with(non_default_encoding)
23
+ else
24
+ if valid_when_forced?(self.encoding)
25
+ self.encode!(Encoding.default_internal, self.encoding, { :undef => :replace, :invalid => :replace})
26
+ else
27
+ alternative_encoding = find_a_valid_encoding(self.encoding)
28
+ force_encoding_with(alternative_encoding)
29
+ end
30
+ end
31
+ rescue
32
+ self.force_encoding_with("ASCII")
33
+ end
34
+
35
+ def encoding_is_default?
36
+ self.encoding == Encoding.default_internal
37
+ end
38
+
39
+ def valid_when_default?
40
+ self.valid_encoding? && encoding_is_default?
41
+ end
42
+
43
+ def valid_when_forced?(encoding = Encoding.default_internal)
44
+ self.dup.force_encoding(encoding).valid_encoding?
45
+ end
46
+
47
+ def find_a_valid_encoding(ignoring = [Encoding.default_internal], guessed_already = false)
48
+ # If we've already tried to guess the encoding, resort to picking one at random until valid
49
+ if guessed_already
50
+ provisional_encoding = Encoding.list.detect{ |encoding| !ignoring.include?(encoding) }
51
+ else # On first run, we'll try and guess the character encoding
52
+ provisional_encoding = guess_encoding
53
+ end
54
+
55
+ # If the provisional encoding is valid when string is forced to it, select it otherwise continue to find one
56
+ if valid_when_forced?(provisional_encoding)
57
+ provisional_encoding
58
+ else
59
+ find_a_valid_encoding(ignoring << provisional_encoding, :guess_failed)
60
+ end
61
+ end
62
+
63
+ # Use an external library to attempt to (silently) guess the encoding
64
+ def guess_encoding(guesser = CharDet)
65
+ Encoding.find(guesser.detect(self, :silent => true)["encoding"])
66
+ end
67
+
68
+ def force_encoding_with(encoding)
69
+ self.force_encoding(encoding).encode(Encoding.default_internal, :invalid => :replace, :undef => :replace)
70
+ end
71
+
72
+ end
73
+
74
+ # Add sterilize methods to a string if it is sterilized, saves clobbering every string!
75
+ class String
76
+ def sterilize!
77
+ self.extend(Sterilizer).sterilize!
78
+ end
79
+ end
@@ -0,0 +1,3 @@
1
+ module Sterilizer
2
+ VERSION = "0.0.2"
3
+ end
@@ -0,0 +1,21 @@
1
+ # -*- encoding: utf-8 -*-
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'sterilizer/version'
5
+
6
+ Gem::Specification.new do |gem|
7
+ gem.name = "sterilizer"
8
+ gem.version = Sterilizer::VERSION
9
+ gem.authors = ["Ben Thompson"]
10
+ gem.email = ["ben@atechmedia.com"]
11
+ gem.description = %q{Guarantee a string}
12
+ gem.summary = %q{}
13
+ gem.homepage = ""
14
+
15
+ gem.files = `git ls-files`.split($/)
16
+ gem.executables = gem.files.grep(%r{^bin/}).map{ |f| File.basename(f) }
17
+ gem.test_files = gem.files.grep(%r{^(test|spec|features)/})
18
+ gem.require_paths = ["lib"]
19
+ gem.add_dependency "rchardet19"
20
+ gem.add_development_dependency 'pry'
21
+ end
metadata ADDED
@@ -0,0 +1,86 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: sterilizer
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.2
5
+ prerelease:
6
+ platform: ruby
7
+ authors:
8
+ - Ben Thompson
9
+ autorequire:
10
+ bindir: bin
11
+ cert_chain: []
12
+ date: 2013-08-02 00:00:00.000000000 Z
13
+ dependencies:
14
+ - !ruby/object:Gem::Dependency
15
+ name: rchardet19
16
+ requirement: !ruby/object:Gem::Requirement
17
+ none: false
18
+ requirements:
19
+ - - ! '>='
20
+ - !ruby/object:Gem::Version
21
+ version: '0'
22
+ type: :runtime
23
+ prerelease: false
24
+ version_requirements: !ruby/object:Gem::Requirement
25
+ none: false
26
+ requirements:
27
+ - - ! '>='
28
+ - !ruby/object:Gem::Version
29
+ version: '0'
30
+ - !ruby/object:Gem::Dependency
31
+ name: pry
32
+ requirement: !ruby/object:Gem::Requirement
33
+ none: false
34
+ requirements:
35
+ - - ! '>='
36
+ - !ruby/object:Gem::Version
37
+ version: '0'
38
+ type: :development
39
+ prerelease: false
40
+ version_requirements: !ruby/object:Gem::Requirement
41
+ none: false
42
+ requirements:
43
+ - - ! '>='
44
+ - !ruby/object:Gem::Version
45
+ version: '0'
46
+ description: Guarantee a string
47
+ email:
48
+ - ben@atechmedia.com
49
+ executables: []
50
+ extensions: []
51
+ extra_rdoc_files: []
52
+ files:
53
+ - .gitignore
54
+ - Gemfile
55
+ - LICENSE.txt
56
+ - README.md
57
+ - Rakefile
58
+ - lib/sterilizer.rb
59
+ - lib/sterilizer/version.rb
60
+ - sterilizer.gemspec
61
+ homepage: ''
62
+ licenses: []
63
+ post_install_message:
64
+ rdoc_options: []
65
+ require_paths:
66
+ - lib
67
+ required_ruby_version: !ruby/object:Gem::Requirement
68
+ none: false
69
+ requirements:
70
+ - - ! '>='
71
+ - !ruby/object:Gem::Version
72
+ version: '0'
73
+ required_rubygems_version: !ruby/object:Gem::Requirement
74
+ none: false
75
+ requirements:
76
+ - - ! '>='
77
+ - !ruby/object:Gem::Version
78
+ version: '0'
79
+ requirements: []
80
+ rubyforge_project:
81
+ rubygems_version: 1.8.23
82
+ signing_key:
83
+ specification_version: 3
84
+ summary: ''
85
+ test_files: []
86
+ has_rdoc: