RubyGems - bioinform - Versions diffs - 0.1.17 → 0.2.0 - Mend

bioinform 0.1.17 → 0.2.0

Files changed (145) hide show

checksums.yaml +4 -4
data/Gemfile +3 -3
data/LICENSE +0 -1
data/README.md +1 -1
data/TODO.txt +23 -30
data/bin/convert_motif +4 -0
data/bin/pcm2pwm +1 -1
data/bin/split_motifs +1 -1
data/bioinform.gemspec +0 -2
data/lib/bioinform.rb +54 -16
data/lib/bioinform/alphabet.rb +85 -0
data/lib/bioinform/background.rb +90 -0
data/lib/bioinform/cli.rb +1 -2
data/lib/bioinform/cli/convert_motif.rb +52 -17
data/lib/bioinform/cli/pcm2pwm.rb +32 -26
data/lib/bioinform/cli/split_motifs.rb +31 -30
data/lib/bioinform/conversion_algorithms.rb +6 -0
data/lib/bioinform/conversion_algorithms/pcm2ppm_converter.rb +13 -11
data/lib/bioinform/conversion_algorithms/pcm2pwm_converter.rb +39 -11
data/lib/bioinform/conversion_algorithms/pcm2pwm_mara_converter.rb +26 -0
data/lib/bioinform/conversion_algorithms/ppm2pcm_converter.rb +30 -0
data/lib/bioinform/conversion_algorithms/pwm2iupac_pwm_converter.rb +23 -0
data/lib/bioinform/conversion_algorithms/pwm2pcm_converter.rb +85 -0
data/lib/bioinform/data_models.rb +1 -7
data/lib/bioinform/data_models/named_model.rb +38 -0
data/lib/bioinform/data_models/pcm.rb +18 -28
data/lib/bioinform/data_models/pm.rb +73 -170
data/lib/bioinform/data_models/ppm.rb +11 -24
data/lib/bioinform/data_models/pwm.rb +30 -56
data/lib/bioinform/errors.rb +17 -0
data/lib/bioinform/formatters.rb +4 -2
data/lib/bioinform/formatters/consensus_formatter.rb +35 -0
data/lib/bioinform/formatters/motif_formatter.rb +69 -0
data/lib/bioinform/formatters/pretty_matrix_formatter.rb +36 -0
data/lib/bioinform/formatters/transfac_formatter.rb +29 -37
data/lib/bioinform/parsers.rb +1 -8
data/lib/bioinform/parsers/matrix_parser.rb +44 -36
data/lib/bioinform/parsers/motif_splitter.rb +45 -0
data/lib/bioinform/support.rb +46 -14
data/lib/bioinform/support/strip_doc.rb +1 -1
data/lib/bioinform/version.rb +1 -1
data/spec/alphabet_spec.rb +79 -0
data/spec/background_spec.rb +57 -0
data/spec/cli/cli_spec.rb +6 -6
data/spec/cli/convert_motif_spec.rb +88 -88
data/spec/cli/data/pcm2pwm/KLF4_f2.pwm.result +9 -9
data/spec/cli/data/pcm2pwm/SP1_f1.pwm.result +11 -11
data/spec/cli/pcm2pwm_spec.rb +22 -23
data/spec/cli/shared_examples/convert_motif/motif_list_empty.rb +1 -1
data/spec/cli/shared_examples/convert_motif/several_motifs_specified.rb +1 -1
data/spec/cli/shared_examples/convert_motif/single_motif_specified.rb +5 -5
data/spec/cli/shared_examples/convert_motif/yield_help_string.rb +2 -2
data/spec/cli/shared_examples/convert_motif/yield_motif_conversion_error.rb +3 -3
data/spec/cli/split_motifs_spec.rb +6 -21
data/spec/converters/pcm2ppm_converter_spec.rb +32 -0
data/spec/converters/pcm2pwm_converter_spec.rb +71 -0
data/spec/converters/ppm2pcm_converter_spec.rb +32 -0
data/spec/converters/pwm2iupac_pwm_converter_spec.rb +65 -0
data/spec/converters/pwm2pcm_converter_spec.rb +57 -0
data/spec/data_models/named_model_spec.rb +41 -0
data/spec/data_models/pcm_spec.rb +114 -45
data/spec/data_models/pm_spec.rb +132 -333
data/spec/data_models/ppm_spec.rb +47 -44
data/spec/data_models/pwm_spec.rb +85 -77
data/spec/fabricators/motif_formats_fabricator.rb +116 -116
data/spec/formatters/consensus_formatter_spec.rb +26 -0
data/spec/formatters/raw_formatter_spec.rb +169 -0
data/spec/parsers/matrix_parser_spec.rb +216 -0
data/spec/parsers/motif_splitter_spec.rb +87 -0
data/spec/spec_helper.rb +2 -2
data/spec/spec_helper_source.rb +25 -5
data/spec/support_spec.rb +31 -0
metadata +43 -124
data/bin/merge_into_collection +0 -4
data/lib/bioinform/cli/merge_into_collection.rb +0 -80
data/lib/bioinform/conversion_algorithms/ppm2pwm_converter.rb +0 -0
data/lib/bioinform/data_models/collection.rb +0 -75
data/lib/bioinform/data_models/motif.rb +0 -56
data/lib/bioinform/formatters/raw_formatter.rb +0 -41
data/lib/bioinform/parsers/jaspar_parser.rb +0 -35
data/lib/bioinform/parsers/parser.rb +0 -92
data/lib/bioinform/parsers/splittable_parser.rb +0 -57
data/lib/bioinform/parsers/string_fantom_parser.rb +0 -35
data/lib/bioinform/parsers/string_parser.rb +0 -72
data/lib/bioinform/parsers/trivial_parser.rb +0 -34
data/lib/bioinform/parsers/yaml_parser.rb +0 -35
data/lib/bioinform/support/advanced_scan.rb +0 -8
data/lib/bioinform/support/array_product.rb +0 -6
data/lib/bioinform/support/array_zip.rb +0 -6
data/lib/bioinform/support/collect_hash.rb +0 -7
data/lib/bioinform/support/deep_dup.rb +0 -5
data/lib/bioinform/support/delete_many.rb +0 -14
data/lib/bioinform/support/inverf.rb +0 -13
data/lib/bioinform/support/multiline_squish.rb +0 -6
data/lib/bioinform/support/parameters.rb +0 -28
data/lib/bioinform/support/partial_sums.rb +0 -16
data/lib/bioinform/support/same_by.rb +0 -12
data/lib/bioinform/support/third_part/active_support/core_ext/array/extract_options.rb +0 -29
data/lib/bioinform/support/third_part/active_support/core_ext/hash/indifferent_access.rb +0 -23
data/lib/bioinform/support/third_part/active_support/core_ext/hash/keys.rb +0 -54
data/lib/bioinform/support/third_part/active_support/core_ext/module/attribute_accessors.rb +0 -64
data/lib/bioinform/support/third_part/active_support/core_ext/object/try.rb +0 -57
data/lib/bioinform/support/third_part/active_support/core_ext/string/access.rb +0 -99
data/lib/bioinform/support/third_part/active_support/core_ext/string/behavior.rb +0 -6
data/lib/bioinform/support/third_part/active_support/core_ext/string/filters.rb +0 -49
data/lib/bioinform/support/third_part/active_support/core_ext/string/multibyte.rb +0 -72
data/lib/bioinform/support/third_part/active_support/hash_with_indifferent_access.rb +0 -181
data/lib/bioinform/support/third_part/active_support/multibyte.rb +0 -44
data/lib/bioinform/support/third_part/active_support/multibyte/chars.rb +0 -476
data/lib/bioinform/support/third_part/active_support/multibyte/exceptions.rb +0 -8
data/lib/bioinform/support/third_part/active_support/multibyte/unicode.rb +0 -393
data/lib/bioinform/support/third_part/active_support/multibyte/utils.rb +0 -60
data/spec/cli/data/merge_into_collection/GABPA_f1.pwm +0 -14
data/spec/cli/data/merge_into_collection/KLF4_f2.pwm +0 -11
data/spec/cli/data/merge_into_collection/SP1_f1.pwm +0 -12
data/spec/cli/data/merge_into_collection/collection.txt.result +0 -40
data/spec/cli/data/merge_into_collection/collection.yaml.result +0 -188
data/spec/cli/data/merge_into_collection/collection_pwm.yaml.result +0 -188
data/spec/cli/data/merge_into_collection/pwm_folder/GABPA_f1.pwm +0 -14
data/spec/cli/data/merge_into_collection/pwm_folder/KLF4_f2.pwm +0 -11
data/spec/cli/data/merge_into_collection/pwm_folder/SP1_f1.pwm +0 -12
data/spec/cli/data/split_motifs/collection.yaml +0 -188
data/spec/cli/merge_into_collection_spec.rb +0 -100
data/spec/data_models/collection_spec.rb +0 -98
data/spec/data_models/motif_spec.rb +0 -224
data/spec/fabricators/collection_fabricator.rb +0 -8
data/spec/fabricators/motif_fabricator.rb +0 -33
data/spec/fabricators/pcm_fabricator.rb +0 -25
data/spec/fabricators/pm_fabricator.rb +0 -52
data/spec/fabricators/ppm_fabricator.rb +0 -14
data/spec/fabricators/pwm_fabricator.rb +0 -16
data/spec/parsers/parser_spec.rb +0 -152
data/spec/parsers/string_fantom_parser_spec.rb +0 -70
data/spec/parsers/string_parser_spec.rb +0 -77
data/spec/parsers/trivial_parser_spec.rb +0 -64
data/spec/parsers/yaml_parser_spec.rb +0 -50
data/spec/support/advanced_scan_spec.rb +0 -32
data/spec/support/array_product_spec.rb +0 -15
data/spec/support/array_zip_spec.rb +0 -15
data/spec/support/collect_hash_spec.rb +0 -15
data/spec/support/delete_many_spec.rb +0 -44
data/spec/support/inverf_spec.rb +0 -19
data/spec/support/multiline_squish_spec.rb +0 -25
data/spec/support/partial_sums_spec.rb +0 -30
data/spec/support/same_by_spec.rb +0 -36

data/lib/bioinform/support/third_part/active_support/multibyte/chars.rb DELETED Viewed

@@ -1,476 +0,0 @@
-# encoding: utf-8
-require_relative '../core_ext/string/access'
-require_relative '../core_ext/string/behavior'
-module ActiveSupport #:nodoc:
-  module Multibyte #:nodoc:
-    # Chars enables you to work transparently with UTF-8 encoding in the Ruby String class without having extensive
-    # knowledge about the encoding. A Chars object accepts a string upon initialization and proxies String methods in an
-    # encoding safe manner. All the normal String methods are also implemented on the proxy.
-    #
-    # String methods are proxied through the Chars object, and can be accessed through the +mb_chars+ method. Methods
-    # which would normally return a String object now return a Chars object so methods can be chained.
-    #
-    #   "The Perfect String  ".mb_chars.downcase.strip.normalize # => "the perfect string"
-    #
-    # Chars objects are perfectly interchangeable with String objects as long as no explicit class checks are made.
-    # If certain methods do explicitly check the class, call +to_s+ before you pass chars objects to them.
-    #
-    #   bad.explicit_checking_method "T".mb_chars.downcase.to_s
-    #
-    # The default Chars implementation assumes that the encoding of the string is UTF-8, if you want to handle different
-    # encodings you can write your own multibyte string handler and configure it through
-    # ActiveSupport::Multibyte.proxy_class.
-    #
-    #   class CharsForUTF32
-    #     def size
-    #       @wrapped_string.size / 4
-    #     end
-    #
-    #     def self.accepts?(string)
-    #       string.length % 4 == 0
-    #     end
-    #   end
-    #
-    #   ActiveSupport::Multibyte.proxy_class = CharsForUTF32
-    class Chars
-      attr_reader :wrapped_string
-      alias to_s wrapped_string
-      alias to_str wrapped_string
-      if RUBY_VERSION >= "1.9"
-        # Creates a new Chars instance by wrapping _string_.
-        def initialize(string)
-          @wrapped_string = string
-          @wrapped_string.force_encoding(Encoding::UTF_8) unless @wrapped_string.frozen?
-        end
-      else
-        def initialize(string) #:nodoc:
-          @wrapped_string = string
-        end
-      end
-      # Forward all undefined methods to the wrapped string.
-      def method_missing(method, *args, &block)
-        if method.to_s =~ /!$/
-          @wrapped_string.__send__(method, *args, &block)
-          self
-        else
-          result = @wrapped_string.__send__(method, *args, &block)
-          result.kind_of?(String) ? chars(result) : result
-        end
-      end
-      # Returns +true+ if _obj_ responds to the given method. Private methods are included in the search
-      # only if the optional second parameter evaluates to +true+.
-      def respond_to?(method, include_private=false)
-        super || @wrapped_string.respond_to?(method, include_private)
-      end
-      # Enable more predictable duck-typing on String-like classes. See Object#acts_like?.
-      def acts_like_string?
-        true
-      end
-      # Returns +true+ when the proxy class can handle the string. Returns +false+ otherwise.
-      def self.consumes?(string)
-        # Unpack is a little bit faster than regular expressions.
-        string.unpack('U*')
-        true
-      rescue ArgumentError
-        false
-      end
-      include Comparable
-      # Returns -1, 0, or 1, depending on whether the Chars object is to be sorted before,
-      # equal or after the object on the right side of the operation. It accepts any object
-      # that implements +to_s+:
-      #
-      #   'é'.mb_chars <=> 'ü'.mb_chars # => -1
-      #
-      # See <tt>String#<=></tt> for more details.
-      def <=>(other)
-        @wrapped_string <=> other.to_s
-      end
-      if RUBY_VERSION < "1.9"
-        # Returns +true+ if the Chars class can and should act as a proxy for the string _string_. Returns
-        # +false+ otherwise.
-        def self.wants?(string)
-          $KCODE == 'UTF8' && consumes?(string)
-        end
-        # Returns a new Chars object containing the _other_ object concatenated to the string.
-        #
-        # Example:
-        #   ('Café'.mb_chars + ' périferôl').to_s # => "Café périferôl"
-        def +(other)
-          chars(@wrapped_string + other)
-        end
-        # Like <tt>String#=~</tt> only it returns the character offset (in codepoints) instead of the byte offset.
-        #
-        # Example:
-        #   'Café périferôl'.mb_chars =~ /ô/ # => 12
-        def =~(other)
-          translate_offset(@wrapped_string =~ other)
-        end
-        # Inserts the passed string at specified codepoint offsets.
-        #
-        # Example:
-        #   'Café'.mb_chars.insert(4, ' périferôl').to_s # => "Café périferôl"
-        def insert(offset, fragment)
-          unpacked = Unicode.u_unpack(@wrapped_string)
-          unless offset > unpacked.length
-            @wrapped_string.replace(
-              Unicode.u_unpack(@wrapped_string).insert(offset, *Unicode.u_unpack(fragment)).pack('U*')
-            )
-          else
-            raise IndexError, "index #{offset} out of string"
-          end
-          self
-        end
-        # Returns +true+ if contained string contains _other_. Returns +false+ otherwise.
-        #
-        # Example:
-        #   'Café'.mb_chars.include?('é') # => true
-        def include?(other)
-          # We have to redefine this method because Enumerable defines it.
-          @wrapped_string.include?(other)
-        end
-        # Returns the position _needle_ in the string, counting in codepoints. Returns +nil+ if _needle_ isn't found.
-        #
-        # Example:
-        #   'Café périferôl'.mb_chars.index('ô')   # => 12
-        #   'Café périferôl'.mb_chars.index(/\w/u) # => 0
-        def index(needle, offset=0)
-          wrapped_offset = first(offset).wrapped_string.length
-          index = @wrapped_string.index(needle, wrapped_offset)
-          index ? (Unicode.u_unpack(@wrapped_string.slice(0...index)).size) : nil
-        end
-        # Returns the position _needle_ in the string, counting in
-        # codepoints, searching backward from _offset_ or the end of the
-        # string. Returns +nil+ if _needle_ isn't found.
-        #
-        # Example:
-        #   'Café périferôl'.mb_chars.rindex('é')   # => 6
-        #   'Café périferôl'.mb_chars.rindex(/\w/u) # => 13
-        def rindex(needle, offset=nil)
-          offset ||= length
-          wrapped_offset = first(offset).wrapped_string.length
-          index = @wrapped_string.rindex(needle, wrapped_offset)
-          index ? (Unicode.u_unpack(@wrapped_string.slice(0...index)).size) : nil
-        end
-        # Returns the number of codepoints in the string
-        def size
-          Unicode.u_unpack(@wrapped_string).size
-        end
-        alias_method :length, :size
-        # Strips entire range of Unicode whitespace from the right of the string.
-        def rstrip
-          chars(@wrapped_string.gsub(Unicode::TRAILERS_PAT, ''))
-        end
-        # Strips entire range of Unicode whitespace from the left of the string.
-        def lstrip
-          chars(@wrapped_string.gsub(Unicode::LEADERS_PAT, ''))
-        end
-        # Strips entire range of Unicode whitespace from the right and left of the string.
-        def strip
-          rstrip.lstrip
-        end
-        # Returns the codepoint of the first character in the string.
-        #
-        # Example:
-        #   'こんにちは'.mb_chars.ord # => 12371
-        def ord
-          Unicode.u_unpack(@wrapped_string)[0]
-        end
-        # Works just like <tt>String#rjust</tt>, only integer specifies characters instead of bytes.
-        #
-        # Example:
-        #
-        #   "¾ cup".mb_chars.rjust(8).to_s
-        #   # => "   ¾ cup"
-        #
-        #   "¾ cup".mb_chars.rjust(8, " ").to_s # Use non-breaking whitespace
-        #   # => "   ¾ cup"
-        def rjust(integer, padstr=' ')
-          justify(integer, :right, padstr)
-        end
-        # Works just like <tt>String#ljust</tt>, only integer specifies characters instead of bytes.
-        #
-        # Example:
-        #
-        #   "¾ cup".mb_chars.rjust(8).to_s
-        #   # => "¾ cup   "
-        #
-        #   "¾ cup".mb_chars.rjust(8, " ").to_s # Use non-breaking whitespace
-        #   # => "¾ cup   "
-        def ljust(integer, padstr=' ')
-          justify(integer, :left, padstr)
-        end
-        # Works just like <tt>String#center</tt>, only integer specifies characters instead of bytes.
-        #
-        # Example:
-        #
-        #   "¾ cup".mb_chars.center(8).to_s
-        #   # => " ¾ cup  "
-        #
-        #   "¾ cup".mb_chars.center(8, " ").to_s # Use non-breaking whitespace
-        #   # => " ¾ cup  "
-        def center(integer, padstr=' ')
-          justify(integer, :center, padstr)
-        end
-      else
-        def =~(other)
-          @wrapped_string =~ other
-        end
-      end
-      # Works just like <tt>String#split</tt>, with the exception that the items in the resulting list are Chars
-      # instances instead of String. This makes chaining methods easier.
-      #
-      # Example:
-      #   'Café périferôl'.mb_chars.split(/é/).map { |part| part.upcase.to_s } # => ["CAF", " P", "RIFERÔL"]
-      def split(*args)
-        @wrapped_string.split(*args).map { |i| i.mb_chars }
-      end
-      # Like <tt>String#[]=</tt>, except instead of byte offsets you specify character offsets.
-      #
-      # Example:
-      #
-      #   s = "Müller"
-      #   s.mb_chars[2] = "e" # Replace character with offset 2
-      #   s
-      #   # => "Müeler"
-      #
-      #   s = "Müller"
-      #   s.mb_chars[1, 2] = "ö" # Replace 2 characters at character offset 1
-      #   s
-      #   # => "Möler"
-      def []=(*args)
-        replace_by = args.pop
-        # Indexed replace with regular expressions already works
-        if args.first.is_a?(Regexp)
-          @wrapped_string[*args] = replace_by
-        else
-          result = Unicode.u_unpack(@wrapped_string)
-          case args.first
-          when Fixnum
-            raise IndexError, "index #{args[0]} out of string" if args[0] >= result.length
-            min = args[0]
-            max = args[1].nil? ? min : (min + args[1] - 1)
-            range = Range.new(min, max)
-            replace_by = [replace_by].pack('U') if replace_by.is_a?(Fixnum)
-          when Range
-            raise RangeError, "#{args[0]} out of range" if args[0].min >= result.length
-            range = args[0]
-          else
-            needle = args[0].to_s
-            min = index(needle)
-            max = min + Unicode.u_unpack(needle).length - 1
-            range = Range.new(min, max)
-          end
-          result[range] = Unicode.u_unpack(replace_by)
-          @wrapped_string.replace(result.pack('U*'))
-        end
-      end
-      # Reverses all characters in the string.
-      #
-      # Example:
-      #   'Café'.mb_chars.reverse.to_s # => 'éfaC'
-      def reverse
-        chars(Unicode.g_unpack(@wrapped_string).reverse.flatten.pack('U*'))
-      end
-      # Implements Unicode-aware slice with codepoints. Slicing on one point returns the codepoints for that
-      # character.
-      #
-      # Example:
-      #   'こんにちは'.mb_chars.slice(2..3).to_s # => "にち"
-      def slice(*args)
-        if args.size > 2
-          raise ArgumentError, "wrong number of arguments (#{args.size} for 1)" # Do as if we were native
-        elsif (args.size == 2 && !(args.first.is_a?(Numeric) || args.first.is_a?(Regexp)))
-          raise TypeError, "cannot convert #{args.first.class} into Integer" # Do as if we were native
-        elsif (args.size == 2 && !args[1].is_a?(Numeric))
-          raise TypeError, "cannot convert #{args[1].class} into Integer" # Do as if we were native
-        elsif args[0].kind_of? Range
-          cps = Unicode.u_unpack(@wrapped_string).slice(*args)
-          result = cps.nil? ? nil : cps.pack('U*')
-        elsif args[0].kind_of? Regexp
-          result = @wrapped_string.slice(*args)
-        elsif args.size == 1 && args[0].kind_of?(Numeric)
-          character = Unicode.u_unpack(@wrapped_string)[args[0]]
-          result = character && [character].pack('U')
-        else
-          cps = Unicode.u_unpack(@wrapped_string).slice(*args)
-          result = cps && cps.pack('U*')
-        end
-        result && chars(result)
-      end
-      alias_method :[], :slice
-      # Limit the byte size of the string to a number of bytes without breaking characters. Usable
-      # when the storage for a string is limited for some reason.
-      #
-      # Example:
-      #   'こんにちは'.mb_chars.limit(7).to_s # => "こん"
-      def limit(limit)
-        slice(0...translate_offset(limit))
-      end
-      # Convert characters in the string to uppercase.
-      #
-      # Example:
-      #   'Laurent, où sont les tests ?'.mb_chars.upcase.to_s # => "LAURENT, OÙ SONT LES TESTS ?"
-      def upcase
-        chars(Unicode.apply_mapping @wrapped_string, :uppercase_mapping)
-      end
-      # Convert characters in the string to lowercase.
-      #
-      # Example:
-      #   'VĚDA A VÝZKUM'.mb_chars.downcase.to_s # => "věda a výzkum"
-      def downcase
-        chars(Unicode.apply_mapping @wrapped_string, :lowercase_mapping)
-      end
-      # Converts the first character to uppercase and the remainder to lowercase.
-      #
-      # Example:
-      #  'über'.mb_chars.capitalize.to_s # => "Über"
-      def capitalize
-        (slice(0) || chars('')).upcase + (slice(1..-1) || chars('')).downcase
-      end
-      # Capitalizes the first letter of every word, when possible.
-      #
-      # Example:
-      #   "ÉL QUE SE ENTERÓ".mb_chars.titleize    # => "Él Que Se Enteró"
-      #   "日本語".mb_chars.titleize                 # => "日本語"
-      def titleize
-        chars(downcase.to_s.gsub(/\b('?[\S])/u) { Unicode.apply_mapping $1, :uppercase_mapping })
-      end
-      alias_method :titlecase, :titleize
-      # Returns the KC normalization of the string by default. NFKC is considered the best normalization form for
-      # passing strings to databases and validations.
-      #
-      # * <tt>form</tt> - The form you want to normalize in. Should be one of the following:
-      #   <tt>:c</tt>, <tt>:kc</tt>, <tt>:d</tt>, or <tt>:kd</tt>. Default is
-      #   ActiveSupport::Multibyte::Unicode.default_normalization_form
-      def normalize(form = nil)
-        chars(Unicode.normalize(@wrapped_string, form))
-      end
-      # Performs canonical decomposition on all the characters.
-      #
-      # Example:
-      #   'é'.length                         # => 2
-      #   'é'.mb_chars.decompose.to_s.length # => 3
-      def decompose
-        chars(Unicode.decompose_codepoints(:canonical, Unicode.u_unpack(@wrapped_string)).pack('U*'))
-      end
-      # Performs composition on all the characters.
-      #
-      # Example:
-      #   'é'.length                       # => 3
-      #   'é'.mb_chars.compose.to_s.length # => 2
-      def compose
-        chars(Unicode.compose_codepoints(Unicode.u_unpack(@wrapped_string)).pack('U*'))
-      end
-      # Returns the number of grapheme clusters in the string.
-      #
-      # Example:
-      #   'क्षि'.mb_chars.length   # => 4
-      #   'क्षि'.mb_chars.g_length # => 3
-      def g_length
-        Unicode.g_unpack(@wrapped_string).length
-      end
-      # Replaces all ISO-8859-1 or CP1252 characters by their UTF-8 equivalent resulting in a valid UTF-8 string.
-      #
-      # Passing +true+ will forcibly tidy all bytes, assuming that the string's encoding is entirely CP1252 or ISO-8859-1.
-      def tidy_bytes(force = false)
-        chars(Unicode.tidy_bytes(@wrapped_string, force))
-      end
-       %w(capitalize downcase lstrip reverse rstrip slice strip tidy_bytes upcase).each do |method|
-        # Only define a corresponding bang method for methods defined in the proxy; On 1.9 the proxy will
-        # exclude lstrip!, rstrip! and strip! because they are already work as expected on multibyte strings.
-        if public_method_defined?(method)
-          define_method("#{method}!") do |*args|
-            @wrapped_string = send(args.nil? ? method : method, *args).to_s
-            self
-          end
-        end
-      end
-      protected
-        def translate_offset(byte_offset) #:nodoc:
-          return nil if byte_offset.nil?
-          return 0   if @wrapped_string == ''
-          if @wrapped_string.respond_to?(:force_encoding)
-            @wrapped_string = @wrapped_string.dup.force_encoding(Encoding::ASCII_8BIT)
-          end
-          begin
-            @wrapped_string[0...byte_offset].unpack('U*').length
-          rescue ArgumentError
-            byte_offset -= 1
-            retry
-          end
-        end
-        def justify(integer, way, padstr=' ') #:nodoc:
-          raise ArgumentError, "zero width padding" if padstr.length == 0
-          padsize = integer - size
-          padsize = padsize > 0 ? padsize : 0
-          case way
-          when :right
-            result = @wrapped_string.dup.insert(0, padding(padsize, padstr))
-          when :left
-            result = @wrapped_string.dup.insert(-1, padding(padsize, padstr))
-          when :center
-            lpad = padding((padsize / 2.0).floor, padstr)
-            rpad = padding((padsize / 2.0).ceil, padstr)
-            result = @wrapped_string.dup.insert(0, lpad).insert(-1, rpad)
-          end
-          chars(result)
-        end
-        def padding(padsize, padstr=' ') #:nodoc:
-          if padsize != 0
-            chars(padstr * ((padsize / Unicode.u_unpack(padstr).size) + 1)).slice(0, padsize)
-          else
-            ''
-          end
-        end
-        def chars(string) #:nodoc:
-          self.class.new(string)
-        end
-    end
-  end
-end