RubyGems - gettext - Versions diffs - 3.2.9 → 3.4.9 - Mend

gettext 3.2.9 → 3.4.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (237) hide show

checksums.yaml +4 -4
data/README.md +276 -198
data/Rakefile +7 -4
data/doc/text/news.md +451 -0
data/gettext.gemspec +10 -7
data/lib/gettext/locale_path.rb +17 -9
data/lib/gettext/mo.rb +12 -19
data/lib/gettext/po.rb +4 -4
data/lib/gettext/po_entry.rb +47 -27
data/lib/gettext/po_parser.rb +65 -59
data/lib/gettext/text_domain.rb +1 -1
data/lib/gettext/text_domain_manager.rb +6 -5
data/lib/gettext/tools/msgcat.rb +9 -2
data/lib/gettext/tools/msginit.rb +226 -54
data/lib/gettext/tools/msgmerge.rb +24 -6
data/lib/gettext/tools/parser/erb.rb +9 -1
data/lib/gettext/tools/parser/erubi.rb +88 -0
data/lib/gettext/tools/parser/glade.rb +38 -40
data/lib/gettext/tools/parser/gtk_builder_ui_definitions.rb +129 -0
data/lib/gettext/tools/parser/ruby.rb +288 -221
data/lib/gettext/tools/task.rb +4 -5
data/lib/gettext/tools/xgettext.rb +21 -10
data/lib/gettext/version.rb +3 -3
data/locale/bg/LC_MESSAGES/gettext.mo +0 -0
data/locale/bs/LC_MESSAGES/gettext.mo +0 -0
data/locale/ca/LC_MESSAGES/gettext.mo +0 -0
data/locale/cs/LC_MESSAGES/gettext.mo +0 -0
data/locale/de/LC_MESSAGES/gettext.mo +0 -0
data/locale/el/LC_MESSAGES/gettext.mo +0 -0
data/locale/eo/LC_MESSAGES/gettext.mo +0 -0
data/locale/es/LC_MESSAGES/gettext.mo +0 -0
data/locale/et/LC_MESSAGES/gettext.mo +0 -0
data/locale/fr/LC_MESSAGES/gettext.mo +0 -0
data/locale/hr/LC_MESSAGES/gettext.mo +0 -0
data/locale/hu/LC_MESSAGES/gettext.mo +0 -0
data/locale/it/LC_MESSAGES/gettext.mo +0 -0
data/locale/ja/LC_MESSAGES/gettext.mo +0 -0
data/locale/ko/LC_MESSAGES/gettext.mo +0 -0
data/locale/lv/LC_MESSAGES/gettext.mo +0 -0
data/locale/nb/LC_MESSAGES/gettext.mo +0 -0
data/locale/nl/LC_MESSAGES/gettext.mo +0 -0
data/locale/pt_BR/LC_MESSAGES/gettext.mo +0 -0
data/locale/ru/LC_MESSAGES/gettext.mo +0 -0
data/locale/sr/LC_MESSAGES/gettext.mo +0 -0
data/locale/uk/LC_MESSAGES/gettext.mo +0 -0
data/locale/vi/LC_MESSAGES/gettext.mo +0 -0
data/locale/zh/LC_MESSAGES/gettext.mo +0 -0
data/locale/zh_TW/LC_MESSAGES/gettext.mo +0 -0
data/po/bg/gettext.edit.po +81 -572
data/po/bg/gettext.po +7 -409
data/po/bs/gettext.edit.po +81 -572
data/po/bs/gettext.po +7 -409
data/po/ca/gettext.edit.po +81 -572
data/po/ca/gettext.po +7 -409
data/po/cs/gettext.edit.po +81 -572
data/po/cs/gettext.po +7 -409
data/po/de/gettext.edit.po +81 -572
data/po/de/gettext.po +7 -409
data/po/el/gettext.edit.po +81 -572
data/po/el/gettext.po +7 -409
data/po/eo/gettext.edit.po +81 -572
data/po/eo/gettext.po +7 -409
data/po/es/gettext.edit.po +81 -572
data/po/es/gettext.po +7 -409
data/po/et/gettext.edit.po +81 -572
data/po/et/gettext.po +7 -409
data/po/fr/gettext.edit.po +81 -572
data/po/fr/gettext.po +7 -409
data/po/gettext.pot +93 -645
data/po/hr/gettext.edit.po +81 -572
data/po/hr/gettext.po +7 -409
data/po/hu/gettext.edit.po +81 -572
data/po/hu/gettext.po +7 -409
data/po/it/gettext.edit.po +81 -572
data/po/it/gettext.po +7 -409
data/po/ja/gettext.edit.po +83 -574
data/po/ja/gettext.po +9 -411
data/po/ko/gettext.edit.po +81 -572
data/po/ko/gettext.po +7 -409
data/po/lv/gettext.edit.po +81 -572
data/po/lv/gettext.po +7 -409
data/po/nb/gettext.edit.po +81 -572
data/po/nb/gettext.po +7 -409
data/po/nl/gettext.edit.po +81 -572
data/po/nl/gettext.po +7 -409
data/po/pt_BR/gettext.edit.po +81 -572
data/po/pt_BR/gettext.po +7 -409
data/po/ru/gettext.edit.po +81 -572
data/po/ru/gettext.po +7 -409
data/po/sr/gettext.edit.po +81 -572
data/po/sr/gettext.po +7 -409
data/po/sv/gettext.edit.po +81 -572
data/po/sv/gettext.po +7 -409
data/po/uk/gettext.edit.po +81 -572
data/po/uk/gettext.po +7 -409
data/po/vi/gettext.edit.po +81 -572
data/po/vi/gettext.po +7 -409
data/po/zh/gettext.edit.po +81 -572
data/po/zh/gettext.po +7 -409
data/po/zh_TW/gettext.edit.po +81 -572
data/po/zh_TW/gettext.po +7 -409
data/samples/cgi/po/helloerb1.pot +3 -3
data/samples/cgi/po/helloerb2.pot +3 -3
data/samples/cgi/po/hellolib.pot +3 -3
data/samples/cgi/po/main.pot +3 -3
data/samples/po/bg/hello_gtk_builder.edit.po +15 -0
data/samples/po/bg/hello_gtk_builder.po +12 -0
data/samples/po/bs/hello_gtk_builder.edit.po +15 -0
data/samples/po/bs/hello_gtk_builder.po +12 -0
data/samples/po/ca/hello_gtk_builder.edit.po +15 -0
data/samples/po/ca/hello_gtk_builder.po +12 -0
data/samples/po/cs/hello_gtk_builder.edit.po +15 -0
data/samples/po/cs/hello_gtk_builder.po +12 -0
data/samples/po/de/hello_gtk_builder.edit.po +15 -0
data/samples/po/de/hello_gtk_builder.po +12 -0
data/samples/po/el/hello_gtk_builder.edit.po +15 -0
data/samples/po/el/hello_gtk_builder.po +12 -0
data/samples/po/eo/hello_gtk_builder.edit.po +15 -0
data/samples/po/eo/hello_gtk_builder.po +12 -0
data/samples/po/es/hello_gtk_builder.edit.po +15 -0
data/samples/po/es/hello_gtk_builder.po +12 -0
data/samples/po/fr/hello_gtk_builder.edit.po +15 -0
data/samples/po/fr/hello_gtk_builder.po +12 -0
data/samples/po/hello.pot +3 -3
data/samples/po/hello2.pot +4 -4
data/samples/po/hello_glade2.pot +8 -5
data/samples/po/hello_gtk2.pot +4 -4
data/samples/po/hello_gtk_builder.pot +18 -4
data/samples/po/hello_noop.pot +4 -4
data/samples/po/hello_plural.pot +4 -4
data/samples/po/hello_tk.pot +4 -4
data/samples/po/hr/hello_gtk_builder.edit.po +15 -0
data/samples/po/hr/hello_gtk_builder.po +12 -0
data/samples/po/hu/hello_gtk_builder.edit.po +15 -0
data/samples/po/hu/hello_gtk_builder.po +12 -0
data/samples/po/it/hello_gtk_builder.edit.po +15 -0
data/samples/po/it/hello_gtk_builder.po +12 -0
data/samples/po/ja/hello_gtk_builder.edit.po +15 -0
data/samples/po/ja/hello_gtk_builder.po +12 -0
data/samples/po/ko/hello_gtk_builder.edit.po +15 -0
data/samples/po/ko/hello_gtk_builder.po +12 -0
data/samples/po/lv/hello_gtk_builder.edit.po +15 -0
data/samples/po/lv/hello_gtk_builder.po +12 -0
data/samples/po/nb/hello_gtk_builder.edit.po +15 -0
data/samples/po/nb/hello_gtk_builder.po +12 -0
data/samples/po/nl/hello_gtk_builder.edit.po +15 -0
data/samples/po/nl/hello_gtk_builder.po +12 -0
data/samples/po/pt_BR/hello_gtk_builder.edit.po +15 -0
data/samples/po/pt_BR/hello_gtk_builder.po +12 -0
data/samples/po/ru/hello_gtk_builder.edit.po +15 -0
data/samples/po/ru/hello_gtk_builder.po +12 -0
data/samples/po/sr/hello_gtk_builder.edit.po +15 -0
data/samples/po/sr/hello_gtk_builder.po +12 -0
data/samples/po/sv/hello_gtk_builder.edit.po +15 -0
data/samples/po/sv/hello_gtk_builder.po +12 -0
data/samples/po/uk/hello_gtk_builder.edit.po +15 -0
data/samples/po/uk/hello_gtk_builder.po +12 -0
data/samples/po/vi/hello_gtk_builder.edit.po +15 -0
data/samples/po/vi/hello_gtk_builder.po +12 -0
data/samples/po/zh/hello_gtk_builder.edit.po +15 -0
data/samples/po/zh/hello_gtk_builder.po +12 -0
data/samples/po/zh_TW/hello_gtk_builder.edit.po +15 -0
data/samples/po/zh_TW/hello_gtk_builder.po +12 -0
data/src/po_parser.ry +48 -42
data/test/fixtures/_/backtick.rb +30 -0
data/test/fixtures/_/block_parameter.rb +2 -2
data/test/fixtures/_/double_quote_in_double_quote.rb +2 -2
data/test/fixtures/_/double_quote_in_single_quote.rb +2 -2
data/test/fixtures/_/literal_concatenation_with_continuation_line.rb +2 -2
data/test/fixtures/_/middle_new_line.rb +2 -2
data/test/fixtures/_/multiple_lines_literal.rb +2 -2
data/test/fixtures/_/multiple_messages_in_same_line.rb +2 -2
data/test/fixtures/_/multiple_same_messages.rb +2 -2
data/test/fixtures/_/one_line.rb +2 -2
data/test/fixtures/_/one_new_line.rb +2 -2
data/test/fixtures/_/percent_strings.rb +55 -0
data/test/fixtures/_/pipe.rb +32 -0
data/test/{gettext-test-utils.rb → fixtures/_/quoted_symbol.rb} +13 -23
data/test/fixtures/_.rb +10 -1
data/test/fixtures/erb/case.rhtml +16 -0
data/test/fixtures/erb/minus.rhtml +12 -0
data/test/fixtures/erb/non_ascii.rhtml +1 -0
data/test/fixtures/glade/3.glade +63 -0
data/test/fixtures/gtk_builder_ui_definitions.ui +68 -0
data/test/fixtures/multi_text_domain.rb +12 -12
data/test/fixtures/np_.rb +1 -1
data/test/fixtures/ns_/custom.rb +2 -2
data/test/fixtures/ns_.rb +1 -1
data/test/fixtures/p_.rb +1 -1
data/test/fixtures/ruby/percent_lower_i.rb +1 -0
data/test/fixtures/ruby/percent_lower_w.rb +1 -0
data/test/fixtures/ruby/percent_upper_i.rb +1 -0
data/test/fixtures/ruby/percent_upper_w.rb +1 -0
data/test/fixtures/s_/custom.rb +2 -2
data/test/fixtures/s_.rb +1 -1
data/test/fixtures/simple.rb +5 -1
data/test/fixtures/upper_nn_.rb +77 -0
data/test/helper.rb +99 -0
data/test/locale/fr/LC_MESSAGES/plural_error.mo +0 -0
data/test/locale/fr/LC_MESSAGES/test1.mo +0 -0
data/test/locale/fr_BE/LC_MESSAGES/test1.mo +0 -0
data/test/locale/fr_BE_Foo/LC_MESSAGES/test1.mo +0 -0
data/test/locale/ja/LC_MESSAGES/_.mo +0 -0
data/test/po/_.pot +28 -4
data/test/po/backslash.pot +6 -4
data/test/po/fr/plural_error.po +7 -0
data/test/po/fr/test1.po +7 -0
data/test/po/fr_BE/test1.po +24 -0
data/test/po/fr_BE_Foo/test1.po +20 -0
data/test/po/hello.pot +3 -3
data/test/po/ja/_.edit.po +27 -3
data/test/po/ja/_.po +20 -2
data/test/po/ja/hello.edit.po +0 -1
data/test/po/non_ascii.pot +4 -4
data/test/po/np_.pot +8 -5
data/test/po/ns_.pot +6 -4
data/test/po/p_.pot +3 -3
data/test/po/s_.pot +6 -4
data/test/po/untranslated.pot +4 -4
data/test/run-test.rb +2 -3
data/test/test_class_info.rb +8 -9
data/test/test_gettext.rb +30 -1
data/test/test_locale_path.rb +12 -4
data/test/test_parser.rb +113 -25
data/test/test_po_entry.rb +21 -17
data/test/test_po_parser.rb +49 -4
data/test/test_string.rb +9 -5
data/test/tools/parser/test_glade.rb +91 -0
data/test/tools/parser/test_gtk_builder_ui_definitions.rb +63 -0
data/test/tools/parser/test_ruby.rb +76 -39
data/test/tools/test_msgcat.rb +21 -1
data/test/tools/test_msginit.rb +82 -3
data/test/tools/test_msgmerge.rb +81 -6
data/test/tools/test_xgettext.rb +106 -5
metadata +82 -34
data/lib/gettext/tools/parser/haml.rb +0 -61
/data/test/fixtures/{gladeparser.glade → glade/2.glade} +0 -0

data/lib/gettext/tools/parser/gtk_builder_ui_definitions.rb ADDED Viewed

@@ -0,0 +1,129 @@
+# Copyright (C) 2020  Sutou Kouhei <kou@clear-code.com>
+#
+# License: Ruby's or LGPL
+#
+# This library is free software: you can redistribute it and/or modify
+# it under the terms of the GNU Lesser General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# This library is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU Lesser General Public License for more details.
+#
+# You should have received a copy of the GNU Lesser General Public License
+# along with this program.  If not, see <http://www.gnu.org/licenses/>.
+require "English"
+require "cgi"
+require "strscan"
+require "gettext/po_entry"
+module GetText
+  class GtkBuilderUIDefinitionsParser
+    @config = {
+      :extnames => [".ui", ".glade"]
+    }
+    class << self
+      # Sets some preferences to parse GtkBuilder UI definitions files.
+      # * config: a Hash of the config. It can takes some values below:
+      #   * :extnames: An Array of target files extension.
+      #     Default is [".ui", ".glade"].
+      def init(config)
+        config.each do |k, v|
+          @config[k] = v
+        end
+      end
+      def target?(file) # :nodoc:
+        @config[:extnames].each do |extname|
+          next unless File.extname(file) == extname
+          next unless File.read(file).include?("<interface>")
+          return true
+        end
+        false
+      end
+      def parse(path, options={})
+        parser = new(path, options)
+        parser.parse
+      end
+    end
+    def initialize(path, options={})
+      @path = path
+      @options = options
+    end
+    def parse # :nodoc:
+      File.open(@path) do |file|
+        po = []
+        start_line_no = nil
+        property = nil
+        file.each_line do |line|
+          case line
+          when /<property/
+            property = $POSTMATCH
+            start_line_no = file.lineno
+            if /<\/property>/ =~ property
+              property << $PREMATCH
+              add_po_entry(po, property, start_line_no)
+              property = nil
+            end
+          when /<\/property>/
+            property << $PREMATCH
+            add_po_entry(po, property, start_line_no)
+            property = nil
+          else
+            property << line if property
+          end
+        end
+        po
+      end
+    end
+    private
+    def add_po_entry(po, property, line_no)
+      raw_attributes, raw_data_and_close_tag = property.split(">", 2)
+      raw_data, _close_tag = raw_data_and_close_tag.split("<", 2)
+      return if raw_data.empty?
+      attributes = parse_attributes(raw_attributes)
+      return unless attributes["translatable"] == "yes"
+      data = CGI.unescapeHTML(raw_data)
+      context = attributes["context"]
+      if context
+        po_entry = POEntry.new(:msgctxt)
+        po_entry.msgctxt = context
+      else
+        po_entry = POEntry.new(:normal)
+      end
+      po_entry.msgid = data
+      po_entry.references << "#{@path}:#{line_no}"
+      po << po_entry
+    end
+    def parse_attributes(raw_attributes)
+      scanner = StringScanner.new(raw_attributes)
+      attributes = {}
+      loop do
+        scanner.scan(/\s*/m)
+        break if scanner.eos?
+        name = scanner.scan(/[^=]+/)
+        break if name.nil?
+        break unless scanner.scan(/=/)
+        quote = scanner.scan(/["']/)
+        break if quote.nil?
+        value = scanner.scan(/[^#{Regexp.escape(quote)}]+/m)
+        break if value.nil?
+        break unless scanner.scan(/#{Regexp.escape(quote)}/)
+        attributes[name] = CGI.unescapeHTML(value)
+      end
+      attributes
+    end
+  end
+end

data/lib/gettext/tools/parser/ruby.rb CHANGED Viewed

@@ -1,8 +1,7 @@
-# -*- coding: utf-8 -*-
 =begin
   parser/ruby.rb - parser for ruby script
-  Copyright (C) 2013-2017  Kouhei Sutou <kou@clear-code.com>
+  Copyright (C) 2013-2021  Sutou Kouhei <kou@clear-code.com>
   Copyright (C) 2003-2009  Masao Mutoh
   Copyright (C) 2005       speakillof
   Copyright (C) 2001,2002  Yasushi Shoji, Masao Mutoh
@@ -12,162 +11,324 @@
 =end
-require "irb/ruby-lex"
+require "ripper"
 require "stringio"
-require "gettext/po_entry"
-require "ripper"
+require "gettext/po_entry"
 module GetText
-  class RubyLexX < RubyLex  # :nodoc: all
-    class StringExtractor < Ripper::Filter
+  class RubyParser
+    class POExtractor < Ripper::Filter
+      ID = ["gettext", "_", "N_", "sgettext", "s_"]
+      PLURAL_ID = ["ngettext", "n_", "Nn_", "ns_", "nsgettext"]
+      MSGCTXT_ID = ["pgettext", "p_"]
+      MSGCTXT_PLURAL_ID = ["npgettext", "np_"]
+      attr_accessor :use_comment
+      attr_accessor :comment_tag
       def initialize(*args)
-        super
+        super(*args)
+        @start_block = false
+        @in_block_arguments = false
+        @ignore_next_comma = false
+        @need_definition_name = false
+        @current_po_entry = nil
+        @current_po_entry_nth_attribute = 0
+        @use_comment = false
+        @comment_tag = nil
+        @last_comment = ""
+        @reset_comment = false
         @string_mark_stack = []
+        @string_stack = []
       end
-      def on_default(event, token, output)
-        case event
-        when :on_tstring_content
-          if @string_mark_stack.last == "\""
-            output << token.gsub(/\\./) do |data|
-              case data
-              when "\\n"
-                "\n"
-              when "\\t"
-                "\t"
-              when "\\\\"
-                "\\"
-              when "\\\""
-                "\""
-              when "\\\#"
-                "#"
-              else
-                data
-              end
-            end
-          else
-            output << token.gsub(/\\./) do |data|
-              case data
-              when "\\\\"
-                "\\"
-              when "\\'"
-                "'"
-              else
-                data
-              end
-            end
+      def process_on_op(token, po)
+        if @start_block
+          @in_block_arguments = (token == "|")
+        else
+          if @in_block_arguments and token == "|"
+            @in_block_arguments = false
           end
-        when :on_tstring_beg
-          unless @string_mark_stack.empty?
-            output << token
+        end
+        po
+      end
+      def process_on_kw(token, po)
+        store_po_entry(po)
+        case token
+        when "do"
+          @start_block = true
+        end
+        po
+      end
+      def process_on_lbrace(token, po)
+        store_po_entry(po)
+        @start_block = (state == Ripper::EXPR_BEG)
+        po
+      end
+      def process_on_ident(token, po)
+        store_po_entry(po)
+        return po if @in_block_arguments
+        return po if state.allbits?(Ripper::EXPR_ENDFN)
+        case token
+        when *ID
+          @current_po_entry = POEntry.new(:normal)
+        when *PLURAL_ID
+          @current_po_entry = POEntry.new(:plural)
+        when *MSGCTXT_ID
+          @current_po_entry = POEntry.new(:msgctxt)
+        when *MSGCTXT_PLURAL_ID
+          @current_po_entry = POEntry.new(:msgctxt_plural)
+        end
+        if @current_po_entry
+          @current_po_entry.add_comment(@last_comment) unless @last_comment.empty?
+          @last_comment = ""
+          @current_po_entry.references << "#{filename}:#{lineno}"
+          @current_po_entry_nth_attribute = 0
+        end
+        po
+      end
+      def process_on_const(token, po)
+        case token
+        when "N_", "Nn_"
+          # TODO: Check the next token is :on_lparen
+          process_on_ident(token, po)
+        else
+          po
+        end
+      end
+      def process_on_comment(token, po)
+        @last_comment = "" if @reset_comment
+        @reset_comment = false
+        if @last_comment.empty?
+          content = token.gsub(/\A#\s*/, "").chomp
+          if comment_to_be_extracted?(content)
+            @last_comment << content
           end
+        else
+          content = token.gsub(/\A#/, "").chomp
+          @last_comment << "\n"
+          @last_comment << content
+        end
+        po
+      end
+      def process_on_sp(token, po)
+        po
+      end
+      def process_on_tstring_beg(token, po)
+        if token.start_with?("%Q")
+          @string_mark_stack << "\""
+        elsif token.start_with?("%q")
+          @string_mark_stack << "'"
+        elsif token.start_with?("%")
+          @string_mark_stack << "\""
+        else
           @string_mark_stack << token
-        when :on_tstring_end
-          @string_mark_stack.pop
-          unless @string_mark_stack.empty?
-            output << token
+        end
+        @string_stack << ""
+        po
+      end
+      def process_on_tstring_content(token, po)
+        case @string_mark_stack.last
+        when "\"", "`"
+          @string_stack.last << token.gsub(/\\./) do |data|
+            case data
+            when "\\n"
+              "\n"
+            when "\\t"
+              "\t"
+            when "\\\\"
+              "\\"
+            when "\\\""
+              "\""
+            when "\\\#"
+              "#"
+            else
+              data
+            end
           end
         else
-          unless @string_mark_stack.empty?
-            output << token.to_s
+          @string_stack.last << token.gsub(/\\./) do |data|
+            case data
+            when "\\\\"
+              "\\"
+            when "\\'"
+              "'"
+            else
+              data
+            end
           end
         end
-        output
+        po
       end
-    end
-    # Parser#parse resemlbes RubyLex#lex
-    def parse
-      until (  (tk = token).kind_of?(RubyToken::TkEND_OF_SCRIPT) && !@continue or tk.nil?  )
-        s = get_readed
-        if RubyToken::TkSTRING === tk or RubyToken::TkDSTRING === tk
-          def tk.value
-            @value
+      def process_on_tstring_end(token, po)
+        @ignore_next_comma = false
+        string_mark = @string_mark_stack.pop
+        case string_mark
+        when "\"", "'"
+          last_string = @string_stack.pop
+          if @current_po_entry and last_string
+            @current_po_entry[@current_po_entry_nth_attribute] =
+              (@current_po_entry[@current_po_entry_nth_attribute] || "") +
+              last_string
           end
+        end
+        po
+      end
-          def tk.value=(s)
-            @value = s
-          end
+      def process_on_heredoc_beg(token, po)
+        if token.end_with?("'")
+          @string_mark_stack << "'"
+        else
+          @string_mark_stack << "\""
+        end
+        @string_stack << ""
+        po
+      end
-          if @here_header
-            s = s.sub(/\A.*?\n/, "").sub(/^.*\n\Z/, "")
-          else
-            s = StringExtractor.new(s).parse("")
-          end
+      def process_on_heredoc_end(token, po)
+        process_on_tstring_end(token, po)
+      end
-          tk.value = s
-        end
+      def process_on_regexp_beg(token, po)
+        @string_mark_stack << "\""
+        @string_stack << ""
+        po
+      end
+      def process_on_regexp_end(token, po)
+        @string_mark_stack.pop
+        @string_stack.pop
+        po
+      end
-        if $DEBUG
-          if tk.is_a? TkSTRING or tk.is_a? TkDSTRING
-            $stderr.puts("#{tk}: #{tk.value}")
-          elsif tk.is_a? TkIDENTIFIER
-            $stderr.puts("#{tk}: #{tk.name}")
-          else
-            $stderr.puts(tk)
+      def process_on_embexpr_beg(token, po)
+        @current_po_entry = nil
+        @current_po_entry_nth_attribute = 0
+        po
+      end
+      def process_on_int(token, po)
+        @ignore_next_comma = true
+        po
+      end
+      def process_on_comma(token, po)
+        unless @ignore_next_comma
+          if @current_po_entry
+            @current_po_entry_nth_attribute += 1
           end
         end
+        po
+      end
-        yield tk
+      def process_on_rparen(token, po)
+        store_po_entry(po)
+        po
+      end
+      def process_on_nl(token, po)
+        @reset_comment = true
+        po
+      end
+      def process_on_symbeg(token, po)
+        if token.start_with?("%s") or [":'", ":\""].include?(token)
+          @string_mark_stack << ":"
+          @string_stack << ""
+        end
+        po
+      end
+      def process_on_backtick(token, po)
+        @string_mark_stack << "`"
+        @string_stack << ""
+        po
       end
-      return nil
-    end
-    # Original parser does not keep the content of the comments,
-    # so monkey patching this with new token type and extended
-    # identify_comment implementation
-    RubyToken.def_token :TkCOMMENT_WITH_CONTENT, TkVal
+      def process_on_symbols_beg(token, po)
+        @string_mark_stack << "\""
+        @string_stack << ""
+        po
+      end
-    def identify_comment
-      @ltype = "#"
-      get_readed # skip the hash sign itself
+      def process_on_qsymbols_beg(token, po)
+        @string_mark_stack << token
+        @string_stack << ""
+        po
+      end
+      def process_on_words_beg(token, po)
+        @string_mark_stack << "\""
+        @string_stack << ""
+        po
+      end
-      while ch = getc
-        if ch == "\n"
-          @ltype = nil
-          ungetc
-          break
+      def process_on_qwords_beg(token, po)
+        @string_mark_stack << token
+        @string_stack << ""
+        po
+      end
+      def on_default(event, token, po)
+        trace(event, token) do
+          process_method = "process_#{event}"
+          start_block = @start_block
+          if respond_to?(process_method)
+            po = __send__(process_method, token, po)
+          end
+          if start_block and event != :on_sp
+            @start_block = false
+          end
+          po
         end
       end
-      return Token(TkCOMMENT_WITH_CONTENT, get_readed)
-    end
-  end
+      private
+      @@debug = ENV["GETTEXT_RUBY_PARSER_DEBUG"]
+      def debug?
+        @@debug
+      end
-  # Extends POEntry for RubyParser.
-  # Implements a sort of state machine to assist the parser.
-  module POEntryForRubyParser
-    # Supports parsing by setting attributes by and by.
-    def set_current_attribute(str)
-      param = @param_type[@param_number]
-      raise ParseError, "no more string parameters expected" unless param
-      set_value(param, str)
-    end
+      def trace(event_name, token)
+        if debug?
+          status = [
+            event_name,
+            token,
+            state,
+          ]
+          status << :start_block if @start_block
+          status << :in_block_arguments if @in_block_arguments
+          pp status
+        end
+        yield
+      end
-    def init_param
-      @param_number = 0
-      self
-    end
+      def store_po_entry(po)
+        return if @current_po_entry.nil?
+        po << @current_po_entry if @current_po_entry.msgid
+        @current_po_entry = nil
+        @current_po_entry_nth_attribute = 0
+      end
-    def advance_to_next_attribute
-      @param_number += 1
-    end
-  end
-  class POEntry
-    include POEntryForRubyParser
-    alias :initialize_old :initialize
-    def initialize(type)
-      initialize_old(type)
-      init_param
-    end
-  end
+      def comment_to_be_extracted?(comment)
+        return false unless @use_comment
-  class RubyParser
-    ID = ["gettext", "_", "N_", "sgettext", "s_"]
-    PLURAL_ID = ["ngettext", "n_", "Nn_", "ns_", "nsgettext"]
-    MSGCTXT_ID = ["pgettext", "p_"]
-    MSGCTXT_PLURAL_ID = ["npgettext", "np_"]
+        return true if @comment_tag.nil?
+        comment.start_with?(@comment_tag)
+      end
+    end
     class << self
       def target?(file)  # :nodoc:
@@ -282,106 +443,12 @@ module GetText
     end
     def parse_source(source)
-      po = []
-      file = StringIO.new(source)
-      rl = RubyLexX.new
-      rl.set_input(file)
-      rl.skip_space = true
-      #rl.readed_auto_clean_up = true
-      po_entry = nil
-      line_no = nil
-      last_comment = ""
-      reset_comment = false
-      ignore_next_comma = false
-      rl.parse do |tk|
-        begin
-          ignore_current_comma = ignore_next_comma
-          ignore_next_comma = false
-          case tk
-          when RubyToken::TkIDENTIFIER, RubyToken::TkCONSTANT
-            if store_po_entry(po, po_entry, line_no, last_comment)
-              last_comment = ""
-            end
-            if ID.include?(tk.name)
-              po_entry = POEntry.new(:normal)
-            elsif PLURAL_ID.include?(tk.name)
-              po_entry = POEntry.new(:plural)
-            elsif MSGCTXT_ID.include?(tk.name)
-              po_entry = POEntry.new(:msgctxt)
-            elsif MSGCTXT_PLURAL_ID.include?(tk.name)
-              po_entry = POEntry.new(:msgctxt_plural)
-            else
-              po_entry = nil
-            end
-            line_no = tk.line_no.to_s
-          when RubyToken::TkBITOR
-            po_entry = nil
-          when RubyToken::TkSTRING, RubyToken::TkDSTRING
-            po_entry.set_current_attribute tk.value if po_entry
-          when RubyToken::TkPLUS, RubyToken::TkNL
-            #do nothing
-          when RubyToken::TkINTEGER
-            ignore_next_comma = true
-          when RubyToken::TkCOMMA
-            unless ignore_current_comma
-              po_entry.advance_to_next_attribute if po_entry
-            end
-          else
-            if store_po_entry(po, po_entry, line_no, last_comment)
-              po_entry = nil
-              last_comment = ""
-            end
-          end
-        rescue
-          $stderr.print "\n\nError"
-          $stderr.print " parsing #{@path}:#{tk.line_no}\n\t #{source.lines.to_a[tk.line_no - 1]}" if tk
-          $stderr.print "\n #{$!.inspect} in\n"
-          $stderr.print $!.backtrace.join("\n")
-          $stderr.print "\n"
-          exit 1
-        end
-        case tk
-        when RubyToken::TkCOMMENT_WITH_CONTENT
-          last_comment = "" if reset_comment
-          if last_comment.empty?
-            comment1 = tk.value.lstrip
-            if comment_to_be_extracted?(comment1)
-              last_comment += comment1
-            end
-          else
-            last_comment += "\n"
-            last_comment += tk.value
-          end
-          reset_comment = false
-        when RubyToken::TkNL
-        else
-          reset_comment = true
-        end
+      extractor = POExtractor.new(source, @path)
+      if @options.key?(:comment_tag)
+        extractor.use_comment = true
+        extractor.comment_tag = @options[:comment_tag]
       end
-      po
-    end
-    private
-    def store_po_entry(po, po_entry, line_no, last_comment) #:nodoc:
-      if po_entry && po_entry.msgid
-        po_entry.references << @path + ":" + line_no
-        po_entry.add_comment(last_comment) unless last_comment.empty?
-        po << po_entry
-        true
-      else
-        false
-      end
-    end
-    def comment_to_be_extracted?(comment)
-      return false unless @options.has_key?(:comment_tag)
-      tag = @options[:comment_tag]
-      return true if tag.nil?
-      /\A#{Regexp.escape(tag)}/ === comment
+      extractor.parse([])
     end
   end
 end