RubyGems - ruby_parser-legacy - Versions diffs - 1.0.0 - Mend

ruby_parser-legacy 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

checksums.yaml +7 -0
checksums.yaml.gz.sig +1 -0
data.tar.gz.sig +1 -0
data/.autotest +26 -0
data/History.rdoc +6 -0
data/Manifest.txt +19 -0
data/README.rdoc +54 -0
data/Rakefile +49 -0
data/lib/ruby_parser/legacy.rb +5 -0
data/lib/ruby_parser/legacy/ruby18_parser.rb +5794 -0
data/lib/ruby_parser/legacy/ruby18_parser.y +1909 -0
data/lib/ruby_parser/legacy/ruby19_parser.rb +6186 -0
data/lib/ruby_parser/legacy/ruby19_parser.y +2117 -0
data/lib/ruby_parser/legacy/ruby_lexer.rb +1412 -0
data/lib/ruby_parser/legacy/ruby_lexer.rex +179 -0
data/lib/ruby_parser/legacy/ruby_lexer.rex.rb +323 -0
data/lib/ruby_parser/legacy/ruby_parser.rb +30 -0
data/lib/ruby_parser/legacy/ruby_parser_extras.rb +1388 -0
data/test/ruby_parser/test_legacy.rb +8 -0
data/test/ruby_parser/test_ruby_lexer.rb +2984 -0
data/test/ruby_parser/test_ruby_parser.rb +3951 -0
data/test/ruby_parser/test_ruby_parser_extras.rb +226 -0
metadata +181 -0
metadata.gz.sig +0 -0

data/lib/ruby_parser/legacy/ruby_lexer.rex ADDED

@@ -0,0 +1,179 @@
+# encoding: UTF-8
+#
+# lexical scanner definition for ruby
+class RubyParser::Legacy::RubyLexer
+macro
+  IDENT         /^#{IDENT_CHAR}+/o
+  ESC           /\\((?>[0-7]{1,3}|x[0-9a-fA-F]{1,2}|M-[^\\]|(C-|c)[^\\]|u[0-9a-fA-F]+|u\{[0-9a-fA-F]+\}|[^0-7xMCc]))/
+  SIMPLE_STRING /((#{ESC}|\#(#{ESC}|[^\{\#\@\$\"\\])|[^\"\\\#])*)/o
+  SSTRING       /((\\.|[^\'])*)/
+  INT_DEC       /[+]?(?:(?:[1-9][\d_]*|0)(?!\.\d)(ri|r|i)?\b|0d[0-9_]+)(ri|r|i)?/i
+  INT_HEX       /[+]?0x[a-f0-9_]+(ri|r|i)?/i
+  INT_BIN       /[+]?0b[01_]+(ri|r|i)?/i
+  INT_OCT       /[+]?0o?[0-7_]+(ri|r|i)?|0o(ri|r|i)?/i
+  FLOAT         /[+]?\d[\d_]*\.[\d_]+(e[+-]?[\d_]+)?(?:(ri|r|i)\b)?|[+]?[\d_]+e[+-]?[\d_]+(?:(ri|r|i)\b)?/i
+  INT_DEC2      /[+]?\d[0-9_]*(?![e])((ri|r|i)\b)?/i
+  NUM_BAD       /[+]?0[xbd]\b/i
+  INT_OCT_BAD   /[+]?0o?[0-7_]*[89]/i
+  FLOAT_BAD     /[+]?\d[\d_]*_(e|\.)/i
+start
+  return process_string if lex_strterm
+  self.cmd_state = self.command_start
+  self.command_start = false
+  self.space_seen    = false # TODO: rename token_seen?
+  self.last_state    = lex_state
+rule
+# [:state]      pattern                 [actions]
+                # \s - \n + \v
+                /[\ \t\r\f\v]/          { self.space_seen = true; next }
+                /\n|\#/                 process_newline_or_comment
+                /[\]\)\}]/              process_brace_close
+: /\!/
+| in_arg_state? /\!\@/                  { result :expr_arg, :tUBANG, "!@" }
+|               /\![=~]?/               { result :arg_state, TOKENS[text], text }
+: /\./
+|               /\.\.\.?/               { result :expr_beg, TOKENS[text], text }
+|               /\.\d/                  { rb_compile_error "no .<digit> floating literal anymore put 0 before dot" }
+|               /\./                    { self.lex_state = :expr_beg; result :expr_dot, :tDOT, "." }
+                /\(/                    process_paren
+# TODO: :expr_beg|:expr_label
+                /\,/                    { result :expr_beg, TOKENS[text], text }
+: /=/
+|               /\=\=\=|\=\=|\=~|\=>|\=(?!begin\b)/ { result arg_state, TOKENS[text], text }
+| bol?          /\=begin(?=\s)/         process_begin
+|               /\=(?=begin\b)/         { result arg_state, TOKENS[text], text }
+ruby22_label?   /\"#{SIMPLE_STRING}\":/o process_label
+                /\"(#{SIMPLE_STRING})\"/o { result :expr_end, :tSTRING, text[1..-2].gsub(ESC) { unescape $1 } }
+                /\"/                    { string STR_DQUOTE; result nil, :tSTRING_BEG, text }
+                /\@\@?\d/               { rb_compile_error "`#{text}` is not allowed as a variable name" }
+                /\@\@?#{IDENT_CHAR}+/o  process_ivar
+: /:/
+| not_end?      /:([a-zA-Z_]#{IDENT_CHAR}*(?:[?]|[!](?!=)|=(?==>)|=(?![=>]))?)/o process_symbol
+| not_end?      /\:\"(#{SIMPLE_STRING})\"/o process_symbol
+| not_end?      /\:\'(#{SSTRING})\'/o       process_symbol
+|               /\:\:/                      process_colon2
+|               /\:/                        process_colon1
+                /->/                    { result :expr_endfn, :tLAMBDA, nil }
+                /[+-]/                  process_plus_minus
+: /[+\d]/
+|               /#{NUM_BAD}/o           { rb_compile_error "Invalid numeric format"  }
+|               /#{INT_DEC}/o           { int_with_base 10                           }
+|               /#{INT_HEX}/o           { int_with_base 16                           }
+|               /#{INT_BIN}/o           { int_with_base 2                            }
+|               /#{INT_OCT_BAD}/o       { rb_compile_error "Illegal octal digit."    }
+|               /#{INT_OCT}/o           { int_with_base 8                            }
+|               /#{FLOAT_BAD}/o         { rb_compile_error "Trailing '_' in number." }
+|               /#{FLOAT}/o             process_float
+|               /#{INT_DEC2}/o          { int_with_base 10                           }
+|               /[0-9]/                 { rb_compile_error "Bad number format" }
+                /\[/                    process_square_bracket
+was_label?        /\'#{SSTRING}\':?/o   process_label_or_string
+: /\|/
+|               /\|\|\=/                { result :expr_beg, :tOP_ASGN, "||" }
+|               /\|\|/                  { result :expr_beg, :tOROP,    "||" }
+|               /\|\=/                  { result :expr_beg, :tOP_ASGN, "|" }
+|               /\|/                    { result :arg_state, :tPIPE,    "|" }
+                /\{/                    process_brace_open
+: /\*/
+|               /\*\*=/                 { result :expr_beg, :tOP_ASGN, "**" }
+|               /\*\*/                  { result(:arg_state, space_vs_beginning(:tDSTAR, :tDSTAR, :tPOW), "**") }
+|               /\*\=/                  { result(:expr_beg, :tOP_ASGN, "*") }
+|               /\*/                    { result(:arg_state, space_vs_beginning(:tSTAR, :tSTAR, :tSTAR2), "*") }
+# TODO: fix result+process_lchevron to set command_start = true
+: /</
+|               /\<\=\>/                { result :arg_state, :tCMP, "<=>"    }
+|               /\<\=/                  { result :arg_state, :tLEQ, "<="     }
+|               /\<\<\=/                { result :expr_beg,  :tOP_ASGN, "<<" }
+|               /\<\</                  process_lchevron
+|               /\</                    { result :arg_state, :tLT, "<"       }
+: />/
+|               /\>\=/                  { result :arg_state, :tGEQ, ">="     }
+|               /\>\>=/                 { result :expr_beg,  :tOP_ASGN, ">>" }
+|               /\>\>/                  { result :arg_state, :tRSHFT, ">>"   }
+|               /\>/                    { result :arg_state, :tGT, ">"       }
+: /\`/
+| expr_fname?   /\`/                   { result(:expr_end, :tBACK_REF2, "`") }
+| expr_dot?     /\`/                   { result((cmd_state ? :expr_cmdarg : :expr_arg), :tBACK_REF2, "`") }
+|               /\`/                   { string STR_XQUOTE, '`'; result(nil, :tXSTRING_BEG, "`") }
+                /\?/                    process_questionmark
+: /&/
+|               /\&\&\=/                { result(:expr_beg, :tOP_ASGN, "&&") }
+|               /\&\&/                  { result(:expr_beg, :tANDOP,   "&&") }
+|               /\&\=/                  { result(:expr_beg, :tOP_ASGN, "&" ) }
+|               /\&\./                  { result(:expr_dot, :tLONELY,  "&.") }
+|               /\&/                    process_amper
+                /\//                    process_slash
+: /\^/
+|               /\^=/                   { result(:expr_beg, :tOP_ASGN, "^") }
+|               /\^/                    { result(:arg_state, :tCARET, "^") }
+                /\;/                    { self.command_start = true; result(:expr_beg, :tSEMI, ";") }
+: /~/
+| in_arg_state? /\~@/                   { result(:arg_state, :tTILDE, "~") }
+|               /\~/                    { result(:arg_state, :tTILDE, "~") }
+: /\\/
+|               /\\\r?\n/               { self.lineno += 1; self.space_seen = true; next }
+|               /\\/                    { rb_compile_error "bare backslash only allowed before newline" }
+                /\%/                    process_percent
+: /\$/
+|               /\$_\w+/                         process_gvar
+|               /\$_/                            process_gvar
+|               /\$[~*$?!@\/\\;,.=:<>\"]|\$-\w?/ process_gvar
+| in_fname?     /\$([\&\`\'\+])/                 process_gvar
+|               /\$([\&\`\'\+])/                 process_backref
+| in_fname?     /\$([1-9]\d*)/                   process_gvar
+|               /\$([1-9]\d*)/                   process_nthref
+|               /\$0/                            process_gvar
+|               /\$\W|\$\z/                      process_gvar_oddity
+|               /\$\w+/                          process_gvar
+                /\_/                    process_underscore
+                /#{IDENT}/o             process_token
+                /\004|\032|\000|\Z/     { [RubyLexer::EOF, RubyLexer::EOF] }
+                /./                     { rb_compile_error "Invalid char #{text.inspect} in expression" }
+end

data/lib/ruby_parser/legacy/ruby_lexer.rex.rb ADDED

@@ -0,0 +1,323 @@
+# encoding: UTF-8
+#--
+# This file is automatically generated. Do not modify it.
+# Generated by: oedipus_lex version 2.5.0.
+# Source: lib/ruby_parser/legacy/ruby_lexer.rex
+#++
+#
+# lexical scanner definition for ruby
+class RubyParser::Legacy::RubyLexer
+  require 'strscan'
+  IDENT         = /^#{IDENT_CHAR}+/o
+  ESC           = /\\((?>[0-7]{1,3}|x[0-9a-fA-F]{1,2}|M-[^\\]|(C-|c)[^\\]|u[0-9a-fA-F]+|u\{[0-9a-fA-F]+\}|[^0-7xMCc]))/
+  SIMPLE_STRING = /((#{ESC}|\#(#{ESC}|[^\{\#\@\$\"\\])|[^\"\\\#])*)/o
+  SSTRING       = /((\\.|[^\'])*)/
+  INT_DEC       = /[+]?(?:(?:[1-9][\d_]*|0)(?!\.\d)(ri|r|i)?\b|0d[0-9_]+)(ri|r|i)?/i
+  INT_HEX       = /[+]?0x[a-f0-9_]+(ri|r|i)?/i
+  INT_BIN       = /[+]?0b[01_]+(ri|r|i)?/i
+  INT_OCT       = /[+]?0o?[0-7_]+(ri|r|i)?|0o(ri|r|i)?/i
+  FLOAT         = /[+]?\d[\d_]*\.[\d_]+(e[+-]?[\d_]+)?(?:(ri|r|i)\b)?|[+]?[\d_]+e[+-]?[\d_]+(?:(ri|r|i)\b)?/i
+  INT_DEC2      = /[+]?\d[0-9_]*(?![e])((ri|r|i)\b)?/i
+  NUM_BAD       = /[+]?0[xbd]\b/i
+  INT_OCT_BAD   = /[+]?0o?[0-7_]*[89]/i
+  FLOAT_BAD     = /[+]?\d[\d_]*_(e|\.)/i
+  class LexerError < StandardError ; end
+  class ScanError < LexerError ; end
+  attr_accessor :filename
+  attr_accessor :ss
+  attr_accessor :state
+  alias :match :ss
+  def matches
+    m = (1..9).map { |i| ss[i] }
+    m.pop until m[-1] or m.empty?
+    m
+  end
+  def action
+    yield
+  end
+  def scanner_class
+    StringScanner
+  end unless instance_methods(false).map(&:to_s).include?("scanner_class")
+  def parse str
+    self.ss     = scanner_class.new str
+    self.state  ||= nil
+    do_parse
+  end
+  def parse_file path
+    self.filename = path
+    open path do |f|
+      parse f.read
+    end
+  end
+  def location
+    [
+      (filename || "<input>"),
+    ].compact.join(":")
+  end
+  def next_token
+    return process_string if lex_strterm
+    self.cmd_state = self.command_start
+    self.command_start = false
+    self.space_seen    = false # TODO: rename token_seen?
+    self.last_state    = lex_state
+    token = nil
+    until ss.eos? or token do
+      token =
+        case state
+        when nil then
+          case
+          when ss.skip(/[\ \t\r\f\v]/) then
+            action { self.space_seen = true; next }
+          when text = ss.scan(/\n|\#/) then
+            process_newline_or_comment text
+          when text = ss.scan(/[\]\)\}]/) then
+            process_brace_close text
+          when ss.match?(/\!/) then
+            case
+            when in_arg_state? && (ss.skip(/\!\@/)) then
+              action { result :expr_arg, :tUBANG, "!@" }
+            when text = ss.scan(/\![=~]?/) then
+              action { result :arg_state, TOKENS[text], text }
+            end # group /\!/
+          when ss.match?(/\./) then
+            case
+            when text = ss.scan(/\.\.\.?/) then
+              action { result :expr_beg, TOKENS[text], text }
+            when ss.skip(/\.\d/) then
+              action { rb_compile_error "no .<digit> floating literal anymore put 0 before dot" }
+            when ss.skip(/\./) then
+              action { self.lex_state = :expr_beg; result :expr_dot, :tDOT, "." }
+            end # group /\./
+          when text = ss.scan(/\(/) then
+            process_paren text
+          when text = ss.scan(/\,/) then
+            action { result :expr_beg, TOKENS[text], text }
+          when ss.match?(/=/) then
+            case
+            when text = ss.scan(/\=\=\=|\=\=|\=~|\=>|\=(?!begin\b)/) then
+              action { result arg_state, TOKENS[text], text }
+            when bol? && (text = ss.scan(/\=begin(?=\s)/)) then
+              process_begin text
+            when text = ss.scan(/\=(?=begin\b)/) then
+              action { result arg_state, TOKENS[text], text }
+            end # group /=/
+          when ruby22_label? && (text = ss.scan(/\"#{SIMPLE_STRING}\":/o)) then
+            process_label text
+          when text = ss.scan(/\"(#{SIMPLE_STRING})\"/o) then
+            action { result :expr_end, :tSTRING, text[1..-2].gsub(ESC) { unescape $1 } }
+          when text = ss.scan(/\"/) then
+            action { string STR_DQUOTE; result nil, :tSTRING_BEG, text }
+          when text = ss.scan(/\@\@?\d/) then
+            action { rb_compile_error "`#{text}` is not allowed as a variable name" }
+          when text = ss.scan(/\@\@?#{IDENT_CHAR}+/o) then
+            process_ivar text
+          when ss.match?(/:/) then
+            case
+            when not_end? && (text = ss.scan(/:([a-zA-Z_]#{IDENT_CHAR}*(?:[?]|[!](?!=)|=(?==>)|=(?![=>]))?)/o)) then
+              process_symbol text
+            when not_end? && (text = ss.scan(/\:\"(#{SIMPLE_STRING})\"/o)) then
+              process_symbol text
+            when not_end? && (text = ss.scan(/\:\'(#{SSTRING})\'/o)) then
+              process_symbol text
+            when text = ss.scan(/\:\:/) then
+              process_colon2 text
+            when text = ss.scan(/\:/) then
+              process_colon1 text
+            end # group /:/
+          when ss.skip(/->/) then
+            action { result :expr_endfn, :tLAMBDA, nil }
+          when text = ss.scan(/[+-]/) then
+            process_plus_minus text
+          when ss.match?(/[+\d]/) then
+            case
+            when ss.skip(/#{NUM_BAD}/o) then
+              action { rb_compile_error "Invalid numeric format"  }
+            when ss.skip(/#{INT_DEC}/o) then
+              action { int_with_base 10                           }
+            when ss.skip(/#{INT_HEX}/o) then
+              action { int_with_base 16                           }
+            when ss.skip(/#{INT_BIN}/o) then
+              action { int_with_base 2                            }
+            when ss.skip(/#{INT_OCT_BAD}/o) then
+              action { rb_compile_error "Illegal octal digit."    }
+            when ss.skip(/#{INT_OCT}/o) then
+              action { int_with_base 8                            }
+            when ss.skip(/#{FLOAT_BAD}/o) then
+              action { rb_compile_error "Trailing '_' in number." }
+            when text = ss.scan(/#{FLOAT}/o) then
+              process_float text
+            when ss.skip(/#{INT_DEC2}/o) then
+              action { int_with_base 10                           }
+            when ss.skip(/[0-9]/) then
+              action { rb_compile_error "Bad number format" }
+            end # group /[+\d]/
+          when text = ss.scan(/\[/) then
+            process_square_bracket text
+          when was_label? && (text = ss.scan(/\'#{SSTRING}\':?/o)) then
+            process_label_or_string text
+          when ss.match?(/\|/) then
+            case
+            when ss.skip(/\|\|\=/) then
+              action { result :expr_beg, :tOP_ASGN, "||" }
+            when ss.skip(/\|\|/) then
+              action { result :expr_beg, :tOROP,    "||" }
+            when ss.skip(/\|\=/) then
+              action { result :expr_beg, :tOP_ASGN, "|" }
+            when ss.skip(/\|/) then
+              action { result :arg_state, :tPIPE,    "|" }
+            end # group /\|/
+          when text = ss.scan(/\{/) then
+            process_brace_open text
+          when ss.match?(/\*/) then
+            case
+            when ss.skip(/\*\*=/) then
+              action { result :expr_beg, :tOP_ASGN, "**" }
+            when ss.skip(/\*\*/) then
+              action { result(:arg_state, space_vs_beginning(:tDSTAR, :tDSTAR, :tPOW), "**") }
+            when ss.skip(/\*\=/) then
+              action { result(:expr_beg, :tOP_ASGN, "*") }
+            when ss.skip(/\*/) then
+              action { result(:arg_state, space_vs_beginning(:tSTAR, :tSTAR, :tSTAR2), "*") }
+            end # group /\*/
+          when ss.match?(/</) then
+            case
+            when ss.skip(/\<\=\>/) then
+              action { result :arg_state, :tCMP, "<=>"    }
+            when ss.skip(/\<\=/) then
+              action { result :arg_state, :tLEQ, "<="     }
+            when ss.skip(/\<\<\=/) then
+              action { result :expr_beg,  :tOP_ASGN, "<<" }
+            when text = ss.scan(/\<\</) then
+              process_lchevron text
+            when ss.skip(/\</) then
+              action { result :arg_state, :tLT, "<"       }
+            end # group /</
+          when ss.match?(/>/) then
+            case
+            when ss.skip(/\>\=/) then
+              action { result :arg_state, :tGEQ, ">="     }
+            when ss.skip(/\>\>=/) then
+              action { result :expr_beg,  :tOP_ASGN, ">>" }
+            when ss.skip(/\>\>/) then
+              action { result :arg_state, :tRSHFT, ">>"   }
+            when ss.skip(/\>/) then
+              action { result :arg_state, :tGT, ">"       }
+            end # group />/
+          when ss.match?(/\`/) then
+            case
+            when expr_fname? && (ss.skip(/\`/)) then
+              action { result(:expr_end, :tBACK_REF2, "`") }
+            when expr_dot? && (ss.skip(/\`/)) then
+              action { result((cmd_state ? :expr_cmdarg : :expr_arg), :tBACK_REF2, "`") }
+            when ss.skip(/\`/) then
+              action { string STR_XQUOTE, '`'; result(nil, :tXSTRING_BEG, "`") }
+            end # group /\`/
+          when text = ss.scan(/\?/) then
+            process_questionmark text
+          when ss.match?(/&/) then
+            case
+            when ss.skip(/\&\&\=/) then
+              action { result(:expr_beg, :tOP_ASGN, "&&") }
+            when ss.skip(/\&\&/) then
+              action { result(:expr_beg, :tANDOP,   "&&") }
+            when ss.skip(/\&\=/) then
+              action { result(:expr_beg, :tOP_ASGN, "&" ) }
+            when ss.skip(/\&\./) then
+              action { result(:expr_dot, :tLONELY,  "&.") }
+            when text = ss.scan(/\&/) then
+              process_amper text
+            end # group /&/
+          when text = ss.scan(/\//) then
+            process_slash text
+          when ss.match?(/\^/) then
+            case
+            when ss.skip(/\^=/) then
+              action { result(:expr_beg, :tOP_ASGN, "^") }
+            when ss.skip(/\^/) then
+              action { result(:arg_state, :tCARET, "^") }
+            end # group /\^/
+          when ss.skip(/\;/) then
+            action { self.command_start = true; result(:expr_beg, :tSEMI, ";") }
+          when ss.match?(/~/) then
+            case
+            when in_arg_state? && (ss.skip(/\~@/)) then
+              action { result(:arg_state, :tTILDE, "~") }
+            when ss.skip(/\~/) then
+              action { result(:arg_state, :tTILDE, "~") }
+            end # group /~/
+          when ss.match?(/\\/) then
+            case
+            when ss.skip(/\\\r?\n/) then
+              action { self.lineno += 1; self.space_seen = true; next }
+            when ss.skip(/\\/) then
+              action { rb_compile_error "bare backslash only allowed before newline" }
+            end # group /\\/
+          when text = ss.scan(/\%/) then
+            process_percent text
+          when ss.match?(/\$/) then
+            case
+            when text = ss.scan(/\$_\w+/) then
+              process_gvar text
+            when text = ss.scan(/\$_/) then
+              process_gvar text
+            when text = ss.scan(/\$[~*$?!@\/\\;,.=:<>\"]|\$-\w?/) then
+              process_gvar text
+            when in_fname? && (text = ss.scan(/\$([\&\`\'\+])/)) then
+              process_gvar text
+            when text = ss.scan(/\$([\&\`\'\+])/) then
+              process_backref text
+            when in_fname? && (text = ss.scan(/\$([1-9]\d*)/)) then
+              process_gvar text
+            when text = ss.scan(/\$([1-9]\d*)/) then
+              process_nthref text
+            when text = ss.scan(/\$0/) then
+              process_gvar text
+            when text = ss.scan(/\$\W|\$\z/) then
+              process_gvar_oddity text
+            when text = ss.scan(/\$\w+/) then
+              process_gvar text
+            end # group /\$/
+          when text = ss.scan(/\_/) then
+            process_underscore text
+          when text = ss.scan(/#{IDENT}/o) then
+            process_token text
+          when ss.skip(/\004|\032|\000|\Z/) then
+            action { [RubyLexer::EOF, RubyLexer::EOF] }
+          when text = ss.scan(/./) then
+            action { rb_compile_error "Invalid char #{text.inspect} in expression" }
+          else
+            text = ss.string[ss.pos .. -1]
+            raise ScanError, "can not match (#{state.inspect}) at #{location}: '#{text}'"
+          end
+        else
+          raise ScanError, "undefined state at #{location}: '#{state}'"
+        end # token = case state
+      next unless token # allow functions to trigger redo w/ nil
+    end # while
+    raise LexerError, "bad lexical result at #{location}: #{token.inspect}" unless
+      token.nil? || (Array === token && token.size >= 2)
+    # auto-switch state
+    self.state = token.last if token && token.first == :state
+    token
+  end # def next_token
+end # class