RubyGems - regexp_parser - Versions diffs - 1.5.0 → 1.8.0 - Mend

regexp_parser 1.5.0 → 1.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +59 -0
data/Gemfile +3 -3
data/README.md +14 -6
data/Rakefile +3 -4
data/lib/regexp_parser/expression.rb +6 -43
data/lib/regexp_parser/expression/classes/conditional.rb +3 -2
data/lib/regexp_parser/expression/classes/escape.rb +0 -4
data/lib/regexp_parser/expression/methods/match.rb +13 -0
data/lib/regexp_parser/expression/methods/match_length.rb +1 -1
data/lib/regexp_parser/expression/methods/options.rb +35 -0
data/lib/regexp_parser/expression/methods/strfregexp.rb +0 -1
data/lib/regexp_parser/expression/methods/tests.rb +6 -15
data/lib/regexp_parser/expression/methods/traverse.rb +3 -1
data/lib/regexp_parser/expression/sequence.rb +3 -2
data/lib/regexp_parser/expression/sequence_operation.rb +2 -6
data/lib/regexp_parser/lexer.rb +4 -25
data/lib/regexp_parser/parser.rb +40 -33
data/lib/regexp_parser/scanner.rb +1208 -1353
data/lib/regexp_parser/scanner/char_type.rl +0 -3
data/lib/regexp_parser/scanner/properties/long.yml +15 -1
data/lib/regexp_parser/scanner/properties/short.yml +5 -0
data/lib/regexp_parser/scanner/scanner.rl +116 -202
data/lib/regexp_parser/syntax/tokens/unicode_property.rb +30 -0
data/lib/regexp_parser/syntax/versions/2.6.2.rb +10 -0
data/lib/regexp_parser/syntax/versions/2.6.3.rb +10 -0
data/lib/regexp_parser/version.rb +1 -1
data/spec/expression/base_spec.rb +14 -0
data/spec/expression/methods/match_length_spec.rb +20 -0
data/spec/expression/methods/match_spec.rb +25 -0
data/spec/expression/methods/tests_spec.rb +2 -0
data/spec/expression/methods/traverse_spec.rb +21 -0
data/spec/expression/options_spec.rb +128 -0
data/spec/expression/root_spec.rb +9 -0
data/spec/expression/sequence_spec.rb +9 -0
data/spec/lexer/conditionals_spec.rb +49 -119
data/spec/lexer/delimiters_spec.rb +68 -0
data/spec/lexer/escapes_spec.rb +8 -32
data/spec/lexer/keep_spec.rb +5 -17
data/spec/lexer/literals_spec.rb +73 -110
data/spec/lexer/nesting_spec.rb +86 -117
data/spec/lexer/refcalls_spec.rb +51 -50
data/spec/parser/all_spec.rb +13 -1
data/spec/parser/anchors_spec.rb +9 -23
data/spec/parser/conditionals_spec.rb +9 -9
data/spec/parser/errors_spec.rb +22 -43
data/spec/parser/escapes_spec.rb +33 -44
data/spec/parser/free_space_spec.rb +25 -4
data/spec/parser/groups_spec.rb +98 -257
data/spec/parser/keep_spec.rb +2 -15
data/spec/parser/options_spec.rb +28 -0
data/spec/parser/posix_classes_spec.rb +5 -24
data/spec/parser/properties_spec.rb +42 -54
data/spec/parser/quantifiers_spec.rb +42 -283
data/spec/parser/refcalls_spec.rb +60 -185
data/spec/parser/set/intersections_spec.rb +17 -17
data/spec/parser/set/ranges_spec.rb +17 -17
data/spec/parser/sets_spec.rb +5 -5
data/spec/parser/types_spec.rb +11 -36
data/spec/scanner/anchors_spec.rb +13 -28
data/spec/scanner/conditionals_spec.rb +121 -173
data/spec/scanner/delimiters_spec.rb +52 -0
data/spec/scanner/errors_spec.rb +64 -87
data/spec/scanner/escapes_spec.rb +53 -50
data/spec/scanner/free_space_spec.rb +102 -165
data/spec/scanner/groups_spec.rb +45 -64
data/spec/scanner/keep_spec.rb +5 -28
data/spec/scanner/literals_spec.rb +45 -81
data/spec/scanner/meta_spec.rb +13 -33
data/spec/scanner/options_spec.rb +36 -0
data/spec/scanner/properties_spec.rb +43 -286
data/spec/scanner/quantifiers_spec.rb +13 -28
data/spec/scanner/refcalls_spec.rb +32 -48
data/spec/scanner/sets_spec.rb +88 -102
data/spec/scanner/types_spec.rb +10 -25
data/spec/spec_helper.rb +1 -0
data/spec/support/shared_examples.rb +77 -0
data/spec/syntax/syntax_spec.rb +4 -0
data/spec/syntax/versions/1.8.6_spec.rb +12 -33
data/spec/syntax/versions/1.9.1_spec.rb +5 -18
data/spec/syntax/versions/1.9.3_spec.rb +4 -17
data/spec/syntax/versions/2.0.0_spec.rb +8 -23
data/spec/syntax/versions/2.2.0_spec.rb +4 -17
data/spec/syntax/versions/aliases_spec.rb +27 -109
metadata +28 -10
data/spec/scanner/scripts_spec.rb +0 -49
data/spec/scanner/unicode_blocks_spec.rb +0 -28

data/spec/lexer/refcalls_spec.rb CHANGED

@@ -1,54 +1,55 @@
 require 'spec_helper'
 RSpec.describe('RefCall lexing') do
-  tests = {
-    # Traditional numerical group back-reference
-    '(abc)\1'           => [3, :backref, :number,                '\1',         5,  7, 0, 0, 0],
-    # Group back-references, named, numbered, and relative
-    '(?<X>abc)\k<X>'    => [3, :backref, :name_ref,              '\k<X>',      9, 14, 0, 0, 0],
-    "(?<X>abc)\\k'X'"   => [3, :backref, :name_ref,              "\\k'X'",     9, 14, 0, 0, 0],
-    '(abc)\k<1>'        => [3, :backref, :number_ref,            '\k<1>',      5, 10, 0, 0, 0],
-    "(abc)\\k'1'"       => [3, :backref, :number_ref,            "\\k'1'",     5, 10, 0, 0, 0],
-    '(abc)\k<-1>'       => [3, :backref, :number_rel_ref,        '\k<-1>',     5, 11, 0, 0, 0],
-    "(abc)\\k'-1'"      => [3, :backref, :number_rel_ref,        "\\k'-1'",    5, 11, 0, 0, 0],
-    # Sub-expression invocation, named, numbered, and relative
-    '(?<X>abc)\g<X>'    => [3, :backref, :name_call,             '\g<X>',      9, 14, 0, 0, 0],
-    "(?<X>abc)\\g'X'"   => [3, :backref, :name_call,             "\\g'X'",     9, 14, 0, 0, 0],
-    '(abc)\g<1>'        => [3, :backref, :number_call,           '\g<1>',      5, 10, 0, 0, 0],
-    "(abc)\\g'1'"       => [3, :backref, :number_call,           "\\g'1'",     5, 10, 0, 0, 0],
-    '(abc)\g<-1>'       => [3, :backref, :number_rel_call,       '\g<-1>',     5, 11, 0, 0, 0],
-    "(abc)\\g'-1'"      => [3, :backref, :number_rel_call,       "\\g'-1'",    5, 11, 0, 0, 0],
-    '(abc)\g<+1>'       => [3, :backref, :number_rel_call,       '\g<+1>',     5, 11, 0, 0, 0],
-    "(abc)\\g'+1'"      => [3, :backref, :number_rel_call,       "\\g'+1'",    5, 11, 0, 0, 0],
-    # Group back-references, with nesting level
-    '(?<X>abc)\k<X-0>'  => [3, :backref, :name_recursion_ref,    '\k<X-0>',    9, 16, 0, 0, 0],
-    "(?<X>abc)\\k'X-0'" => [3, :backref, :name_recursion_ref,    "\\k'X-0'",   9, 16, 0, 0, 0],
-    '(abc)\k<1-0>'      => [3, :backref, :number_recursion_ref,  '\k<1-0>',    5, 12, 0, 0, 0],
-    "(abc)\\k'1-0'"     => [3, :backref, :number_recursion_ref,  "\\k'1-0'",   5, 12, 0, 0, 0],
-  }
-  tests.each_with_index do |(pattern, (index, type, token, text, ts, te, level, set_level, conditional_level)), count|
-    specify("lexer_#{type}_#{token}_#{count}") do
-      tokens = RL.lex(pattern, 'ruby/1.9')
-      struct = tokens.at(index)
-      expect(struct.type).to eq type
-      expect(struct.token).to eq token
-      expect(struct.text).to eq text
-      expect(struct.ts).to eq ts
-      expect(struct.te).to eq te
-      expect(struct.level).to eq level
-      expect(struct.set_level).to eq set_level
-      expect(struct.conditional_level).to eq conditional_level
-    end
-  end
+  # Traditional numerical group back-reference
+  include_examples 'lex', '(abc)\1',
+    3 => [:backref, :number,                '\1',         5,  7, 0, 0, 0]
+  # Group back-references, named, numbered, and relative
+  include_examples 'lex', '(?<X>abc)\k<X>',
+    3 => [:backref, :name_ref,              '\k<X>',      9, 14, 0, 0, 0]
+  include_examples 'lex', "(?<X>abc)\\k'X'",
+    3 => [:backref, :name_ref,              "\\k'X'",     9, 14, 0, 0, 0]
+  include_examples 'lex', '(abc)\k<1>',
+    3 => [:backref, :number_ref,            '\k<1>',      5, 10, 0, 0, 0]
+  include_examples 'lex', "(abc)\\k'1'",
+    3 => [:backref, :number_ref,            "\\k'1'",     5, 10, 0, 0, 0]
+  include_examples 'lex', '(abc)\k<-1>',
+    3 => [:backref, :number_rel_ref,        '\k<-1>',     5, 11, 0, 0, 0]
+  include_examples 'lex', "(abc)\\k'-1'",
+    3 => [:backref, :number_rel_ref,        "\\k'-1'",    5, 11, 0, 0, 0]
+  # Sub-expression invocation, named, numbered, and relative
+  include_examples 'lex', '(?<X>abc)\g<X>',
+    3 => [:backref, :name_call,             '\g<X>',      9, 14, 0, 0, 0]
+  include_examples 'lex', "(?<X>abc)\\g'X'",
+    3 => [:backref, :name_call,             "\\g'X'",     9, 14, 0, 0, 0]
+  include_examples 'lex', '(abc)\g<1>',
+    3 => [:backref, :number_call,           '\g<1>',      5, 10, 0, 0, 0]
+  include_examples 'lex', "(abc)\\g'1'",
+    3 => [:backref, :number_call,           "\\g'1'",     5, 10, 0, 0, 0]
+  include_examples 'lex', '(abc)\g<-1>',
+    3 => [:backref, :number_rel_call,       '\g<-1>',     5, 11, 0, 0, 0]
+  include_examples 'lex', "(abc)\\g'-1'",
+    3 => [:backref, :number_rel_call,       "\\g'-1'",    5, 11, 0, 0, 0]
+  include_examples 'lex', '(abc)\g<+1>',
+    3 => [:backref, :number_rel_call,       '\g<+1>',     5, 11, 0, 0, 0]
+  include_examples 'lex', "(abc)\\g'+1'",
+    3 => [:backref, :number_rel_call,       "\\g'+1'",    5, 11, 0, 0, 0]
+  # Group back-references, with nesting level
+  include_examples 'lex', '(?<X>abc)\k<X-0>',
+    3 => [:backref, :name_recursion_ref,    '\k<X-0>',    9, 16, 0, 0, 0]
+  include_examples 'lex', "(?<X>abc)\\k'X-0'",
+    3 => [:backref, :name_recursion_ref,    "\\k'X-0'",   9, 16, 0, 0, 0]
+  include_examples 'lex', '(abc)\k<1-0>',
+    3 => [:backref, :number_recursion_ref,  '\k<1-0>',    5, 12, 0, 0, 0]
+  include_examples 'lex', "(abc)\\k'1-0'",
+    3 => [:backref, :number_recursion_ref,  "\\k'1-0'",   5, 12, 0, 0, 0]
 end

data/spec/parser/all_spec.rb CHANGED

@@ -2,7 +2,11 @@ require 'spec_helper'
 RSpec.describe(Regexp::Parser) do
   specify('parse returns a root expression') do
-    expect(RP.parse('abc')).to be_instance_of(Regexp::Expression::Root)
+    expect(RP.parse('abc')).to be_instance_of(Root)
+  end
+  specify('parse can be called with block') do
+    expect(RP.parse('abc') { |root| root.class }).to eq Root
   end
   specify('parse root contains expressions') do
@@ -10,6 +14,14 @@ RSpec.describe(Regexp::Parser) do
     expect(root.expressions).to all(be_a Regexp::Expression::Base)
   end
+  specify('parse root options mi') do
+    root = RP.parse(/[abc]/mi, 'ruby/1.8')
+    expect(root.m?).to be true
+    expect(root.i?).to be true
+    expect(root.x?).to be false
+  end
   specify('parse node types') do
     root = RP.parse('^(one){2,3}([^d\\]efm-qz\\,\\-]*)(ghi)+$')

data/spec/parser/anchors_spec.rb CHANGED

@@ -1,31 +1,17 @@
 require 'spec_helper'
 RSpec.describe('Anchor parsing') do
-  tests = {
-    '^a'      => [0, :anchor,   :bol,                 Anchor::BOL],
-    'a$'      => [1, :anchor,   :eol,                 Anchor::EOL],
+  include_examples 'parse', /^a/,   0 =>  [:anchor,   :bol,               Anchor::BOL]
+  include_examples 'parse', /a$/,   1 =>  [:anchor,   :eol,               Anchor::EOL]
-    '\Aa'     => [0, :anchor,   :bos,                 Anchor::BOS],
-    'a\z'     => [1, :anchor,   :eos,                 Anchor::EOS],
-    'a\Z'     => [1, :anchor,   :eos_ob_eol,          Anchor::EOSobEOL],
+  include_examples 'parse', /\Aa/,  0 =>  [:anchor,   :bos,               Anchor::BOS]
+  include_examples 'parse', /a\z/,  1 =>  [:anchor,   :eos,               Anchor::EOS]
+  include_examples 'parse', /a\Z/,  1 =>  [:anchor,   :eos_ob_eol,        Anchor::EOSobEOL]
-    'a\b'     => [1, :anchor,   :word_boundary,       Anchor::WordBoundary],
-    'a\B'     => [1, :anchor,   :nonword_boundary,    Anchor::NonWordBoundary],
+  include_examples 'parse', /a\b/,  1 =>  [:anchor,   :word_boundary,     Anchor::WordBoundary]
+  include_examples 'parse', /a\B/,  1 =>  [:anchor,   :nonword_boundary,  Anchor::NonWordBoundary]
-    'a\G'     => [1, :anchor,   :match_start,         Anchor::MatchStart],
+  include_examples 'parse', /a\G/,  1 =>  [:anchor,   :match_start,       Anchor::MatchStart]
-    "\\\\Aa"  => [0, :escape,   :backslash,           EscapeSequence::Literal],
-  }
-  tests.each_with_index do |(pattern, (index, type, token, klass)), count|
-    specify("parse_anchor_#{token}_#{count}") do
-      root = RP.parse(pattern, 'ruby/1.9')
-      exp = root.expressions.at(index)
-      expect(exp).to be_a(klass)
-      expect(exp.type).to eq type
-      expect(exp.token).to eq token
-    end
-  end
+  include_examples 'parse', /\\A/,  0 =>  [:escape,   :backslash,         EscapeSequence::Literal]
 end

data/spec/parser/conditionals_spec.rb CHANGED

@@ -2,7 +2,7 @@ require 'spec_helper'
 RSpec.describe('Conditional parsing') do
   specify('parse conditional') do
-    regexp = Regexp.new('(?<A>a)(?(<A>)T|F)/')
+    regexp = /(?<A>a)(?(<A>)T|F)/
     root = RP.parse(regexp, 'ruby/2.0')
     exp = root[1]
@@ -16,7 +16,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional condition') do
-    regexp = Regexp.new('(?<A>a)(?(<A>)T|F)/')
+    regexp = /(?<A>a)(?(<A>)T|F)/
     root = RP.parse(regexp, 'ruby/2.0')
     exp = root[1].condition
@@ -31,7 +31,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional condition with number ref') do
-    regexp = Regexp.new('(a)(?(1)T|F)/')
+    regexp = /(a)(?(1)T|F)/
     root = RP.parse(regexp, 'ruby/2.0')
     exp = root[1].condition
@@ -46,7 +46,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional nested groups') do
-    regexp = Regexp.new('((a)|(b)|((?(2)(c(d|e)+)?|(?(3)f|(?(4)(g|(h)(i)))))))/')
+    regexp = /((a)|(b)|((?(2)(c(d|e)+)?|(?(3)f|(?(4)(g|(h)(i)))))))/
     root = RP.parse(regexp, 'ruby/2.0')
@@ -80,7 +80,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional nested') do
-    regexp = Regexp.new('(a(b(c(d)(e))))(?(1)(?(2)d|(?(3)e|f))|(?(4)(?(5)g|h)))/')
+    regexp = /(a(b(c(d)(e))))(?(1)(?(2)d|(?(3)e|f))|(?(4)(?(5)g|h)))/
     root = RP.parse(regexp, 'ruby/2.0')
@@ -102,7 +102,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional nested alternation') do
-    regexp = Regexp.new('(a)(?(1)(b|c|d)|(e|f|g))(h)(?(2)(i|j|k)|(l|m|n))|o|p/')
+    regexp = /(a)(?(1)(b|c|d)|(e|f|g))(h)(?(2)(i|j|k)|(l|m|n))|o|p/
     root = RP.parse(regexp, 'ruby/2.0')
@@ -125,7 +125,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional extra separator') do
-    regexp = Regexp.new('(?<A>a)(?(<A>)T|)/')
+    regexp = /(?<A>a)(?(<A>)T|)/
     root = RP.parse(regexp, 'ruby/2.0')
     branches = root[1].branches
@@ -146,7 +146,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional quantified') do
-    regexp = Regexp.new('(foo)(?(1)\d|(\w)){42}/')
+    regexp = /(foo)(?(1)\d|(\w)){42}/
     root = RP.parse(regexp, 'ruby/2.0')
     conditional = root[1]
@@ -158,7 +158,7 @@ RSpec.describe('Conditional parsing') do
   end
   specify('parse conditional branch content quantified') do
-    regexp = Regexp.new('(foo)(?(1)\d{23}|(\w){42})/')
+    regexp = /(foo)(?(1)\d{23}|(\w){42})/
     root = RP.parse(regexp, 'ruby/2.0')
     conditional = root[1]

data/spec/parser/errors_spec.rb CHANGED

@@ -1,51 +1,30 @@
 require 'spec_helper'
 RSpec.describe('Parsing errors') do
-  let(:rp) { Regexp::Parser.new }
-  before { rp.parse(/foo/) }
+  let(:parser) { Regexp::Parser.new }
+  before { parser.parse(/foo/) } # initializes ivars
-  specify('parser unknown token type') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:foo, :bar)) }
+  it('raises UnknownTokenTypeError for unknown token types') do
+    expect { parser.send(:parse_token, Regexp::Token.new(:foo, :bar)) }
       .to raise_error(Regexp::Parser::UnknownTokenTypeError)
   end
-  specify('parser unknown set token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:set, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
-  specify('parser unknown meta token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:meta, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
-  specify('parser unknown character type token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:type, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
-  specify('parser unknown unicode property token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:property, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
-  specify('parser unknown unicode nonproperty token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:nonproperty, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
-  specify('parser unknown anchor token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:anchor, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
-  specify('parser unknown quantifier token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:quantifier, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
-  specify('parser unknown group open token') do
-    expect { rp.send(:parse_token, Regexp::Token.new(:group, :foo)) }
-      .to raise_error(Regexp::Parser::UnknownTokenError)
-  end
+  RSpec.shared_examples 'UnknownTokenError' do |type, token|
+    it "raises for unkown tokens of type #{type}" do
+      expect { parser.send(:parse_token, Regexp::Token.new(type, :foo)) }
+        .to raise_error(Regexp::Parser::UnknownTokenError)
+    end
+  end
+  include_examples 'UnknownTokenError', :anchor
+  include_examples 'UnknownTokenError', :backref
+  include_examples 'UnknownTokenError', :conditional
+  include_examples 'UnknownTokenError', :free_space
+  include_examples 'UnknownTokenError', :group
+  include_examples 'UnknownTokenError', :meta
+  include_examples 'UnknownTokenError', :nonproperty
+  include_examples 'UnknownTokenError', :property
+  include_examples 'UnknownTokenError', :quantifier
+  include_examples 'UnknownTokenError', :set
+  include_examples 'UnknownTokenError', :type
 end

data/spec/parser/escapes_spec.rb CHANGED

@@ -1,49 +1,35 @@
 require 'spec_helper'
-RSpec.describe('Escape parsing') do
-  tests = {
-    /a\ac/          => [1, :escape, :bell,              EscapeSequence::Bell],
-    /a\ec/          => [1, :escape, :escape,            EscapeSequence::AsciiEscape],
-    /a\fc/          => [1, :escape, :form_feed,         EscapeSequence::FormFeed],
-    /a\nc/          => [1, :escape, :newline,           EscapeSequence::Newline],
-    /a\rc/          => [1, :escape, :carriage,          EscapeSequence::Return],
-    /a\tc/          => [1, :escape, :tab,               EscapeSequence::Tab],
-    /a\vc/          => [1, :escape, :vertical_tab,      EscapeSequence::VerticalTab],
-    # meta character escapes
-    /a\.c/          => [1, :escape, :dot,               EscapeSequence::Literal],
-    /a\?c/          => [1, :escape, :zero_or_one,       EscapeSequence::Literal],
-    /a\*c/          => [1, :escape, :zero_or_more,      EscapeSequence::Literal],
-    /a\+c/          => [1, :escape, :one_or_more,       EscapeSequence::Literal],
-    /a\|c/          => [1, :escape, :alternation,       EscapeSequence::Literal],
-    /a\(c/          => [1, :escape, :group_open,        EscapeSequence::Literal],
-    /a\)c/          => [1, :escape, :group_close,       EscapeSequence::Literal],
-    /a\{c/          => [1, :escape, :interval_open,     EscapeSequence::Literal],
-    /a\}c/          => [1, :escape, :interval_close,    EscapeSequence::Literal],
-    # unicode escapes
-    /a\u0640/       => [1, :escape, :codepoint,         EscapeSequence::Codepoint],
-    /a\u{41 1F60D}/ => [1, :escape, :codepoint_list,    EscapeSequence::CodepointList],
-    /a\u{10FFFF}/   => [1, :escape, :codepoint_list,    EscapeSequence::CodepointList],
-     # hex escapes
-    /a\xFF/n        => [1, :escape, :hex,               EscapeSequence::Hex],
-    # octal escapes
-    /a\177/n        => [1, :escape, :octal,             EscapeSequence::Octal],
-  }
-  tests.each_with_index do |(pattern, (index, type, token, klass)), count|
-    specify("parse_escape_#{token}_#{count = (count + 1)}") do
-      root = RP.parse(pattern, 'ruby/1.9')
-      exp = root.expressions.at(index)
-      expect(exp).to be_a(klass)
-      expect(exp.type).to eq type
-      expect(exp.token).to eq token
-    end
-  end
+RSpec.describe('EscapeSequence parsing') do
+  include_examples 'parse', /a\ac/,          1 => [:escape, :bell,              EscapeSequence::Bell]
+  include_examples 'parse', /a\ec/,          1 => [:escape, :escape,            EscapeSequence::AsciiEscape]
+  include_examples 'parse', /a\fc/,          1 => [:escape, :form_feed,         EscapeSequence::FormFeed]
+  include_examples 'parse', /a\nc/,          1 => [:escape, :newline,           EscapeSequence::Newline]
+  include_examples 'parse', /a\rc/,          1 => [:escape, :carriage,          EscapeSequence::Return]
+  include_examples 'parse', /a\tc/,          1 => [:escape, :tab,               EscapeSequence::Tab]
+  include_examples 'parse', /a\vc/,          1 => [:escape, :vertical_tab,      EscapeSequence::VerticalTab]
+  # meta character escapes
+  include_examples 'parse', /a\.c/,          1 => [:escape, :dot,               EscapeSequence::Literal]
+  include_examples 'parse', /a\?c/,          1 => [:escape, :zero_or_one,       EscapeSequence::Literal]
+  include_examples 'parse', /a\*c/,          1 => [:escape, :zero_or_more,      EscapeSequence::Literal]
+  include_examples 'parse', /a\+c/,          1 => [:escape, :one_or_more,       EscapeSequence::Literal]
+  include_examples 'parse', /a\|c/,          1 => [:escape, :alternation,       EscapeSequence::Literal]
+  include_examples 'parse', /a\(c/,          1 => [:escape, :group_open,        EscapeSequence::Literal]
+  include_examples 'parse', /a\)c/,          1 => [:escape, :group_close,       EscapeSequence::Literal]
+  include_examples 'parse', /a\{c/,          1 => [:escape, :interval_open,     EscapeSequence::Literal]
+  include_examples 'parse', /a\}c/,          1 => [:escape, :interval_close,    EscapeSequence::Literal]
+  # unicode escapes
+  include_examples 'parse', /a\u0640/,       1 => [:escape, :codepoint,         EscapeSequence::Codepoint]
+  include_examples 'parse', /a\u{41 1F60D}/, 1 => [:escape, :codepoint_list,    EscapeSequence::CodepointList]
+  include_examples 'parse', /a\u{10FFFF}/,   1 => [:escape, :codepoint_list,    EscapeSequence::CodepointList]
+    # hex escapes
+  include_examples 'parse', /a\xFF/n,        1 => [:escape, :hex,               EscapeSequence::Hex]
+  # octal escapes
+  include_examples 'parse', /a\177/n,        1 => [:escape, :octal,             EscapeSequence::Octal]
   specify('parse chars and codepoints') do
     root = RP.parse(/\n\?\101\x42\u0043\u{44 45}/)
@@ -65,6 +51,9 @@ RSpec.describe('Escape parsing') do
     expect(root[5].chars).to eq %w[D E]
     expect(root[5].codepoints).to eq [68, 69]
+    expect { root[5].char }.to raise_error(/#chars/)
+    expect { root[5].codepoint }.to raise_error(/#codepoints/)
   end
   specify('parse escape control sequence lower') do

data/spec/parser/free_space_spec.rb CHANGED

@@ -24,13 +24,34 @@ RSpec.describe('FreeSpace parsing') do
     expect(root.first.text).to eq 'a b c d'
   end
+  specify('parse single-line free space comments without spaces') do
+    regexp = /a#b/x
+    root = RP.parse(regexp)
+    expect(root.length).to eq 2
+    expect(root[0]).to be_instance_of(Literal)
+    expect(root[1]).to be_instance_of(Comment)
+  end
+  specify('parse single-line free space comments with spaces') do
+    regexp = /a # b/x
+    root = RP.parse(regexp)
+    expect(root.length).to eq 3
+    expect(root[0]).to be_instance_of(Literal)
+    expect(root[1]).to be_instance_of(WhiteSpace)
+    expect(root[2]).to be_instance_of(Comment)
+  end
   specify('parse free space comments') do
     regexp = /
       a   ?     # One letter
       b {2,5}   # Another one
       [c-g]  +  # A set
       (h|i|j) | # A group
-      klm *
+      klm#nospace before or after comment hash
       nop +
     /x
@@ -51,11 +72,11 @@ RSpec.describe('FreeSpace parsing') do
     alt_2 = alt.alternatives.last
     expect(alt_2).to be_instance_of(Alternative)
-    expect(alt_2.length).to eq 7
+    expect(alt_2.length).to eq 8
-    [0, 2, 4, 6].each { |i| expect(alt_2[i].class).to eq WhiteSpace }
+    [0, 2, 5, 7].each { |i| expect(alt_2[i].class).to eq WhiteSpace }
-    expect(alt_2[1]).to be_instance_of(Comment)
+    [1, 4].each { |i| expect(alt_2[i]).to be_instance_of(Comment) }
   end
   specify('parse free space nested comments') do