RubyGems - regexp_parser - Versions diffs - 0.4.6 → 0.4.7 - Mend

regexp_parser 0.4.6 → 0.4.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

checksums.yaml +4 -4
data/ChangeLog +13 -0
data/README.md +4 -3
data/lib/regexp_parser/expression.rb +8 -8
data/lib/regexp_parser/expression/classes/backref.rb +7 -7
data/lib/regexp_parser/expression/classes/conditional.rb +2 -2
data/lib/regexp_parser/expression/classes/group.rb +2 -2
data/lib/regexp_parser/expression/classes/root.rb +4 -18
data/lib/regexp_parser/expression/classes/set.rb +1 -1
data/lib/regexp_parser/expression/subexpression.rb +2 -2
data/lib/regexp_parser/lexer.rb +10 -6
data/lib/regexp_parser/parser.rb +202 -172
data/lib/regexp_parser/scanner.rb +151 -148
data/lib/regexp_parser/scanner/scanner.rl +44 -41
data/lib/regexp_parser/syntax/tokens/backref.rb +1 -1
data/lib/regexp_parser/version.rb +2 -2
data/test/expression/test_to_h.rb +2 -2
data/test/lexer/test_refcalls.rb +3 -0
data/test/parser/test_errors.rb +13 -9
data/test/parser/test_groups.rb +140 -14
data/test/parser/test_refcalls.rb +13 -0
data/test/scanner/test_free_space.rb +43 -0
data/test/scanner/test_refcalls.rb +3 -0
data/test/syntax/ruby/test_1.8.rb +1 -1
metadata +3 -3

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 6bc36d64eb84ebef5287ca3c866c834339b6b563
-  data.tar.gz: 59db2b321120f59697d3ce6e0c612dd745a41ffc
+  metadata.gz: de01aa2d195d95dd0bee1afd232f85195562a8bf
+  data.tar.gz: b41cb58a4e07d681da7c16473f4f03d96a792ff9
 SHA512:
-  metadata.gz: fcf1c339c360217fbb2a1c4cedfd2eeeca199a52983fe706c7d661141a93b3793e1de0901d6c935b61dad30a78c4ad7f510bfec6abdf765f2c6e6a6edb3adefa
-  data.tar.gz: d0fc3eb8fd70a252d60ed25f7472ad36e76d379d5660f5d9d28735b9faa7caf1e15bc69468849e91d20832e3249a582c53ce52b67c5a01e50b2f6325dcf1063e
+  metadata.gz: 342d6218d5553f2f2f6975f202cf650cd74c9128379348526981d829188b38836dfd88bc46b8476212d4b10aeb628479109baff075e1297c4cf69aaa4fe8ff03
+  data.tar.gz: 80883d05ff9bb3f5f9f296aeeb5eabde013a362c6d6c82f4eeab87438050f93fea2224f407b170b65ff55d175937c55f56d49077e0ad43b0a55832989e221544

data/ChangeLog CHANGED

@@ -1,3 +1,16 @@
+Sun Oct 15 2017 Janosch Müller <janosch84@gmail.com>
+	* Fixed a thread safety issue (issue #45)
+	* Some public class methods that were only reliable for
+	  internal use are now private instance methods (PR #46)
+	* Improved the usefulness of Expression#options (issue #43) -
+	  #options and derived methods such as #i?, #m? and #x? are now
+	  defined for all Expressions that are affected by such flags.
+	* Fixed scanning of whitespace following (?x) (commit 5c94bd2)
+	* Fixed a Parser bug where the #number attribute of traditional
+	  numerical backreferences was not set correctly (commit 851b620)
+	* Bumped version to 0.4.7
 Mon Sep 18 2017 Janosch Müller <janosch84@gmail.com>
 	* Added Parser support for hex escapes in sets (PR #36)

data/README.md CHANGED

@@ -125,9 +125,10 @@ Regexp::Scanner.scan( /(cat?([bhm]at)){3,5}/ ).map {|token| token[2]}
   * If the input is a ruby **Regexp** object, the scanner calls #source on it to
     get its string representation. #source does not include the options of
-    the expression (m, i, and x) To include the options in the scan, #to_s
-    should be called on the **Regexp** before passing it to the scanner or any
-    of the other modules.
+    the expression (m, i, and x). To include the options in the scan, #to_s
+    should be called on the **Regexp** before passing it to the scanner or the
+    lexer. For the parser, however, this is not necessary. It automatically
+    exposes the options of a passed **Regexp** in the returned root expression.
   * To keep the scanner simple(r) and fairly reusable for other purposes, it
     does not perform lexical analysis on the tokens, sticking to the task

data/lib/regexp_parser/expression.rb CHANGED

@@ -8,7 +8,7 @@ module Regexp::Expression
     attr_accessor :quantifier
     attr_accessor :options
-    def initialize(token)
+    def initialize(token, options = {})
       @type               = token.type
       @token              = token.token
       @text               = token.text
@@ -17,7 +17,7 @@ module Regexp::Expression
       @set_level          = token.set_level
       @conditional_level  = token.conditional_level
       @quantifier         = nil
-      @options            = nil
+      @options            = options
     end
     def clone
@@ -95,35 +95,35 @@ module Regexp::Expression
     end
     def multiline?
-      (@options and @options[:m]) ? true : false
+      @options[:m] == true
     end
     alias :m? :multiline?
     def case_insensitive?
-      (@options and @options[:i]) ? true : false
+      @options[:i] == true
     end
     alias :i? :case_insensitive?
     alias :ignore_case? :case_insensitive?
     def free_spacing?
-      (@options and @options[:x]) ? true : false
+      @options[:x] == true
     end
     alias :x? :free_spacing?
     alias :extended? :free_spacing?
     if RUBY_VERSION >= '2.0'
       def default_classes?
-        (@options and @options[:d]) ? true : false
+        @options[:d] == true
       end
       alias :d? :default_classes?
       def ascii_classes?
-        (@options and @options[:a]) ? true : false
+        @options[:a] == true
       end
       alias :a? :ascii_classes?
       def unicode_classes?
-        (@options and @options[:u]) ? true : false
+        @options[:u] == true
       end
       alias :u? :unicode_classes?
     end

data/lib/regexp_parser/expression/classes/backref.rb CHANGED

@@ -6,18 +6,18 @@ module Regexp::Expression
     class Name < Backreference::Base
       attr_reader :name
-      def initialize(token)
+      def initialize(token, options = {})
         @name = token.text[3..-2]
-        super(token)
+        super
       end
     end
     class Number < Backreference::Base
       attr_reader :number
-      def initialize(token)
-        @number = token.text[3..-2]
-        super(token)
+      def initialize(token, options = {})
+        @number = token.text[token.token.equal?(:number) ? 1..-1 : 3..-2]
+        super
       end
     end
@@ -29,9 +29,9 @@ module Regexp::Expression
     class NameCall < Backreference::Base
       attr_reader :name
-      def initialize(token)
+      def initialize(token, options = {})
         @name = token.text[3..-2]
-        super(token)
+        super
       end
     end

data/lib/regexp_parser/expression/classes/conditional.rb CHANGED

@@ -11,8 +11,8 @@ module Regexp::Expression
     class Branch    < Regexp::Expression::Sequence; end
     class Expression < Regexp::Expression::Subexpression
-      def initialize(token)
-        super(token)
+      def initialize(token, options = {})
+        super
         @condition = nil
         @branches  = []

data/lib/regexp_parser/expression/classes/group.rb CHANGED

@@ -36,9 +36,9 @@ module Regexp::Expression
     class Named     < Group::Capture
       attr_reader :name
-      def initialize(token)
+      def initialize(token, options = {})
         @name = token.text[3..-2]
-        super(token)
+        super
       end
       def clone

data/lib/regexp_parser/expression/classes/root.rb CHANGED

@@ -1,26 +1,12 @@
 module Regexp::Expression
   class Root < Regexp::Expression::Subexpression
-    def initialize
-      super Regexp::Token.new(:expression, :root, '', 0)
+    def initialize(options = {})
+      super(Regexp::Token.new(:expression, :root, '', 0), options)
     end
-    def multiline?
-      @expressions[0].m?
-    end
-    alias :m? :multiline?
-    def case_insensitive?
-      @expressions[0].i?
-    end
-    alias :i? :case_insensitive?
-    alias :ignore_case? :case_insensitive?
-    def free_spacing?
-      @expressions[0].x?
-    end
-    alias :x? :free_spacing?
-    alias :extended? :free_spacing?
+    alias ignore_case? case_insensitive?
+    alias extended?    free_spacing?
   end
 end

data/lib/regexp_parser/expression/classes/set.rb CHANGED

@@ -3,7 +3,7 @@ module Regexp::Expression
   class CharacterSet < Regexp::Expression::Base
     attr_accessor :members
-    def initialize(token)
+    def initialize(token, options = {})
       @members  = []
       @negative = false
       @closed   = false

data/lib/regexp_parser/expression/subexpression.rb CHANGED

@@ -3,8 +3,8 @@ module Regexp::Expression
   class Subexpression < Regexp::Expression::Base
     attr_accessor :expressions
-    def initialize(token)
-      super(token)
+    def initialize(token, options = {})
+      super
       @expressions = []
     end

data/lib/regexp_parser/lexer.rb CHANGED

@@ -2,7 +2,7 @@
 # collects emitted tokens into an array, calculates their nesting depth, and
 # normalizes tokens for the parser, and checks if they are implemented by the
 # given syntax flavor.
-module Regexp::Lexer
+class Regexp::Lexer
   OPENING_TOKENS = [:capture, :options, :passive, :atomic, :named, :absence,
                     :lookahead, :nlookahead, :lookbehind, :nlookbehind
@@ -11,6 +11,10 @@ module Regexp::Lexer
   CLOSING_TOKENS = [:close].freeze
   def self.lex(input, syntax = "ruby/#{RUBY_VERSION}", &block)
+    new.lex(input, syntax, &block)
+  end
+  def lex(input, syntax = "ruby/#{RUBY_VERSION}", &block)
     syntax = Regexp::Syntax.new(syntax)
     @tokens = []
@@ -57,7 +61,7 @@ module Regexp::Lexer
   protected
-  def self.ascend(type, token)
+  def ascend(type, token)
     if type == :group or type == :assertion
       @nesting -= 1 if CLOSING_TOKENS.include?(token)
     end
@@ -71,7 +75,7 @@ module Regexp::Lexer
     end
   end
-  def self.descend(type, token)
+  def descend(type, token)
     if type == :group or type == :assertion
       @nesting += 1 if OPENING_TOKENS.include?(token)
     end
@@ -87,7 +91,7 @@ module Regexp::Lexer
   # called by scan to break a literal run that is longer than one character
   # into two separate tokens when it is followed by a quantifier
-  def self.break_literal(token)
+  def break_literal(token)
     text = token.text
     if text.scan(/./mu).length > 1
       lead = text.sub(/.\z/mu, "")
@@ -113,7 +117,7 @@ module Regexp::Lexer
   # called by scan to merge two consecutive literals. this happens when tokens
   # get normalized (as in the case of posix/bre) and end up becoming literals.
-  def self.merge_literal(current)
+  def merge_literal(current)
     last = @tokens.pop
     Regexp::Token.new(
@@ -128,7 +132,7 @@ module Regexp::Lexer
     )
   end
-  def self.merge_condition(current)
+  def merge_condition(current)
     last = @tokens.pop
     Regexp::Token.new(:conditional, :condition, last.text + current.text,
       last.ts, current.te, @nesting, @set_nesting, @conditional_nesting)

data/lib/regexp_parser/parser.rb CHANGED

@@ -1,6 +1,6 @@
 require 'regexp_parser/expression'
-module Regexp::Parser
+class Regexp::Parser
   include Regexp::Expression
   include Regexp::Syntax
@@ -19,8 +19,14 @@ module Regexp::Parser
   end
   def self.parse(input, syntax = "ruby/#{RUBY_VERSION}", &block)
-    @nesting = [@root = @node = Root.new]
+    new.parse(input, syntax, &block)
+  end
+  def parse(input, syntax = "ruby/#{RUBY_VERSION}", &block)
+    @nesting = [@root = @node = Root.new(options_from_input(input))]
+    @options_stack = [@root.options]
+    @switching_options = false
     @conditional_nesting = []
     Regexp::Lexer.scan(input, syntax) do |token|
@@ -34,21 +40,33 @@ module Regexp::Parser
     end
   end
-  def self.nest(exp)
+  private
+  def options_from_input(input)
+    return {} unless input.is_a?(::Regexp)
+    options = {}
+    options[:i] = true if input.options & ::Regexp::IGNORECASE != 0
+    options[:m] = true if input.options & ::Regexp::MULTILINE  != 0
+    options[:x] = true if input.options & ::Regexp::EXTENDED   != 0
+    options
+  end
+  def nest(exp)
     @nesting.push exp
     @node << exp
     @node  = exp
   end
-  def self.nest_conditional(exp)
+  def nest_conditional(exp)
     @conditional_nesting.push exp
     @node << exp
     @node  = exp
   end
-  def self.parse_token(token)
+  def parse_token(token)
     case token.type
     when :meta;         meta(token)
     when :quantifier;   quantifier(token)
@@ -66,7 +84,7 @@ module Regexp::Parser
       property(token)
     when :literal
-      @node << Literal.new(token)
+      @node << Literal.new(token, active_opts)
     when :free_space
       free_space(token)
@@ -75,7 +93,7 @@ module Regexp::Parser
     end
   end
-  def self.set(token)
+  def set(token)
     case token.token
     when :open
       open_set(token)
@@ -96,14 +114,14 @@ module Regexp::Parser
     end
   end
-  def self.meta(token)
+  def meta(token)
     case token.token
     when :dot
-      @node << CharacterType::Any.new(token)
+      @node << CharacterType::Any.new(token, active_opts)
     when :alternation
       unless @node.token == :alternation
         unless @node.last.is_a?(Alternation)
-          alt = Alternation.new(token)
+          alt = Alternation.new(token, active_opts)
           seq = Alternative.new(alt.level, alt.set_level, alt.conditional_level)
           while @node.expressions.last
@@ -126,62 +144,62 @@ module Regexp::Parser
     end
   end
-  def self.backref(token)
+  def backref(token)
     case token.token
     when :name_ref
-      @node << Backreference::Name.new(token)
+      @node << Backreference::Name.new(token, active_opts)
     when :name_nest_ref
-      @node << Backreference::NameNestLevel.new(token)
+      @node << Backreference::NameNestLevel.new(token, active_opts)
     when :name_call
-      @node << Backreference::NameCall.new(token)
+      @node << Backreference::NameCall.new(token, active_opts)
     when :number, :number_ref
-      @node << Backreference::Number.new(token)
+      @node << Backreference::Number.new(token, active_opts)
     when :number_rel_ref
-      @node << Backreference::NumberRelative.new(token)
+      @node << Backreference::NumberRelative.new(token, active_opts)
     when :number_nest_ref
-      @node << Backreference::NumberNestLevel.new(token)
+      @node << Backreference::NumberNestLevel.new(token, active_opts)
     when :number_call
-      @node << Backreference::NumberCall.new(token)
+      @node << Backreference::NumberCall.new(token, active_opts)
     when :number_rel_call
-      @node << Backreference::NumberCallRelative.new(token)
+      @node << Backreference::NumberCallRelative.new(token, active_opts)
     else
       raise UnknownTokenError.new('Backreference', token)
     end
   end
-  def self.type(token)
+  def type(token)
     case token.token
     when :digit
-      @node << CharacterType::Digit.new(token)
+      @node << CharacterType::Digit.new(token, active_opts)
     when :nondigit
-      @node << CharacterType::NonDigit.new(token)
+      @node << CharacterType::NonDigit.new(token, active_opts)
     when :hex
-      @node << CharacterType::Hex.new(token)
+      @node << CharacterType::Hex.new(token, active_opts)
     when :nonhex
-      @node << CharacterType::NonHex.new(token)
+      @node << CharacterType::NonHex.new(token, active_opts)
     when :space
-      @node << CharacterType::Space.new(token)
+      @node << CharacterType::Space.new(token, active_opts)
     when :nonspace
-      @node << CharacterType::NonSpace.new(token)
+      @node << CharacterType::NonSpace.new(token, active_opts)
     when :word
-      @node << CharacterType::Word.new(token)
+      @node << CharacterType::Word.new(token, active_opts)
     when :nonword
-      @node << CharacterType::NonWord.new(token)
+      @node << CharacterType::NonWord.new(token, active_opts)
     when :linebreak
-      @node << CharacterType::Linebreak.new(token)
+      @node << CharacterType::Linebreak.new(token, active_opts)
     when :xgrapheme
-      @node << CharacterType::ExtendedGrapheme.new(token)
+      @node << CharacterType::ExtendedGrapheme.new(token, active_opts)
     else
       raise UnknownTokenError.new('CharacterType', token)
     end
   end
-  def self.conditional(token)
+  def conditional(token)
     case token.token
     when :open
-      nest_conditional(Conditional::Expression.new(token))
+      nest_conditional(Conditional::Expression.new(token, active_opts))
     when :condition
-      @conditional_nesting.last.condition(Conditional::Condition.new(token))
+      @conditional_nesting.last.condition(Conditional::Condition.new(token, active_opts))
       @conditional_nesting.last.branch
     when :separator
       @conditional_nesting.last.branch
@@ -200,175 +218,174 @@ module Regexp::Parser
     end
   end
-  def self.property(token)
-    include Regexp::Expression::UnicodeProperty
+  include Regexp::Expression::UnicodeProperty
+  def property(token)
     case token.token
-    when :alnum;            @node << Alnum.new(token)
-    when :alpha;            @node << Alpha.new(token)
-    when :any;              @node << Any.new(token)
-    when :ascii;            @node << Ascii.new(token)
-    when :blank;            @node << Blank.new(token)
-    when :cntrl;            @node << Cntrl.new(token)
-    when :digit;            @node << Digit.new(token)
-    when :graph;            @node << Graph.new(token)
-    when :lower;            @node << Lower.new(token)
-    when :print;            @node << Print.new(token)
-    when :punct;            @node << Punct.new(token)
-    when :space;            @node << Space.new(token)
-    when :upper;            @node << Upper.new(token)
-    when :word;             @node << Word.new(token)
-    when :xdigit;           @node << Xdigit.new(token)
-    when :newline;          @node << Newline.new(token)
-    when :letter_any;       @node << Letter::Any.new(token)
-    when :letter_uppercase; @node << Letter::Uppercase.new(token)
-    when :letter_lowercase; @node << Letter::Lowercase.new(token)
-    when :letter_titlecase; @node << Letter::Titlecase.new(token)
-    when :letter_modifier;  @node << Letter::Modifier.new(token)
-    when :letter_other;     @node << Letter::Other.new(token)
-    when :mark_any;         @node << Mark::Any.new(token)
-    when :mark_nonspacing;  @node << Mark::Nonspacing.new(token)
-    when :mark_spacing;     @node << Mark::Spacing.new(token)
-    when :mark_enclosing;   @node << Mark::Enclosing.new(token)
-    when :number_any;       @node << Number::Any.new(token)
-    when :number_decimal;   @node << Number::Decimal.new(token)
-    when :number_letter;    @node << Number::Letter.new(token)
-    when :number_other;     @node << Number::Other.new(token)
-    when :punct_any;        @node << Punctuation::Any.new(token)
-    when :punct_connector;  @node << Punctuation::Connector.new(token)
-    when :punct_dash;       @node << Punctuation::Dash.new(token)
-    when :punct_open;       @node << Punctuation::Open.new(token)
-    when :punct_close;      @node << Punctuation::Close.new(token)
-    when :punct_initial;    @node << Punctuation::Initial.new(token)
-    when :punct_final;      @node << Punctuation::Final.new(token)
-    when :punct_other;      @node << Punctuation::Other.new(token)
-    when :separator_any;    @node << Separator::Any.new(token)
-    when :separator_space;  @node << Separator::Space.new(token)
-    when :separator_line;   @node << Separator::Line.new(token)
-    when :separator_para;   @node << Separator::Paragraph.new(token)
-    when :symbol_any;       @node << Symbol::Any.new(token)
-    when :symbol_math;      @node << Symbol::Math.new(token)
-    when :symbol_currency;  @node << Symbol::Currency.new(token)
-    when :symbol_modifier;  @node << Symbol::Modifier.new(token)
-    when :symbol_other;     @node << Symbol::Other.new(token)
-    when :other;            @node << Codepoint::Any.new(token)
-    when :control;          @node << Codepoint::Control.new(token)
-    when :format;           @node << Codepoint::Format.new(token)
-    when :surrogate;        @node << Codepoint::Surrogate.new(token)
-    when :private_use;      @node << Codepoint::PrivateUse.new(token)
-    when :unassigned;       @node << Codepoint::Unassigned.new(token)
+    when :alnum;            @node << Alnum.new(token, active_opts)
+    when :alpha;            @node << Alpha.new(token, active_opts)
+    when :any;              @node << Any.new(token, active_opts)
+    when :ascii;            @node << Ascii.new(token, active_opts)
+    when :blank;            @node << Blank.new(token, active_opts)
+    when :cntrl;            @node << Cntrl.new(token, active_opts)
+    when :digit;            @node << Digit.new(token, active_opts)
+    when :graph;            @node << Graph.new(token, active_opts)
+    when :lower;            @node << Lower.new(token, active_opts)
+    when :print;            @node << Print.new(token, active_opts)
+    when :punct;            @node << Punct.new(token, active_opts)
+    when :space;            @node << Space.new(token, active_opts)
+    when :upper;            @node << Upper.new(token, active_opts)
+    when :word;             @node << Word.new(token, active_opts)
+    when :xdigit;           @node << Xdigit.new(token, active_opts)
+    when :newline;          @node << Newline.new(token, active_opts)
+    when :letter_any;       @node << Letter::Any.new(token, active_opts)
+    when :letter_uppercase; @node << Letter::Uppercase.new(token, active_opts)
+    when :letter_lowercase; @node << Letter::Lowercase.new(token, active_opts)
+    when :letter_titlecase; @node << Letter::Titlecase.new(token, active_opts)
+    when :letter_modifier;  @node << Letter::Modifier.new(token, active_opts)
+    when :letter_other;     @node << Letter::Other.new(token, active_opts)
+    when :mark_any;         @node << Mark::Any.new(token, active_opts)
+    when :mark_nonspacing;  @node << Mark::Nonspacing.new(token, active_opts)
+    when :mark_spacing;     @node << Mark::Spacing.new(token, active_opts)
+    when :mark_enclosing;   @node << Mark::Enclosing.new(token, active_opts)
+    when :number_any;       @node << Number::Any.new(token, active_opts)
+    when :number_decimal;   @node << Number::Decimal.new(token, active_opts)
+    when :number_letter;    @node << Number::Letter.new(token, active_opts)
+    when :number_other;     @node << Number::Other.new(token, active_opts)
+    when :punct_any;        @node << Punctuation::Any.new(token, active_opts)
+    when :punct_connector;  @node << Punctuation::Connector.new(token, active_opts)
+    when :punct_dash;       @node << Punctuation::Dash.new(token, active_opts)
+    when :punct_open;       @node << Punctuation::Open.new(token, active_opts)
+    when :punct_close;      @node << Punctuation::Close.new(token, active_opts)
+    when :punct_initial;    @node << Punctuation::Initial.new(token, active_opts)
+    when :punct_final;      @node << Punctuation::Final.new(token, active_opts)
+    when :punct_other;      @node << Punctuation::Other.new(token, active_opts)
+    when :separator_any;    @node << Separator::Any.new(token, active_opts)
+    when :separator_space;  @node << Separator::Space.new(token, active_opts)
+    when :separator_line;   @node << Separator::Line.new(token, active_opts)
+    when :separator_para;   @node << Separator::Paragraph.new(token, active_opts)
+    when :symbol_any;       @node << Symbol::Any.new(token, active_opts)
+    when :symbol_math;      @node << Symbol::Math.new(token, active_opts)
+    when :symbol_currency;  @node << Symbol::Currency.new(token, active_opts)
+    when :symbol_modifier;  @node << Symbol::Modifier.new(token, active_opts)
+    when :symbol_other;     @node << Symbol::Other.new(token, active_opts)
+    when :other;            @node << Codepoint::Any.new(token, active_opts)
+    when :control;          @node << Codepoint::Control.new(token, active_opts)
+    when :format;           @node << Codepoint::Format.new(token, active_opts)
+    when :surrogate;        @node << Codepoint::Surrogate.new(token, active_opts)
+    when :private_use;      @node << Codepoint::PrivateUse.new(token, active_opts)
+    when :unassigned;       @node << Codepoint::Unassigned.new(token, active_opts)
     when *Token::UnicodeProperty::Age
-      @node << Age.new(token)
+      @node << Age.new(token, active_opts)
     when *Token::UnicodeProperty::Derived
-      @node << Derived.new(token)
+      @node << Derived.new(token, active_opts)
     when *Regexp::Syntax::Token::UnicodeProperty::Script
-      @node << Script.new(token)
+      @node << Script.new(token, active_opts)
     when *Regexp::Syntax::Token::UnicodeProperty::UnicodeBlock
-      @node << Block.new(token)
+      @node << Block.new(token, active_opts)
     else
       raise UnknownTokenError.new('UnicodeProperty', token)
     end
   end
-  def self.anchor(token)
+  def anchor(token)
     case token.token
     when :bol
-      @node << Anchor::BeginningOfLine.new(token)
+      @node << Anchor::BeginningOfLine.new(token, active_opts)
     when :eol
-      @node << Anchor::EndOfLine.new(token)
+      @node << Anchor::EndOfLine.new(token, active_opts)
     when :bos
-      @node << Anchor::BOS.new(token)
+      @node << Anchor::BOS.new(token, active_opts)
     when :eos
-      @node << Anchor::EOS.new(token)
+      @node << Anchor::EOS.new(token, active_opts)
     when :eos_ob_eol
-      @node << Anchor::EOSobEOL.new(token)
+      @node << Anchor::EOSobEOL.new(token, active_opts)
     when :word_boundary
-      @node << Anchor::WordBoundary.new(token)
+      @node << Anchor::WordBoundary.new(token, active_opts)
     when :nonword_boundary
-      @node << Anchor::NonWordBoundary.new(token)
+      @node << Anchor::NonWordBoundary.new(token, active_opts)
     when :match_start
-      @node << Anchor::MatchStart.new(token)
+      @node << Anchor::MatchStart.new(token, active_opts)
     else
       raise UnknownTokenError.new('Anchor', token)
     end
   end
-  def self.escape(token)
+  def escape(token)
     case token.token
     when :backspace
-      @node << EscapeSequence::Backspace.new(token)
+      @node << EscapeSequence::Backspace.new(token, active_opts)
     when :escape
-      @node << EscapeSequence::AsciiEscape.new(token)
+      @node << EscapeSequence::AsciiEscape.new(token, active_opts)
     when :bell
-      @node << EscapeSequence::Bell.new(token)
+      @node << EscapeSequence::Bell.new(token, active_opts)
     when :form_feed
-      @node << EscapeSequence::FormFeed.new(token)
+      @node << EscapeSequence::FormFeed.new(token, active_opts)
     when :newline
-      @node << EscapeSequence::Newline.new(token)
+      @node << EscapeSequence::Newline.new(token, active_opts)
     when :carriage
-      @node << EscapeSequence::Return.new(token)
+      @node << EscapeSequence::Return.new(token, active_opts)
     when :space
-      @node << EscapeSequence::Space.new(token)
+      @node << EscapeSequence::Space.new(token, active_opts)
     when :tab
-      @node << EscapeSequence::Tab.new(token)
+      @node << EscapeSequence::Tab.new(token, active_opts)
     when :vertical_tab
-      @node << EscapeSequence::VerticalTab.new(token)
+      @node << EscapeSequence::VerticalTab.new(token, active_opts)
     when :control
       if token.text =~ /\A(?:\\C-\\M|\\c\\M)/
-        @node << EscapeSequence::MetaControl.new(token)
+        @node << EscapeSequence::MetaControl.new(token, active_opts)
       else
-        @node << EscapeSequence::Control.new(token)
+        @node << EscapeSequence::Control.new(token, active_opts)
       end
     when :meta_sequence
       if token.text =~ /\A\\M-\\[Cc]/
-        @node << EscapeSequence::MetaControl.new(token)
+        @node << EscapeSequence::MetaControl.new(token, active_opts)
       else
-        @node << EscapeSequence::Meta.new(token)
+        @node << EscapeSequence::Meta.new(token, active_opts)
       end
     else
       # treating everything else as a literal
-      @node << EscapeSequence::Literal.new(token)
+      @node << EscapeSequence::Literal.new(token, active_opts)
     end
   end
-  def self.keep(token)
-    @node << Keep::Mark.new(token)
+  def keep(token)
+    @node << Keep::Mark.new(token, active_opts)
   end
-  def self.free_space(token)
+  def free_space(token)
     case token.token
     when :comment
-      @node << Comment.new(token)
+      @node << Comment.new(token, active_opts)
     when :whitespace
       if @node.last and @node.last.is_a?(WhiteSpace)
-        @node.last.merge(WhiteSpace.new(token))
+        @node.last.merge(WhiteSpace.new(token, active_opts))
       else
-        @node << WhiteSpace.new(token)
+        @node << WhiteSpace.new(token, active_opts)
       end
     else
       raise UnknownTokenError.new('FreeSpace', token)
     end
   end
-  def self.quantifier(token)
+  def quantifier(token)
     offset = -1
     target_node = @node.expressions[offset]
     while target_node and target_node.is_a?(FreeSpace)
@@ -378,15 +395,6 @@ module Regexp::Parser
     raise ArgumentError.new("No valid target found for '#{token.text}' "+
                             "quantifier") unless target_node
-    unless target_node
-      if token.token == :zero_or_one
-        raise "Quantifier given without a target, or the syntax of the group " +
-              "or its options is incorrect"
-      else
-        raise "Quantifier `#{token.text}' given without a target"
-      end
-    end
     case token.token
     when :zero_or_one
       target_node.quantify(:zero_or_one, token.text, 0, 1, :greedy)
@@ -417,7 +425,7 @@ module Regexp::Parser
     end
   end
-  def self.interval(target_node, token)
+  def interval(target_node, token)
     text = token.text
     mchr = text[text.length-1].chr =~ /[?+]/ ? text[text.length-1].chr : nil
     case mchr
@@ -439,91 +447,113 @@ module Regexp::Parser
     target_node.quantify(:interval, text, min.to_i, max.to_i, mode)
   end
-  def self.group(token)
+  def group(token)
     case token.token
     when :options
-      options(token)
+      options_group(token)
     when :close
       close_group
     when :comment
-      @node << Group::Comment.new(token)
+      @node << Group::Comment.new(token, active_opts)
     else
       open_group(token)
     end
   end
-  def self.options(token)
-    opt = token.text.split('-', 2)
+  def options_group(token)
+    positive, negative = token.text.split('-', 2)
+    negative ||= ''
+    @switching_options = !token.text.include?(':')
+    # TODO: change this -^ to token.type == :options_switch in v1.0.0
+    new_options = active_opts.dup
-    exp = Group::Options.new(token)
-    exp.options = {
-      :m => opt[0].include?('m') ? true : false,
-      :i => opt[0].include?('i') ? true : false,
-      :x => opt[0].include?('x') ? true : false,
-      :d => opt[0].include?('d') ? true : false,
-      :a => opt[0].include?('a') ? true : false,
-      :u => opt[0].include?('u') ? true : false
-    }
+    # Negative options have precedence. E.g. /(?i-i)a/ is case-sensitive.
+    %w[i m x].each do |flag|
+      new_options[flag.to_sym] = true if positive.include?(flag)
+      new_options.delete(flag.to_sym) if negative.include?(flag)
+    end
+    # Any encoding flag overrides all previous encoding flags. If there are
+    # multiple encoding flags in an options string, the last one wins.
+    # E.g. /(?dau)\w/ matches UTF8 chars but /(?dua)\w/ only ASCII chars.
+    if (flag = positive.reverse[/[adu]/])
+      %w[a d u].each { |key| new_options.delete(key.to_sym) }
+      new_options[flag.to_sym] = true
+    end
+    @options_stack << new_options
+    exp = Group::Options.new(token, active_opts)
     nest(exp)
   end
-  def self.open_group(token)
+  def open_group(token)
     case token.token
     when :passive
-      exp = Group::Passive.new(token)
+      exp = Group::Passive.new(token, active_opts)
     when :atomic
-      exp = Group::Atomic.new(token)
+      exp = Group::Atomic.new(token, active_opts)
     when :named
-      exp = Group::Named.new(token)
+      exp = Group::Named.new(token, active_opts)
     when :capture
-      exp = Group::Capture.new(token)
+      exp = Group::Capture.new(token, active_opts)
     when :absence
-      exp = Group::Absence.new(token)
+      exp = Group::Absence.new(token, active_opts)
     when :lookahead
-      exp = Assertion::Lookahead.new(token)
+      exp = Assertion::Lookahead.new(token, active_opts)
     when :nlookahead
-      exp = Assertion::NegativeLookahead.new(token)
+      exp = Assertion::NegativeLookahead.new(token, active_opts)
     when :lookbehind
-      exp = Assertion::Lookbehind.new(token)
+      exp = Assertion::Lookbehind.new(token, active_opts)
     when :nlookbehind
-      exp = Assertion::NegativeLookbehind.new(token)
+      exp = Assertion::NegativeLookbehind.new(token, active_opts)
     else
       raise UnknownTokenError.new('Group type open', token)
     end
+    # Push the active options to the stack again. This way we can simply pop the
+    # stack for any group we close, no matter if it had its own options or not.
+    @options_stack << active_opts
     nest(exp)
   end
-  def self.close_group
+  def close_group
     @nesting.pop
+    @options_stack.pop unless @switching_options
+    @switching_options = false
     @node = @nesting.last
     @node = @node.last if @node.last and @node.last.is_a?(Alternation)
   end
-  def self.open_set(token)
+  def open_set(token)
     token.token = :character
     if token.type == :subset
-      @set << CharacterSubSet.new(token)
+      @set << CharacterSubSet.new(token, active_opts)
     else
-      @node << (@set = CharacterSet.new(token))
+      @node << (@set = CharacterSet.new(token, active_opts))
     end
   end
-  def self.negate_set
+  def negate_set
     @set.negate
   end
-  def self.append_set(token)
+  def append_set(token)
     @set << token.text
   end
-  def self.close_set(token)
+  def close_set(token)
     @set.close
   end
+  def active_opts
+    @options_stack.last
+  end
 end # module Regexp::Parser