RubyGems - rley - Versions diffs - 0.5.08 → 0.5.09 - Mend

rley 0.5.08 → 0.5.09

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +7 -1
data/examples/general/SRL/lib/ast_builder.rb +74 -78
data/examples/general/SRL/lib/grammar.rb +11 -3
data/examples/general/SRL/lib/regex/abstract_method.rb +35 -0
data/examples/general/SRL/lib/regex/atomic_expression.rb +21 -0
data/examples/general/SRL/lib/regex/char_class.rb +34 -0
data/examples/general/SRL/lib/regex/char_range.rb +50 -0
data/examples/general/SRL/lib/regex/character.rb +195 -0
data/examples/general/SRL/lib/regex/compound_expression.rb +60 -0
data/examples/general/SRL/lib/regex/expression.rb +42 -0
data/examples/general/SRL/lib/regex/monadic_expression.rb +31 -0
data/examples/general/SRL/lib/regex/polyadic_expression.rb +64 -0
data/examples/general/SRL/lib/regex/quantifiable.rb +28 -0
data/examples/general/SRL/lib/regex/repetition.rb +31 -0
data/examples/general/SRL/lib/regex_repr.rb +5 -1
data/examples/general/SRL/lib/tokenizer.rb +8 -5
data/examples/general/SRL/spec/integration_spec.rb +64 -41
data/examples/general/SRL/spec/regex/character_spec.rb +159 -0
data/examples/general/SRL/spec/tokenizer_spec.rb +18 -4
data/examples/general/SRL/srl_demo.rb +14 -4
data/lib/rley/constants.rb +1 -1
metadata +14 -3
data/examples/general/SRL/lib/srl_demo.rb +0 -67

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 3c616b691fb51ba2eb00a25fee75ff4a80093990
-  data.tar.gz: 1039cfe8f29c8d1ec7c88fa83c18f9173763b8f2
+  metadata.gz: d95e1ed6a38d8e1ed70e456f46c812275a1d4530
+  data.tar.gz: fcf7b54ff98d107fa38239139db10e7bbf1f7825
 SHA512:
-  metadata.gz: df7412344421bd421fb459fe5cf8053618dea1212c4da27e83cf41225dbaf664d9b143499978e6bcef2ae293a7bf9378d3ecb4867f989553f798e9723ba8344b
-  data.tar.gz: 436474ceafd2689137fab890b19ca24715ebe72dd1311b3ad64313bc130cf8bbce12fe35049008d20a89634309cbac882da70bc891522d45a58e8ce310b466a7
+  metadata.gz: e185aa4e7ca59e5995f6e87379efd4f921d4242307abd55718e46bf346e7414c487b56f753f446d8518ffab74e783774aaa2adc9b7fcf8a014fdba96b8da090d
+  data.tar.gz: 5c990777d79432c813c92dda0b21e7af3dcf587485b868e9723d30e3d1c1b3b2d6e1bc8dc7235fb1ba32c1b27ddeb6f829ef3e1b7b9248d5be1199f27e153849

data/CHANGELOG.md CHANGED

@@ -1,4 +1,10 @@
-### 0.5.08 / 2017-11-xx
+### 0.5.09 / 2017-12-02
+* [CHANGE] Dir `examples/general/SRL/ Added support for letter range to Simple Regex Language parser.
+### 0.5.08 / 2017-11-28
+* [NEW] Dir `examples/general/SRL/ Added an initial version of the Simple Regex Language parser.
+  Supports the SRL quantifier syntax only.
+* [FIX] Method `ParseTreeBuilder::place_TOS_child` was sometimes fooled when argument `aNode` was nil.
 * [FIX] Method `BaseParser::initialize` missing parameter name in doc caused a YARD warning.
 * [FIX] Method `GrmItemsBuilder::build_dotted_items` missing parameter name in doc caused a YARD warning.
 * [FIX] Method `NonTerminalVertex::initialize` missing parameter name in doc caused a YARD warning.

data/examples/general/SRL/lib/ast_builder.rb CHANGED

@@ -35,9 +35,30 @@ class ASTBuilder < Rley::Parser::ParseTreeBuilder
   # @param theChildren [Array] Children nodes (one per rhs symbol)
   def new_parent_node(aProduction, aRange, theTokens, theChildren)
     node = case aProduction.name
-      when 'srl_0' # rule 'srl' => 'quantifier'
+      when 'srl_0' # rule 'srl' => 'term'
         return_first_child(aRange, theTokens, theChildren)
+      when 'term_0' # rule 'term' => 'atom'
+        return_first_child(aRange, theTokens, theChildren)
+      when 'term_1' # rule 'term' => %w[atom quantifier]
+        reduce_term_1(aProduction, aRange, theTokens, theChildren)
+      when 'atom_0' #rule 'atom' => 'letter_range'
+        return_first_child(aRange, theTokens, theChildren)
+      when 'letter_range_0' # rule 'letter_range' => %w[LETTER FROM LETTER_LIT TO LETTER_LIT]
+        reduce_letter_range_0(aProduction, aRange, theTokens, theChildren)
+       when 'letter_range_1' #rule 'letter_range' => %w[UPPERCASE LETTER FROM LETTER_LIT TO LETTER_LIT]
+        reduce_letter_range_1(aProduction, aRange, theTokens, theChildren)
+      when 'letter_range_2' # rule 'letter_range' => 'LETTER'
+        reduce_letter_range_2(aProduction, aRange, theTokens, theChildren)
+      when 'letter_range_3' # rule 'letter_range' => %w[UPPERCASE LETTER]
+        reduce_letter_range_3(aProduction, aRange, theTokens, theChildren)
       when 'quantifier_0' # rule 'quantifier' => 'ONCE'
         multiplicity(1, 1)
@@ -78,99 +99,74 @@ class ASTBuilder < Rley::Parser::ParseTreeBuilder
     return SRL::Regex::Multiplicity.new(lowerBound, upperBound, :greedy)
   end
-  # rule 'quantifier' => %w[EXACTLY count TIMES]
-  def reduce_quantifier_2(aProduction, aRange, theTokens, theChildren)
-    count = theChildren[1].token.lexeme.to_i
-    multiplicity(count, count)
-  end
-  # rule 'quantifier' => %w[BETWEEN count AND count times_suffix]
-  def reduce_quantifier_3(aProduction, aRange, theTokens, theChildren)
-    upper = theChildren[3].token.lexeme.to_i
-    # lower = theChildren[1].token.lexeme.to_i
-    multiplicity(3, upper)
-  end
-  # rule 'quantifier' => %w[AT LEAST count TIMES]
-  def reduce_quantifier_7(aProduction, aRange, theTokens, theChildren)
-    count = theChildren[2].token.lexeme.to_i
-    multiplicity(count, :more)
+  def char_range(lowerBound, upperBound)
+    # TODO fix module nesting
+    lower = Regex::Character.new(lowerBound)
+    upper =  Regex::Character.new(upperBound)
+    return Regex::CharRange.new(lower, upper)
   end
-=begin
-  def reduce_binary_operator(theChildren)
-    operator_node = theChildren[1]
-    operator_node.children << theChildren[0]
-    operator_node.children << theChildren[2]
-    return operator_node
+  def char_class(toNegate, *theChildren)
+    Regex::CharClass.new(toNegate, *theChildren)
   end
-  # rule 'simple_expression' => %w[simple_expression add_operator term]
-  def reduce_simple_expression_1(_production, _range, _tokens, theChildren)
-    reduce_binary_operator(theChildren)
+  def repetition(expressionToRepeat, aMultiplicity)
+    return Regex::Repetition.new(expressionToRepeat, aMultiplicity)
   end
-  # rule 'term' => %w[term mul_operator factor]
-  def reduce_term_1(_production, _range, _tokens, theChildren)
-    reduce_binary_operator(theChildren)
+  # rule 'term' => %w[atom quantifier]
+  def reduce_term_1(aProduction, aRange, theTokens, theChildren)
+    quantifier = theChildren.last
+    atom = theChildren.first
+    repetition(atom, quantifier)
   end
-  # rule 'factor' => %w[simple_factor POWER simple_factor]]
-  def reduce_factor_1(aProduction, aRange, theTokens, theChildren)
-    result = PowerNode.new(theChildren[1].symbol, aRange)
-    result.children << theChildren[0]
-    result.children << theChildren[2]
-    return result
+  # rule 'letter_range' => %w[LETTER FROM LETTER_LIT TO LETTER_LIT]
+  def reduce_letter_range_0(aProduction, aRange, theTokens, theChildren)
+    lower = theChildren[2].token.lexeme
+    upper =  theChildren[4].token.lexeme
+    ch_range = char_range(lower, upper)
+    char_class(false, ch_range)
   end
-  # rule 'simple_factor' => %[sign scalar]
-  def reduce_simple_factor_0(aProduction, aRange, theTokens, theChildren)
-    first_child = theChildren[0]
-    result = if first_child.kind_of?(CalcNegateNode)
-               -theChildren[1]
-             else
-               theChildren[1]
-             end
-    return result
+  # rule 'letter_range' => %w[UPPERCASE LETTER FROM LETTER_LIT TO LETTER_LIT]
+  def reduce_letter_range_1(aProduction, aRange, theTokens, theChildren)
+    lower = theChildren[3].token.lexeme
+    upper =  theChildren[5].token.lexeme
+    ch_range = char_range(lower.upcase, upper.upcase)
+    char_class(false, ch_range)
   end
-  # rule 'simple_factor' => %w[unary_function in_parenthesis]
-  def reduce_simple_factor_1(aProduction, aRange, theTokens, theChildren)
-    func = CalcUnaryFunction.new(theChildren[0].symbol, aRange.low)
-    func.func_name = theChildren[0].value
-    func.children << theChildren[1]
-    return func
+  # rule 'letter_range' => 'LETTER'
+  def reduce_letter_range_2(aProduction, aRange, theTokens, theChildren)
+    ch_range = char_range('a', 'z')
+    char_class(false, ch_range)
   end
-  # rule 'simple_factor' => %w[MINUS in_parenthesis]
-  def reduce_simple_factor_2(aProduction, aRange, theTokens, theChildren)
-    negation = CalcNegateNode.new(theChildren[0].symbol, aRange.low)
-    negation.children << theChildren[1]
-    return negation
+  #rule 'letter_range' => %w[UPPERCASE LETTER]
+  def reduce_letter_range_3(aProduction, aRange, theTokens, theChildren)
+    ch_range = char_range('A', 'Z')
+    char_class(false, ch_range)
   end
-  # rule 'add_operator' => 'PLUS'
-  def reduce_add_operator_0(_production, aRange, _tokens, theChildren)
-    return CalcAddNode.new(theChildren[0].symbol, aRange)
+  # rule 'quantifier' => %w[EXACTLY count TIMES]
+  def reduce_quantifier_2(aProduction, aRange, theTokens, theChildren)
+    count = theChildren[1].token.lexeme.to_i
+    multiplicity(count, count)
   end
-  # rule 'add_operator' => 'MINUS'
-  def reduce_add_operator_1(_production, aRange, _tokens, theChildren)
-    return CalcSubtractNode.new(theChildren[0].symbol, aRange)
+  # rule 'quantifier' => %w[BETWEEN count AND count times_suffix]
+  def reduce_quantifier_3(aProduction, aRange, theTokens, theChildren)
+    lower = theChildren[1].token.lexeme.to_i
+    upper = theChildren[3].token.lexeme.to_i
+    multiplicity(lower, upper)
   end
-  # rule 'mul_operator' => 'STAR'
-  def reduce_mul_operator_0(_production, aRange, _tokens, theChildren)
-    return CalcMultiplyNode.new(theChildren[0].symbol, aRange)
+  # rule 'quantifier' => %w[AT LEAST count TIMES]
+  def reduce_quantifier_7(aProduction, aRange, theTokens, theChildren)
+    count = theChildren[2].token.lexeme.to_i
+    multiplicity(count, :more)
   end
-  # rule 'mul_operator' => 'DIVIDE'
-  def reduce_mul_operator_1(_production, aRange, _tokens, theChildren)
-    return CalcDivideNode.new(theChildren[0].symbol, aRange)
-  end
-=end
 end # class
 # End of file

data/examples/general/SRL/lib/grammar.rb CHANGED

@@ -6,13 +6,21 @@ module SRL
   # This is a very partial grammar of SRL.
   # It will be expanded with the coming versions of Rley
   builder = Rley::Syntax::GrammarBuilder.new do
-    add_terminals('DIGIT', 'INTEGER')
+    add_terminals('DIGIT_LIT', 'INTEGER', 'LETTER_LIT')
+    add_terminals('UPPERCASE', 'LETTER', 'FROM', 'TO')
     add_terminals('EXACTLY', 'TIMES', 'ONCE', 'TWICE')
     add_terminals('BETWEEN', 'AND', 'OPTIONAL', 'OR')
     add_terminals('MORE', 'NEVER', 'AT', 'LEAST')
     # For the moment one focuses on quantifier syntax only...
-    rule 'srl' => 'quantifier'
+    rule 'srl' => 'term'
+    rule 'term' => 'atom'
+    rule 'term' => %w[atom quantifier]
+    rule 'atom' => 'letter_range'
+    rule 'letter_range' => %w[LETTER FROM LETTER_LIT TO LETTER_LIT]
+    rule 'letter_range' => %w[UPPERCASE LETTER FROM LETTER_LIT TO LETTER_LIT]
+    rule 'letter_range' => 'LETTER'
+    rule 'letter_range' => %w[UPPERCASE LETTER]
     rule 'quantifier' => 'ONCE'
     rule 'quantifier' => 'TWICE'
     rule 'quantifier' => %w[EXACTLY count TIMES]
@@ -21,7 +29,7 @@ module SRL
     rule 'quantifier' => %w[ONCE OR MORE]
     rule 'quantifier' => %w[NEVER OR MORE]
     rule 'quantifier' => %w[AT LEAST count TIMES]
-    rule 'count' => 'DIGIT'
+    rule 'count' => 'DIGIT_LIT'
     rule 'count' => 'INTEGER'
     rule 'times_suffix' => 'TIMES'
     rule 'times_suffix' => []

data/examples/general/SRL/lib/regex/abstract_method.rb ADDED

@@ -0,0 +1,35 @@
+# File: abstract_method.rb
+# Mix-in module. Provides the method 'abstract_method' that raises an exception
+# with an appropriate message when called.
+module AbstractMethod
+public
+	# Call this method in the body of your abstract methods.
+	# Example:
+	# require 'AbstractMethod'
+	# class SomeClass
+	# include AbstractMethod # To add the behaviour from the mix-in module AbstractMethod
+	# ...
+	# Consider that SomeClass has an abstract method called 'some_method'
+	#
+	# def some_method() abstract_method
+	# end
+	def abstract_method()
+		# Determine the short class name of self
+		className =  self.class.name.split(/::/).last
+		# Retrieve the top text line of the call stack
+		top_line = caller.first
+		# Extract the calling method name
+		callerNameInQuotes = top_line.scan(/`.+?$/).first
+		callerName = callerNameInQuotes.gsub(/`|'/, '')	# Remove enclosing quotes
+		# Build the error message
+		error_message = "The method #{className}##{callerName} is abstract. It should be implemented in subclasses of #{className}."
+		raise NotImplementedError, error_message
+	end
+end # module
+# End of file

data/examples/general/SRL/lib/regex/atomic_expression.rb ADDED

@@ -0,0 +1,21 @@
+# File: atomic_expression.rb
+require_relative "expression"	# Access the superclass
+module Regex # This module is used as a namespace
+# Abstract class. A valid regular expression that
+# cannot be further decomposed into sub-expressions.
+class AtomicExpression < Expression
+public
+	# Redefined method. Return true since it may not have any child.
+	def atomic?
+		return true
+	end
+end # class
+end # module
+# End of file

data/examples/general/SRL/lib/regex/char_class.rb ADDED

@@ -0,0 +1,34 @@
+# File: char_class.rb
+require_relative "polyadic_expression"	# Access the superclass
+module Regex # This module is used as a namespace
+# Abstract class. A n-ary matching operator.
+# It succeeds when one child expression succeeds to match the subject text
+# than defined by this concatenation.
+class CharClass < PolyadicExpression
+	# A flag that indicates whether the character is negated
+	attr_reader(:negated)
+	# Constructor.
+	def initialize(to_negate,*theChildren)
+		super(theChildren)
+		@negated = to_negate
+	end
+public
+	# Conversion method re-definition.
+	# Purpose: Return the String representation of the concatented expressions.
+	def to_str()
+		result_children = children.inject('') { |subResult, aChild| subResult << aChild.to_str() }
+		result = '['+ (negated ? '^' : '')  + result_children + ']'
+		return result
+	end
+end # class
+end # module
+# End of file

data/examples/general/SRL/lib/regex/char_range.rb ADDED

@@ -0,0 +1,50 @@
+# File: char_range.rb
+require_relative 'polyadic_expression'	# Access the superclass
+module Regex # This module is used as a namespace
+# A binary expression that represents a contiguous range of characters.
+# Assumption: characters are ordered by codepoint
+class CharRange < PolyadicExpression
+	# Constructor.
+	# [thelowerBound] A character that will be the lower bound value for the range.
+	# [theUpperBound] A character that will be the upper bound value for the range.
+	# TODO: optimisation. Build a Character if lower bound == upper bound.
+	def initialize(theLowerBound, theUpperBound)
+		range = validated_range(theLowerBound, theUpperBound)
+		super(range)
+	end
+public
+	# Return the lower bound of the range.
+	def lower()
+		return children.first
+	end
+	# Return the upper bound of the range.
+	def upper()
+		return children.last
+	end
+	# Conversion method re-definition.
+	# Purpose: Return the String representation of the concatented expressions.
+	def to_str()
+		result = lower.to_str() + '-' + upper.to_str()
+		return result
+	end
+private
+	# Validation method. Returns a couple of Characters.after their validation.
+	def validated_range(theLowerBound, theUpperBound)
+		raise StandardError, "Character range error: lower bound is greater than upper bound." if theLowerBound.codepoint > theUpperBound.codepoint
+		return [theLowerBound, theUpperBound]
+	end
+end # class
+end # module
+# End of file

data/examples/general/SRL/lib/regex/character.rb ADDED

@@ -0,0 +1,195 @@
+# File: character.rb
+require_relative 'atomic_expression'	# Access the superclass
+module Regex # This module is used as a namespace
+# A regular expression that matches a specific character in a given character set
+class Character < AtomicExpression
+	# Constant with all special 2-characters escape sequences
+	DigramSequences = {
+		"\\a" => 0x7, # alarm
+		"\\n" => 0xA, # newline
+		"\\r" => 0xD, # carriage return
+		"\\t" => 0x9, # tab
+		"\\e" => 0x1B, # escape
+		"\\f" => 0xC, # form feed
+		"\\v" => 0xB, # vertical feed
+		# Single octal digit literals
+		"\\0" => 0,
+		"\\1" => 1,
+		"\\2" => 2,
+		"\\3" => 3,
+		"\\4" => 4,
+		"\\5" => 5,
+		"\\6" => 6,
+		"\\7" => 7
+	}
+	# The integer value that uniquely identifies the character.
+	attr_reader(:codepoint)
+	# The initial text representation of the character (if any).
+	attr_reader(:lexeme)
+	# Constructor.
+	# [aValue] Initialize the character with a either a String literal or a codepoint value.
+	# Examples:
+	# Initializing with codepoint value...
+	# RegAn::Character.new(0x3a3)	# Represents: Σ (Unicode GREEK CAPITAL LETTER SIGMA)
+	# RegAn::Character.new(931)		# Also represents: Σ (931 dec == 3a3 hex)
+	#
+	# Initializing with a single character string
+	# RegAn::Character.new(?\u03a3) # Also represents: Σ
+	# RegAn::Character.new('Σ')		# Obviously, represents a Σ
+	#
+	# Initializing with an escape sequence string
+	# Recognized escaped characters are: \a (alarm, 0x07), \n (newline, 0xA),
+	#	\r (carriage return, 0xD), \t (tab, 0x9), \e (escape, 0x1B), \f (form feed, 0xC)
+	#	\uXXXX where XXXX is a 4 hex digits integer value, \u{X...}, \ooo (octal)	\xXX (hex)
+	# Any other escaped character will be treated as a literal character
+	# RegAn::Character.new('\n')		# Represents a newline
+	# RegAn::Character.new('\u03a3')	# Represents a Σ
+	def initialize(aValue)
+		case aValue
+			when String
+				if aValue.size == 1
+					# Literal single character case...
+					@codepoint = self.class.char2codepoint(aValue)
+				else
+					# Should be an escape sequence...
+					@codepoint = self.class.esc2codepoint(aValue)
+				end
+				@lexeme = aValue
+			when Fixnum
+				@codepoint = aValue
+			else
+				raise StandardError, "Cannot initialize a Character with a '#{aValue}'."
+		end
+	end
+public
+	# Convertion method that returns a character given a codepoint (integer) value.
+	# Example:
+	# RegAn::Character::codepoint2char(0x3a3)	# Returns: Σ (The Unicode GREEK CAPITAL LETTER SIGMA)
+	def self.codepoint2char(aCodepoint)
+		return [aCodepoint].pack('U')	# Remark: chr() fails with codepoints > 256
+	end
+	# Convertion method that returns the codepoint for the given single character.
+	# Example:
+	# RegAn::Character::char2codepoint('Σ')	# Returns: 0x3a3
+	def self.char2codepoint(aChar)
+		return aChar.ord()
+	end
+	# Convertion method that returns the codepoint for the given escape sequence (a String).
+	# Recognized escaped characters are: \a (alarm, 0x07), \n (newline, 0xA),
+	#	\r (carriage return, 0xD), \t (tab, 0x9), \e (escape, 0x1B), \f (form feed, 0xC), \v (vertical feed, 0xB)
+	#	\uXXXX where XXXX is a 4 hex digits integer value, \u{X...}, \ooo (octal)	\xXX (hex)
+	# Any other escaped character will be treated as a literal character
+	# Example:
+	# RegAn::Character::esc2codepoint('\n')	# Returns: 0xd
+	def self.esc2codepoint(anEscapeSequence)
+		raise StandardError, "Escape sequence #{anEscapeSequence} does not begin with a backslash (\)." unless anEscapeSequence[0] == "\\"
+		result = (anEscapeSequence.length == 2)? digram2codepoint(anEscapeSequence) : esc_number2codepoint(anEscapeSequence)
+		return result
+	end
+	# Return the character as a String object
+	def char()
+		self.class.codepoint2char(@codepoint)
+	end
+	# Conversion method re-definition.
+	# Purpose: Return the String representation of the expression.
+	# If the Character was initially from a text (the lexeme), then the lexeme is returned back.
+	# Otherwise the character corresponding to the codepoint is returned.
+	def to_str()
+		if lexeme.nil?
+			result = char()
+		else
+			result = lexeme.dup()
+		end
+		return result
+	end
+	# Returns true iff this Character and parameter 'another' represent the same character.
+	# [another] any Object. The way the equality is tested depends on the another's class
+	# Example:
+	# newOne = Character.new(?\u03a3)
+	# newOne == newOne	# true. Identity
+	# newOne == Character.new(?\u03a3)	# true. Both have same codepoint
+	# newOne == ?\u03a3	# true. The single character String match exactly the char attribute.
+	# newOne == 0x03a3	# true. The Fixnum is compared to the codepoint value.
+	# Will test equality with any Object that knows the to_s method
+	def ==(another)
+		result = case another
+			when Character
+				self.to_str == another.to_str
+			when Fixnum
+				self.codepoint == another
+			when String
+				(another.size > 1) ? false : self.to_str == another
+			else
+				# Unknown type: try with a convertion
+				self == another.to_s()	# Recursive call
+		end
+		return result
+	end
+	# Return a plain English description of the character
+	def explain()
+		return "the character '#{to_str()}'"
+	end
+private
+	# Convertion method that returns a codepoint for the given two characters (digram) escape sequence.
+	# Recognized escaped characters are: \a (alarm, 0x07), \n (newline, 0xA),
+	#	\r (carriage return, 0xD), \t (tab, 0x9), \e (escape, 0x1B), \f (form feed, 0xC), \v (vertical feed, 0xB)
+	# Any other escape sequence will return the codepoint of the escaped character.
+	# [aDigram]	A sequence of two characters that starts with a backslash.
+	def self.digram2codepoint(aDigram)
+		# Check that the digram is a special escape sequence
+		result = DigramSequences.fetch(aDigram, nil)
+		# If it not a special sequence, then escaped character is considered literally (the backslash is 'dummy')
+		result = char2codepoint(aDigram[-1]) if result.nil?
+		return result
+	end
+	# Convertion method that returns a codepoint for the given complex escape sequence.
+	# [anEscapeSequence] A String with the format:
+	# \uXXXX where XXXX is a 4 hex digits integer value,
+	# \u{X...} X 1 or more hex digits
+	# \ooo (1..3 octal digits literal)
+	# \xXX (1..2 hex digits literal)
+	def self.esc_number2codepoint(anEscapeSequence)
+		# Next line requires Ruby >= 1.9
+		unless /^\\(?:(?:(?<prefix>[uxX])\{?(?<hexa>\h+)\}?)|(?<octal>[0-7]{1,3}))$/ =~ anEscapeSequence
+			raise StandardError, "Unsupported escape sequence #{anEscapeSequence}."
+		else
+			#shorterSeq = anEscapeSequence[1..-1]	# Remove the backslash
+		# Octal literal case?
+			return octal.oct() if octal # shorterSeq =~ /[0-7]{1,3}/
+			# Extract the hexadecimal number
+			hexliteral = hexa # shorterSeq.sub(/^[xXu]\{?([0-9a-fA-F]+)}?$/, '\1')
+			return hexliteral.hex()
+		end
+	end
+end # class
+end # module
+# End of file