RubyGems - prism - Versions diffs - 0.19.0 → 0.24.0 - Mend

prism 0.19.0 → 0.24.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (69) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +102 -1
data/Makefile +5 -0
data/README.md +9 -6
data/config.yml +236 -38
data/docs/build_system.md +19 -2
data/docs/cruby_compilation.md +27 -0
data/docs/parser_translation.md +34 -0
data/docs/parsing_rules.md +19 -0
data/docs/releasing.md +84 -16
data/docs/ruby_api.md +1 -1
data/docs/ruby_parser_translation.md +19 -0
data/docs/serialization.md +19 -5
data/ext/prism/api_node.c +1989 -1525
data/ext/prism/extension.c +130 -30
data/ext/prism/extension.h +2 -2
data/include/prism/ast.h +1700 -505
data/include/prism/defines.h +8 -0
data/include/prism/diagnostic.h +49 -7
data/include/prism/encoding.h +17 -0
data/include/prism/options.h +40 -14
data/include/prism/parser.h +34 -18
data/include/prism/util/pm_buffer.h +9 -0
data/include/prism/util/pm_constant_pool.h +18 -0
data/include/prism/util/pm_newline_list.h +4 -14
data/include/prism/util/pm_strpbrk.h +4 -1
data/include/prism/version.h +2 -2
data/include/prism.h +19 -2
data/lib/prism/debug.rb +11 -5
data/lib/prism/desugar_compiler.rb +225 -80
data/lib/prism/dot_visitor.rb +36 -14
data/lib/prism/dsl.rb +302 -299
data/lib/prism/ffi.rb +107 -76
data/lib/prism/lex_compat.rb +17 -1
data/lib/prism/node.rb +4580 -2607
data/lib/prism/node_ext.rb +27 -4
data/lib/prism/parse_result.rb +75 -29
data/lib/prism/serialize.rb +633 -305
data/lib/prism/translation/parser/compiler.rb +1838 -0
data/lib/prism/translation/parser/lexer.rb +335 -0
data/lib/prism/translation/parser/rubocop.rb +45 -0
data/lib/prism/translation/parser.rb +190 -0
data/lib/prism/translation/parser33.rb +12 -0
data/lib/prism/translation/parser34.rb +12 -0
data/lib/prism/translation/ripper.rb +696 -0
data/lib/prism/translation/ruby_parser.rb +1521 -0
data/lib/prism/translation.rb +11 -0
data/lib/prism.rb +1 -1
data/prism.gemspec +18 -7
data/rbi/prism.rbi +150 -88
data/rbi/prism_static.rbi +15 -3
data/sig/prism.rbs +996 -961
data/sig/prism_static.rbs +123 -46
data/src/diagnostic.c +264 -219
data/src/encoding.c +21 -26
data/src/node.c +2 -6
data/src/options.c +29 -5
data/src/prettyprint.c +176 -44
data/src/prism.c +1499 -564
data/src/serialize.c +35 -21
data/src/token_type.c +353 -4
data/src/util/pm_buffer.c +11 -0
data/src/util/pm_constant_pool.c +37 -11
data/src/util/pm_newline_list.c +6 -15
data/src/util/pm_string.c +0 -7
data/src/util/pm_strpbrk.c +122 -14
metadata +16 -5
data/docs/building.md +0 -29
data/lib/prism/ripper_compat.rb +0 -207

data/lib/prism/node_ext.rb CHANGED Viewed

@@ -81,7 +81,7 @@ module Prism
   class RationalNode < Node
     # Returns the value of the node as a Ruby Rational.
     def value
-      Rational(slice.chomp("r"))
+      Rational(numeric.is_a?(IntegerNode) ? numeric.value : slice.chomp("r"))
     end
   end
@@ -94,7 +94,7 @@ module Prism
     # Returns the full name of this constant. For example: "Foo"
     def full_name
-      name.name
+      name.to_s
     end
   end
@@ -118,7 +118,7 @@ module Prism
         current = current.parent
       end
-      unless current.is_a?(ConstantReadNode)
+      if !current.is_a?(ConstantReadNode) && !current.nil?
         raise DynamicPartsInConstantPathError, "Constant path contains dynamic parts. Cannot compute full name"
       end
@@ -135,7 +135,17 @@ module Prism
     # Returns the list of parts for the full name of this constant path.
     # For example: [:Foo, :Bar]
     def full_name_parts
-      (parent&.full_name_parts || [:""]).push(child.name)
+      parts = case parent
+      when ConstantPathNode, ConstantReadNode
+        parent.full_name_parts
+      when nil
+        [:""]
+      else
+        raise ConstantPathNode::DynamicPartsInConstantPathError,
+          "Constant path target contains dynamic parts. Cannot compute full name"
+      end
+      parts.push(child.name)
     end
     # Returns the full name of this constant path. For example: "Foo::Bar"
@@ -144,6 +154,19 @@ module Prism
     end
   end
+  class ConstantTargetNode < Node
+    # Returns the list of parts for the full name of this constant.
+    # For example: [:Foo]
+    def full_name_parts
+      [name]
+    end
+    # Returns the full name of this constant. For example: "Foo"
+    def full_name
+      name.to_s
+    end
+  end
   class ParametersNode < Node
     # Mirrors the Method#parameters method.
     def signature

data/lib/prism/parse_result.rb CHANGED Viewed

@@ -9,18 +9,16 @@ module Prism
     attr_reader :source
     # The line number where this source starts.
-    attr_accessor :start_line
+    attr_reader :start_line
     # The list of newline byte offsets in the source code.
     attr_reader :offsets
-    # Create a new source object with the given source code and newline byte
-    # offsets. If no newline byte offsets are given, they will be computed from
-    # the source code.
-    def initialize(source, start_line = 1, offsets = compute_offsets(source))
+    # Create a new source object with the given source code.
+    def initialize(source, start_line = 1, offsets = [])
       @source = source
-      @start_line = start_line
-      @offsets = offsets
+      @start_line = start_line # set after parsing is done
+      @offsets = offsets # set after parsing is done
     end
     # Perform a byteslice on the source code using the given byte offset and
@@ -56,6 +54,23 @@ module Prism
       character_offset(byte_offset) - character_offset(line_start(byte_offset))
     end
+    # Returns the offset from the start of the file for the given byte offset
+    # counting in code units for the given encoding.
+    #
+    # This method is tested with UTF-8, UTF-16, and UTF-32. If there is the
+    # concept of code units that differs from the number of characters in other
+    # encodings, it is not captured here.
+    def code_units_offset(byte_offset, encoding)
+      byteslice = source.byteslice(0, byte_offset).encode(encoding)
+      (encoding == Encoding::UTF_16LE || encoding == Encoding::UTF_16BE) ? (byteslice.bytesize / 2) : byteslice.length
+    end
+    # Returns the column number in code units for the given encoding for the
+    # given byte offset.
+    def code_units_column(byte_offset, encoding)
+      code_units_offset(byte_offset, encoding) - code_units_offset(line_start(byte_offset), encoding)
+    end
     private
     # Binary search through the offsets to find the line number for the given
@@ -77,21 +92,14 @@ module Prism
       left - 1
     end
-    # Find all of the newlines in the source code and return their byte offsets
-    # from the start of the string an array.
-    def compute_offsets(code)
-      offsets = [0]
-      code.b.scan("\n") { offsets << $~.end(0) }
-      offsets
-    end
   end
   # This represents a location in the source.
   class Location
     # A Source object that is used to determine more information from the given
     # offset and length.
-    protected attr_reader :source
+    attr_reader :source
+    protected :source
     # The byte offset from the beginning of the source where this location
     # starts.
@@ -137,6 +145,11 @@ module Prism
       source.character_offset(start_offset)
     end
+    # The offset from the start of the file in code units of the given encoding.
+    def start_code_units_offset(encoding = Encoding::UTF_16LE)
+      source.code_units_offset(start_offset, encoding)
+    end
     # The byte offset from the beginning of the source where this location ends.
     def end_offset
       start_offset + length
@@ -148,6 +161,11 @@ module Prism
       source.character_offset(end_offset)
     end
+    # The offset from the start of the file in code units of the given encoding.
+    def end_code_units_offset(encoding = Encoding::UTF_16LE)
+      source.code_units_offset(end_offset, encoding)
+    end
     # The line number where this location starts.
     def start_line
       source.line(start_offset)
@@ -176,6 +194,12 @@ module Prism
       source.character_column(start_offset)
     end
+    # The column number in code units of the given encoding where this location
+    # starts from the start of the line.
+    def start_code_units_column(encoding = Encoding::UTF_16LE)
+      source.code_units_column(start_offset, encoding)
+    end
     # The column number in bytes where this location ends from the start of the
     # line.
     def end_column
@@ -188,6 +212,12 @@ module Prism
       source.character_column(end_offset)
     end
+    # The column number in code units of the given encoding where this location
+    # ends from the start of the line.
+    def end_code_units_column(encoding = Encoding::UTF_16LE)
+      source.code_units_column(end_offset, encoding)
+    end
     # Implement the hash pattern matching interface for Location.
     def deconstruct_keys(keys)
       { start_offset: start_offset, end_offset: end_offset }
@@ -312,20 +342,24 @@ module Prism
     # A Location object representing the location of this error in the source.
     attr_reader :location
+    # The level of this error.
+    attr_reader :level
     # Create a new error object with the given message and location.
-    def initialize(message, location)
+    def initialize(message, location, level)
       @message = message
       @location = location
+      @level = level
     end
     # Implement the hash pattern matching interface for ParseError.
     def deconstruct_keys(keys)
-      { message: message, location: location }
+      { message: message, location: location, level: level }
     end
     # Returns a string representation of this error.
     def inspect
-      "#<Prism::ParseError @message=#{@message.inspect} @location=#{@location.inspect}>"
+      "#<Prism::ParseError @message=#{@message.inspect} @location=#{@location.inspect} @level=#{@level.inspect}>"
     end
   end
@@ -337,20 +371,24 @@ module Prism
     # A Location object representing the location of this warning in the source.
     attr_reader :location
+    # The level of this warning.
+    attr_reader :level
     # Create a new warning object with the given message and location.
-    def initialize(message, location)
+    def initialize(message, location, level)
       @message = message
       @location = location
+      @level = level
     end
     # Implement the hash pattern matching interface for ParseWarning.
     def deconstruct_keys(keys)
-      { message: message, location: location }
+      { message: message, location: location, level: level }
     end
     # Returns a string representation of this warning.
     def inspect
-      "#<Prism::ParseWarning @message=#{@message.inspect} @location=#{@location.inspect}>"
+      "#<Prism::ParseWarning @message=#{@message.inspect} @location=#{@location.inspect} @level=#{@level.inspect}>"
     end
   end
@@ -369,9 +407,9 @@ module Prism
     # The list of magic comments that were encountered during parsing.
     attr_reader :magic_comments
-    # An optional location that represents the location of the content after the
-    # __END__ marker. This content is loaded into the DATA constant when the
-    # file being parsed is the main file being executed.
+    # An optional location that represents the location of the __END__ marker
+    # and the rest of the content of the file. This content is loaded into the
+    # DATA constant when the file being parsed is the main file being executed.
     attr_reader :data_loc
     # The list of errors that were generated during parsing.
@@ -414,17 +452,19 @@ module Prism
   # This represents a token from the Ruby source.
   class Token
+    # The Source object that represents the source this token came from.
+    attr_reader :source
+    private :source
     # The type of token that this token is.
     attr_reader :type
     # A byteslice of the source that this token represents.
     attr_reader :value
-    # A Location object representing the location of this token in the source.
-    attr_reader :location
     # Create a new token object with the given type, value, and location.
-    def initialize(type, value, location)
+    def initialize(source, type, value, location)
+      @source = source
       @type = type
       @value = value
       @location = location
@@ -435,6 +475,12 @@ module Prism
       { type: type, value: value, location: location }
     end
+    # A Location object representing the location of this token in the source.
+    def location
+      return @location if @location.is_a?(Location)
+      @location = Location.new(source, @location >> 32, @location & 0xFFFFFFFF)
+    end
     # Implement the pretty print interface for Token.
     def pretty_print(q)
       q.group do