RubyGems - jruby-prism-parser - Versions diffs - 0.23.0.pre.SNAPSHOT-java - Mend

jruby-prism-parser 0.23.0.pre.SNAPSHOT-java

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (110) hide show

checksums.yaml +7 -0
data/CHANGELOG.md +401 -0
data/CODE_OF_CONDUCT.md +76 -0
data/CONTRIBUTING.md +62 -0
data/LICENSE.md +7 -0
data/Makefile +101 -0
data/README.md +98 -0
data/config.yml +2902 -0
data/docs/build_system.md +91 -0
data/docs/configuration.md +64 -0
data/docs/cruby_compilation.md +27 -0
data/docs/design.md +53 -0
data/docs/encoding.md +121 -0
data/docs/fuzzing.md +88 -0
data/docs/heredocs.md +36 -0
data/docs/javascript.md +118 -0
data/docs/local_variable_depth.md +229 -0
data/docs/mapping.md +117 -0
data/docs/parser_translation.md +34 -0
data/docs/parsing_rules.md +19 -0
data/docs/releasing.md +98 -0
data/docs/ripper.md +36 -0
data/docs/ruby_api.md +43 -0
data/docs/ruby_parser_translation.md +19 -0
data/docs/serialization.md +209 -0
data/docs/testing.md +55 -0
data/ext/prism/api_node.c +5098 -0
data/ext/prism/api_pack.c +267 -0
data/ext/prism/extconf.rb +110 -0
data/ext/prism/extension.c +1155 -0
data/ext/prism/extension.h +18 -0
data/include/prism/ast.h +5807 -0
data/include/prism/defines.h +102 -0
data/include/prism/diagnostic.h +339 -0
data/include/prism/encoding.h +265 -0
data/include/prism/node.h +57 -0
data/include/prism/options.h +230 -0
data/include/prism/pack.h +152 -0
data/include/prism/parser.h +732 -0
data/include/prism/prettyprint.h +26 -0
data/include/prism/regexp.h +33 -0
data/include/prism/util/pm_buffer.h +155 -0
data/include/prism/util/pm_char.h +205 -0
data/include/prism/util/pm_constant_pool.h +209 -0
data/include/prism/util/pm_list.h +97 -0
data/include/prism/util/pm_memchr.h +29 -0
data/include/prism/util/pm_newline_list.h +93 -0
data/include/prism/util/pm_state_stack.h +42 -0
data/include/prism/util/pm_string.h +150 -0
data/include/prism/util/pm_string_list.h +44 -0
data/include/prism/util/pm_strncasecmp.h +32 -0
data/include/prism/util/pm_strpbrk.h +46 -0
data/include/prism/version.h +29 -0
data/include/prism.h +289 -0
data/jruby-prism.jar +0 -0
data/lib/prism/compiler.rb +486 -0
data/lib/prism/debug.rb +206 -0
data/lib/prism/desugar_compiler.rb +207 -0
data/lib/prism/dispatcher.rb +2150 -0
data/lib/prism/dot_visitor.rb +4634 -0
data/lib/prism/dsl.rb +785 -0
data/lib/prism/ffi.rb +346 -0
data/lib/prism/lex_compat.rb +908 -0
data/lib/prism/mutation_compiler.rb +753 -0
data/lib/prism/node.rb +17864 -0
data/lib/prism/node_ext.rb +212 -0
data/lib/prism/node_inspector.rb +68 -0
data/lib/prism/pack.rb +224 -0
data/lib/prism/parse_result/comments.rb +177 -0
data/lib/prism/parse_result/newlines.rb +64 -0
data/lib/prism/parse_result.rb +498 -0
data/lib/prism/pattern.rb +250 -0
data/lib/prism/serialize.rb +1354 -0
data/lib/prism/translation/parser/compiler.rb +1838 -0
data/lib/prism/translation/parser/lexer.rb +335 -0
data/lib/prism/translation/parser/rubocop.rb +37 -0
data/lib/prism/translation/parser.rb +178 -0
data/lib/prism/translation/ripper.rb +577 -0
data/lib/prism/translation/ruby_parser.rb +1521 -0
data/lib/prism/translation.rb +11 -0
data/lib/prism/version.rb +3 -0
data/lib/prism/visitor.rb +495 -0
data/lib/prism.rb +99 -0
data/prism.gemspec +135 -0
data/rbi/prism.rbi +7767 -0
data/rbi/prism_static.rbi +207 -0
data/sig/prism.rbs +4773 -0
data/sig/prism_static.rbs +201 -0
data/src/diagnostic.c +400 -0
data/src/encoding.c +5132 -0
data/src/node.c +2786 -0
data/src/options.c +213 -0
data/src/pack.c +493 -0
data/src/prettyprint.c +8881 -0
data/src/prism.c +18406 -0
data/src/regexp.c +638 -0
data/src/serialize.c +1554 -0
data/src/token_type.c +700 -0
data/src/util/pm_buffer.c +190 -0
data/src/util/pm_char.c +318 -0
data/src/util/pm_constant_pool.c +322 -0
data/src/util/pm_list.c +49 -0
data/src/util/pm_memchr.c +35 -0
data/src/util/pm_newline_list.c +84 -0
data/src/util/pm_state_stack.c +25 -0
data/src/util/pm_string.c +203 -0
data/src/util/pm_string_list.c +28 -0
data/src/util/pm_strncasecmp.c +24 -0
data/src/util/pm_strpbrk.c +180 -0
metadata +156 -0

data/lib/prism/parse_result/newlines.rb ADDED Viewed

@@ -0,0 +1,64 @@
+# frozen_string_literal: true
+module Prism
+  class ParseResult
+    # The :line tracepoint event gets fired whenever the Ruby VM encounters an
+    # expression on a new line. The types of expressions that can trigger this
+    # event are:
+    #
+    # * if statements
+    # * unless statements
+    # * nodes that are children of statements lists
+    #
+    # In order to keep track of the newlines, we have a list of offsets that
+    # come back from the parser. We assign these offsets to the first nodes that
+    # we find in the tree that are on those lines.
+    #
+    # Note that the logic in this file should be kept in sync with the Java
+    # MarkNewlinesVisitor, since that visitor is responsible for marking the
+    # newlines for JRuby/TruffleRuby.
+    class Newlines < Visitor
+      # Create a new Newlines visitor with the given newline offsets.
+      def initialize(newline_marked)
+        @newline_marked = newline_marked
+      end
+      # Permit block/lambda nodes to mark newlines within themselves.
+      def visit_block_node(node)
+        old_newline_marked = @newline_marked
+        @newline_marked = Array.new(old_newline_marked.size, false)
+        begin
+          super(node)
+        ensure
+          @newline_marked = old_newline_marked
+        end
+      end
+      alias_method :visit_lambda_node, :visit_block_node
+      # Mark if/unless nodes as newlines.
+      def visit_if_node(node)
+        node.set_newline_flag(@newline_marked)
+        super(node)
+      end
+      alias_method :visit_unless_node, :visit_if_node
+      # Permit statements lists to mark newlines within themselves.
+      def visit_statements_node(node)
+        node.body.each do |child|
+          child.set_newline_flag(@newline_marked)
+        end
+        super(node)
+      end
+    end
+    private_constant :Newlines
+    # Walk the tree and mark nodes that are on a new line.
+    def mark_newlines!
+      value.accept(Newlines.new(Array.new(1 + source.offsets.size, false)))
+    end
+  end
+end

data/lib/prism/parse_result.rb ADDED Viewed

@@ -0,0 +1,498 @@
+# frozen_string_literal: true
+module Prism
+  # This represents a source of Ruby code that has been parsed. It is used in
+  # conjunction with locations to allow them to resolve line numbers and source
+  # ranges.
+  class Source
+    # The source code that this source object represents.
+    attr_reader :source
+    # The line number where this source starts.
+    attr_reader :start_line
+    # The list of newline byte offsets in the source code.
+    attr_reader :offsets
+    # Create a new source object with the given source code.
+    def initialize(source, start_line = 1, offsets = [])
+      @source = source
+      @start_line = start_line # set after parsing is done
+      @offsets = offsets # set after parsing is done
+    end
+    # Perform a byteslice on the source code using the given byte offset and
+    # byte length.
+    def slice(byte_offset, length)
+      source.byteslice(byte_offset, length)
+    end
+    # Binary search through the offsets to find the line number for the given
+    # byte offset.
+    def line(byte_offset)
+      start_line + find_line(byte_offset)
+    end
+    # Return the byte offset of the start of the line corresponding to the given
+    # byte offset.
+    def line_start(byte_offset)
+      offsets[find_line(byte_offset)]
+    end
+    # Return the column number for the given byte offset.
+    def column(byte_offset)
+      byte_offset - line_start(byte_offset)
+    end
+    # Return the character offset for the given byte offset.
+    def character_offset(byte_offset)
+      source.byteslice(0, byte_offset).length
+    end
+    # Return the column number in characters for the given byte offset.
+    def character_column(byte_offset)
+      character_offset(byte_offset) - character_offset(line_start(byte_offset))
+    end
+    # Returns the offset from the start of the file for the given byte offset
+    # counting in code units for the given encoding.
+    #
+    # This method is tested with UTF-8, UTF-16, and UTF-32. If there is the
+    # concept of code units that differs from the number of characters in other
+    # encodings, it is not captured here.
+    def code_units_offset(byte_offset, encoding)
+      byteslice = source.byteslice(0, byte_offset).encode(encoding)
+      (encoding == Encoding::UTF_16LE || encoding == Encoding::UTF_16BE) ? (byteslice.bytesize / 2) : byteslice.length
+    end
+    # Returns the column number in code units for the given encoding for the
+    # given byte offset.
+    def code_units_column(byte_offset, encoding)
+      code_units_offset(byte_offset, encoding) - code_units_offset(line_start(byte_offset), encoding)
+    end
+    private
+    # Binary search through the offsets to find the line number for the given
+    # byte offset.
+    def find_line(byte_offset)
+      left = 0
+      right = offsets.length - 1
+      while left <= right
+        mid = left + (right - left) / 2
+        return mid if offsets[mid] == byte_offset
+        if offsets[mid] < byte_offset
+          left = mid + 1
+        else
+          right = mid - 1
+        end
+      end
+      left - 1
+    end
+  end
+  # This represents a location in the source.
+  class Location
+    # A Source object that is used to determine more information from the given
+    # offset and length.
+    attr_reader :source
+    protected :source
+    # The byte offset from the beginning of the source where this location
+    # starts.
+    attr_reader :start_offset
+    # The length of this location in bytes.
+    attr_reader :length
+    # The list of comments attached to this location
+    attr_reader :comments
+    # Create a new location object with the given source, start byte offset, and
+    # byte length.
+    def initialize(source, start_offset, length)
+      @source = source
+      @start_offset = start_offset
+      @length = length
+      @comments = []
+    end
+    # Create a new location object with the given options.
+    def copy(**options)
+      Location.new(
+        options.fetch(:source) { source },
+        options.fetch(:start_offset) { start_offset },
+        options.fetch(:length) { length }
+      )
+    end
+    # Returns a string representation of this location.
+    def inspect
+      "#<Prism::Location @start_offset=#{@start_offset} @length=#{@length} start_line=#{start_line}>"
+    end
+    # The source code that this location represents.
+    def slice
+      source.slice(start_offset, length)
+    end
+    # The character offset from the beginning of the source where this location
+    # starts.
+    def start_character_offset
+      source.character_offset(start_offset)
+    end
+    # The offset from the start of the file in code units of the given encoding.
+    def start_code_units_offset(encoding = Encoding::UTF_16LE)
+      source.code_units_offset(start_offset, encoding)
+    end
+    # The byte offset from the beginning of the source where this location ends.
+    def end_offset
+      start_offset + length
+    end
+    # The character offset from the beginning of the source where this location
+    # ends.
+    def end_character_offset
+      source.character_offset(end_offset)
+    end
+    # The offset from the start of the file in code units of the given encoding.
+    def end_code_units_offset(encoding = Encoding::UTF_16LE)
+      source.code_units_offset(end_offset, encoding)
+    end
+    # The line number where this location starts.
+    def start_line
+      source.line(start_offset)
+    end
+    # The content of the line where this location starts before this location.
+    def start_line_slice
+      offset = source.line_start(start_offset)
+      source.slice(offset, start_offset - offset)
+    end
+    # The line number where this location ends.
+    def end_line
+      source.line(end_offset)
+    end
+    # The column number in bytes where this location starts from the start of
+    # the line.
+    def start_column
+      source.column(start_offset)
+    end
+    # The column number in characters where this location ends from the start of
+    # the line.
+    def start_character_column
+      source.character_column(start_offset)
+    end
+    # The column number in code units of the given encoding where this location
+    # starts from the start of the line.
+    def start_code_units_column(encoding = Encoding::UTF_16LE)
+      source.code_units_column(start_offset, encoding)
+    end
+    # The column number in bytes where this location ends from the start of the
+    # line.
+    def end_column
+      source.column(end_offset)
+    end
+    # The column number in characters where this location ends from the start of
+    # the line.
+    def end_character_column
+      source.character_column(end_offset)
+    end
+    # The column number in code units of the given encoding where this location
+    # ends from the start of the line.
+    def end_code_units_column(encoding = Encoding::UTF_16LE)
+      source.code_units_column(end_offset, encoding)
+    end
+    # Implement the hash pattern matching interface for Location.
+    def deconstruct_keys(keys)
+      { start_offset: start_offset, end_offset: end_offset }
+    end
+    # Implement the pretty print interface for Location.
+    def pretty_print(q)
+      q.text("(#{start_line},#{start_column})-(#{end_line},#{end_column})")
+    end
+    # Returns true if the given other location is equal to this location.
+    def ==(other)
+      other.is_a?(Location) &&
+        other.start_offset == start_offset &&
+        other.end_offset == end_offset
+    end
+    # Returns a new location that stretches from this location to the given
+    # other location. Raises an error if this location is not before the other
+    # location or if they don't share the same source.
+    def join(other)
+      raise "Incompatible sources" if source != other.source
+      raise "Incompatible locations" if start_offset > other.start_offset
+      Location.new(source, start_offset, other.end_offset - start_offset)
+    end
+    # Returns a null location that does not correspond to a source and points to
+    # the beginning of the file. Useful for when you want a location object but
+    # do not care where it points.
+    def self.null
+      new(nil, 0, 0)
+    end
+  end
+  # This represents a comment that was encountered during parsing. It is the
+  # base class for all comment types.
+  class Comment
+    # The location of this comment in the source.
+    attr_reader :location
+    # Create a new comment object with the given location.
+    def initialize(location)
+      @location = location
+    end
+    # Implement the hash pattern matching interface for Comment.
+    def deconstruct_keys(keys)
+      { location: location }
+    end
+  end
+  # InlineComment objects are the most common. They correspond to comments in
+  # the source file like this one that start with #.
+  class InlineComment < Comment
+    # Returns true if this comment happens on the same line as other code and
+    # false if the comment is by itself.
+    def trailing?
+      !location.start_line_slice.strip.empty?
+    end
+    # Returns a string representation of this comment.
+    def inspect
+      "#<Prism::InlineComment @location=#{location.inspect}>"
+    end
+  end
+  # EmbDocComment objects correspond to comments that are surrounded by =begin
+  # and =end.
+  class EmbDocComment < Comment
+    # This can only be true for inline comments.
+    def trailing?
+      false
+    end
+    # Returns a string representation of this comment.
+    def inspect
+      "#<Prism::EmbDocComment @location=#{location.inspect}>"
+    end
+  end
+  # This represents a magic comment that was encountered during parsing.
+  class MagicComment
+    # A Location object representing the location of the key in the source.
+    attr_reader :key_loc
+    # A Location object representing the location of the value in the source.
+    attr_reader :value_loc
+    # Create a new magic comment object with the given key and value locations.
+    def initialize(key_loc, value_loc)
+      @key_loc = key_loc
+      @value_loc = value_loc
+    end
+    # Returns the key of the magic comment by slicing it from the source code.
+    def key
+      key_loc.slice
+    end
+    # Returns the value of the magic comment by slicing it from the source code.
+    def value
+      value_loc.slice
+    end
+    # Implement the hash pattern matching interface for MagicComment.
+    def deconstruct_keys(keys)
+      { key_loc: key_loc, value_loc: value_loc }
+    end
+    # Returns a string representation of this magic comment.
+    def inspect
+      "#<Prism::MagicComment @key=#{key.inspect} @value=#{value.inspect}>"
+    end
+  end
+  # This represents an error that was encountered during parsing.
+  class ParseError
+    # The message associated with this error.
+    attr_reader :message
+    # A Location object representing the location of this error in the source.
+    attr_reader :location
+    # The level of this error.
+    attr_reader :level
+    # Create a new error object with the given message and location.
+    def initialize(message, location, level)
+      @message = message
+      @location = location
+      @level = level
+    end
+    # Implement the hash pattern matching interface for ParseError.
+    def deconstruct_keys(keys)
+      { message: message, location: location, level: level }
+    end
+    # Returns a string representation of this error.
+    def inspect
+      "#<Prism::ParseError @message=#{@message.inspect} @location=#{@location.inspect} @level=#{@level.inspect}>"
+    end
+  end
+  # This represents a warning that was encountered during parsing.
+  class ParseWarning
+    # The message associated with this warning.
+    attr_reader :message
+    # A Location object representing the location of this warning in the source.
+    attr_reader :location
+    # The level of this warning.
+    attr_reader :level
+    # Create a new warning object with the given message and location.
+    def initialize(message, location, level)
+      @message = message
+      @location = location
+      @level = level
+    end
+    # Implement the hash pattern matching interface for ParseWarning.
+    def deconstruct_keys(keys)
+      { message: message, location: location, level: level }
+    end
+    # Returns a string representation of this warning.
+    def inspect
+      "#<Prism::ParseWarning @message=#{@message.inspect} @location=#{@location.inspect} @level=#{@level.inspect}>"
+    end
+  end
+  # This represents the result of a call to ::parse or ::parse_file. It contains
+  # the AST, any comments that were encounters, and any errors that were
+  # encountered.
+  class ParseResult
+    # The value that was generated by parsing. Normally this holds the AST, but
+    # it can sometimes how a list of tokens or other results passed back from
+    # the parser.
+    attr_reader :value
+    # The list of comments that were encountered during parsing.
+    attr_reader :comments
+    # The list of magic comments that were encountered during parsing.
+    attr_reader :magic_comments
+    # An optional location that represents the location of the __END__ marker
+    # and the rest of the content of the file. This content is loaded into the
+    # DATA constant when the file being parsed is the main file being executed.
+    attr_reader :data_loc
+    # The list of errors that were generated during parsing.
+    attr_reader :errors
+    # The list of warnings that were generated during parsing.
+    attr_reader :warnings
+    # A Source instance that represents the source code that was parsed.
+    attr_reader :source
+    # Create a new parse result object with the given values.
+    def initialize(value, comments, magic_comments, data_loc, errors, warnings, source)
+      @value = value
+      @comments = comments
+      @magic_comments = magic_comments
+      @data_loc = data_loc
+      @errors = errors
+      @warnings = warnings
+      @source = source
+    end
+    # Implement the hash pattern matching interface for ParseResult.
+    def deconstruct_keys(keys)
+      { value: value, comments: comments, magic_comments: magic_comments, data_loc: data_loc, errors: errors, warnings: warnings }
+    end
+    # Returns true if there were no errors during parsing and false if there
+    # were.
+    def success?
+      errors.empty?
+    end
+    # Returns true if there were errors during parsing and false if there were
+    # not.
+    def failure?
+      !success?
+    end
+  end
+  # This represents a token from the Ruby source.
+  class Token
+    # The type of token that this token is.
+    attr_reader :type
+    # A byteslice of the source that this token represents.
+    attr_reader :value
+    # A Location object representing the location of this token in the source.
+    attr_reader :location
+    # Create a new token object with the given type, value, and location.
+    def initialize(type, value, location)
+      @type = type
+      @value = value
+      @location = location
+    end
+    # Implement the hash pattern matching interface for Token.
+    def deconstruct_keys(keys)
+      { type: type, value: value, location: location }
+    end
+    # Implement the pretty print interface for Token.
+    def pretty_print(q)
+      q.group do
+        q.text(type.to_s)
+        self.location.pretty_print(q)
+        q.text("(")
+        q.nest(2) do
+          q.breakable("")
+          q.pp(value)
+        end
+        q.breakable("")
+        q.text(")")
+      end
+    end
+    # Returns true if the given other token is equal to this token.
+    def ==(other)
+      other.is_a?(Token) &&
+        other.type == type &&
+        other.value == value
+    end
+  end
+end