RubyGems - prism - Versions diffs - 0.19.0 → 0.20.0 - Mend

prism 0.19.0 → 0.20.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +29 -1
data/Makefile +5 -0
data/README.md +8 -6
data/config.yml +236 -38
data/docs/build_system.md +19 -2
data/docs/cruby_compilation.md +27 -0
data/docs/parser_translation.md +34 -0
data/docs/parsing_rules.md +19 -0
data/docs/releasing.md +3 -3
data/docs/ruby_api.md +1 -1
data/docs/serialization.md +17 -5
data/ext/prism/api_node.c +101 -81
data/ext/prism/extension.c +74 -11
data/ext/prism/extension.h +1 -1
data/include/prism/ast.h +1699 -504
data/include/prism/defines.h +8 -0
data/include/prism/diagnostic.h +39 -2
data/include/prism/encoding.h +10 -0
data/include/prism/options.h +40 -14
data/include/prism/parser.h +33 -17
data/include/prism/util/pm_buffer.h +9 -0
data/include/prism/util/pm_constant_pool.h +7 -0
data/include/prism/util/pm_newline_list.h +0 -11
data/include/prism/version.h +2 -2
data/include/prism.h +19 -2
data/lib/prism/debug.rb +11 -5
data/lib/prism/dot_visitor.rb +36 -14
data/lib/prism/dsl.rb +22 -22
data/lib/prism/ffi.rb +2 -2
data/lib/prism/node.rb +1020 -737
data/lib/prism/node_ext.rb +2 -2
data/lib/prism/parse_result.rb +17 -9
data/lib/prism/serialize.rb +53 -29
data/lib/prism/translation/parser/compiler.rb +1831 -0
data/lib/prism/translation/parser/lexer.rb +335 -0
data/lib/prism/translation/parser/rubocop.rb +37 -0
data/lib/prism/translation/parser.rb +163 -0
data/lib/prism/translation.rb +11 -0
data/lib/prism.rb +1 -0
data/prism.gemspec +12 -5
data/rbi/prism.rbi +150 -88
data/rbi/prism_static.rbi +15 -3
data/sig/prism.rbs +996 -961
data/sig/prism_static.rbs +123 -46
data/src/diagnostic.c +259 -219
data/src/encoding.c +4 -8
data/src/node.c +2 -6
data/src/options.c +24 -5
data/src/prettyprint.c +174 -42
data/src/prism.c +1136 -328
data/src/serialize.c +12 -9
data/src/token_type.c +353 -4
data/src/util/pm_buffer.c +11 -0
data/src/util/pm_constant_pool.c +12 -11
data/src/util/pm_newline_list.c +2 -14
metadata +10 -3
data/docs/building.md +0 -29

data/lib/prism/translation/parser/lexer.rb ADDED Viewed

@@ -0,0 +1,335 @@
+# frozen_string_literal: true
+module Prism
+  module Translation
+    class Parser
+      # Accepts a list of prism tokens and converts them into the expected
+      # format for the parser gem.
+      class Lexer
+        # The direct translating of types between the two lexers.
+        TYPES = {
+          # These tokens should never appear in the output of the lexer.
+          EOF: nil,
+          MISSING: nil,
+          NOT_PROVIDED: nil,
+          IGNORED_NEWLINE: nil,
+          EMBDOC_END: nil,
+          EMBDOC_LINE: nil,
+          __END__: nil,
+          # These tokens have more or less direct mappings.
+          AMPERSAND: :tAMPER2,
+          AMPERSAND_AMPERSAND: :tANDOP,
+          AMPERSAND_AMPERSAND_EQUAL: :tOP_ASGN,
+          AMPERSAND_DOT: :tANDDOT,
+          AMPERSAND_EQUAL: :tOP_ASGN,
+          BACK_REFERENCE: :tBACK_REF,
+          BACKTICK: :tXSTRING_BEG,
+          BANG: :tBANG,
+          BANG_EQUAL: :tNEQ,
+          BANG_TILDE: :tNMATCH,
+          BRACE_LEFT: :tLCURLY,
+          BRACE_RIGHT: :tRCURLY,
+          BRACKET_LEFT: :tLBRACK2,
+          BRACKET_LEFT_ARRAY: :tLBRACK,
+          BRACKET_LEFT_RIGHT: :tAREF,
+          BRACKET_LEFT_RIGHT_EQUAL: :tASET,
+          BRACKET_RIGHT: :tRBRACK,
+          CARET: :tCARET,
+          CARET_EQUAL: :tOP_ASGN,
+          CHARACTER_LITERAL: :tCHARACTER,
+          CLASS_VARIABLE: :tCVAR,
+          COLON: :tCOLON,
+          COLON_COLON: :tCOLON2,
+          COMMA: :tCOMMA,
+          COMMENT: :tCOMMENT,
+          CONSTANT: :tCONSTANT,
+          DOT: :tDOT,
+          DOT_DOT: :tDOT2,
+          DOT_DOT_DOT: :tDOT3,
+          EMBDOC_BEGIN: :tCOMMENT,
+          EMBEXPR_BEGIN: :tSTRING_DBEG,
+          EMBEXPR_END: :tSTRING_DEND,
+          EMBVAR: :tSTRING_DVAR,
+          EQUAL: :tEQL,
+          EQUAL_EQUAL: :tEQ,
+          EQUAL_EQUAL_EQUAL: :tEQQ,
+          EQUAL_GREATER: :tASSOC,
+          EQUAL_TILDE: :tMATCH,
+          FLOAT: :tFLOAT,
+          FLOAT_IMAGINARY: :tIMAGINARY,
+          FLOAT_RATIONAL: :tRATIONAL,
+          FLOAT_RATIONAL_IMAGINARY: :tIMAGINARY,
+          GLOBAL_VARIABLE: :tGVAR,
+          GREATER: :tGT,
+          GREATER_EQUAL: :tGEQ,
+          GREATER_GREATER: :tRSHFT,
+          GREATER_GREATER_EQUAL: :tOP_ASGN,
+          HEREDOC_START: :tSTRING_BEG,
+          HEREDOC_END: :tSTRING_END,
+          IDENTIFIER: :tIDENTIFIER,
+          INSTANCE_VARIABLE: :tIVAR,
+          INTEGER: :tINTEGER,
+          INTEGER_IMAGINARY: :tIMAGINARY,
+          INTEGER_RATIONAL: :tRATIONAL,
+          INTEGER_RATIONAL_IMAGINARY: :tIMAGINARY,
+          KEYWORD_ALIAS: :kALIAS,
+          KEYWORD_AND: :kAND,
+          KEYWORD_BEGIN: :kBEGIN,
+          KEYWORD_BEGIN_UPCASE: :klBEGIN,
+          KEYWORD_BREAK: :kBREAK,
+          KEYWORD_CASE: :kCASE,
+          KEYWORD_CLASS: :kCLASS,
+          KEYWORD_DEF: :kDEF,
+          KEYWORD_DEFINED: :kDEFINED,
+          KEYWORD_DO: :kDO,
+          KEYWORD_DO_LOOP: :kDO_COND,
+          KEYWORD_END: :kEND,
+          KEYWORD_END_UPCASE: :klEND,
+          KEYWORD_ENSURE: :kENSURE,
+          KEYWORD_ELSE: :kELSE,
+          KEYWORD_ELSIF: :kELSIF,
+          KEYWORD_FALSE: :kFALSE,
+          KEYWORD_FOR: :kFOR,
+          KEYWORD_IF: :kIF,
+          KEYWORD_IF_MODIFIER: :kIF_MOD,
+          KEYWORD_IN: :kIN,
+          KEYWORD_MODULE: :kMODULE,
+          KEYWORD_NEXT: :kNEXT,
+          KEYWORD_NIL: :kNIL,
+          KEYWORD_NOT: :kNOT,
+          KEYWORD_OR: :kOR,
+          KEYWORD_REDO: :kREDO,
+          KEYWORD_RESCUE: :kRESCUE,
+          KEYWORD_RESCUE_MODIFIER: :kRESCUE_MOD,
+          KEYWORD_RETRY: :kRETRY,
+          KEYWORD_RETURN: :kRETURN,
+          KEYWORD_SELF: :kSELF,
+          KEYWORD_SUPER: :kSUPER,
+          KEYWORD_THEN: :kTHEN,
+          KEYWORD_TRUE: :kTRUE,
+          KEYWORD_UNDEF: :kUNDEF,
+          KEYWORD_UNLESS: :kUNLESS,
+          KEYWORD_UNLESS_MODIFIER: :kUNLESS_MOD,
+          KEYWORD_UNTIL: :kUNTIL,
+          KEYWORD_UNTIL_MODIFIER: :kUNTIL_MOD,
+          KEYWORD_WHEN: :kWHEN,
+          KEYWORD_WHILE: :kWHILE,
+          KEYWORD_WHILE_MODIFIER: :kWHILE_MOD,
+          KEYWORD_YIELD: :kYIELD,
+          KEYWORD___ENCODING__: :k__ENCODING__,
+          KEYWORD___FILE__: :k__FILE__,
+          KEYWORD___LINE__: :k__LINE__,
+          LABEL: :tLABEL,
+          LABEL_END: :tLABEL_END,
+          LAMBDA_BEGIN: :tLAMBEG,
+          LESS: :tLT,
+          LESS_EQUAL: :tLEQ,
+          LESS_EQUAL_GREATER: :tCMP,
+          LESS_LESS: :tLSHFT,
+          LESS_LESS_EQUAL: :tOP_ASGN,
+          METHOD_NAME: :tFID,
+          MINUS: :tMINUS,
+          MINUS_EQUAL: :tOP_ASGN,
+          MINUS_GREATER: :tLAMBDA,
+          NEWLINE: :tNL,
+          NUMBERED_REFERENCE: :tNTH_REF,
+          PARENTHESIS_LEFT: :tLPAREN,
+          PARENTHESIS_LEFT_PARENTHESES: :tLPAREN_ARG,
+          PARENTHESIS_RIGHT: :tRPAREN,
+          PERCENT: :tPERCENT,
+          PERCENT_EQUAL: :tOP_ASGN,
+          PERCENT_LOWER_I: :tQSYMBOLS_BEG,
+          PERCENT_LOWER_W: :tQWORDS_BEG,
+          PERCENT_UPPER_I: :tSYMBOLS_BEG,
+          PERCENT_UPPER_W: :tWORDS_BEG,
+          PERCENT_LOWER_X: :tXSTRING_BEG,
+          PLUS: :tPLUS,
+          PLUS_EQUAL: :tOP_ASGN,
+          PIPE_EQUAL: :tOP_ASGN,
+          PIPE: :tPIPE,
+          PIPE_PIPE: :tOROP,
+          PIPE_PIPE_EQUAL: :tOP_ASGN,
+          QUESTION_MARK: :tEH,
+          REGEXP_BEGIN: :tREGEXP_BEG,
+          REGEXP_END: :tSTRING_END,
+          SEMICOLON: :tSEMI,
+          SLASH: :tDIVIDE,
+          SLASH_EQUAL: :tOP_ASGN,
+          STAR: :tSTAR2,
+          STAR_EQUAL: :tOP_ASGN,
+          STAR_STAR: :tPOW,
+          STAR_STAR_EQUAL: :tOP_ASGN,
+          STRING_BEGIN: :tSTRING_BEG,
+          STRING_CONTENT: :tSTRING_CONTENT,
+          STRING_END: :tSTRING_END,
+          SYMBOL_BEGIN: :tSYMBEG,
+          TILDE: :tTILDE,
+          UAMPERSAND: :tAMPER,
+          UCOLON_COLON: :tCOLON3,
+          UDOT_DOT: :tDOT2,
+          UDOT_DOT_DOT: :tBDOT3,
+          UMINUS: :tUMINUS,
+          UMINUS_NUM: :tUNARY_NUM,
+          UPLUS: :tUPLUS,
+          USTAR: :tSTAR,
+          USTAR_STAR: :tPOW,
+          WORDS_SEP: :tSPACE
+        }
+        private_constant :TYPES
+        # The Parser::Source::Buffer that the tokens were lexed from.
+        attr_reader :source_buffer
+        # An array of prism tokens that we lexed.
+        attr_reader :lexed
+        # A hash that maps offsets in bytes to offsets in characters.
+        attr_reader :offset_cache
+        # Initialize the lexer with the given source buffer, prism tokens, and
+        # offset cache.
+        def initialize(source_buffer, lexed, offset_cache)
+          @source_buffer = source_buffer
+          @lexed = lexed
+          @offset_cache = offset_cache
+        end
+        Range = ::Parser::Source::Range # :nodoc:
+        private_constant :Range
+        # Convert the prism tokens into the expected format for the parser gem.
+        def to_a
+          tokens = []
+          index = 0
+          while index < lexed.length
+            token, = lexed[index]
+            index += 1
+            next if token.type == :IGNORED_NEWLINE || token.type == :EOF
+            type = TYPES.fetch(token.type)
+            value = token.value
+            location = Range.new(source_buffer, offset_cache[token.location.start_offset], offset_cache[token.location.end_offset])
+            case type
+            when :tCHARACTER
+              value.delete_prefix!("?")
+            when :tCOMMENT
+              if token.type == :EMBDOC_BEGIN
+                until (next_token = lexed[index]) && next_token.type == :EMBDOC_END
+                  value += next_token.value
+                  index += 1
+                end
+                value += next_token.value
+                location = Range.new(source_buffer, offset_cache[token.location.start_offset], offset_cache[lexed[index].location.end_offset])
+                index += 1
+              else
+                value.chomp!
+                location = Range.new(source_buffer, offset_cache[token.location.start_offset], offset_cache[token.location.end_offset - 1])
+              end
+            when :tNL
+              value = nil
+            when :tFLOAT
+              value = Float(value)
+            when :tIMAGINARY
+              value = parse_complex(value)
+            when :tINTEGER
+              if value.start_with?("+")
+                tokens << [:tUNARY_NUM, ["+", Range.new(source_buffer, offset_cache[token.location.start_offset], offset_cache[token.location.start_offset + 1])]]
+                location = Range.new(source_buffer, offset_cache[token.location.start_offset + 1], offset_cache[token.location.end_offset])
+              end
+              value = Integer(value)
+            when :tLABEL
+              value.chomp!(":")
+            when :tLABEL_END
+              value.chomp!(":")
+            when :tNTH_REF
+              value = Integer(value.delete_prefix("$"))
+            when :tOP_ASGN
+              value.chomp!("=")
+            when :tRATIONAL
+              value = parse_rational(value)
+            when :tSPACE
+              value = nil
+            when :tSTRING_BEG
+              if ["\"", "'"].include?(value) && (next_token = lexed[index]) && next_token.type == :STRING_END
+                next_location = token.location.join(next_token.location)
+                type = :tSTRING
+                value = ""
+                location = Range.new(source_buffer, offset_cache[next_location.start_offset], offset_cache[next_location.end_offset])
+                index += 1
+              elsif ["\"", "'"].include?(value) && (next_token = lexed[index]) && next_token.type == :STRING_CONTENT && (next_next_token = lexed[index + 1]) && next_next_token.type == :STRING_END
+                next_location = token.location.join(next_next_token.location)
+                type = :tSTRING
+                value = next_token.value
+                location = Range.new(source_buffer, offset_cache[next_location.start_offset], offset_cache[next_location.end_offset])
+                index += 2
+              elsif value.start_with?("<<")
+                quote = value[2] == "-" || value[2] == "~" ? value[3] : value[2]
+                value = "<<#{quote == "'" || quote == "\"" ? quote : "\""}"
+              end
+            when :tSTRING_DVAR
+              value = nil
+            when :tSTRING_END
+              if token.type == :REGEXP_END
+                value = value[0]
+                location = Range.new(source_buffer, offset_cache[token.location.start_offset], offset_cache[token.location.start_offset + 1])
+              end
+            when :tSYMBEG
+              if (next_token = lexed[index]) && next_token.type != :STRING_CONTENT && next_token.type != :EMBEXPR_BEGIN && next_token.type != :EMBVAR
+                next_location = token.location.join(next_token.location)
+                type = :tSYMBOL
+                value = next_token.value
+                value = { "~@" => "~", "!@" => "!" }.fetch(value, value)
+                location = Range.new(source_buffer, offset_cache[next_location.start_offset], offset_cache[next_location.end_offset])
+                index += 1
+              end
+            when :tFID
+              if tokens[-1][0] == :kDEF
+                type = :tIDENTIFIER
+              end
+            end
+            tokens << [type, [value, location]]
+            if token.type == :REGEXP_END
+              tokens << [:tREGEXP_OPT, [token.value[1..], Range.new(source_buffer, offset_cache[token.location.start_offset + 1], offset_cache[token.location.end_offset])]]
+            end
+          end
+          tokens
+        end
+        private
+        # Parse a complex from the string representation.
+        def parse_complex(value)
+          value.chomp!("i")
+          if value.end_with?("r")
+            Complex(0, parse_rational(value))
+          elsif value.start_with?(/0[BbOoDdXx]/)
+            Complex(0, Integer(value))
+          else
+            Complex(0, value)
+          end
+        end
+        # Parse a rational from the string representation.
+        def parse_rational(value)
+          value.chomp!("r")
+          if value.start_with?(/0[BbOoDdXx]/)
+            Rational(Integer(value))
+          else
+            Rational(value)
+          end
+        end
+      end
+    end
+  end
+end

data/lib/prism/translation/parser/rubocop.rb ADDED Viewed

@@ -0,0 +1,37 @@
+# frozen_string_literal: true
+require "parser"
+require "rubocop"
+require "prism"
+require "prism/translation/parser"
+module Prism
+  module Translation
+    class Parser
+      # This is the special version number that should be used in rubocop
+      # configuration files to trigger using prism.
+      VERSION_3_3 = 80_82_73_83_77.33
+      # This module gets prepended into RuboCop::AST::ProcessedSource.
+      module ProcessedSource
+        # Redefine parser_class so that we can inject the prism parser into the
+        # list of known parsers.
+        def parser_class(ruby_version)
+          if ruby_version == Prism::Translation::Parser::VERSION_3_3
+            require "prism/translation/parser"
+            Prism::Translation::Parser
+          else
+            super
+          end
+        end
+      end
+    end
+  end
+end
+# :stopdoc:
+RuboCop::AST::ProcessedSource.prepend(Prism::Translation::Parser::ProcessedSource)
+known_rubies = RuboCop::TargetRuby.const_get(:KNOWN_RUBIES)
+RuboCop::TargetRuby.send(:remove_const, :KNOWN_RUBIES)
+RuboCop::TargetRuby::KNOWN_RUBIES = [*known_rubies, Prism::Translation::Parser::VERSION_3_3].freeze

data/lib/prism/translation/parser.rb ADDED Viewed

@@ -0,0 +1,163 @@
+# frozen_string_literal: true
+require "parser"
+module Prism
+  module Translation
+    # This class is the entry-point for converting a prism syntax tree into the
+    # whitequark/parser gem's syntax tree. It inherits from the base parser for
+    # the parser gem, and overrides the parse* methods to parse with prism and
+    # then translate.
+    class Parser < ::Parser::Base
+      # The parser gem has a list of diagnostics with a hard-coded set of error
+      # messages. We create our own diagnostic class in order to set our own
+      # error messages.
+      class Diagnostic < ::Parser::Diagnostic
+        # The message generated by prism.
+        attr_reader :message
+        # Initialize a new diagnostic with the given message and location.
+        def initialize(message, location)
+          @message = message
+          super(:error, :prism_error, {}, location, [])
+        end
+      end
+      Racc_debug_parser = false # :nodoc:
+      def version # :nodoc:
+        33
+      end
+      # The default encoding for Ruby files is UTF-8.
+      def default_encoding
+        Encoding::UTF_8
+      end
+      def yyerror # :nodoc:
+      end
+      # Parses a source buffer and returns the AST.
+      def parse(source_buffer)
+        @source_buffer = source_buffer
+        source = source_buffer.source
+        result = unwrap(Prism.parse(source, filepath: source_buffer.name))
+        build_ast(result.value, build_offset_cache(source))
+      ensure
+        @source_buffer = nil
+      end
+      # Parses a source buffer and returns the AST and the source code comments.
+      def parse_with_comments(source_buffer)
+        @source_buffer = source_buffer
+        source = source_buffer.source
+        offset_cache = build_offset_cache(source)
+        result = unwrap(Prism.parse(source, filepath: source_buffer.name))
+        [
+          build_ast(result.value, offset_cache),
+          build_comments(result.comments, offset_cache)
+        ]
+      ensure
+        @source_buffer = nil
+      end
+      # Parses a source buffer and returns the AST, the source code comments,
+      # and the tokens emitted by the lexer.
+      def tokenize(source_buffer, _recover = false)
+        @source_buffer = source_buffer
+        source = source_buffer.source
+        offset_cache = build_offset_cache(source)
+        result = unwrap(Prism.parse_lex(source, filepath: source_buffer.name))
+        program, tokens = result.value
+        [
+          build_ast(program, offset_cache),
+          build_comments(result.comments, offset_cache),
+          build_tokens(tokens, offset_cache)
+        ]
+      ensure
+        @source_buffer = nil
+      end
+      # Since prism resolves num params for us, we don't need to support this
+      # kind of logic here.
+      def try_declare_numparam(node)
+        node.children[0].match?(/\A_[1-9]\z/)
+      end
+      private
+      # If there was a error generated during the parse, then raise an
+      # appropriate syntax error. Otherwise return the result.
+      def unwrap(result)
+        return result if result.success?
+        error = result.errors.first
+        offset_cache = build_offset_cache(source_buffer.source)
+        diagnostic = Diagnostic.new(error.message, build_range(error.location, offset_cache))
+        raise ::Parser::SyntaxError, diagnostic
+      end
+      # Prism deals with offsets in bytes, while the parser gem deals with
+      # offsets in characters. We need to handle this conversion in order to
+      # build the parser gem AST.
+      #
+      # If the bytesize of the source is the same as the length, then we can
+      # just use the offset directly. Otherwise, we build a hash that functions
+      # as a cache for the conversion.
+      #
+      # This is a good opportunity for some optimizations. If the source file
+      # has any multi-byte characters, this can tank the performance of the
+      # translator. We could make this significantly faster by using a
+      # different data structure for the cache.
+      def build_offset_cache(source)
+        if source.bytesize == source.length
+          -> (offset) { offset }
+        else
+          Hash.new do |hash, offset|
+            hash[offset] = source.byteslice(0, offset).length
+          end
+        end
+      end
+      # Build the parser gem AST from the prism AST.
+      def build_ast(program, offset_cache)
+        program.accept(Compiler.new(self, offset_cache))
+      end
+      # Build the parser gem comments from the prism comments.
+      def build_comments(comments, offset_cache)
+        comments.map do |comment|
+          ::Parser::Source::Comment.new(build_range(comment.location, offset_cache))
+        end
+      end
+      # Build the parser gem tokens from the prism tokens.
+      def build_tokens(tokens, offset_cache)
+        Lexer.new(source_buffer, tokens.map(&:first), offset_cache).to_a
+      end
+      # Build a range from a prism location.
+      def build_range(location, offset_cache)
+        ::Parser::Source::Range.new(
+          source_buffer,
+          offset_cache[location.start_offset],
+          offset_cache[location.end_offset]
+        )
+      end
+      require_relative "parser/compiler"
+      require_relative "parser/lexer"
+      private_constant :Compiler
+      private_constant :Lexer
+    end
+  end
+end

data/lib/prism/translation.rb ADDED Viewed

@@ -0,0 +1,11 @@
+# frozen_string_literal: true
+module Prism
+  # This module is responsible for converting the prism syntax tree into other
+  # syntax trees. At the moment it only supports converting to the
+  # whitequark/parser gem's syntax tree, but support is planned for the
+  # seattlerb/ruby_parser gem's syntax tree as well.
+  module Translation
+    autoload :Parser, "prism/translation/parser"
+  end
+end

data/lib/prism.rb CHANGED Viewed

@@ -26,6 +26,7 @@ module Prism
   autoload :Pack, "prism/pack"
   autoload :Pattern, "prism/pattern"
   autoload :Serialize, "prism/serialize"
+  autoload :Translation, "prism/translation"
   autoload :Visitor, "prism/visitor"
   # Some of these constants are not meant to be exposed, so marking them as

data/prism.gemspec CHANGED Viewed

@@ -2,7 +2,7 @@
 Gem::Specification.new do |spec|
   spec.name = "prism"
-  spec.version = "0.19.0"
+  spec.version = "0.20.0"
   spec.authors = ["Shopify"]
   spec.email = ["ruby@shopify.com"]
@@ -22,8 +22,8 @@ Gem::Specification.new do |spec|
     "README.md",
     "config.yml",
     "docs/build_system.md",
-    "docs/building.md",
     "docs/configuration.md",
+    "docs/cruby_compilation.md",
     "docs/design.md",
     "docs/encoding.md",
     "docs/fuzzing.md",
@@ -31,6 +31,8 @@ Gem::Specification.new do |spec|
     "docs/javascript.md",
     "docs/local_variable_depth.md",
     "docs/mapping.md",
+    "docs/parser_translation.md",
+    "docs/parsing_rules.md",
     "docs/releasing.md",
     "docs/ripper.md",
     "docs/ruby_api.md",
@@ -73,16 +75,21 @@ Gem::Specification.new do |spec|
     "lib/prism/ffi.rb",
     "lib/prism/lex_compat.rb",
     "lib/prism/mutation_compiler.rb",
-    "lib/prism/node.rb",
     "lib/prism/node_ext.rb",
     "lib/prism/node_inspector.rb",
+    "lib/prism/node.rb",
     "lib/prism/pack.rb",
     "lib/prism/parse_result.rb",
+    "lib/prism/parse_result/comments.rb",
+    "lib/prism/parse_result/newlines.rb",
     "lib/prism/pattern.rb",
     "lib/prism/ripper_compat.rb",
     "lib/prism/serialize.rb",
-    "lib/prism/parse_result/comments.rb",
-    "lib/prism/parse_result/newlines.rb",
+    "lib/prism/translation.rb",
+    "lib/prism/translation/parser.rb",
+    "lib/prism/translation/parser/compiler.rb",
+    "lib/prism/translation/parser/lexer.rb",
+    "lib/prism/translation/parser/rubocop.rb",
     "lib/prism/visitor.rb",
     "src/diagnostic.c",
     "src/encoding.c",