RubyGems - prettier - Versions diffs - 0.12.2 → 0.12.3 - Mend

prettier 0.12.2 → 0.12.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +49 -1
data/CONTRIBUTING.md +1 -1
data/README.md +34 -18
data/node_modules/prettier/bin-prettier.js +22 -13
data/node_modules/prettier/index.js +22 -13
data/package.json +2 -2
data/src/nodes.js +10 -576
data/src/nodes/alias.js +1 -1
data/src/nodes/args.js +88 -0
data/src/nodes/arrays.js +1 -1
data/src/nodes/assign.js +39 -0
data/src/nodes/blocks.js +18 -3
data/src/nodes/calls.js +37 -3
data/src/nodes/case.js +1 -1
data/src/nodes/commands.js +2 -1
data/src/nodes/conditionals.js +118 -57
data/src/nodes/constants.js +25 -0
data/src/nodes/flow.js +64 -0
data/src/nodes/hashes.js +3 -2
data/src/nodes/hooks.js +1 -1
data/src/nodes/ints.js +24 -0
data/src/nodes/lambdas.js +1 -1
data/src/nodes/loops.js +1 -1
data/src/nodes/massign.js +70 -0
data/src/nodes/methods.js +40 -2
data/src/nodes/operators.js +44 -0
data/src/nodes/params.js +14 -3
data/src/nodes/regexp.js +1 -1
data/src/nodes/rescue.js +1 -1
data/src/nodes/scopes.js +61 -0
data/src/nodes/statements.js +105 -0
data/src/nodes/strings.js +9 -2
data/src/{builders.js → prettier.js} +9 -2
data/src/ripper.rb +412 -353
data/src/utils.js +1 -1
metadata +40 -3

data/src/nodes/statements.js ADDED Viewed

@@ -0,0 +1,105 @@
+const {
+  concat,
+  dedent,
+  group,
+  hardline,
+  indent,
+  join,
+  line,
+  literalline,
+  markAsRoot,
+  softline,
+  trim
+} = require("../prettier");
+module.exports = {
+  "@__end__": (path, _opts, _print) => {
+    const { body } = path.getValue();
+    return concat([trim, "__END__", literalline, body]);
+  },
+  bodystmt: (path, opts, print) => {
+    const [_statements, rescue, elseClause, ensure] = path.getValue().body;
+    const parts = [path.call(print, "body", 0)];
+    if (rescue) {
+      parts.push(dedent(concat([hardline, path.call(print, "body", 1)])));
+    }
+    if (elseClause) {
+      // Before Ruby 2.6, this piece of bodystmt was an explicit "else" node
+      const stmts =
+        elseClause.type === "else"
+          ? path.call(print, "body", 2, "body", 0)
+          : path.call(print, "body", 2);
+      parts.push(concat([dedent(concat([hardline, "else"])), hardline, stmts]));
+    }
+    if (ensure) {
+      parts.push(dedent(concat([hardline, path.call(print, "body", 3)])));
+    }
+    return group(concat(parts));
+  },
+  embdoc: (path, _opts, _print) => concat([trim, path.getValue().body]),
+  paren: (path, opts, print) => {
+    if (!path.getValue().body[0]) {
+      return "()";
+    }
+    let content = path.call(print, "body", 0);
+    if (
+      ["args", "args_add_star", "args_add_block"].includes(
+        path.getValue().body[0].type
+      )
+    ) {
+      content = join(concat([",", line]), content);
+    }
+    return group(
+      concat([
+        "(",
+        indent(concat([softline, content])),
+        concat([softline, ")"])
+      ])
+    );
+  },
+  program: (path, opts, print) =>
+    markAsRoot(
+      concat([join(literalline, path.map(print, "body")), literalline])
+    ),
+  stmts: (path, opts, print) => {
+    const stmts = path.getValue().body;
+    const parts = [];
+    let lineNo = null;
+    stmts.forEach((stmt, index) => {
+      if (stmt.type === "void_stmt") {
+        return;
+      }
+      const printed = path.call(print, "body", index);
+      if (lineNo === null) {
+        parts.push(printed);
+      } else if (
+        stmt.start - lineNo > 1 ||
+        [stmt.type, stmts[index - 1].type].includes("access_ctrl")
+      ) {
+        parts.push(hardline, hardline, printed);
+      } else if (
+        stmt.start !== lineNo ||
+        path.getParentNode().type !== "string_embexpr"
+      ) {
+        parts.push(hardline, printed);
+      } else {
+        parts.push("; ", printed);
+      }
+      lineNo = stmt.end;
+    });
+    return concat(parts);
+  }
+};

data/src/nodes/strings.js CHANGED Viewed

@@ -6,8 +6,8 @@ const {
   join,
   literalline,
   softline
-} = require("../builders");
-const { concatBody, empty, makeList, surround } = require("../utils");
+} = require("../prettier");
+const { concatBody, empty, makeList, prefix, surround } = require("../utils");
 const escapePattern = require("../escapePattern");
 // If there is some part of this string that matches an escape sequence or that
@@ -72,6 +72,11 @@ module.exports = {
     const quote = preferSingleQuotes ? "'" : '"';
     return body.length === 2 ? concat([quote, body.slice(1), quote]) : body;
   },
+  dyna_symbol: (path, opts, print) => {
+    const { quote } = path.getValue().body[0];
+    return concat([":", quote, concat(path.call(print, "body", 0)), quote]);
+  },
   heredoc: (path, opts, print) => {
     const { beging, ending } = path.getValue();
@@ -129,6 +134,8 @@ module.exports = {
     return concat([quote].concat(parts).concat([quote]));
   },
+  symbol: prefix(":"),
+  symbol_literal: concatBody,
   word_add: concatBody,
   word_new: empty,
   xstring: makeList,

data/src/{builders.js → prettier.js} RENAMED Viewed

@@ -4,6 +4,13 @@
 const source = process.env.RBPRETTIER ? "../node_modules/prettier" : "prettier";
 // eslint-disable-next-line import/no-dynamic-require
-const { builders, utils } = require(source).doc;
+const prettier = require(source);
-module.exports = Object.assign({}, builders, utils);
+// Just combine all the things into one big object so that we can import
+// whatever we need from prettier without having to dive too deeply.
+module.exports = Object.assign(
+  {},
+  prettier.doc.builders,
+  prettier.doc.utils,
+  prettier.util
+);

data/src/ripper.rb CHANGED Viewed

@@ -9,448 +9,503 @@ end
 require 'json' unless defined?(JSON)
 require 'ripper'
-module Layer
+class RipperJS < Ripper
+  private
+  # Scanner events occur when the lexer hits a new token, like a keyword or an
+  # end. These nodes always contain just one argument which is a string
+  # representing the content. For the most part these can just be printed
+  # directly, which very few exceptions.
+  SCANNER_EVENTS.each do |event|
+    define_method(:"on_#{event}") do |body|
+      { type: :"@#{event}", body: body, start: lineno, end: lineno }
+    end
+  end
+  # Parser events represent nodes in the ripper abstract syntax tree. The event
+  # is reported after the children of the node have already been built.
+  PARSER_EVENTS.each do |event|
+    define_method(:"on_#{event}") do |*body|
+      min = body.map { |part| part.is_a?(Hash) ? part[:start] : lineno }.min
+      { type: event, body: body, start: min || lineno, end: lineno }
+    end
+  end
   # Some nodes are lists that come back from the parser. They always start with
-  # a *_new node (or in the case of string, *_content) and each additional node
-  # in the list is a *_add node. This layer takes those nodes and turns them
-  # into one node with an array body.
-  module Lists
-    events = %i[
-      args
-      mlhs
-      mrhs
-      qsymbols
-      qwords
-      regexp
-      stmts
-      string
-      symbols
-      words
-      xstring
-    ]
-    private
-    events.each do |event|
-      suffix = event == :string ? 'content' : 'new'
-      define_method(:"on_#{event}_#{suffix}") do
-        { type: event, body: [], start: lineno, end: lineno }
-      end
-      define_method(:"on_#{event}_add") do |parts, part|
-        parts.tap do |node|
-          node[:body] << part
-          node[:end] = lineno
+  # a `*_new` node (or in the case of string, `*_content`) and each additional
+  # node in the list is a `*_add` node. This module takes those nodes and turns
+  # them into one node with an array body.
+  #
+  # For example, the statement `[a, b, c]` would be parsed as:
+  #
+  # [:args_add,
+  #   [:args_add,
+  #     [:args_add,
+  #       [:args_new],
+  #       [:vcall, [:@ident, "a", [1, 1]]]
+  #     ],
+  #     [:vcall, [:@ident, "b", [1, 4]]]
+  #   ],
+  #   [:vcall, [:@ident, "c", [1, 7]]]
+  # ]
+  #
+  # But after this module is applied that is instead parsed as:
+  #
+  # [:args,
+  #   [
+  #     [:vcall, [:@ident, "a", [1, 1]]],
+  #     [:vcall, [:@ident, "b", [1, 4]]],
+  #     [:vcall, [:@ident, "c", [1, 7]]]
+  #   ]
+  # ]
+  #
+  # This makes it a lot easier to join things with commas, and ends up resulting
+  # in a much flatter `prettier` tree once it has been converted. Note that
+  # because of this module some extra node types are added (the aggregate of
+  # the previous `*_add` nodes) and some nodes now have arrays in places where
+  # they previously had single nodes.
+  prepend(
+    Module.new do
+      events = %i[
+        args
+        mlhs
+        mrhs
+        qsymbols
+        qwords
+        regexp
+        stmts
+        string
+        symbols
+        words
+        xstring
+      ]
+      private
+      events.each do |event|
+        suffix = event == :string ? 'content' : 'new'
+        define_method(:"on_#{event}_#{suffix}") do
+          { type: event, body: [], start: lineno, end: lineno }
+        end
+        define_method(:"on_#{event}_add") do |parts, part|
+          parts.tap do |node|
+            node[:body] << part
+            node[:end] = lineno
+          end
         end
       end
     end
-  end
+  )
   # For most nodes, it's enough to look at the child nodes to determine the
   # start of the parent node. However, for some nodes it's necessary to keep
   # track of the keywords as they come in from the lexer and to modify the start
-  # node once we have it.
-  module StartLine
-    events = %i[begin else elsif ensure rescue until while]
+  # node once we have it. We need accurate start and end lines so that we can
+  # embed block comments into the right kind of node.
+  prepend(
+    Module.new do
+      events = %i[begin else elsif ensure if rescue until while]
-    def initialize(*args)
-      super(*args)
-      @keywords = []
-    end
+      def initialize(*args)
+        super(*args)
+        @keywords = []
+      end
-    def self.prepended(base)
-      base.attr_reader :keywords
-    end
+      def self.prepended(base)
+        base.attr_reader :keywords
+      end
-    private
+      private
-    def find_start(body)
-      keywords[keywords.rindex { |keyword| keyword[:body] == body }][:start]
-    end
+      def find_start(body)
+        keywords[keywords.rindex { |keyword| keyword[:body] == body }][:start]
+      end
-    events.each do |event|
-      keyword = event.to_s
+      events.each do |event|
+        keyword = event.to_s
-      define_method(:"on_#{event}") do |*body|
-        super(*body).tap { |sexp| sexp.merge!(start: find_start(keyword)) }
+        define_method(:"on_#{event}") do |*body|
+          super(*body).tap { |sexp| sexp.merge!(start: find_start(keyword)) }
+        end
       end
-    end
-    def on_kw(body)
-      super(body).tap { |sexp| keywords << sexp }
-    end
+      def on_kw(body)
+        super(body).tap { |sexp| keywords << sexp }
+      end
-    def on_program(*body)
-      super(*body).tap { |sexp| sexp.merge!(start: 1) }
+      def on_program(*body)
+        super(*body).tap { |sexp| sexp.merge!(start: 1) }
+      end
     end
-  end
+  )
-  # Nodes that are always on their own line occur when the lexer is in the
-  # EXPR_BEG node. Those comments are tracked within the @block_comments
-  # instance variable. Then for each node that could contain them, we attach
-  # them after the node has been built.
-  module BlockComments
-    events = {
-      begin: [0, :body, 0],
-      bodystmt: [0],
-      class: [2, :body, 0],
-      def: [2, :body, 0],
-      defs: [4, :body, 0],
-      else: [0],
-      elsif: [1],
-      ensure: [0],
-      if: [1],
-      program: [0],
-      rescue: [2],
-      sclass: [1, :body, 0],
-      unless: [1],
-      until: [1],
-      when: [1],
-      while: [1]
-    }
-    def initialize(*args)
-      super(*args)
-      @block_comments = []
-      @current_embdoc = nil
-    end
+  # This layer keeps track of inline comments as they come in. Ripper itself
+  # doesn't attach comments to the AST, so we need to do it manually. In this
+  # case, inline comments are defined as any comments wherein the lexer state is
+  # not equal to EXPR_BEG (tracked in the BlockComments layer).
+  prepend(
+    Module.new do
+      # Certain events needs to steal the comments from their children in order
+      # for them to display properly.
+      events = {
+        aref: [:body, 1],
+        args_add_block: [:body, 0],
+        break: [:body, 0],
+        command: [:body, 1],
+        command_call: [:body, 3],
+        regexp_literal: [:body, 0],
+        string_literal: [:body, 0],
+        symbol_literal: [:body, 0]
+      }
-    def self.prepended(base)
-      base.attr_reader :block_comments, :current_embdoc
-    end
+      def initialize(*args)
+        super(*args)
+        @inline_comments = []
+        @last_sexp = nil
+      end
+      def self.prepended(base)
+        base.attr_reader :inline_comments, :last_sexp
+      end
+      private
-    private
+      events.each do |event, path|
+        define_method(:"on_#{event}") do |*body|
+          @last_sexp =
+            super(*body).tap do |sexp|
+              comments = (sexp.dig(*path) || {}).delete(:comments)
+              sexp.merge!(comments: comments) if comments
+            end
+        end
+      end
-    def attach_comments(sexp, stmts)
-      range = sexp[:start]..sexp[:end]
-      comments =
-        block_comments.group_by { |comment| range.include?(comment[:start]) }
+      SPECIAL_LITERALS = %i[qsymbols qwords symbols words].freeze
-      if comments[true]
-        stmts[:body] =
-          (stmts[:body] + comments[true]).sort_by { |node| node[:start] }
+      # Special array literals are handled in different ways and so their
+      # comments need to be passed up to their parent array node.
+      def on_array(*body)
+        @last_sexp =
+          super(*body).tap do |sexp|
+            next unless SPECIAL_LITERALS.include?(body.dig(0, :type))
-        @block_comments = comments.fetch(false) { [] }
+            comments = sexp.dig(:body, 0).delete(:comments)
+            sexp.merge!(comments: comments) if comments
+          end
       end
-    end
-    events.each do |event, path|
-      define_method(:"on_#{event}") do |*body|
-        super(*body).tap { |sexp| attach_comments(sexp, body.dig(*path)) }
+      # Handling this specially because we want to pull the comments out of both
+      # child nodes.
+      def on_assoc_new(*body)
+        @last_sexp =
+          super(*body).tap do |sexp|
+            comments =
+              (sexp.dig(:body, 0).delete(:comments) || []) +
+                (sexp.dig(:body, 1).delete(:comments) || [])
+            sexp.merge!(comments: comments) if comments.any?
+          end
       end
-    end
-    def on_comment(body)
-      super(body).tap do |sexp|
-        block_comments << sexp if RipperJS.lex_state_name(state) == 'EXPR_BEG'
+      # Most scanner events don't stand on their own as s-expressions, but the
+      # CHAR scanner event is effectively just a string, so we need to track it
+      # as a s-expression.
+      def on_CHAR(body)
+        @last_sexp = super(body)
       end
-    end
-    def on_embdoc_beg(comment)
-      @current_embdoc = {
-        type: :embdoc, body: comment, start: lineno, end: lineno
-      }
-    end
+      # We need to know exactly where the comment is, switching off the current
+      # lexer state. In Ruby 2.7.0-dev, that's defined as:
+      #
+      # enum lex_state_bits {
+      #     EXPR_BEG_bit,     /* ignore newline, +/- is a sign. */
+      #     EXPR_END_bit,     /* newline significant, +/- is an operator. */
+      #     EXPR_ENDARG_bit,  /* ditto, and unbound braces. */
+      #     EXPR_ENDFN_bit,   /* ditto, and unbound braces. */
+      #     EXPR_ARG_bit,     /* newline significant, +/- is an operator. */
+      #     EXPR_CMDARG_bit,  /* newline significant, +/- is an operator. */
+      #     EXPR_MID_bit,     /* newline significant, +/- is an operator. */
+      #     EXPR_FNAME_bit,   /* ignore newline, no reserved words. */
+      #     EXPR_DOT_bit,     /* right after `.' or `::', no reserved words. */
+      #     EXPR_CLASS_bit,   /* immediate after `class', no here document. */
+      #     EXPR_LABEL_bit,   /* flag bit, label is allowed. */
+      #     EXPR_LABELED_bit, /* flag bit, just after a label. */
+      #     EXPR_FITEM_bit,   /* symbol literal as FNAME. */
+      #     EXPR_MAX_STATE
+      # };
+      def on_comment(body)
+        sexp = { type: :@comment, body: body.chomp, start: lineno, end: lineno }
+        case RipperJS.lex_state_name(state)
+        when 'EXPR_END', 'EXPR_ARG|EXPR_LABELED', 'EXPR_ENDFN'
+          last_sexp.merge!(comments: [sexp])
+        when 'EXPR_CMDARG', 'EXPR_END|EXPR_ENDARG', 'EXPR_ENDARG', 'EXPR_ARG',
+             'EXPR_FNAME|EXPR_FITEM', 'EXPR_CLASS', 'EXPR_END|EXPR_LABEL'
+          inline_comments << sexp
+        when 'EXPR_BEG|EXPR_LABEL', 'EXPR_MID'
+          inline_comments << sexp.merge!(break: true)
+        when 'EXPR_DOT'
+          last_sexp.merge!(comments: [sexp.merge!(break: true)])
+        end
-    def on_embdoc(comment)
-      @current_embdoc[:body] << comment
-    end
+        sexp
+      end
-    def on_embdoc_end(comment)
-      @current_embdoc[:body] << comment.chomp
-      @block_comments << @current_embdoc
-      @current_embdoc = nil
-    end
+      defined = private_instance_methods(false).grep(/\Aon_/) { $'.to_sym }
-    def on_method_add_block(*body)
-      super(*body).tap do |sexp|
-        stmts = body[1][:body][1]
-        stmts = stmts[:type] == :stmts ? stmts : body[1][:body][1][:body][0]
+      (Ripper::PARSER_EVENTS - defined).each do |event|
+        define_method(:"on_#{event}") do |*body|
+          super(*body).tap do |sexp|
+            @last_sexp = sexp
+            next if inline_comments.empty?
-        attach_comments(sexp, stmts)
+            sexp[:comments] = inline_comments.reverse
+            @inline_comments = []
+          end
+        end
       end
     end
-  end
+  )
-  # Tracking heredocs in somewhat interesting. Straight-line heredocs are
-  # reported as strings, whereas squiggly-line heredocs are reported as
-  # heredocs.
-  module Heredocs
-    def initialize(*args)
-      super(*args)
-      @heredoc_stack = []
-    end
+  # Nodes that are always on their own line occur when the lexer is in the
+  # EXPR_BEG state. Those comments are tracked within the @block_comments
+  # instance variable. Then for each node that could contain them, we attach
+  # them after the node has been built.
+  prepend(
+    Module.new do
+      events = {
+        begin: [0, :body, 0],
+        bodystmt: [0],
+        class: [2, :body, 0],
+        def: [2, :body, 0],
+        defs: [4, :body, 0],
+        else: [0],
+        elsif: [1],
+        ensure: [0],
+        if: [1],
+        program: [0],
+        rescue: [2],
+        sclass: [1, :body, 0],
+        unless: [1],
+        until: [1],
+        when: [1],
+        while: [1]
+      }
-    def self.prepended(base)
-      base.attr_reader :heredoc_stack
-    end
+      def initialize(*args)
+        super(*args)
+        @block_comments = []
+        @current_embdoc = nil
+      end
-    private
+      def self.prepended(base)
+        base.attr_reader :block_comments, :current_embdoc
+      end
-    def on_embexpr_beg(body)
-      super(body).tap { |sexp| heredoc_stack << sexp }
-    end
+      private
-    def on_embexpr_end(body)
-      super(body).tap { heredoc_stack.pop }
-    end
+      def attach_comments(sexp, stmts)
+        range = sexp[:start]..sexp[:end]
+        comments =
+          block_comments.group_by { |comment| range.include?(comment[:start]) }
-    def on_heredoc_beg(beging)
-      heredoc = { type: :heredoc, beging: beging, start: lineno, end: lineno }
-      heredoc_stack << heredoc
-    end
+        if comments[true]
+          stmts[:body] =
+            (stmts[:body] + comments[true]).sort_by { |node| node[:start] }
-    def on_heredoc_end(ending)
-      heredoc_stack[-1].merge!(ending: ending.chomp, end: lineno)
-    end
+          @block_comments = comments.fetch(false) { [] }
+        end
+      end
-    def on_heredoc_dedent(string, _width)
-      heredoc = heredoc_stack.pop
-      string.merge!(heredoc.slice(:type, :beging, :ending, :start, :end))
-    end
+      events.each do |event, path|
+        define_method(:"on_#{event}") do |*body|
+          super(*body).tap { |sexp| attach_comments(sexp, body.dig(*path)) }
+        end
+      end
-    def on_string_literal(string)
-      heredoc = heredoc_stack[-1]
+      def on_comment(body)
+        super(body).tap do |sexp|
+          block_comments << sexp if RipperJS.lex_state_name(state) == 'EXPR_BEG'
+        end
+      end
-      if heredoc && string[:type] != :heredoc && heredoc[:type] == :heredoc
-        heredoc_stack.pop
-        string.merge!(heredoc.slice(:type, :beging, :ending, :start, :end))
-      else
-        super
+      def on_embdoc_beg(comment)
+        @current_embdoc = {
+          type: :embdoc, body: comment, start: lineno, end: lineno
+        }
       end
-    end
-  end
-  # These are the event types that contain _actual_ string content. If there is
-  # an encoding magic comment at the top of the file, ripper will actually
-  # change into that encoding for the storage of the string. This will break
-  # everything, so we need to force the encoding back into UTF-8 so that
-  # the JSON library won't break.
-  module Encoding
-    events = %w[comment ident tstring_content]
+      def on_embdoc(comment)
+        @current_embdoc[:body] << comment
+      end
-    events.each do |event|
-      define_method(:"on_#{event}") do |body|
-        super(body.force_encoding('UTF-8'))
+      def on_embdoc_end(comment)
+        @current_embdoc[:body] << comment.chomp
+        @block_comments << @current_embdoc
+        @current_embdoc = nil
       end
-    end
-  end
-  # This layer keeps track of inline comments as they come in. Ripper itself
-  # doesn't attach comments to the AST, so we need to do it manually. In this
-  # case, inline comments are defined as any comments wherein the lexer state is
-  # not equal to EXPR_BEG (tracked in the BlockComments layer).
-  module InlineComments
-    # Certain events needs to steal the comments from their children in order
-    # for them to display properly.
-    events = {
-      args_add_block: [:body, 0],
-      break: [:body, 0],
-      command: [:body, 1],
-      command_call: [:body, 3],
-      regexp_literal: [:body, 0],
-      string_literal: [:body, 0],
-      symbol_literal: [:body, 0]
-    }
-    def initialize(*args)
-      super(*args)
-      @inline_comments = []
-      @last_sexp = nil
-    end
+      def on_method_add_block(*body)
+        super(*body).tap do |sexp|
+          stmts = body[1][:body][1]
+          stmts = stmts[:type] == :stmts ? stmts : body[1][:body][1][:body][0]
-    def self.prepended(base)
-      base.attr_reader :inline_comments, :last_sexp
+          attach_comments(sexp, stmts)
+        end
+      end
     end
+  )
-    private
+  # Tracking heredocs in somewhat interesting. Straight-line heredocs are
+  # reported as strings, whereas squiggly-line heredocs are reported as
+  # heredocs. We track the start and matching end of the heredoc as "beging" and
+  # "ending" respectively.
+  prepend(
+    Module.new do
+      def initialize(*args)
+        super(*args)
+        @heredoc_stack = []
+      end
-    events.each do |event, path|
-      define_method(:"on_#{event}") do |*body|
-        @last_sexp =
-          super(*body).tap do |sexp|
-            comments = (sexp.dig(*path) || {}).delete(:comments)
-            sexp.merge!(comments: comments) if comments
-          end
+      def self.prepended(base)
+        base.attr_reader :heredoc_stack
       end
-    end
-    SPECIAL_LITERALS = %i[qsymbols qwords symbols words].freeze
+      private
-    # Special array literals are handled in different ways and so their comments
-    # need to be passed up to their parent array node.
-    def on_array(*body)
-      @last_sexp =
-        super(*body).tap do |sexp|
-          next unless SPECIAL_LITERALS.include?(body.dig(0, :type))
+      def on_embexpr_beg(body)
+        super(body).tap { |sexp| heredoc_stack << sexp }
+      end
-          comments = sexp.dig(:body, 0).delete(:comments)
-          sexp.merge!(comments: comments) if comments
-        end
-    end
+      def on_embexpr_end(body)
+        super(body).tap { heredoc_stack.pop }
+      end
-    # Handling this specially because we want to pull the comments out of both
-    # child nodes.
-    def on_assoc_new(*body)
-      @last_sexp =
-        super(*body).tap do |sexp|
-          comments =
-            (sexp.dig(:body, 0).delete(:comments) || []) +
-              (sexp.dig(:body, 1).delete(:comments) || [])
+      def on_heredoc_beg(beging)
+        heredoc = { type: :heredoc, beging: beging, start: lineno, end: lineno }
+        heredoc_stack << heredoc
+      end
-          sexp.merge!(comments: comments) if comments.any?
-        end
-    end
+      def on_heredoc_end(ending)
+        heredoc_stack[-1].merge!(ending: ending.chomp, end: lineno)
+      end
-    # Most scanner events don't stand on their own a s-expressions, but the CHAR
-    # scanner event is effectively just a string, so we need to track it as a
-    # s-expression.
-    def on_CHAR(body)
-      @last_sexp = super(body)
-    end
+      def on_heredoc_dedent(string, _width)
+        heredoc = heredoc_stack.pop
+        string.merge!(heredoc.slice(:type, :beging, :ending, :start, :end))
+      end
-    # We need to know exactly where the comment is, switching off the current
-    # lexer state. In Ruby 2.7.0-dev, that's defined as:
-    #
-    # enum lex_state_bits {
-    #     EXPR_BEG_bit,    /* ignore newline, +/- is a sign. */
-    #     EXPR_END_bit,    /* newline significant, +/- is an operator. */
-    #     EXPR_ENDARG_bit,    /* ditto, and unbound braces. */
-    #     EXPR_ENDFN_bit,    /* ditto, and unbound braces. */
-    #     EXPR_ARG_bit,    /* newline significant, +/- is an operator. */
-    #     EXPR_CMDARG_bit,    /* newline significant, +/- is an operator. */
-    #     EXPR_MID_bit,    /* newline significant, +/- is an operator. */
-    #     EXPR_FNAME_bit,    /* ignore newline, no reserved words. */
-    #     EXPR_DOT_bit,    /* right after `.' or `::', no reserved words. */
-    #     EXPR_CLASS_bit,    /* immediate after `class', no here document. */
-    #     EXPR_LABEL_bit,    /* flag bit, label is allowed. */
-    #     EXPR_LABELED_bit,    /* flag bit, just after a label. */
-    #     EXPR_FITEM_bit,    /* symbol literal as FNAME. */
-    #     EXPR_MAX_STATE
-    # };
-    def on_comment(body)
-      sexp = { type: :@comment, body: body.chomp, start: lineno, end: lineno }
-      case RipperJS.lex_state_name(state)
-      when 'EXPR_END', 'EXPR_ARG|EXPR_LABELED', 'EXPR_ENDFN'
-        last_sexp.merge!(comments: [sexp])
-      when 'EXPR_CMDARG', 'EXPR_END|EXPR_ENDARG', 'EXPR_ENDARG', 'EXPR_ARG',
-           'EXPR_FNAME|EXPR_FITEM', 'EXPR_CLASS', 'EXPR_END|EXPR_LABEL'
-        inline_comments << sexp
-      when 'EXPR_BEG|EXPR_LABEL', 'EXPR_MID'
-        inline_comments << sexp.merge!(break: true)
-      when 'EXPR_DOT'
-        last_sexp.merge!(comments: [sexp.merge!(break: true)])
-      end
-      sexp
-    end
+      def on_string_literal(string)
+        heredoc = heredoc_stack[-1]
-    defined_events = private_instance_methods(false).grep(/\Aon_/) { $'.to_sym }
+        if heredoc && string[:type] != :heredoc && heredoc[:type] == :heredoc
+          heredoc_stack.pop
+          string.merge!(heredoc.slice(:type, :beging, :ending, :start, :end))
+        else
+          super
+        end
+      end
+    end
+  )
-    (Ripper::PARSER_EVENTS - defined_events).each do |event|
-      define_method(:"on_#{event}") do |*body|
-        super(*body).tap do |sexp|
-          @last_sexp = sexp
-          next if inline_comments.empty?
+  # These are the event types that contain _actual_ string content. If there is
+  # an encoding magic comment at the top of the file, ripper will actually
+  # change into that encoding for the storage of the string. This will break
+  # everything, so we need to force the encoding back into UTF-8 so that
+  # the JSON library won't break.
+  prepend(
+    Module.new do
+      private
-          sexp[:comments] = inline_comments.reverse
-          @inline_comments = []
+      %w[comment ident tstring_content].each do |event|
+        define_method(:"on_#{event}") do |body|
+          super(body.force_encoding('UTF-8'))
         end
       end
     end
-  end
+  )
   # Handles __END__ syntax, which allows individual scripts to keep content
-  # after the main ruby code that can be read through DATA.
-  module Ending
-    def initialize(source, *args)
-      super(source, *args)
-      @source = source
-      @ending = nil
-    end
+  # after the main ruby code that can be read through DATA. Which looks like:
+  #
+  # foo.bar
+  #
+  # __END__
+  # some other content that isn't read by ripper normally
+  prepend(
+    Module.new do
+      def initialize(source, *args)
+        super(source, *args)
+        @source = source
+        @ending = nil
+      end
-    def self.prepended(base)
-      base.attr_reader :source, :ending
-    end
+      def self.prepended(base)
+        base.attr_reader :source, :ending
+      end
-    private
+      private
-    def on___end__(body)
-      @ending = super(source.split("\n")[lineno..-1].join("\n"))
-    end
+      def on___end__(body)
+        @ending = super(source.split("\n")[lineno..-1].join("\n"))
+      end
-    def on_program(*body)
-      super(*body).tap { |sexp| sexp[:body][0][:body] << ending if ending }
+      def on_program(*body)
+        super(*body).tap { |sexp| sexp[:body][0][:body] << ending if ending }
+      end
     end
-  end
+  )
-  # Adds the used quote type onto string nodes.
-  module Strings
-    private
+  # Adds the used quote type onto string nodes. This is necessary because we're
+  # going to have to stick to whatever quote the user chose if there are escape
+  # sequences within the string. For example, if you have '\n' we can't switch
+  # to double quotes without changing what it means.
+  prepend(
+    Module.new do
+      private
-    def on_tstring_end(quote)
-      last_sexp.merge!(quote: quote)
-    end
+      def on_tstring_end(quote)
+        last_sexp.merge!(quote: quote)
+      end
-    def on_label_end(quote)
-      last_sexp.merge!(quote: quote[0]) # quote is ": or ':
+      def on_label_end(quote)
+        last_sexp.merge!(quote: quote[0]) # quote is ": or ':
+      end
     end
-  end
+  )
   # Normally access controls are reported as vcall nodes. This module creates a
-  # new node type to explicitly track those nodes instead.
-  module AccessControls
-    def initialize(source, *args)
-      super(source, *args)
-      @lines = source.split("\n")
-    end
-    def self.prepended(base)
-      base.attr_reader :lines
-    end
-    private
+  # new node type to explicitly track those nodes instead, so that the printer
+  # can add new lines as necessary.
+  prepend(
+    Module.new do
+      KEYWORDS = %w[private protected public].freeze
-    def on_vcall(ident)
-      super(ident).tap do |sexp|
-        if !%w[private protected public].include?(ident[:body]) ||
-           ident[:body] != lines[lineno - 1].strip
-          next
-        end
+      def initialize(source, *args)
+        super(source, *args)
+        @lines = source.split("\n")
+      end
-        sexp.merge!(type: :access_ctrl)
+      def self.prepended(base)
+        base.attr_reader :lines
       end
-    end
-  end
-end
-class RipperJS < Ripper
-  private
+      private
-  SCANNER_EVENTS.each do |event|
-    define_method(:"on_#{event}") do |body|
-      { type: :"@#{event}", body: body, start: lineno, end: lineno }
-    end
-  end
+      def on_vcall(ident)
+        super(ident).tap do |sexp|
+          if !KEYWORDS.include?(ident[:body]) ||
+             ident[:body] != lines[lineno - 1].strip
+            next
+          end
-  PARSER_EVENTS.each do |event|
-    define_method(:"on_#{event}") do |*body|
-      min = body.map { |part| part.is_a?(Hash) ? part[:start] : lineno }.min
-      { type: event, body: body, start: min || lineno, end: lineno }
+          sexp.merge!(type: :access_ctrl)
+        end
+      end
     end
-  end
-  prepend Layer::Lists
-  prepend Layer::StartLine
-  prepend Layer::InlineComments
-  prepend Layer::BlockComments
-  prepend Layer::Heredocs
-  prepend Layer::Encoding
-  prepend Layer::Ending
-  prepend Layer::Strings
-  prepend Layer::AccessControls
+  )
   # When the only statement inside of a `def` node is a `begin` node, then you
   # can safely replace the body of the `def` with the body of the `begin`. For
@@ -529,6 +584,10 @@ class RipperJS < Ripper
   )
 end
+# If this is the main file we're executing, then most likely this is being
+# executed from the parse.js spawn. In that case, read the ruby source from
+# stdin and report back the AST over stdout.
 if $0 == __FILE__
   builder = RipperJS.new($stdin.read)
   response = builder.parse