RubyGems - prism - Versions diffs - 0.30.0 → 1.0.0 - Mend

prism 0.30.0 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +31 -1
data/README.md +3 -1
data/config.yml +185 -126
data/docs/serialization.md +3 -0
data/ext/prism/api_node.c +2843 -2085
data/ext/prism/extconf.rb +1 -1
data/ext/prism/extension.c +35 -25
data/ext/prism/extension.h +2 -2
data/include/prism/ast.h +1048 -69
data/include/prism/defines.h +9 -0
data/include/prism/diagnostic.h +11 -3
data/include/prism/options.h +55 -1
data/include/prism/parser.h +27 -3
data/include/prism/regexp.h +2 -1
data/include/prism/util/pm_integer.h +6 -6
data/include/prism/util/pm_newline_list.h +11 -0
data/include/prism/util/pm_string.h +1 -0
data/include/prism/version.h +3 -3
data/lib/prism/desugar_compiler.rb +111 -74
data/lib/prism/dispatcher.rb +2 -1
data/lib/prism/dot_visitor.rb +21 -31
data/lib/prism/dsl.rb +656 -471
data/lib/prism/ffi.rb +3 -0
data/lib/prism/inspect_visitor.rb +285 -57
data/lib/prism/mutation_compiler.rb +5 -5
data/lib/prism/node.rb +2282 -4754
data/lib/prism/node_ext.rb +72 -11
data/lib/prism/parse_result/errors.rb +65 -0
data/lib/prism/parse_result/newlines.rb +28 -28
data/lib/prism/parse_result.rb +25 -2
data/lib/prism/reflection.rb +7 -7
data/lib/prism/serialize.rb +468 -610
data/lib/prism/translation/parser/compiler.rb +18 -18
data/lib/prism/translation/parser/lexer.rb +1 -1
data/lib/prism/translation/parser.rb +3 -3
data/lib/prism/translation/ripper.rb +14 -14
data/lib/prism/translation/ruby_parser.rb +43 -7
data/prism.gemspec +3 -1
data/rbi/prism/dsl.rbi +521 -0
data/rbi/prism/node.rbi +1456 -5616
data/rbi/prism.rbi +16 -16
data/sig/prism/dsl.rbs +189 -305
data/sig/prism/node.rbs +702 -603
data/sig/prism/parse_result.rbs +2 -0
data/src/diagnostic.c +22 -6
data/src/node.c +277 -284
data/src/options.c +18 -0
data/src/prettyprint.c +99 -108
data/src/prism.c +1282 -760
data/src/regexp.c +72 -4
data/src/serialize.c +165 -50
data/src/token_type.c +2 -2
data/src/util/pm_integer.c +14 -14
data/src/util/pm_newline_list.c +29 -0
data/src/util/pm_string.c +9 -5
metadata +4 -2

data/src/regexp.c CHANGED Viewed

@@ -18,6 +18,12 @@ typedef struct {
     /** A pointer to the end of the source that we are parsing. */
     const uint8_t *end;
+    /**
+     * Whether or not the regular expression currently being parsed is in
+     * extended mode, wherein whitespace is ignored and comments are allowed.
+     */
+    bool extended_mode;
     /** Whether the encoding has changed from the default. */
     bool encoding_changed;
@@ -418,6 +424,19 @@ pm_regexp_options_remove(pm_regexp_options_t *options, uint8_t key) {
     return false;
 }
+/**
+ * True if the given key is set in the options.
+ */
+static uint8_t
+pm_regexp_options_state(pm_regexp_options_t *options, uint8_t key) {
+    if (key >= PRISM_REGEXP_OPTION_STATE_SLOT_MINIMUM && key <= PRISM_REGEXP_OPTION_STATE_SLOT_MAXIMUM) {
+        key = (uint8_t) (key - PRISM_REGEXP_OPTION_STATE_SLOT_MINIMUM);
+        return options->values[key];
+    }
+    return false;
+}
 /**
  * Groups can have quite a few different patterns for syntax. They basically
  * just wrap a set of expressions, but they can potentially have options after a
@@ -443,6 +462,9 @@ static bool
 pm_regexp_parse_group(pm_regexp_parser_t *parser, uint16_t depth) {
     const uint8_t *group_start = parser->cursor;
+    pm_regexp_options_t options;
+    pm_regexp_options_init(&options);
     // First, parse any options for the group.
     if (pm_regexp_char_accept(parser, '?')) {
         if (pm_regexp_char_is_eof(parser)) {
@@ -450,9 +472,6 @@ pm_regexp_parse_group(pm_regexp_parser_t *parser, uint16_t depth) {
             return false;
         }
-        pm_regexp_options_t options;
-        pm_regexp_options_init(&options);
         switch (*parser->cursor) {
             case '#': { // inline comments
                 parser->cursor++;
@@ -560,6 +579,18 @@ pm_regexp_parse_group(pm_regexp_parser_t *parser, uint16_t depth) {
                     return false;
                 }
+                // If we are at the end of the group of options and there is no
+                // subexpression, then we are going to be setting the options
+                // for the parent group. In this case we are safe to return now.
+                if (*parser->cursor == ')') {
+                    if (pm_regexp_options_state(&options, 'x') == PM_REGEXP_OPTION_STATE_ADDED) {
+                        parser->extended_mode = true;
+                    }
+                    parser->cursor++;
+                    return true;
+                }
                 // If we hit a -, then we're done parsing options.
                 if (*parser->cursor != '-') break;
@@ -577,6 +608,24 @@ pm_regexp_parse_group(pm_regexp_parser_t *parser, uint16_t depth) {
                 if (pm_regexp_char_is_eof(parser)) {
                     return false;
                 }
+                // If we are at the end of the group of options and there is no
+                // subexpression, then we are going to be setting the options
+                // for the parent group. In this case we are safe to return now.
+                if (*parser->cursor == ')') {
+                    switch (pm_regexp_options_state(&options, 'x')) {
+                        case PM_REGEXP_OPTION_STATE_ADDED:
+                            parser->extended_mode = true;
+                            break;
+                        case PM_REGEXP_OPTION_STATE_REMOVED:
+                            parser->extended_mode = false;
+                            break;
+                    }
+                    parser->cursor++;
+                    return true;
+                }
                 break;
             default:
                 parser->cursor++;
@@ -585,15 +634,27 @@ pm_regexp_parse_group(pm_regexp_parser_t *parser, uint16_t depth) {
         }
     }
+    bool extended_mode = parser->extended_mode;
+    switch (pm_regexp_options_state(&options, 'x')) {
+        case PM_REGEXP_OPTION_STATE_ADDED:
+            parser->extended_mode = true;
+            break;
+        case PM_REGEXP_OPTION_STATE_REMOVED:
+            parser->extended_mode = false;
+            break;
+    }
     // Now, parse the expressions within this group.
     while (!pm_regexp_char_is_eof(parser) && *parser->cursor != ')') {
         if (!pm_regexp_parse_expression(parser, (uint16_t) (depth + 1))) {
+            parser->extended_mode = extended_mode;
             return false;
         }
         pm_regexp_char_accept(parser, '|');
     }
     // Finally, make sure we have a closing parenthesis.
+    parser->extended_mode = extended_mode;
     if (pm_regexp_char_expect(parser, ')')) return true;
     pm_regexp_parse_error(parser, group_start, parser->cursor, "end pattern with unmatched parenthesis");
@@ -641,6 +702,12 @@ pm_regexp_parse_item(pm_regexp_parser_t *parser, uint16_t depth) {
             parser->cursor++;
             pm_regexp_parse_error(parser, parser->cursor - 1, parser->cursor, "unmatched close parenthesis");
             return true;
+        case '#':
+            if (parser->extended_mode) {
+                if (!pm_regexp_char_find(parser, '\n')) parser->cursor = parser->end;
+                return true;
+            }
+        /* fallthrough */
         default: {
             size_t width;
             if (!parser->encoding_changed) {
@@ -702,12 +769,13 @@ pm_regexp_parse_pattern(pm_regexp_parser_t *parser) {
  * groups.
  */
 PRISM_EXPORTED_FUNCTION void
-pm_regexp_parse(pm_parser_t *parser, const uint8_t *source, size_t size, pm_regexp_name_callback_t name_callback, void *name_data, pm_regexp_error_callback_t error_callback, void *error_data) {
+pm_regexp_parse(pm_parser_t *parser, const uint8_t *source, size_t size, bool extended_mode, pm_regexp_name_callback_t name_callback, void *name_data, pm_regexp_error_callback_t error_callback, void *error_data) {
     pm_regexp_parse_pattern(&(pm_regexp_parser_t) {
         .parser = parser,
         .start = source,
         .cursor = source,
         .end = source + size,
+        .extended_mode = extended_mode,
         .encoding_changed = parser->encoding_changed,
         .encoding = parser->encoding,
         .name_callback = name_callback,