RubyGems - prism - Versions diffs - 0.16.0 → 0.17.0 - Mend

prism 0.16.0 → 0.17.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +16 -1
data/Makefile +6 -0
data/README.md +1 -1
data/config.yml +50 -35
data/docs/fuzzing.md +1 -1
data/docs/serialization.md +28 -29
data/ext/prism/api_node.c +802 -770
data/ext/prism/api_pack.c +20 -9
data/ext/prism/extension.c +464 -162
data/ext/prism/extension.h +1 -1
data/include/prism/ast.h +3173 -763
data/include/prism/defines.h +32 -9
data/include/prism/diagnostic.h +36 -3
data/include/prism/enc/pm_encoding.h +118 -28
data/include/prism/node.h +38 -13
data/include/prism/options.h +204 -0
data/include/prism/pack.h +44 -33
data/include/prism/parser.h +445 -200
data/include/prism/prettyprint.h +12 -1
data/include/prism/regexp.h +16 -2
data/include/prism/util/pm_buffer.h +94 -16
data/include/prism/util/pm_char.h +162 -48
data/include/prism/util/pm_constant_pool.h +126 -32
data/include/prism/util/pm_list.h +68 -38
data/include/prism/util/pm_memchr.h +18 -3
data/include/prism/util/pm_newline_list.h +70 -27
data/include/prism/util/pm_state_stack.h +25 -7
data/include/prism/util/pm_string.h +115 -27
data/include/prism/util/pm_string_list.h +25 -6
data/include/prism/util/pm_strncasecmp.h +32 -0
data/include/prism/util/pm_strpbrk.h +31 -17
data/include/prism/version.h +27 -2
data/include/prism.h +224 -31
data/lib/prism/compiler.rb +6 -3
data/lib/prism/debug.rb +23 -7
data/lib/prism/dispatcher.rb +33 -18
data/lib/prism/dsl.rb +10 -5
data/lib/prism/ffi.rb +132 -80
data/lib/prism/lex_compat.rb +25 -15
data/lib/prism/mutation_compiler.rb +10 -5
data/lib/prism/node.rb +370 -135
data/lib/prism/node_ext.rb +1 -1
data/lib/prism/node_inspector.rb +1 -1
data/lib/prism/pack.rb +79 -40
data/lib/prism/parse_result/comments.rb +7 -2
data/lib/prism/parse_result/newlines.rb +4 -0
data/lib/prism/parse_result.rb +150 -30
data/lib/prism/pattern.rb +11 -0
data/lib/prism/ripper_compat.rb +28 -10
data/lib/prism/serialize.rb +86 -54
data/lib/prism/visitor.rb +10 -3
data/lib/prism.rb +20 -2
data/prism.gemspec +4 -2
data/rbi/prism.rbi +104 -60
data/rbi/prism_static.rbi +16 -2
data/sig/prism.rbs +72 -43
data/sig/prism_static.rbs +14 -1
data/src/diagnostic.c +56 -53
data/src/enc/pm_big5.c +1 -0
data/src/enc/pm_euc_jp.c +1 -0
data/src/enc/pm_gbk.c +1 -0
data/src/enc/pm_shift_jis.c +1 -0
data/src/enc/pm_tables.c +316 -80
data/src/enc/pm_unicode.c +53 -8
data/src/enc/pm_windows_31j.c +1 -0
data/src/node.c +334 -321
data/src/options.c +170 -0
data/src/prettyprint.c +74 -47
data/src/prism.c +1642 -856
data/src/regexp.c +151 -95
data/src/serialize.c +44 -20
data/src/token_type.c +3 -1
data/src/util/pm_buffer.c +45 -15
data/src/util/pm_char.c +103 -57
data/src/util/pm_constant_pool.c +51 -21
data/src/util/pm_list.c +12 -4
data/src/util/pm_memchr.c +5 -3
data/src/util/pm_newline_list.c +20 -12
data/src/util/pm_state_stack.c +9 -3
data/src/util/pm_string.c +95 -85
data/src/util/pm_string_list.c +14 -15
data/src/util/pm_strncasecmp.c +10 -3
data/src/util/pm_strpbrk.c +25 -19
metadata +5 -3
data/docs/prism.png +0 -0

data/src/diagnostic.c CHANGED Viewed

@@ -1,56 +1,55 @@
 #include "prism/diagnostic.h"
-/*
-  ## Message composition
-  When composing an error message, use sentence fragments.
-  Try describing the property of the code that caused the error, rather than the rule that is being
-  violated. It may help to use a fragment that completes a sentence beginning, "The parser
-  encountered (a) ...". If appropriate, add a description of the rule violation (or other helpful
-  context) after a semicolon.
-  For example:, instead of "Control escape sequence cannot be doubled", prefer:
-  > "Invalid control escape sequence; control cannot be repeated"
-  In some cases, where the failure is more general or syntax expectations are violated, it may make
-  more sense to use a fragment that completes a sentence beginning, "The parser ...".
-  For example:
-  > "Expected an expression after `(`"
-  > "Cannot parse the expression"
-  ## Message style guide
-  - Use articles like "a", "an", and "the" when appropriate.
-    - e.g., prefer "Cannot parse the expression" to "Cannot parse expression".
-  - Use the common name for tokens and nodes.
-    - e.g., prefer "keyword splat" to "assoc splat"
-    - e.g., prefer "embedded document" to "embdoc"
-  - Capitalize the initial word of the message.
-  - Use back ticks around token literals
-    - e.g., "Expected a `=>` between the hash key and value"
-  - Do not use `.` or other punctuation at the end of the message.
-  - Do not use contractions like "can't". Prefer "cannot" to "can not".
-  - For tokens that can have multiple meanings, reference the token and its meaning.
-    - e.g., "`*` splat argument" is clearer and more complete than "splat argument" or "`*` argument"
-  ## Error names (PM_ERR_*)
-  - When appropriate, prefer node name to token name.
-    - e.g., prefer "SPLAT" to "STAR" in the context of argument parsing.
-  - Prefer token name to common name.
-    - e.g., prefer "STAR" to "ASTERISK".
-  - Try to order the words in the name from more general to more specific,
-    - e.g., "INVALID_NUMBER_DECIMAL" is better than "DECIMAL_INVALID_NUMBER".
-    - When in doubt, look for similar patterns and name them so that they are grouped when lexically
-      sorted. See PM_ERR_ARGUMENT_NO_FORWARDING_* for an example.
-*/
+/**
+ * ## Message composition
+ *
+ * When composing an error message, use sentence fragments.
+ *
+ * Try describing the property of the code that caused the error, rather than the rule that is being
+ * violated. It may help to use a fragment that completes a sentence beginning, "The parser
+ * encountered (a) ...". If appropriate, add a description of the rule violation (or other helpful
+ * context) after a semicolon.
+ *
+ * For example:, instead of "Control escape sequence cannot be doubled", prefer:
+ *
+ * > "Invalid control escape sequence; control cannot be repeated"
+ *
+ * In some cases, where the failure is more general or syntax expectations are violated, it may make
+ * more sense to use a fragment that completes a sentence beginning, "The parser ...".
+ *
+ * For example:
+ *
+ * > "Expected an expression after `(`"
+ * > "Cannot parse the expression"
+ *
+ *
+ * ## Message style guide
+ *
+ * - Use articles like "a", "an", and "the" when appropriate.
+ *   - e.g., prefer "Cannot parse the expression" to "Cannot parse expression".
+ * - Use the common name for tokens and nodes.
+ *   - e.g., prefer "keyword splat" to "assoc splat"
+ *   - e.g., prefer "embedded document" to "embdoc"
+ * - Capitalize the initial word of the message.
+ * - Use back ticks around token literals
+ *   - e.g., "Expected a `=>` between the hash key and value"
+ * - Do not use `.` or other punctuation at the end of the message.
+ * - Do not use contractions like "can't". Prefer "cannot" to "can not".
+ * - For tokens that can have multiple meanings, reference the token and its meaning.
+ *   - e.g., "`*` splat argument" is clearer and more complete than "splat argument" or "`*` argument"
+ *
+ *
+ * ## Error names (PM_ERR_*)
+ *
+ * - When appropriate, prefer node name to token name.
+ *   - e.g., prefer "SPLAT" to "STAR" in the context of argument parsing.
+ * - Prefer token name to common name.
+ *   - e.g., prefer "STAR" to "ASTERISK".
+ * - Try to order the words in the name from more general to more specific,
+ *   - e.g., "INVALID_NUMBER_DECIMAL" is better than "DECIMAL_INVALID_NUMBER".
+ *   - When in doubt, look for similar patterns and name them so that they are grouped when lexically
+ *     sorted. See PM_ERR_ARGUMENT_NO_FORWARDING_* for an example.
+ */
 static const char* const diagnostic_messages[PM_DIAGNOSTIC_ID_LEN] = {
     [PM_ERR_ALIAS_ARGUMENT]                     = "Invalid argument being passed to `alias`; expected a bare word, symbol, constant, or global variable",
     [PM_ERR_AMPAMPEQ_MULTI_ASSIGN]              = "Unexpected `&&=` in a multiple assignment",
@@ -263,7 +262,9 @@ pm_diagnostic_message(pm_diagnostic_id_t diag_id) {
     return message;
 }
-// Append an error to the given list of diagnostic.
+/**
+ * Append an error to the given list of diagnostic.
+ */
 bool
 pm_diagnostic_list_append(pm_list_t *list, const uint8_t *start, const uint8_t *end, pm_diagnostic_id_t diag_id) {
     pm_diagnostic_t *diagnostic = (pm_diagnostic_t *) calloc(sizeof(pm_diagnostic_t), 1);
@@ -274,7 +275,9 @@ pm_diagnostic_list_append(pm_list_t *list, const uint8_t *start, const uint8_t *
     return true;
 }
-// Deallocate the internal state of the given diagnostic list.
+/**
+ * Deallocate the internal state of the given diagnostic list.
+ */
 void
 pm_diagnostic_list_free(pm_list_t *list) {
     pm_list_node_t *node, *next;

data/src/enc/pm_big5.c CHANGED Viewed

@@ -42,6 +42,7 @@ pm_encoding_big5_isupper_char(const uint8_t *b, ptrdiff_t n) {
     }
 }
+/** Big5 encoding */
 pm_encoding_t pm_encoding_big5 = {
     .name = "big5",
     .char_width = pm_encoding_big5_char_width,

data/src/enc/pm_euc_jp.c CHANGED Viewed

@@ -48,6 +48,7 @@ pm_encoding_euc_jp_isupper_char(const uint8_t *b, ptrdiff_t n) {
     }
 }
+/** EUC-JP encoding */
 pm_encoding_t pm_encoding_euc_jp = {
     .name = "euc-jp",
     .char_width = pm_encoding_euc_jp_char_width,

data/src/enc/pm_gbk.c CHANGED Viewed

@@ -51,6 +51,7 @@ pm_encoding_gbk_isupper_char(const uint8_t *b, ptrdiff_t n) {
     }
 }
+/** GBK encoding */
 pm_encoding_t pm_encoding_gbk = {
     .name = "gbk",
     .char_width = pm_encoding_gbk_char_width,

data/src/enc/pm_shift_jis.c CHANGED Viewed

@@ -46,6 +46,7 @@ pm_encoding_shift_jis_isupper_char(const uint8_t *b, ptrdiff_t n) {
     }
 }
+/** Shift_JIS encoding */
 pm_encoding_t pm_encoding_shift_jis = {
     .name = "shift_jis",
     .char_width = pm_encoding_shift_jis_char_width,