jruby-prism-parser 0.24.0-java → 1.4.0-java

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (148) hide show
  1. checksums.yaml +4 -4
  2. data/BSDmakefile +58 -0
  3. data/CHANGELOG.md +269 -1
  4. data/CONTRIBUTING.md +0 -4
  5. data/Makefile +25 -18
  6. data/README.md +57 -6
  7. data/config.yml +1724 -140
  8. data/docs/build_system.md +39 -11
  9. data/docs/configuration.md +4 -0
  10. data/docs/cruby_compilation.md +1 -1
  11. data/docs/fuzzing.md +1 -1
  12. data/docs/parser_translation.md +14 -9
  13. data/docs/parsing_rules.md +4 -1
  14. data/docs/releasing.md +8 -10
  15. data/docs/relocation.md +34 -0
  16. data/docs/ripper_translation.md +72 -0
  17. data/docs/ruby_api.md +2 -1
  18. data/docs/serialization.md +29 -5
  19. data/ext/prism/api_node.c +3395 -1999
  20. data/ext/prism/api_pack.c +9 -0
  21. data/ext/prism/extconf.rb +55 -34
  22. data/ext/prism/extension.c +597 -346
  23. data/ext/prism/extension.h +6 -5
  24. data/include/prism/ast.h +2612 -455
  25. data/include/prism/defines.h +160 -2
  26. data/include/prism/diagnostic.h +188 -76
  27. data/include/prism/encoding.h +22 -4
  28. data/include/prism/node.h +89 -17
  29. data/include/prism/options.h +224 -12
  30. data/include/prism/pack.h +11 -0
  31. data/include/prism/parser.h +267 -66
  32. data/include/prism/prettyprint.h +8 -0
  33. data/include/prism/regexp.h +18 -8
  34. data/include/prism/static_literals.h +121 -0
  35. data/include/prism/util/pm_buffer.h +75 -2
  36. data/include/prism/util/pm_char.h +1 -2
  37. data/include/prism/util/pm_constant_pool.h +18 -9
  38. data/include/prism/util/pm_integer.h +126 -0
  39. data/include/prism/util/pm_list.h +1 -1
  40. data/include/prism/util/pm_newline_list.h +19 -0
  41. data/include/prism/util/pm_string.h +48 -8
  42. data/include/prism/version.h +3 -3
  43. data/include/prism.h +99 -5
  44. data/jruby-prism.jar +0 -0
  45. data/lib/prism/compiler.rb +11 -1
  46. data/lib/prism/desugar_compiler.rb +113 -74
  47. data/lib/prism/dispatcher.rb +45 -1
  48. data/lib/prism/dot_visitor.rb +201 -77
  49. data/lib/prism/dsl.rb +673 -461
  50. data/lib/prism/ffi.rb +233 -45
  51. data/lib/prism/inspect_visitor.rb +2389 -0
  52. data/lib/prism/lex_compat.rb +35 -16
  53. data/lib/prism/mutation_compiler.rb +24 -8
  54. data/lib/prism/node.rb +7731 -8460
  55. data/lib/prism/node_ext.rb +328 -32
  56. data/lib/prism/pack.rb +4 -0
  57. data/lib/prism/parse_result/comments.rb +34 -24
  58. data/lib/prism/parse_result/errors.rb +65 -0
  59. data/lib/prism/parse_result/newlines.rb +102 -12
  60. data/lib/prism/parse_result.rb +448 -44
  61. data/lib/prism/pattern.rb +28 -10
  62. data/lib/prism/polyfill/append_as_bytes.rb +15 -0
  63. data/lib/prism/polyfill/byteindex.rb +13 -0
  64. data/lib/prism/polyfill/unpack1.rb +14 -0
  65. data/lib/prism/reflection.rb +413 -0
  66. data/lib/prism/relocation.rb +504 -0
  67. data/lib/prism/serialize.rb +1940 -1198
  68. data/lib/prism/string_query.rb +30 -0
  69. data/lib/prism/translation/parser/builder.rb +61 -0
  70. data/lib/prism/translation/parser/compiler.rb +569 -195
  71. data/lib/prism/translation/parser/lexer.rb +516 -39
  72. data/lib/prism/translation/parser.rb +177 -12
  73. data/lib/prism/translation/parser33.rb +1 -1
  74. data/lib/prism/translation/parser34.rb +1 -1
  75. data/lib/prism/translation/parser35.rb +12 -0
  76. data/lib/prism/translation/ripper/sexp.rb +125 -0
  77. data/lib/prism/translation/ripper/shim.rb +5 -0
  78. data/lib/prism/translation/ripper.rb +3224 -462
  79. data/lib/prism/translation/ruby_parser.rb +194 -69
  80. data/lib/prism/translation.rb +4 -1
  81. data/lib/prism/version.rb +1 -1
  82. data/lib/prism/visitor.rb +13 -0
  83. data/lib/prism.rb +17 -27
  84. data/prism.gemspec +57 -17
  85. data/rbi/prism/compiler.rbi +12 -0
  86. data/rbi/prism/dsl.rbi +524 -0
  87. data/rbi/prism/inspect_visitor.rbi +12 -0
  88. data/rbi/prism/node.rbi +8722 -0
  89. data/rbi/prism/node_ext.rbi +107 -0
  90. data/rbi/prism/parse_result.rbi +404 -0
  91. data/rbi/prism/reflection.rbi +58 -0
  92. data/rbi/prism/string_query.rbi +12 -0
  93. data/rbi/prism/translation/parser.rbi +11 -0
  94. data/rbi/prism/translation/parser33.rbi +6 -0
  95. data/rbi/prism/translation/parser34.rbi +6 -0
  96. data/rbi/prism/translation/parser35.rbi +6 -0
  97. data/rbi/prism/translation/ripper.rbi +15 -0
  98. data/rbi/prism/visitor.rbi +473 -0
  99. data/rbi/prism.rbi +44 -7745
  100. data/sig/prism/compiler.rbs +9 -0
  101. data/sig/prism/dispatcher.rbs +16 -0
  102. data/sig/prism/dot_visitor.rbs +6 -0
  103. data/sig/prism/dsl.rbs +351 -0
  104. data/sig/prism/inspect_visitor.rbs +22 -0
  105. data/sig/prism/lex_compat.rbs +10 -0
  106. data/sig/prism/mutation_compiler.rbs +159 -0
  107. data/sig/prism/node.rbs +3614 -0
  108. data/sig/prism/node_ext.rbs +82 -0
  109. data/sig/prism/pack.rbs +43 -0
  110. data/sig/prism/parse_result.rbs +192 -0
  111. data/sig/prism/pattern.rbs +13 -0
  112. data/sig/prism/reflection.rbs +50 -0
  113. data/sig/prism/relocation.rbs +185 -0
  114. data/sig/prism/serialize.rbs +8 -0
  115. data/sig/prism/string_query.rbs +11 -0
  116. data/sig/prism/visitor.rbs +169 -0
  117. data/sig/prism.rbs +248 -4767
  118. data/src/diagnostic.c +672 -230
  119. data/src/encoding.c +211 -108
  120. data/src/node.c +7541 -1653
  121. data/src/options.c +135 -20
  122. data/src/pack.c +33 -17
  123. data/src/prettyprint.c +1543 -1485
  124. data/src/prism.c +7813 -3050
  125. data/src/regexp.c +225 -73
  126. data/src/serialize.c +101 -77
  127. data/src/static_literals.c +617 -0
  128. data/src/token_type.c +14 -13
  129. data/src/util/pm_buffer.c +187 -20
  130. data/src/util/pm_char.c +5 -5
  131. data/src/util/pm_constant_pool.c +39 -19
  132. data/src/util/pm_integer.c +670 -0
  133. data/src/util/pm_list.c +1 -1
  134. data/src/util/pm_newline_list.c +43 -5
  135. data/src/util/pm_string.c +213 -33
  136. data/src/util/pm_strncasecmp.c +13 -1
  137. data/src/util/pm_strpbrk.c +32 -6
  138. metadata +55 -19
  139. data/docs/ripper.md +0 -36
  140. data/include/prism/util/pm_state_stack.h +0 -42
  141. data/include/prism/util/pm_string_list.h +0 -44
  142. data/lib/prism/debug.rb +0 -206
  143. data/lib/prism/node_inspector.rb +0 -68
  144. data/lib/prism/translation/parser/rubocop.rb +0 -45
  145. data/rbi/prism_static.rbi +0 -207
  146. data/sig/prism_static.rbs +0 -201
  147. data/src/util/pm_state_stack.c +0 -25
  148. data/src/util/pm_string_list.c +0 -28
data/src/options.c CHANGED
@@ -1,5 +1,14 @@
1
1
  #include "prism/options.h"
2
2
 
3
+ /**
4
+ * Set the shebang callback option on the given options struct.
5
+ */
6
+ PRISM_EXPORTED_FUNCTION void
7
+ pm_options_shebang_callback_set(pm_options_t *options, pm_options_shebang_callback_t shebang_callback, void *shebang_callback_data) {
8
+ options->shebang_callback = shebang_callback;
9
+ options->shebang_callback_data = shebang_callback_data;
10
+ }
11
+
3
12
  /**
4
13
  * Set the filepath option on the given options struct.
5
14
  */
@@ -16,6 +25,14 @@ pm_options_encoding_set(pm_options_t *options, const char *encoding) {
16
25
  pm_string_constant_init(&options->encoding, encoding, strlen(encoding));
17
26
  }
18
27
 
28
+ /**
29
+ * Set the encoding_locked option on the given options struct.
30
+ */
31
+ PRISM_EXPORTED_FUNCTION void
32
+ pm_options_encoding_locked_set(pm_options_t *options, bool encoding_locked) {
33
+ options->encoding_locked = encoding_locked;
34
+ }
35
+
19
36
  /**
20
37
  * Set the line option on the given options struct.
21
38
  */
@@ -29,7 +46,23 @@ pm_options_line_set(pm_options_t *options, int32_t line) {
29
46
  */
30
47
  PRISM_EXPORTED_FUNCTION void
31
48
  pm_options_frozen_string_literal_set(pm_options_t *options, bool frozen_string_literal) {
32
- options->frozen_string_literal = frozen_string_literal;
49
+ options->frozen_string_literal = frozen_string_literal ? PM_OPTIONS_FROZEN_STRING_LITERAL_ENABLED : PM_OPTIONS_FROZEN_STRING_LITERAL_DISABLED;
50
+ }
51
+
52
+ /**
53
+ * Sets the command line option on the given options struct.
54
+ */
55
+ PRISM_EXPORTED_FUNCTION void
56
+ pm_options_command_line_set(pm_options_t *options, uint8_t command_line) {
57
+ options->command_line = command_line;
58
+ }
59
+
60
+ /**
61
+ * Checks if the given slice represents a number.
62
+ */
63
+ static inline bool
64
+ is_number(const char *string, size_t length) {
65
+ return pm_strspn_decimal_digit((const uint8_t *) string, (ptrdiff_t) length) == length;
33
66
  }
34
67
 
35
68
  /**
@@ -39,39 +72,97 @@ pm_options_frozen_string_literal_set(pm_options_t *options, bool frozen_string_l
39
72
  */
40
73
  PRISM_EXPORTED_FUNCTION bool
41
74
  pm_options_version_set(pm_options_t *options, const char *version, size_t length) {
42
- if (version == NULL && length == 0) {
75
+ if (version == NULL) {
43
76
  options->version = PM_OPTIONS_VERSION_LATEST;
44
77
  return true;
45
78
  }
46
79
 
47
- if (length == 5) {
48
- if (strncmp(version, "3.3.0", length) == 0) {
49
- options->version = PM_OPTIONS_VERSION_CRUBY_3_3_0;
80
+ if (length == 3) {
81
+ if (strncmp(version, "3.3", 3) == 0) {
82
+ options->version = PM_OPTIONS_VERSION_CRUBY_3_3;
83
+ return true;
84
+ }
85
+
86
+ if (strncmp(version, "3.4", 3) == 0) {
87
+ options->version = PM_OPTIONS_VERSION_CRUBY_3_4;
50
88
  return true;
51
89
  }
52
90
 
53
- if (strncmp(version, "3.4.0", length) == 0) {
91
+ if (strncmp(version, "3.5", 3) == 0) {
54
92
  options->version = PM_OPTIONS_VERSION_LATEST;
55
93
  return true;
56
94
  }
95
+
96
+ return false;
57
97
  }
58
98
 
59
- if (length == 6 && strncmp(version, "latest", length) == 0) {
60
- options->version = PM_OPTIONS_VERSION_LATEST;
61
- return true;
99
+ if (length >= 4) {
100
+ if (strncmp(version, "3.3.", 4) == 0 && is_number(version + 4, length - 4)) {
101
+ options->version = PM_OPTIONS_VERSION_CRUBY_3_3;
102
+ return true;
103
+ }
104
+
105
+ if (strncmp(version, "3.4.", 4) == 0 && is_number(version + 4, length - 4)) {
106
+ options->version = PM_OPTIONS_VERSION_CRUBY_3_4;
107
+ return true;
108
+ }
109
+
110
+ if (strncmp(version, "3.5.", 4) == 0 && is_number(version + 4, length - 4)) {
111
+ options->version = PM_OPTIONS_VERSION_LATEST;
112
+ return true;
113
+ }
114
+ }
115
+
116
+ if (length >= 6) {
117
+ if (strncmp(version, "latest", 7) == 0) { // 7 to compare the \0 as well
118
+ options->version = PM_OPTIONS_VERSION_LATEST;
119
+ return true;
120
+ }
62
121
  }
63
122
 
64
123
  return false;
65
124
  }
66
125
 
67
126
  /**
68
- * Allocate and zero out the scopes array on the given options struct.
127
+ * Set the main script option on the given options struct.
69
128
  */
70
129
  PRISM_EXPORTED_FUNCTION void
130
+ pm_options_main_script_set(pm_options_t *options, bool main_script) {
131
+ options->main_script = main_script;
132
+ }
133
+
134
+ /**
135
+ * Set the partial script option on the given options struct.
136
+ */
137
+ PRISM_EXPORTED_FUNCTION void
138
+ pm_options_partial_script_set(pm_options_t *options, bool partial_script) {
139
+ options->partial_script = partial_script;
140
+ }
141
+
142
+ /**
143
+ * Set the freeze option on the given options struct.
144
+ */
145
+ PRISM_EXPORTED_FUNCTION void
146
+ pm_options_freeze_set(pm_options_t *options, bool freeze) {
147
+ options->freeze = freeze;
148
+ }
149
+
150
+ // For some reason, GCC analyzer thinks we're leaking allocated scopes and
151
+ // locals here, even though we definitely aren't. This is a false positive.
152
+ // Ideally we wouldn't need to suppress this.
153
+ #if defined(__GNUC__) && (__GNUC__ >= 10)
154
+ #pragma GCC diagnostic push
155
+ #pragma GCC diagnostic ignored "-Wanalyzer-malloc-leak"
156
+ #endif
157
+
158
+ /**
159
+ * Allocate and zero out the scopes array on the given options struct.
160
+ */
161
+ PRISM_EXPORTED_FUNCTION bool
71
162
  pm_options_scopes_init(pm_options_t *options, size_t scopes_count) {
72
163
  options->scopes_count = scopes_count;
73
- options->scopes = calloc(scopes_count, sizeof(pm_options_scope_t));
74
- if (options->scopes == NULL) abort();
164
+ options->scopes = xcalloc(scopes_count, sizeof(pm_options_scope_t));
165
+ return options->scopes != NULL;
75
166
  }
76
167
 
77
168
  /**
@@ -86,11 +177,12 @@ pm_options_scope_get(const pm_options_t *options, size_t index) {
86
177
  * Create a new options scope struct. This will hold a set of locals that are in
87
178
  * scope surrounding the code that is being parsed.
88
179
  */
89
- PRISM_EXPORTED_FUNCTION void
180
+ PRISM_EXPORTED_FUNCTION bool
90
181
  pm_options_scope_init(pm_options_scope_t *scope, size_t locals_count) {
91
182
  scope->locals_count = locals_count;
92
- scope->locals = calloc(locals_count, sizeof(pm_string_t));
93
- if (scope->locals == NULL) abort();
183
+ scope->locals = xcalloc(locals_count, sizeof(pm_string_t));
184
+ scope->forwarding = PM_OPTIONS_SCOPE_FORWARDING_NONE;
185
+ return scope->locals != NULL;
94
186
  }
95
187
 
96
188
  /**
@@ -101,6 +193,14 @@ pm_options_scope_local_get(const pm_options_scope_t *scope, size_t index) {
101
193
  return &scope->locals[index];
102
194
  }
103
195
 
196
+ /**
197
+ * Set the forwarding option on the given scope struct.
198
+ */
199
+ PRISM_EXPORTED_FUNCTION void
200
+ pm_options_scope_forwarding_set(pm_options_scope_t *scope, uint8_t forwarding) {
201
+ scope->forwarding = forwarding;
202
+ }
203
+
104
204
  /**
105
205
  * Free the internal memory associated with the options.
106
206
  */
@@ -116,10 +216,10 @@ pm_options_free(pm_options_t *options) {
116
216
  pm_string_free(&scope->locals[local_index]);
117
217
  }
118
218
 
119
- free(scope->locals);
219
+ xfree(scope->locals);
120
220
  }
121
221
 
122
- free(options->scopes);
222
+ xfree(options->scopes);
123
223
  }
124
224
 
125
225
  /**
@@ -185,21 +285,32 @@ pm_options_read(pm_options_t *options, const char *data) {
185
285
  data += encoding_length;
186
286
  }
187
287
 
188
- options->frozen_string_literal = *data++;
288
+ options->frozen_string_literal = (int8_t) *data++;
289
+ options->command_line = (uint8_t) *data++;
189
290
  options->version = (pm_options_version_t) *data++;
291
+ options->encoding_locked = ((uint8_t) *data++) > 0;
292
+ options->main_script = ((uint8_t) *data++) > 0;
293
+ options->partial_script = ((uint8_t) *data++) > 0;
294
+ options->freeze = ((uint8_t) *data++) > 0;
190
295
 
191
296
  uint32_t scopes_count = pm_options_read_u32(data);
192
297
  data += 4;
193
298
 
194
299
  if (scopes_count > 0) {
195
- pm_options_scopes_init(options, scopes_count);
300
+ if (!pm_options_scopes_init(options, scopes_count)) return;
196
301
 
197
302
  for (size_t scope_index = 0; scope_index < scopes_count; scope_index++) {
198
303
  uint32_t locals_count = pm_options_read_u32(data);
199
304
  data += 4;
200
305
 
201
306
  pm_options_scope_t *scope = &options->scopes[scope_index];
202
- pm_options_scope_init(scope, locals_count);
307
+ if (!pm_options_scope_init(scope, locals_count)) {
308
+ pm_options_free(options);
309
+ return;
310
+ }
311
+
312
+ uint8_t forwarding = (uint8_t) *data++;
313
+ pm_options_scope_forwarding_set(&options->scopes[scope_index], forwarding);
203
314
 
204
315
  for (size_t local_index = 0; local_index < locals_count; local_index++) {
205
316
  uint32_t local_length = pm_options_read_u32(data);
@@ -211,3 +322,7 @@ pm_options_read(pm_options_t *options, const char *data) {
211
322
  }
212
323
  }
213
324
  }
325
+
326
+ #if defined(__GNUC__) && (__GNUC__ >= 10)
327
+ #pragma GCC diagnostic pop
328
+ #endif
data/src/pack.c CHANGED
@@ -1,16 +1,43 @@
1
1
  #include "prism/pack.h"
2
2
 
3
+ // We optionally support parsing String#pack templates. For systems that don't
4
+ // want or need this functionality, it can be turned off with the
5
+ // PRISM_EXCLUDE_PACK define.
6
+ #ifdef PRISM_EXCLUDE_PACK
7
+
8
+ void pm_pack_parse(void) {}
9
+
10
+ #else
11
+
3
12
  #include <stdbool.h>
4
13
  #include <errno.h>
5
14
 
6
15
  static uintmax_t
7
- strtoumaxc(const char **format);
16
+ strtoumaxc(const char **format) {
17
+ uintmax_t value = 0;
18
+ while (**format >= '0' && **format <= '9') {
19
+ if (value > UINTMAX_MAX / 10) {
20
+ errno = ERANGE;
21
+ }
22
+ value = value * 10 + ((uintmax_t) (**format - '0'));
23
+ (*format)++;
24
+ }
25
+ return value;
26
+ }
8
27
 
9
28
  PRISM_EXPORTED_FUNCTION pm_pack_result
10
- pm_pack_parse(pm_pack_variant variant, const char **format, const char *format_end,
11
- pm_pack_type *type, pm_pack_signed *signed_type, pm_pack_endian *endian, pm_pack_size *size,
12
- pm_pack_length_type *length_type, uint64_t *length, pm_pack_encoding *encoding) {
13
-
29
+ pm_pack_parse(
30
+ pm_pack_variant variant,
31
+ const char **format,
32
+ const char *format_end,
33
+ pm_pack_type *type,
34
+ pm_pack_signed *signed_type,
35
+ pm_pack_endian *endian,
36
+ pm_pack_size *size,
37
+ pm_pack_length_type *length_type,
38
+ uint64_t *length,
39
+ pm_pack_encoding *encoding
40
+ ) {
14
41
  if (*encoding == PM_PACK_ENCODING_START) {
15
42
  *encoding = PM_PACK_ENCODING_US_ASCII;
16
43
  }
@@ -479,15 +506,4 @@ pm_size_to_native(pm_pack_size size) {
479
506
  }
480
507
  }
481
508
 
482
- static uintmax_t
483
- strtoumaxc(const char **format) {
484
- uintmax_t value = 0;
485
- while (**format >= '0' && **format <= '9') {
486
- if (value > UINTMAX_MAX / 10) {
487
- errno = ERANGE;
488
- }
489
- value = value * 10 + ((uintmax_t) (**format - '0'));
490
- (*format)++;
491
- }
492
- return value;
493
- }
509
+ #endif