jruby-prism-parser 0.24.0-java → 1.4.0-java
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/BSDmakefile +58 -0
- data/CHANGELOG.md +269 -1
- data/CONTRIBUTING.md +0 -4
- data/Makefile +25 -18
- data/README.md +57 -6
- data/config.yml +1724 -140
- data/docs/build_system.md +39 -11
- data/docs/configuration.md +4 -0
- data/docs/cruby_compilation.md +1 -1
- data/docs/fuzzing.md +1 -1
- data/docs/parser_translation.md +14 -9
- data/docs/parsing_rules.md +4 -1
- data/docs/releasing.md +8 -10
- data/docs/relocation.md +34 -0
- data/docs/ripper_translation.md +72 -0
- data/docs/ruby_api.md +2 -1
- data/docs/serialization.md +29 -5
- data/ext/prism/api_node.c +3395 -1999
- data/ext/prism/api_pack.c +9 -0
- data/ext/prism/extconf.rb +55 -34
- data/ext/prism/extension.c +597 -346
- data/ext/prism/extension.h +6 -5
- data/include/prism/ast.h +2612 -455
- data/include/prism/defines.h +160 -2
- data/include/prism/diagnostic.h +188 -76
- data/include/prism/encoding.h +22 -4
- data/include/prism/node.h +89 -17
- data/include/prism/options.h +224 -12
- data/include/prism/pack.h +11 -0
- data/include/prism/parser.h +267 -66
- data/include/prism/prettyprint.h +8 -0
- data/include/prism/regexp.h +18 -8
- data/include/prism/static_literals.h +121 -0
- data/include/prism/util/pm_buffer.h +75 -2
- data/include/prism/util/pm_char.h +1 -2
- data/include/prism/util/pm_constant_pool.h +18 -9
- data/include/prism/util/pm_integer.h +126 -0
- data/include/prism/util/pm_list.h +1 -1
- data/include/prism/util/pm_newline_list.h +19 -0
- data/include/prism/util/pm_string.h +48 -8
- data/include/prism/version.h +3 -3
- data/include/prism.h +99 -5
- data/jruby-prism.jar +0 -0
- data/lib/prism/compiler.rb +11 -1
- data/lib/prism/desugar_compiler.rb +113 -74
- data/lib/prism/dispatcher.rb +45 -1
- data/lib/prism/dot_visitor.rb +201 -77
- data/lib/prism/dsl.rb +673 -461
- data/lib/prism/ffi.rb +233 -45
- data/lib/prism/inspect_visitor.rb +2389 -0
- data/lib/prism/lex_compat.rb +35 -16
- data/lib/prism/mutation_compiler.rb +24 -8
- data/lib/prism/node.rb +7731 -8460
- data/lib/prism/node_ext.rb +328 -32
- data/lib/prism/pack.rb +4 -0
- data/lib/prism/parse_result/comments.rb +34 -24
- data/lib/prism/parse_result/errors.rb +65 -0
- data/lib/prism/parse_result/newlines.rb +102 -12
- data/lib/prism/parse_result.rb +448 -44
- data/lib/prism/pattern.rb +28 -10
- data/lib/prism/polyfill/append_as_bytes.rb +15 -0
- data/lib/prism/polyfill/byteindex.rb +13 -0
- data/lib/prism/polyfill/unpack1.rb +14 -0
- data/lib/prism/reflection.rb +413 -0
- data/lib/prism/relocation.rb +504 -0
- data/lib/prism/serialize.rb +1940 -1198
- data/lib/prism/string_query.rb +30 -0
- data/lib/prism/translation/parser/builder.rb +61 -0
- data/lib/prism/translation/parser/compiler.rb +569 -195
- data/lib/prism/translation/parser/lexer.rb +516 -39
- data/lib/prism/translation/parser.rb +177 -12
- data/lib/prism/translation/parser33.rb +1 -1
- data/lib/prism/translation/parser34.rb +1 -1
- data/lib/prism/translation/parser35.rb +12 -0
- data/lib/prism/translation/ripper/sexp.rb +125 -0
- data/lib/prism/translation/ripper/shim.rb +5 -0
- data/lib/prism/translation/ripper.rb +3224 -462
- data/lib/prism/translation/ruby_parser.rb +194 -69
- data/lib/prism/translation.rb +4 -1
- data/lib/prism/version.rb +1 -1
- data/lib/prism/visitor.rb +13 -0
- data/lib/prism.rb +17 -27
- data/prism.gemspec +57 -17
- data/rbi/prism/compiler.rbi +12 -0
- data/rbi/prism/dsl.rbi +524 -0
- data/rbi/prism/inspect_visitor.rbi +12 -0
- data/rbi/prism/node.rbi +8722 -0
- data/rbi/prism/node_ext.rbi +107 -0
- data/rbi/prism/parse_result.rbi +404 -0
- data/rbi/prism/reflection.rbi +58 -0
- data/rbi/prism/string_query.rbi +12 -0
- data/rbi/prism/translation/parser.rbi +11 -0
- data/rbi/prism/translation/parser33.rbi +6 -0
- data/rbi/prism/translation/parser34.rbi +6 -0
- data/rbi/prism/translation/parser35.rbi +6 -0
- data/rbi/prism/translation/ripper.rbi +15 -0
- data/rbi/prism/visitor.rbi +473 -0
- data/rbi/prism.rbi +44 -7745
- data/sig/prism/compiler.rbs +9 -0
- data/sig/prism/dispatcher.rbs +16 -0
- data/sig/prism/dot_visitor.rbs +6 -0
- data/sig/prism/dsl.rbs +351 -0
- data/sig/prism/inspect_visitor.rbs +22 -0
- data/sig/prism/lex_compat.rbs +10 -0
- data/sig/prism/mutation_compiler.rbs +159 -0
- data/sig/prism/node.rbs +3614 -0
- data/sig/prism/node_ext.rbs +82 -0
- data/sig/prism/pack.rbs +43 -0
- data/sig/prism/parse_result.rbs +192 -0
- data/sig/prism/pattern.rbs +13 -0
- data/sig/prism/reflection.rbs +50 -0
- data/sig/prism/relocation.rbs +185 -0
- data/sig/prism/serialize.rbs +8 -0
- data/sig/prism/string_query.rbs +11 -0
- data/sig/prism/visitor.rbs +169 -0
- data/sig/prism.rbs +248 -4767
- data/src/diagnostic.c +672 -230
- data/src/encoding.c +211 -108
- data/src/node.c +7541 -1653
- data/src/options.c +135 -20
- data/src/pack.c +33 -17
- data/src/prettyprint.c +1543 -1485
- data/src/prism.c +7813 -3050
- data/src/regexp.c +225 -73
- data/src/serialize.c +101 -77
- data/src/static_literals.c +617 -0
- data/src/token_type.c +14 -13
- data/src/util/pm_buffer.c +187 -20
- data/src/util/pm_char.c +5 -5
- data/src/util/pm_constant_pool.c +39 -19
- data/src/util/pm_integer.c +670 -0
- data/src/util/pm_list.c +1 -1
- data/src/util/pm_newline_list.c +43 -5
- data/src/util/pm_string.c +213 -33
- data/src/util/pm_strncasecmp.c +13 -1
- data/src/util/pm_strpbrk.c +32 -6
- metadata +55 -19
- data/docs/ripper.md +0 -36
- data/include/prism/util/pm_state_stack.h +0 -42
- data/include/prism/util/pm_string_list.h +0 -44
- data/lib/prism/debug.rb +0 -206
- data/lib/prism/node_inspector.rb +0 -68
- data/lib/prism/translation/parser/rubocop.rb +0 -45
- data/rbi/prism_static.rbi +0 -207
- data/sig/prism_static.rbs +0 -201
- data/src/util/pm_state_stack.c +0 -25
- data/src/util/pm_string_list.c +0 -28
data/src/options.c
CHANGED
@@ -1,5 +1,14 @@
|
|
1
1
|
#include "prism/options.h"
|
2
2
|
|
3
|
+
/**
|
4
|
+
* Set the shebang callback option on the given options struct.
|
5
|
+
*/
|
6
|
+
PRISM_EXPORTED_FUNCTION void
|
7
|
+
pm_options_shebang_callback_set(pm_options_t *options, pm_options_shebang_callback_t shebang_callback, void *shebang_callback_data) {
|
8
|
+
options->shebang_callback = shebang_callback;
|
9
|
+
options->shebang_callback_data = shebang_callback_data;
|
10
|
+
}
|
11
|
+
|
3
12
|
/**
|
4
13
|
* Set the filepath option on the given options struct.
|
5
14
|
*/
|
@@ -16,6 +25,14 @@ pm_options_encoding_set(pm_options_t *options, const char *encoding) {
|
|
16
25
|
pm_string_constant_init(&options->encoding, encoding, strlen(encoding));
|
17
26
|
}
|
18
27
|
|
28
|
+
/**
|
29
|
+
* Set the encoding_locked option on the given options struct.
|
30
|
+
*/
|
31
|
+
PRISM_EXPORTED_FUNCTION void
|
32
|
+
pm_options_encoding_locked_set(pm_options_t *options, bool encoding_locked) {
|
33
|
+
options->encoding_locked = encoding_locked;
|
34
|
+
}
|
35
|
+
|
19
36
|
/**
|
20
37
|
* Set the line option on the given options struct.
|
21
38
|
*/
|
@@ -29,7 +46,23 @@ pm_options_line_set(pm_options_t *options, int32_t line) {
|
|
29
46
|
*/
|
30
47
|
PRISM_EXPORTED_FUNCTION void
|
31
48
|
pm_options_frozen_string_literal_set(pm_options_t *options, bool frozen_string_literal) {
|
32
|
-
options->frozen_string_literal = frozen_string_literal;
|
49
|
+
options->frozen_string_literal = frozen_string_literal ? PM_OPTIONS_FROZEN_STRING_LITERAL_ENABLED : PM_OPTIONS_FROZEN_STRING_LITERAL_DISABLED;
|
50
|
+
}
|
51
|
+
|
52
|
+
/**
|
53
|
+
* Sets the command line option on the given options struct.
|
54
|
+
*/
|
55
|
+
PRISM_EXPORTED_FUNCTION void
|
56
|
+
pm_options_command_line_set(pm_options_t *options, uint8_t command_line) {
|
57
|
+
options->command_line = command_line;
|
58
|
+
}
|
59
|
+
|
60
|
+
/**
|
61
|
+
* Checks if the given slice represents a number.
|
62
|
+
*/
|
63
|
+
static inline bool
|
64
|
+
is_number(const char *string, size_t length) {
|
65
|
+
return pm_strspn_decimal_digit((const uint8_t *) string, (ptrdiff_t) length) == length;
|
33
66
|
}
|
34
67
|
|
35
68
|
/**
|
@@ -39,39 +72,97 @@ pm_options_frozen_string_literal_set(pm_options_t *options, bool frozen_string_l
|
|
39
72
|
*/
|
40
73
|
PRISM_EXPORTED_FUNCTION bool
|
41
74
|
pm_options_version_set(pm_options_t *options, const char *version, size_t length) {
|
42
|
-
if (version == NULL
|
75
|
+
if (version == NULL) {
|
43
76
|
options->version = PM_OPTIONS_VERSION_LATEST;
|
44
77
|
return true;
|
45
78
|
}
|
46
79
|
|
47
|
-
if (length ==
|
48
|
-
if (strncmp(version, "3.3
|
49
|
-
options->version =
|
80
|
+
if (length == 3) {
|
81
|
+
if (strncmp(version, "3.3", 3) == 0) {
|
82
|
+
options->version = PM_OPTIONS_VERSION_CRUBY_3_3;
|
83
|
+
return true;
|
84
|
+
}
|
85
|
+
|
86
|
+
if (strncmp(version, "3.4", 3) == 0) {
|
87
|
+
options->version = PM_OPTIONS_VERSION_CRUBY_3_4;
|
50
88
|
return true;
|
51
89
|
}
|
52
90
|
|
53
|
-
if (strncmp(version, "3.
|
91
|
+
if (strncmp(version, "3.5", 3) == 0) {
|
54
92
|
options->version = PM_OPTIONS_VERSION_LATEST;
|
55
93
|
return true;
|
56
94
|
}
|
95
|
+
|
96
|
+
return false;
|
57
97
|
}
|
58
98
|
|
59
|
-
if (length
|
60
|
-
|
61
|
-
|
99
|
+
if (length >= 4) {
|
100
|
+
if (strncmp(version, "3.3.", 4) == 0 && is_number(version + 4, length - 4)) {
|
101
|
+
options->version = PM_OPTIONS_VERSION_CRUBY_3_3;
|
102
|
+
return true;
|
103
|
+
}
|
104
|
+
|
105
|
+
if (strncmp(version, "3.4.", 4) == 0 && is_number(version + 4, length - 4)) {
|
106
|
+
options->version = PM_OPTIONS_VERSION_CRUBY_3_4;
|
107
|
+
return true;
|
108
|
+
}
|
109
|
+
|
110
|
+
if (strncmp(version, "3.5.", 4) == 0 && is_number(version + 4, length - 4)) {
|
111
|
+
options->version = PM_OPTIONS_VERSION_LATEST;
|
112
|
+
return true;
|
113
|
+
}
|
114
|
+
}
|
115
|
+
|
116
|
+
if (length >= 6) {
|
117
|
+
if (strncmp(version, "latest", 7) == 0) { // 7 to compare the \0 as well
|
118
|
+
options->version = PM_OPTIONS_VERSION_LATEST;
|
119
|
+
return true;
|
120
|
+
}
|
62
121
|
}
|
63
122
|
|
64
123
|
return false;
|
65
124
|
}
|
66
125
|
|
67
126
|
/**
|
68
|
-
*
|
127
|
+
* Set the main script option on the given options struct.
|
69
128
|
*/
|
70
129
|
PRISM_EXPORTED_FUNCTION void
|
130
|
+
pm_options_main_script_set(pm_options_t *options, bool main_script) {
|
131
|
+
options->main_script = main_script;
|
132
|
+
}
|
133
|
+
|
134
|
+
/**
|
135
|
+
* Set the partial script option on the given options struct.
|
136
|
+
*/
|
137
|
+
PRISM_EXPORTED_FUNCTION void
|
138
|
+
pm_options_partial_script_set(pm_options_t *options, bool partial_script) {
|
139
|
+
options->partial_script = partial_script;
|
140
|
+
}
|
141
|
+
|
142
|
+
/**
|
143
|
+
* Set the freeze option on the given options struct.
|
144
|
+
*/
|
145
|
+
PRISM_EXPORTED_FUNCTION void
|
146
|
+
pm_options_freeze_set(pm_options_t *options, bool freeze) {
|
147
|
+
options->freeze = freeze;
|
148
|
+
}
|
149
|
+
|
150
|
+
// For some reason, GCC analyzer thinks we're leaking allocated scopes and
|
151
|
+
// locals here, even though we definitely aren't. This is a false positive.
|
152
|
+
// Ideally we wouldn't need to suppress this.
|
153
|
+
#if defined(__GNUC__) && (__GNUC__ >= 10)
|
154
|
+
#pragma GCC diagnostic push
|
155
|
+
#pragma GCC diagnostic ignored "-Wanalyzer-malloc-leak"
|
156
|
+
#endif
|
157
|
+
|
158
|
+
/**
|
159
|
+
* Allocate and zero out the scopes array on the given options struct.
|
160
|
+
*/
|
161
|
+
PRISM_EXPORTED_FUNCTION bool
|
71
162
|
pm_options_scopes_init(pm_options_t *options, size_t scopes_count) {
|
72
163
|
options->scopes_count = scopes_count;
|
73
|
-
options->scopes =
|
74
|
-
|
164
|
+
options->scopes = xcalloc(scopes_count, sizeof(pm_options_scope_t));
|
165
|
+
return options->scopes != NULL;
|
75
166
|
}
|
76
167
|
|
77
168
|
/**
|
@@ -86,11 +177,12 @@ pm_options_scope_get(const pm_options_t *options, size_t index) {
|
|
86
177
|
* Create a new options scope struct. This will hold a set of locals that are in
|
87
178
|
* scope surrounding the code that is being parsed.
|
88
179
|
*/
|
89
|
-
PRISM_EXPORTED_FUNCTION
|
180
|
+
PRISM_EXPORTED_FUNCTION bool
|
90
181
|
pm_options_scope_init(pm_options_scope_t *scope, size_t locals_count) {
|
91
182
|
scope->locals_count = locals_count;
|
92
|
-
scope->locals =
|
93
|
-
|
183
|
+
scope->locals = xcalloc(locals_count, sizeof(pm_string_t));
|
184
|
+
scope->forwarding = PM_OPTIONS_SCOPE_FORWARDING_NONE;
|
185
|
+
return scope->locals != NULL;
|
94
186
|
}
|
95
187
|
|
96
188
|
/**
|
@@ -101,6 +193,14 @@ pm_options_scope_local_get(const pm_options_scope_t *scope, size_t index) {
|
|
101
193
|
return &scope->locals[index];
|
102
194
|
}
|
103
195
|
|
196
|
+
/**
|
197
|
+
* Set the forwarding option on the given scope struct.
|
198
|
+
*/
|
199
|
+
PRISM_EXPORTED_FUNCTION void
|
200
|
+
pm_options_scope_forwarding_set(pm_options_scope_t *scope, uint8_t forwarding) {
|
201
|
+
scope->forwarding = forwarding;
|
202
|
+
}
|
203
|
+
|
104
204
|
/**
|
105
205
|
* Free the internal memory associated with the options.
|
106
206
|
*/
|
@@ -116,10 +216,10 @@ pm_options_free(pm_options_t *options) {
|
|
116
216
|
pm_string_free(&scope->locals[local_index]);
|
117
217
|
}
|
118
218
|
|
119
|
-
|
219
|
+
xfree(scope->locals);
|
120
220
|
}
|
121
221
|
|
122
|
-
|
222
|
+
xfree(options->scopes);
|
123
223
|
}
|
124
224
|
|
125
225
|
/**
|
@@ -185,21 +285,32 @@ pm_options_read(pm_options_t *options, const char *data) {
|
|
185
285
|
data += encoding_length;
|
186
286
|
}
|
187
287
|
|
188
|
-
options->frozen_string_literal = *data++;
|
288
|
+
options->frozen_string_literal = (int8_t) *data++;
|
289
|
+
options->command_line = (uint8_t) *data++;
|
189
290
|
options->version = (pm_options_version_t) *data++;
|
291
|
+
options->encoding_locked = ((uint8_t) *data++) > 0;
|
292
|
+
options->main_script = ((uint8_t) *data++) > 0;
|
293
|
+
options->partial_script = ((uint8_t) *data++) > 0;
|
294
|
+
options->freeze = ((uint8_t) *data++) > 0;
|
190
295
|
|
191
296
|
uint32_t scopes_count = pm_options_read_u32(data);
|
192
297
|
data += 4;
|
193
298
|
|
194
299
|
if (scopes_count > 0) {
|
195
|
-
pm_options_scopes_init(options, scopes_count);
|
300
|
+
if (!pm_options_scopes_init(options, scopes_count)) return;
|
196
301
|
|
197
302
|
for (size_t scope_index = 0; scope_index < scopes_count; scope_index++) {
|
198
303
|
uint32_t locals_count = pm_options_read_u32(data);
|
199
304
|
data += 4;
|
200
305
|
|
201
306
|
pm_options_scope_t *scope = &options->scopes[scope_index];
|
202
|
-
pm_options_scope_init(scope, locals_count)
|
307
|
+
if (!pm_options_scope_init(scope, locals_count)) {
|
308
|
+
pm_options_free(options);
|
309
|
+
return;
|
310
|
+
}
|
311
|
+
|
312
|
+
uint8_t forwarding = (uint8_t) *data++;
|
313
|
+
pm_options_scope_forwarding_set(&options->scopes[scope_index], forwarding);
|
203
314
|
|
204
315
|
for (size_t local_index = 0; local_index < locals_count; local_index++) {
|
205
316
|
uint32_t local_length = pm_options_read_u32(data);
|
@@ -211,3 +322,7 @@ pm_options_read(pm_options_t *options, const char *data) {
|
|
211
322
|
}
|
212
323
|
}
|
213
324
|
}
|
325
|
+
|
326
|
+
#if defined(__GNUC__) && (__GNUC__ >= 10)
|
327
|
+
#pragma GCC diagnostic pop
|
328
|
+
#endif
|
data/src/pack.c
CHANGED
@@ -1,16 +1,43 @@
|
|
1
1
|
#include "prism/pack.h"
|
2
2
|
|
3
|
+
// We optionally support parsing String#pack templates. For systems that don't
|
4
|
+
// want or need this functionality, it can be turned off with the
|
5
|
+
// PRISM_EXCLUDE_PACK define.
|
6
|
+
#ifdef PRISM_EXCLUDE_PACK
|
7
|
+
|
8
|
+
void pm_pack_parse(void) {}
|
9
|
+
|
10
|
+
#else
|
11
|
+
|
3
12
|
#include <stdbool.h>
|
4
13
|
#include <errno.h>
|
5
14
|
|
6
15
|
static uintmax_t
|
7
|
-
strtoumaxc(const char **format)
|
16
|
+
strtoumaxc(const char **format) {
|
17
|
+
uintmax_t value = 0;
|
18
|
+
while (**format >= '0' && **format <= '9') {
|
19
|
+
if (value > UINTMAX_MAX / 10) {
|
20
|
+
errno = ERANGE;
|
21
|
+
}
|
22
|
+
value = value * 10 + ((uintmax_t) (**format - '0'));
|
23
|
+
(*format)++;
|
24
|
+
}
|
25
|
+
return value;
|
26
|
+
}
|
8
27
|
|
9
28
|
PRISM_EXPORTED_FUNCTION pm_pack_result
|
10
|
-
pm_pack_parse(
|
11
|
-
|
12
|
-
|
13
|
-
|
29
|
+
pm_pack_parse(
|
30
|
+
pm_pack_variant variant,
|
31
|
+
const char **format,
|
32
|
+
const char *format_end,
|
33
|
+
pm_pack_type *type,
|
34
|
+
pm_pack_signed *signed_type,
|
35
|
+
pm_pack_endian *endian,
|
36
|
+
pm_pack_size *size,
|
37
|
+
pm_pack_length_type *length_type,
|
38
|
+
uint64_t *length,
|
39
|
+
pm_pack_encoding *encoding
|
40
|
+
) {
|
14
41
|
if (*encoding == PM_PACK_ENCODING_START) {
|
15
42
|
*encoding = PM_PACK_ENCODING_US_ASCII;
|
16
43
|
}
|
@@ -479,15 +506,4 @@ pm_size_to_native(pm_pack_size size) {
|
|
479
506
|
}
|
480
507
|
}
|
481
508
|
|
482
|
-
|
483
|
-
strtoumaxc(const char **format) {
|
484
|
-
uintmax_t value = 0;
|
485
|
-
while (**format >= '0' && **format <= '9') {
|
486
|
-
if (value > UINTMAX_MAX / 10) {
|
487
|
-
errno = ERANGE;
|
488
|
-
}
|
489
|
-
value = value * 10 + ((uintmax_t) (**format - '0'));
|
490
|
-
(*format)++;
|
491
|
-
}
|
492
|
-
return value;
|
493
|
-
}
|
509
|
+
#endif
|