prism 1.2.0 → 1.4.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +46 -1
- data/Makefile +1 -1
- data/config.yml +429 -2
- data/docs/build_system.md +8 -11
- data/docs/releasing.md +1 -1
- data/docs/relocation.md +34 -0
- data/docs/ruby_api.md +1 -1
- data/ext/prism/api_node.c +1824 -1305
- data/ext/prism/extconf.rb +13 -36
- data/ext/prism/extension.c +298 -109
- data/ext/prism/extension.h +4 -4
- data/include/prism/ast.h +442 -2
- data/include/prism/defines.h +26 -8
- data/include/prism/options.h +47 -1
- data/include/prism/util/pm_buffer.h +10 -0
- data/include/prism/version.h +2 -2
- data/include/prism.h +51 -4
- data/lib/prism/dot_visitor.rb +26 -0
- data/lib/prism/dsl.rb +14 -6
- data/lib/prism/ffi.rb +93 -28
- data/lib/prism/inspect_visitor.rb +4 -1
- data/lib/prism/node.rb +1886 -105
- data/lib/prism/parse_result/errors.rb +1 -1
- data/lib/prism/parse_result/newlines.rb +1 -1
- data/lib/prism/parse_result.rb +54 -2
- data/lib/prism/polyfill/append_as_bytes.rb +15 -0
- data/lib/prism/reflection.rb +4 -4
- data/lib/prism/relocation.rb +504 -0
- data/lib/prism/serialize.rb +1252 -765
- data/lib/prism/string_query.rb +30 -0
- data/lib/prism/translation/parser/builder.rb +61 -0
- data/lib/prism/translation/parser/compiler.rb +228 -162
- data/lib/prism/translation/parser/lexer.rb +435 -61
- data/lib/prism/translation/parser.rb +51 -3
- data/lib/prism/translation/parser35.rb +12 -0
- data/lib/prism/translation/ripper.rb +13 -3
- data/lib/prism/translation/ruby_parser.rb +17 -7
- data/lib/prism/translation.rb +1 -0
- data/lib/prism.rb +9 -7
- data/prism.gemspec +11 -1
- data/rbi/prism/dsl.rbi +10 -7
- data/rbi/prism/node.rbi +44 -17
- data/rbi/prism/parse_result.rbi +17 -0
- data/rbi/prism/string_query.rbi +12 -0
- data/rbi/prism/translation/parser35.rbi +6 -0
- data/rbi/prism.rbi +39 -36
- data/sig/prism/dsl.rbs +6 -4
- data/sig/prism/node.rbs +29 -15
- data/sig/prism/parse_result.rbs +10 -0
- data/sig/prism/relocation.rbs +185 -0
- data/sig/prism/serialize.rbs +4 -2
- data/sig/prism/string_query.rbs +11 -0
- data/sig/prism.rbs +22 -1
- data/src/diagnostic.c +2 -2
- data/src/node.c +39 -0
- data/src/options.c +31 -0
- data/src/prettyprint.c +62 -0
- data/src/prism.c +738 -199
- data/src/regexp.c +7 -3
- data/src/serialize.c +18 -0
- data/src/static_literals.c +1 -1
- data/src/util/pm_buffer.c +40 -0
- data/src/util/pm_char.c +1 -1
- data/src/util/pm_constant_pool.c +6 -2
- data/src/util/pm_string.c +1 -0
- data/src/util/pm_strncasecmp.c +13 -1
- metadata +13 -7
data/ext/prism/extension.c
CHANGED
@@ -23,12 +23,15 @@ VALUE rb_cPrismResult;
|
|
23
23
|
VALUE rb_cPrismParseResult;
|
24
24
|
VALUE rb_cPrismLexResult;
|
25
25
|
VALUE rb_cPrismParseLexResult;
|
26
|
+
VALUE rb_cPrismStringQuery;
|
27
|
+
VALUE rb_cPrismScope;
|
26
28
|
|
27
29
|
VALUE rb_cPrismDebugEncoding;
|
28
30
|
|
29
31
|
ID rb_id_option_command_line;
|
30
32
|
ID rb_id_option_encoding;
|
31
33
|
ID rb_id_option_filepath;
|
34
|
+
ID rb_id_option_freeze;
|
32
35
|
ID rb_id_option_frozen_string_literal;
|
33
36
|
ID rb_id_option_line;
|
34
37
|
ID rb_id_option_main_script;
|
@@ -36,6 +39,10 @@ ID rb_id_option_partial_script;
|
|
36
39
|
ID rb_id_option_scopes;
|
37
40
|
ID rb_id_option_version;
|
38
41
|
ID rb_id_source_for;
|
42
|
+
ID rb_id_forwarding_positionals;
|
43
|
+
ID rb_id_forwarding_keywords;
|
44
|
+
ID rb_id_forwarding_block;
|
45
|
+
ID rb_id_forwarding_all;
|
39
46
|
|
40
47
|
/******************************************************************************/
|
41
48
|
/* IO of Ruby code */
|
@@ -93,14 +100,53 @@ build_options_scopes(pm_options_t *options, VALUE scopes) {
|
|
93
100
|
for (size_t scope_index = 0; scope_index < scopes_count; scope_index++) {
|
94
101
|
VALUE scope = rb_ary_entry(scopes, scope_index);
|
95
102
|
|
96
|
-
//
|
97
|
-
//
|
98
|
-
|
99
|
-
|
103
|
+
// The scope can be either an array or it can be a Prism::Scope object.
|
104
|
+
// Parse out the correct values here from either.
|
105
|
+
VALUE locals;
|
106
|
+
uint8_t forwarding = PM_OPTIONS_SCOPE_FORWARDING_NONE;
|
107
|
+
|
108
|
+
if (RB_TYPE_P(scope, T_ARRAY)) {
|
109
|
+
locals = scope;
|
110
|
+
} else if (rb_obj_is_kind_of(scope, rb_cPrismScope)) {
|
111
|
+
locals = rb_ivar_get(scope, rb_intern("@locals"));
|
112
|
+
if (!RB_TYPE_P(locals, T_ARRAY)) {
|
113
|
+
rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Array)", rb_obj_class(locals));
|
114
|
+
}
|
115
|
+
|
116
|
+
VALUE names = rb_ivar_get(scope, rb_intern("@forwarding"));
|
117
|
+
if (!RB_TYPE_P(names, T_ARRAY)) {
|
118
|
+
rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Array)", rb_obj_class(names));
|
119
|
+
}
|
120
|
+
|
121
|
+
size_t names_count = RARRAY_LEN(names);
|
122
|
+
for (size_t name_index = 0; name_index < names_count; name_index++) {
|
123
|
+
VALUE name = rb_ary_entry(names, name_index);
|
124
|
+
|
125
|
+
// Check that the name is a symbol. If it's not, then raise
|
126
|
+
// a type error.
|
127
|
+
if (!RB_TYPE_P(name, T_SYMBOL)) {
|
128
|
+
rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Symbol)", rb_obj_class(name));
|
129
|
+
}
|
130
|
+
|
131
|
+
ID id = SYM2ID(name);
|
132
|
+
if (id == rb_id_forwarding_positionals) {
|
133
|
+
forwarding |= PM_OPTIONS_SCOPE_FORWARDING_POSITIONALS;
|
134
|
+
} else if (id == rb_id_forwarding_keywords) {
|
135
|
+
forwarding |= PM_OPTIONS_SCOPE_FORWARDING_KEYWORDS;
|
136
|
+
} else if (id == rb_id_forwarding_block) {
|
137
|
+
forwarding |= PM_OPTIONS_SCOPE_FORWARDING_BLOCK;
|
138
|
+
} else if (id == rb_id_forwarding_all) {
|
139
|
+
forwarding |= PM_OPTIONS_SCOPE_FORWARDING_ALL;
|
140
|
+
} else {
|
141
|
+
rb_raise(rb_eArgError, "invalid forwarding value: %" PRIsVALUE, name);
|
142
|
+
}
|
143
|
+
}
|
144
|
+
} else {
|
145
|
+
rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Array or Prism::Scope)", rb_obj_class(scope));
|
100
146
|
}
|
101
147
|
|
102
148
|
// Initialize the scope array.
|
103
|
-
size_t locals_count = RARRAY_LEN(
|
149
|
+
size_t locals_count = RARRAY_LEN(locals);
|
104
150
|
pm_options_scope_t *options_scope = &options->scopes[scope_index];
|
105
151
|
if (!pm_options_scope_init(options_scope, locals_count)) {
|
106
152
|
rb_raise(rb_eNoMemError, "failed to allocate memory");
|
@@ -108,7 +154,7 @@ build_options_scopes(pm_options_t *options, VALUE scopes) {
|
|
108
154
|
|
109
155
|
// Iterate over the locals and add them to the scope.
|
110
156
|
for (size_t local_index = 0; local_index < locals_count; local_index++) {
|
111
|
-
VALUE local = rb_ary_entry(
|
157
|
+
VALUE local = rb_ary_entry(locals, local_index);
|
112
158
|
|
113
159
|
// Check that the local is a symbol. If it's not, then raise a
|
114
160
|
// type error.
|
@@ -121,6 +167,9 @@ build_options_scopes(pm_options_t *options, VALUE scopes) {
|
|
121
167
|
const char *name = rb_id2name(SYM2ID(local));
|
122
168
|
pm_string_constant_init(scope_local, name, strlen(name));
|
123
169
|
}
|
170
|
+
|
171
|
+
// Now set the forwarding options.
|
172
|
+
pm_options_scope_forwarding_set(options_scope, forwarding);
|
124
173
|
}
|
125
174
|
}
|
126
175
|
|
@@ -179,6 +228,8 @@ build_options_i(VALUE key, VALUE value, VALUE argument) {
|
|
179
228
|
if (!NIL_P(value)) pm_options_main_script_set(options, RTEST(value));
|
180
229
|
} else if (key_id == rb_id_option_partial_script) {
|
181
230
|
if (!NIL_P(value)) pm_options_partial_script_set(options, RTEST(value));
|
231
|
+
} else if (key_id == rb_id_option_freeze) {
|
232
|
+
if (!NIL_P(value)) pm_options_freeze_set(options, RTEST(value));
|
182
233
|
} else {
|
183
234
|
rb_raise(rb_eArgError, "unknown keyword: %" PRIsVALUE, key);
|
184
235
|
}
|
@@ -343,6 +394,7 @@ dump(int argc, VALUE *argv, VALUE self) {
|
|
343
394
|
#endif
|
344
395
|
|
345
396
|
VALUE value = dump_input(&input, &options);
|
397
|
+
if (options.freeze) rb_obj_freeze(value);
|
346
398
|
|
347
399
|
#ifdef PRISM_BUILD_DEBUG
|
348
400
|
xfree(dup);
|
@@ -382,56 +434,90 @@ dump_file(int argc, VALUE *argv, VALUE self) {
|
|
382
434
|
/* Extracting values for the parse result */
|
383
435
|
/******************************************************************************/
|
384
436
|
|
437
|
+
/**
|
438
|
+
* The same as rb_class_new_instance, but accepts an additional boolean to
|
439
|
+
* indicate whether or not the resulting class instance should be frozen.
|
440
|
+
*/
|
441
|
+
static inline VALUE
|
442
|
+
rb_class_new_instance_freeze(int argc, const VALUE *argv, VALUE klass, bool freeze) {
|
443
|
+
VALUE value = rb_class_new_instance(argc, argv, klass);
|
444
|
+
if (freeze) rb_obj_freeze(value);
|
445
|
+
return value;
|
446
|
+
}
|
447
|
+
|
448
|
+
/**
|
449
|
+
* Create a new Location instance from the given parser and bounds.
|
450
|
+
*/
|
451
|
+
static inline VALUE
|
452
|
+
parser_location(const pm_parser_t *parser, VALUE source, bool freeze, const uint8_t *start, size_t length) {
|
453
|
+
VALUE argv[] = { source, LONG2FIX(start - parser->start), LONG2FIX(length) };
|
454
|
+
return rb_class_new_instance_freeze(3, argv, rb_cPrismLocation, freeze);
|
455
|
+
}
|
456
|
+
|
457
|
+
/**
|
458
|
+
* Create a new Location instance from the given parser and location.
|
459
|
+
*/
|
460
|
+
#define PARSER_LOCATION_LOC(parser, source, freeze, loc) \
|
461
|
+
parser_location(parser, source, freeze, loc.start, (size_t) (loc.end - loc.start))
|
462
|
+
|
463
|
+
/**
|
464
|
+
* Build a new Comment instance from the given parser and comment.
|
465
|
+
*/
|
466
|
+
static inline VALUE
|
467
|
+
parser_comment(const pm_parser_t *parser, VALUE source, bool freeze, const pm_comment_t *comment) {
|
468
|
+
VALUE argv[] = { PARSER_LOCATION_LOC(parser, source, freeze, comment->location) };
|
469
|
+
VALUE type = (comment->type == PM_COMMENT_EMBDOC) ? rb_cPrismEmbDocComment : rb_cPrismInlineComment;
|
470
|
+
return rb_class_new_instance_freeze(1, argv, type, freeze);
|
471
|
+
}
|
472
|
+
|
385
473
|
/**
|
386
474
|
* Extract the comments out of the parser into an array.
|
387
475
|
*/
|
388
476
|
static VALUE
|
389
|
-
parser_comments(pm_parser_t *parser, VALUE source) {
|
477
|
+
parser_comments(const pm_parser_t *parser, VALUE source, bool freeze) {
|
390
478
|
VALUE comments = rb_ary_new_capa(parser->comment_list.size);
|
391
479
|
|
392
|
-
for (
|
393
|
-
|
394
|
-
|
395
|
-
|
396
|
-
|
397
|
-
|
398
|
-
|
399
|
-
VALUE type = (comment->type == PM_COMMENT_EMBDOC) ? rb_cPrismEmbDocComment : rb_cPrismInlineComment;
|
400
|
-
VALUE comment_argv[] = { rb_class_new_instance(3, location_argv, rb_cPrismLocation) };
|
401
|
-
rb_ary_push(comments, rb_class_new_instance(1, comment_argv, type));
|
480
|
+
for (
|
481
|
+
const pm_comment_t *comment = (const pm_comment_t *) parser->comment_list.head;
|
482
|
+
comment != NULL;
|
483
|
+
comment = (const pm_comment_t *) comment->node.next
|
484
|
+
) {
|
485
|
+
VALUE value = parser_comment(parser, source, freeze, comment);
|
486
|
+
rb_ary_push(comments, value);
|
402
487
|
}
|
403
488
|
|
489
|
+
if (freeze) rb_obj_freeze(comments);
|
404
490
|
return comments;
|
405
491
|
}
|
406
492
|
|
493
|
+
/**
|
494
|
+
* Build a new MagicComment instance from the given parser and magic comment.
|
495
|
+
*/
|
496
|
+
static inline VALUE
|
497
|
+
parser_magic_comment(const pm_parser_t *parser, VALUE source, bool freeze, const pm_magic_comment_t *magic_comment) {
|
498
|
+
VALUE key_loc = parser_location(parser, source, freeze, magic_comment->key_start, magic_comment->key_length);
|
499
|
+
VALUE value_loc = parser_location(parser, source, freeze, magic_comment->value_start, magic_comment->value_length);
|
500
|
+
VALUE argv[] = { key_loc, value_loc };
|
501
|
+
return rb_class_new_instance_freeze(2, argv, rb_cPrismMagicComment, freeze);
|
502
|
+
}
|
503
|
+
|
407
504
|
/**
|
408
505
|
* Extract the magic comments out of the parser into an array.
|
409
506
|
*/
|
410
507
|
static VALUE
|
411
|
-
parser_magic_comments(pm_parser_t *parser, VALUE source) {
|
508
|
+
parser_magic_comments(const pm_parser_t *parser, VALUE source, bool freeze) {
|
412
509
|
VALUE magic_comments = rb_ary_new_capa(parser->magic_comment_list.size);
|
413
510
|
|
414
|
-
for (
|
415
|
-
|
416
|
-
|
417
|
-
|
418
|
-
|
419
|
-
|
420
|
-
|
421
|
-
VALUE value_loc_argv[] = {
|
422
|
-
source,
|
423
|
-
LONG2FIX(magic_comment->value_start - parser->start),
|
424
|
-
LONG2FIX(magic_comment->value_length)
|
425
|
-
};
|
426
|
-
|
427
|
-
VALUE magic_comment_argv[] = {
|
428
|
-
rb_class_new_instance(3, key_loc_argv, rb_cPrismLocation),
|
429
|
-
rb_class_new_instance(3, value_loc_argv, rb_cPrismLocation)
|
430
|
-
};
|
431
|
-
|
432
|
-
rb_ary_push(magic_comments, rb_class_new_instance(2, magic_comment_argv, rb_cPrismMagicComment));
|
511
|
+
for (
|
512
|
+
const pm_magic_comment_t *magic_comment = (const pm_magic_comment_t *) parser->magic_comment_list.head;
|
513
|
+
magic_comment != NULL;
|
514
|
+
magic_comment = (const pm_magic_comment_t *) magic_comment->node.next
|
515
|
+
) {
|
516
|
+
VALUE value = parser_magic_comment(parser, source, freeze, magic_comment);
|
517
|
+
rb_ary_push(magic_comments, value);
|
433
518
|
}
|
434
519
|
|
520
|
+
if (freeze) rb_obj_freeze(magic_comments);
|
435
521
|
return magic_comments;
|
436
522
|
}
|
437
523
|
|
@@ -440,17 +526,11 @@ parser_magic_comments(pm_parser_t *parser, VALUE source) {
|
|
440
526
|
* exists.
|
441
527
|
*/
|
442
528
|
static VALUE
|
443
|
-
parser_data_loc(const pm_parser_t *parser, VALUE source) {
|
529
|
+
parser_data_loc(const pm_parser_t *parser, VALUE source, bool freeze) {
|
444
530
|
if (parser->data_loc.end == NULL) {
|
445
531
|
return Qnil;
|
446
532
|
} else {
|
447
|
-
|
448
|
-
source,
|
449
|
-
LONG2FIX(parser->data_loc.start - parser->start),
|
450
|
-
LONG2FIX(parser->data_loc.end - parser->data_loc.start)
|
451
|
-
};
|
452
|
-
|
453
|
-
return rb_class_new_instance(3, argv, rb_cPrismLocation);
|
533
|
+
return PARSER_LOCATION_LOC(parser, source, freeze, parser->data_loc);
|
454
534
|
}
|
455
535
|
}
|
456
536
|
|
@@ -458,16 +538,17 @@ parser_data_loc(const pm_parser_t *parser, VALUE source) {
|
|
458
538
|
* Extract the errors out of the parser into an array.
|
459
539
|
*/
|
460
540
|
static VALUE
|
461
|
-
parser_errors(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
|
541
|
+
parser_errors(const pm_parser_t *parser, rb_encoding *encoding, VALUE source, bool freeze) {
|
462
542
|
VALUE errors = rb_ary_new_capa(parser->error_list.size);
|
463
|
-
pm_diagnostic_t *error;
|
464
543
|
|
465
|
-
for (
|
466
|
-
|
467
|
-
|
468
|
-
|
469
|
-
|
470
|
-
|
544
|
+
for (
|
545
|
+
const pm_diagnostic_t *error = (const pm_diagnostic_t *) parser->error_list.head;
|
546
|
+
error != NULL;
|
547
|
+
error = (const pm_diagnostic_t *) error->node.next
|
548
|
+
) {
|
549
|
+
VALUE type = ID2SYM(rb_intern(pm_diagnostic_id_human(error->diag_id)));
|
550
|
+
VALUE message = rb_obj_freeze(rb_enc_str_new_cstr(error->message, encoding));
|
551
|
+
VALUE location = PARSER_LOCATION_LOC(parser, source, freeze, error->location);
|
471
552
|
|
472
553
|
VALUE level = Qnil;
|
473
554
|
switch (error->level) {
|
@@ -484,16 +565,12 @@ parser_errors(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
|
|
484
565
|
rb_raise(rb_eRuntimeError, "Unknown level: %" PRIu8, error->level);
|
485
566
|
}
|
486
567
|
|
487
|
-
VALUE
|
488
|
-
|
489
|
-
|
490
|
-
rb_class_new_instance(3, location_argv, rb_cPrismLocation),
|
491
|
-
level
|
492
|
-
};
|
493
|
-
|
494
|
-
rb_ary_push(errors, rb_class_new_instance(4, error_argv, rb_cPrismParseError));
|
568
|
+
VALUE argv[] = { type, message, location, level };
|
569
|
+
VALUE value = rb_class_new_instance_freeze(4, argv, rb_cPrismParseError, freeze);
|
570
|
+
rb_ary_push(errors, value);
|
495
571
|
}
|
496
572
|
|
573
|
+
if (freeze) rb_obj_freeze(errors);
|
497
574
|
return errors;
|
498
575
|
}
|
499
576
|
|
@@ -501,16 +578,17 @@ parser_errors(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
|
|
501
578
|
* Extract the warnings out of the parser into an array.
|
502
579
|
*/
|
503
580
|
static VALUE
|
504
|
-
parser_warnings(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
|
581
|
+
parser_warnings(const pm_parser_t *parser, rb_encoding *encoding, VALUE source, bool freeze) {
|
505
582
|
VALUE warnings = rb_ary_new_capa(parser->warning_list.size);
|
506
|
-
pm_diagnostic_t *warning;
|
507
583
|
|
508
|
-
for (
|
509
|
-
|
510
|
-
|
511
|
-
|
512
|
-
|
513
|
-
|
584
|
+
for (
|
585
|
+
const pm_diagnostic_t *warning = (const pm_diagnostic_t *) parser->warning_list.head;
|
586
|
+
warning != NULL;
|
587
|
+
warning = (const pm_diagnostic_t *) warning->node.next
|
588
|
+
) {
|
589
|
+
VALUE type = ID2SYM(rb_intern(pm_diagnostic_id_human(warning->diag_id)));
|
590
|
+
VALUE message = rb_obj_freeze(rb_enc_str_new_cstr(warning->message, encoding));
|
591
|
+
VALUE location = PARSER_LOCATION_LOC(parser, source, freeze, warning->location);
|
514
592
|
|
515
593
|
VALUE level = Qnil;
|
516
594
|
switch (warning->level) {
|
@@ -524,16 +602,12 @@ parser_warnings(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
|
|
524
602
|
rb_raise(rb_eRuntimeError, "Unknown level: %" PRIu8, warning->level);
|
525
603
|
}
|
526
604
|
|
527
|
-
VALUE
|
528
|
-
|
529
|
-
|
530
|
-
rb_class_new_instance(3, location_argv, rb_cPrismLocation),
|
531
|
-
level
|
532
|
-
};
|
533
|
-
|
534
|
-
rb_ary_push(warnings, rb_class_new_instance(4, warning_argv, rb_cPrismParseWarning));
|
605
|
+
VALUE argv[] = { type, message, location, level };
|
606
|
+
VALUE value = rb_class_new_instance_freeze(4, argv, rb_cPrismParseWarning, freeze);
|
607
|
+
rb_ary_push(warnings, value);
|
535
608
|
}
|
536
609
|
|
610
|
+
if (freeze) rb_obj_freeze(warnings);
|
537
611
|
return warnings;
|
538
612
|
}
|
539
613
|
|
@@ -541,18 +615,18 @@ parser_warnings(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
|
|
541
615
|
* Create a new parse result from the given parser, value, encoding, and source.
|
542
616
|
*/
|
543
617
|
static VALUE
|
544
|
-
parse_result_create(VALUE class, pm_parser_t *parser, VALUE value, rb_encoding *encoding, VALUE source) {
|
618
|
+
parse_result_create(VALUE class, const pm_parser_t *parser, VALUE value, rb_encoding *encoding, VALUE source, bool freeze) {
|
545
619
|
VALUE result_argv[] = {
|
546
620
|
value,
|
547
|
-
parser_comments(parser, source),
|
548
|
-
parser_magic_comments(parser, source),
|
549
|
-
parser_data_loc(parser, source),
|
550
|
-
parser_errors(parser, encoding, source),
|
551
|
-
parser_warnings(parser, encoding, source),
|
621
|
+
parser_comments(parser, source, freeze),
|
622
|
+
parser_magic_comments(parser, source, freeze),
|
623
|
+
parser_data_loc(parser, source, freeze),
|
624
|
+
parser_errors(parser, encoding, source, freeze),
|
625
|
+
parser_warnings(parser, encoding, source, freeze),
|
552
626
|
source
|
553
627
|
};
|
554
628
|
|
555
|
-
return
|
629
|
+
return rb_class_new_instance_freeze(7, result_argv, class, freeze);
|
556
630
|
}
|
557
631
|
|
558
632
|
/******************************************************************************/
|
@@ -568,6 +642,7 @@ typedef struct {
|
|
568
642
|
VALUE source;
|
569
643
|
VALUE tokens;
|
570
644
|
rb_encoding *encoding;
|
645
|
+
bool freeze;
|
571
646
|
} parse_lex_data_t;
|
572
647
|
|
573
648
|
/**
|
@@ -579,10 +654,13 @@ static void
|
|
579
654
|
parse_lex_token(void *data, pm_parser_t *parser, pm_token_t *token) {
|
580
655
|
parse_lex_data_t *parse_lex_data = (parse_lex_data_t *) parser->lex_callback->data;
|
581
656
|
|
582
|
-
VALUE
|
583
|
-
|
584
|
-
|
585
|
-
)
|
657
|
+
VALUE value = pm_token_new(parser, token, parse_lex_data->encoding, parse_lex_data->source, parse_lex_data->freeze);
|
658
|
+
VALUE yields = rb_assoc_new(value, INT2FIX(parser->lex_state));
|
659
|
+
|
660
|
+
if (parse_lex_data->freeze) {
|
661
|
+
rb_obj_freeze(value);
|
662
|
+
rb_obj_freeze(yields);
|
663
|
+
}
|
586
664
|
|
587
665
|
rb_ary_push(parse_lex_data->tokens, yields);
|
588
666
|
}
|
@@ -602,14 +680,37 @@ parse_lex_encoding_changed_callback(pm_parser_t *parser) {
|
|
602
680
|
// one or two tokens, since the encoding can only change at the top of the
|
603
681
|
// file.
|
604
682
|
VALUE tokens = parse_lex_data->tokens;
|
683
|
+
VALUE next_tokens = rb_ary_new();
|
684
|
+
|
605
685
|
for (long index = 0; index < RARRAY_LEN(tokens); index++) {
|
606
686
|
VALUE yields = rb_ary_entry(tokens, index);
|
607
687
|
VALUE token = rb_ary_entry(yields, 0);
|
608
688
|
|
609
689
|
VALUE value = rb_ivar_get(token, rb_intern("@value"));
|
610
|
-
|
611
|
-
|
690
|
+
VALUE next_value = rb_str_dup(value);
|
691
|
+
|
692
|
+
rb_enc_associate(next_value, parse_lex_data->encoding);
|
693
|
+
if (parse_lex_data->freeze) rb_obj_freeze(next_value);
|
694
|
+
|
695
|
+
VALUE next_token_argv[] = {
|
696
|
+
parse_lex_data->source,
|
697
|
+
rb_ivar_get(token, rb_intern("@type")),
|
698
|
+
next_value,
|
699
|
+
rb_ivar_get(token, rb_intern("@location"))
|
700
|
+
};
|
701
|
+
|
702
|
+
VALUE next_token = rb_class_new_instance(4, next_token_argv, rb_cPrismToken);
|
703
|
+
VALUE next_yields = rb_assoc_new(next_token, rb_ary_entry(yields, 1));
|
704
|
+
|
705
|
+
if (parse_lex_data->freeze) {
|
706
|
+
rb_obj_freeze(next_token);
|
707
|
+
rb_obj_freeze(next_yields);
|
708
|
+
}
|
709
|
+
|
710
|
+
rb_ary_push(next_tokens, next_yields);
|
612
711
|
}
|
712
|
+
|
713
|
+
rb_ary_replace(parse_lex_data->tokens, next_tokens);
|
613
714
|
}
|
614
715
|
|
615
716
|
/**
|
@@ -629,7 +730,8 @@ parse_lex_input(pm_string_t *input, const pm_options_t *options, bool return_nod
|
|
629
730
|
parse_lex_data_t parse_lex_data = {
|
630
731
|
.source = source,
|
631
732
|
.tokens = rb_ary_new(),
|
632
|
-
.encoding = rb_utf8_encoding()
|
733
|
+
.encoding = rb_utf8_encoding(),
|
734
|
+
.freeze = options->freeze,
|
633
735
|
};
|
634
736
|
|
635
737
|
parse_lex_data_t *data = &parse_lex_data;
|
@@ -652,14 +754,22 @@ parse_lex_input(pm_string_t *input, const pm_options_t *options, bool return_nod
|
|
652
754
|
rb_ary_push(offsets, ULONG2NUM(parser.newline_list.offsets[index]));
|
653
755
|
}
|
654
756
|
|
757
|
+
if (options->freeze) {
|
758
|
+
rb_obj_freeze(source_string);
|
759
|
+
rb_obj_freeze(offsets);
|
760
|
+
rb_obj_freeze(source);
|
761
|
+
rb_obj_freeze(parse_lex_data.tokens);
|
762
|
+
}
|
763
|
+
|
655
764
|
VALUE result;
|
656
765
|
if (return_nodes) {
|
657
766
|
VALUE value = rb_ary_new_capa(2);
|
658
|
-
rb_ary_push(value, pm_ast_new(&parser, node, parse_lex_data.encoding, source));
|
767
|
+
rb_ary_push(value, pm_ast_new(&parser, node, parse_lex_data.encoding, source, options->freeze));
|
659
768
|
rb_ary_push(value, parse_lex_data.tokens);
|
660
|
-
|
769
|
+
if (options->freeze) rb_obj_freeze(value);
|
770
|
+
result = parse_result_create(rb_cPrismParseLexResult, &parser, value, parse_lex_data.encoding, source, options->freeze);
|
661
771
|
} else {
|
662
|
-
result = parse_result_create(rb_cPrismLexResult, &parser, parse_lex_data.tokens, parse_lex_data.encoding, source);
|
772
|
+
result = parse_result_create(rb_cPrismLexResult, &parser, parse_lex_data.tokens, parse_lex_data.encoding, source, options->freeze);
|
663
773
|
}
|
664
774
|
|
665
775
|
pm_node_destroy(&parser, node);
|
@@ -725,9 +835,13 @@ parse_input(pm_string_t *input, const pm_options_t *options) {
|
|
725
835
|
pm_node_t *node = pm_parse(&parser);
|
726
836
|
rb_encoding *encoding = rb_enc_find(parser.encoding->name);
|
727
837
|
|
728
|
-
VALUE source = pm_source_new(&parser, encoding);
|
729
|
-
VALUE value = pm_ast_new(&parser, node, encoding, source);
|
730
|
-
VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source)
|
838
|
+
VALUE source = pm_source_new(&parser, encoding, options->freeze);
|
839
|
+
VALUE value = pm_ast_new(&parser, node, encoding, source, options->freeze);
|
840
|
+
VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source, options->freeze);
|
841
|
+
|
842
|
+
if (options->freeze) {
|
843
|
+
rb_obj_freeze(source);
|
844
|
+
}
|
731
845
|
|
732
846
|
pm_node_destroy(&parser, node);
|
733
847
|
pm_parser_free(&parser);
|
@@ -749,6 +863,8 @@ parse_input(pm_string_t *input, const pm_options_t *options) {
|
|
749
863
|
* encoding or nil.
|
750
864
|
* * `filepath` - the filepath of the source being parsed. This should be a
|
751
865
|
* string or nil.
|
866
|
+
* * `freeze` - whether or not to deeply freeze the AST. This should be a
|
867
|
+
* boolean or nil.
|
752
868
|
* * `frozen_string_literal` - whether or not the frozen string literal pragma
|
753
869
|
* has been set. This should be a boolean or nil.
|
754
870
|
* * `line` - the line number that the parse starts on. This should be an
|
@@ -768,12 +884,12 @@ parse_input(pm_string_t *input, const pm_options_t *options) {
|
|
768
884
|
* parsed. This should be an array of arrays of symbols or nil. Scopes are
|
769
885
|
* ordered from the outermost scope to the innermost one.
|
770
886
|
* * `version` - the version of Ruby syntax that prism should used to parse Ruby
|
771
|
-
* code. By default prism assumes you want to parse with the latest
|
772
|
-
* of Ruby syntax (which you can trigger with `nil` or
|
773
|
-
* may also restrict the syntax to a specific version of
|
774
|
-
* To parse with the same syntax version that
|
775
|
-
* use `version: RUBY_VERSION`. Raises
|
776
|
-
* currently supported by Prism.
|
887
|
+
* code. By default prism assumes you want to parse with the latest
|
888
|
+
* version of Ruby syntax (which you can trigger with `nil` or
|
889
|
+
* `"latest"`). You may also restrict the syntax to a specific version of
|
890
|
+
* Ruby, e.g., with `"3.3.0"`. To parse with the same syntax version that
|
891
|
+
* the current Ruby is running use `version: RUBY_VERSION`. Raises
|
892
|
+
* ArgumentError if the version is not currently supported by Prism.
|
777
893
|
*/
|
778
894
|
static VALUE
|
779
895
|
parse(int argc, VALUE *argv, VALUE self) {
|
@@ -921,9 +1037,9 @@ parse_stream(int argc, VALUE *argv, VALUE self) {
|
|
921
1037
|
pm_node_t *node = pm_parse_stream(&parser, &buffer, (void *) stream, parse_stream_fgets, &options);
|
922
1038
|
rb_encoding *encoding = rb_enc_find(parser.encoding->name);
|
923
1039
|
|
924
|
-
VALUE source = pm_source_new(&parser, encoding);
|
925
|
-
VALUE value = pm_ast_new(&parser, node, encoding, source);
|
926
|
-
VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source);
|
1040
|
+
VALUE source = pm_source_new(&parser, encoding, options.freeze);
|
1041
|
+
VALUE value = pm_ast_new(&parser, node, encoding, source, options.freeze);
|
1042
|
+
VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source, options.freeze);
|
927
1043
|
|
928
1044
|
pm_node_destroy(&parser, node);
|
929
1045
|
pm_buffer_free(&buffer);
|
@@ -943,8 +1059,8 @@ parse_input_comments(pm_string_t *input, const pm_options_t *options) {
|
|
943
1059
|
pm_node_t *node = pm_parse(&parser);
|
944
1060
|
rb_encoding *encoding = rb_enc_find(parser.encoding->name);
|
945
1061
|
|
946
|
-
VALUE source = pm_source_new(&parser, encoding);
|
947
|
-
VALUE comments = parser_comments(&parser, source);
|
1062
|
+
VALUE source = pm_source_new(&parser, encoding, options->freeze);
|
1063
|
+
VALUE comments = parser_comments(&parser, source, options->freeze);
|
948
1064
|
|
949
1065
|
pm_node_destroy(&parser, node);
|
950
1066
|
pm_parser_free(&parser);
|
@@ -1133,6 +1249,68 @@ parse_file_failure_p(int argc, VALUE *argv, VALUE self) {
|
|
1133
1249
|
return RTEST(parse_file_success_p(argc, argv, self)) ? Qfalse : Qtrue;
|
1134
1250
|
}
|
1135
1251
|
|
1252
|
+
/******************************************************************************/
|
1253
|
+
/* String query methods */
|
1254
|
+
/******************************************************************************/
|
1255
|
+
|
1256
|
+
/**
|
1257
|
+
* Process the result of a call to a string query method and return an
|
1258
|
+
* appropriate value.
|
1259
|
+
*/
|
1260
|
+
static VALUE
|
1261
|
+
string_query(pm_string_query_t result) {
|
1262
|
+
switch (result) {
|
1263
|
+
case PM_STRING_QUERY_ERROR:
|
1264
|
+
rb_raise(rb_eArgError, "Invalid or non ascii-compatible encoding");
|
1265
|
+
return Qfalse;
|
1266
|
+
case PM_STRING_QUERY_FALSE:
|
1267
|
+
return Qfalse;
|
1268
|
+
case PM_STRING_QUERY_TRUE:
|
1269
|
+
return Qtrue;
|
1270
|
+
}
|
1271
|
+
return Qfalse;
|
1272
|
+
}
|
1273
|
+
|
1274
|
+
/**
|
1275
|
+
* call-seq:
|
1276
|
+
* Prism::StringQuery::local?(string) -> bool
|
1277
|
+
*
|
1278
|
+
* Returns true if the string constitutes a valid local variable name. Note that
|
1279
|
+
* this means the names that can be set through Binding#local_variable_set, not
|
1280
|
+
* necessarily the ones that can be set through a local variable assignment.
|
1281
|
+
*/
|
1282
|
+
static VALUE
|
1283
|
+
string_query_local_p(VALUE self, VALUE string) {
|
1284
|
+
const uint8_t *source = (const uint8_t *) check_string(string);
|
1285
|
+
return string_query(pm_string_query_local(source, RSTRING_LEN(string), rb_enc_get(string)->name));
|
1286
|
+
}
|
1287
|
+
|
1288
|
+
/**
|
1289
|
+
* call-seq:
|
1290
|
+
* Prism::StringQuery::constant?(string) -> bool
|
1291
|
+
*
|
1292
|
+
* Returns true if the string constitutes a valid constant name. Note that this
|
1293
|
+
* means the names that can be set through Module#const_set, not necessarily the
|
1294
|
+
* ones that can be set through a constant assignment.
|
1295
|
+
*/
|
1296
|
+
static VALUE
|
1297
|
+
string_query_constant_p(VALUE self, VALUE string) {
|
1298
|
+
const uint8_t *source = (const uint8_t *) check_string(string);
|
1299
|
+
return string_query(pm_string_query_constant(source, RSTRING_LEN(string), rb_enc_get(string)->name));
|
1300
|
+
}
|
1301
|
+
|
1302
|
+
/**
|
1303
|
+
* call-seq:
|
1304
|
+
* Prism::StringQuery::method_name?(string) -> bool
|
1305
|
+
*
|
1306
|
+
* Returns true if the string constitutes a valid method name.
|
1307
|
+
*/
|
1308
|
+
static VALUE
|
1309
|
+
string_query_method_name_p(VALUE self, VALUE string) {
|
1310
|
+
const uint8_t *source = (const uint8_t *) check_string(string);
|
1311
|
+
return string_query(pm_string_query_method_name(source, RSTRING_LEN(string), rb_enc_get(string)->name));
|
1312
|
+
}
|
1313
|
+
|
1136
1314
|
/******************************************************************************/
|
1137
1315
|
/* Initialization of the extension */
|
1138
1316
|
/******************************************************************************/
|
@@ -1170,12 +1348,15 @@ Init_prism(void) {
|
|
1170
1348
|
rb_cPrismParseResult = rb_define_class_under(rb_cPrism, "ParseResult", rb_cPrismResult);
|
1171
1349
|
rb_cPrismLexResult = rb_define_class_under(rb_cPrism, "LexResult", rb_cPrismResult);
|
1172
1350
|
rb_cPrismParseLexResult = rb_define_class_under(rb_cPrism, "ParseLexResult", rb_cPrismResult);
|
1351
|
+
rb_cPrismStringQuery = rb_define_class_under(rb_cPrism, "StringQuery", rb_cObject);
|
1352
|
+
rb_cPrismScope = rb_define_class_under(rb_cPrism, "Scope", rb_cObject);
|
1173
1353
|
|
1174
1354
|
// Intern all of the IDs eagerly that we support so that we don't have to do
|
1175
1355
|
// it every time we parse.
|
1176
1356
|
rb_id_option_command_line = rb_intern_const("command_line");
|
1177
1357
|
rb_id_option_encoding = rb_intern_const("encoding");
|
1178
1358
|
rb_id_option_filepath = rb_intern_const("filepath");
|
1359
|
+
rb_id_option_freeze = rb_intern_const("freeze");
|
1179
1360
|
rb_id_option_frozen_string_literal = rb_intern_const("frozen_string_literal");
|
1180
1361
|
rb_id_option_line = rb_intern_const("line");
|
1181
1362
|
rb_id_option_main_script = rb_intern_const("main_script");
|
@@ -1183,11 +1364,15 @@ Init_prism(void) {
|
|
1183
1364
|
rb_id_option_scopes = rb_intern_const("scopes");
|
1184
1365
|
rb_id_option_version = rb_intern_const("version");
|
1185
1366
|
rb_id_source_for = rb_intern("for");
|
1367
|
+
rb_id_forwarding_positionals = rb_intern("*");
|
1368
|
+
rb_id_forwarding_keywords = rb_intern("**");
|
1369
|
+
rb_id_forwarding_block = rb_intern("&");
|
1370
|
+
rb_id_forwarding_all = rb_intern("...");
|
1186
1371
|
|
1187
1372
|
/**
|
1188
1373
|
* The version of the prism library.
|
1189
1374
|
*/
|
1190
|
-
rb_define_const(rb_cPrism, "VERSION",
|
1375
|
+
rb_define_const(rb_cPrism, "VERSION", rb_str_freeze(rb_str_new_cstr(EXPECTED_PRISM_VERSION)));
|
1191
1376
|
|
1192
1377
|
// First, the functions that have to do with lexing and parsing.
|
1193
1378
|
rb_define_singleton_method(rb_cPrism, "lex", lex, -1);
|
@@ -1211,6 +1396,10 @@ Init_prism(void) {
|
|
1211
1396
|
rb_define_singleton_method(rb_cPrism, "dump_file", dump_file, -1);
|
1212
1397
|
#endif
|
1213
1398
|
|
1399
|
+
rb_define_singleton_method(rb_cPrismStringQuery, "local?", string_query_local_p, 1);
|
1400
|
+
rb_define_singleton_method(rb_cPrismStringQuery, "constant?", string_query_constant_p, 1);
|
1401
|
+
rb_define_singleton_method(rb_cPrismStringQuery, "method_name?", string_query_method_name_p, 1);
|
1402
|
+
|
1214
1403
|
// Next, initialize the other APIs.
|
1215
1404
|
Init_prism_api_node();
|
1216
1405
|
Init_prism_pack();
|