prism 1.2.0 → 1.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (68) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +46 -1
  3. data/Makefile +1 -1
  4. data/config.yml +429 -2
  5. data/docs/build_system.md +8 -11
  6. data/docs/releasing.md +1 -1
  7. data/docs/relocation.md +34 -0
  8. data/docs/ruby_api.md +1 -1
  9. data/ext/prism/api_node.c +1824 -1305
  10. data/ext/prism/extconf.rb +13 -36
  11. data/ext/prism/extension.c +298 -109
  12. data/ext/prism/extension.h +4 -4
  13. data/include/prism/ast.h +442 -2
  14. data/include/prism/defines.h +26 -8
  15. data/include/prism/options.h +47 -1
  16. data/include/prism/util/pm_buffer.h +10 -0
  17. data/include/prism/version.h +2 -2
  18. data/include/prism.h +51 -4
  19. data/lib/prism/dot_visitor.rb +26 -0
  20. data/lib/prism/dsl.rb +14 -6
  21. data/lib/prism/ffi.rb +93 -28
  22. data/lib/prism/inspect_visitor.rb +4 -1
  23. data/lib/prism/node.rb +1886 -105
  24. data/lib/prism/parse_result/errors.rb +1 -1
  25. data/lib/prism/parse_result/newlines.rb +1 -1
  26. data/lib/prism/parse_result.rb +54 -2
  27. data/lib/prism/polyfill/append_as_bytes.rb +15 -0
  28. data/lib/prism/reflection.rb +4 -4
  29. data/lib/prism/relocation.rb +504 -0
  30. data/lib/prism/serialize.rb +1252 -765
  31. data/lib/prism/string_query.rb +30 -0
  32. data/lib/prism/translation/parser/builder.rb +61 -0
  33. data/lib/prism/translation/parser/compiler.rb +228 -162
  34. data/lib/prism/translation/parser/lexer.rb +435 -61
  35. data/lib/prism/translation/parser.rb +51 -3
  36. data/lib/prism/translation/parser35.rb +12 -0
  37. data/lib/prism/translation/ripper.rb +13 -3
  38. data/lib/prism/translation/ruby_parser.rb +17 -7
  39. data/lib/prism/translation.rb +1 -0
  40. data/lib/prism.rb +9 -7
  41. data/prism.gemspec +11 -1
  42. data/rbi/prism/dsl.rbi +10 -7
  43. data/rbi/prism/node.rbi +44 -17
  44. data/rbi/prism/parse_result.rbi +17 -0
  45. data/rbi/prism/string_query.rbi +12 -0
  46. data/rbi/prism/translation/parser35.rbi +6 -0
  47. data/rbi/prism.rbi +39 -36
  48. data/sig/prism/dsl.rbs +6 -4
  49. data/sig/prism/node.rbs +29 -15
  50. data/sig/prism/parse_result.rbs +10 -0
  51. data/sig/prism/relocation.rbs +185 -0
  52. data/sig/prism/serialize.rbs +4 -2
  53. data/sig/prism/string_query.rbs +11 -0
  54. data/sig/prism.rbs +22 -1
  55. data/src/diagnostic.c +2 -2
  56. data/src/node.c +39 -0
  57. data/src/options.c +31 -0
  58. data/src/prettyprint.c +62 -0
  59. data/src/prism.c +738 -199
  60. data/src/regexp.c +7 -3
  61. data/src/serialize.c +18 -0
  62. data/src/static_literals.c +1 -1
  63. data/src/util/pm_buffer.c +40 -0
  64. data/src/util/pm_char.c +1 -1
  65. data/src/util/pm_constant_pool.c +6 -2
  66. data/src/util/pm_string.c +1 -0
  67. data/src/util/pm_strncasecmp.c +13 -1
  68. metadata +13 -7
@@ -23,12 +23,15 @@ VALUE rb_cPrismResult;
23
23
  VALUE rb_cPrismParseResult;
24
24
  VALUE rb_cPrismLexResult;
25
25
  VALUE rb_cPrismParseLexResult;
26
+ VALUE rb_cPrismStringQuery;
27
+ VALUE rb_cPrismScope;
26
28
 
27
29
  VALUE rb_cPrismDebugEncoding;
28
30
 
29
31
  ID rb_id_option_command_line;
30
32
  ID rb_id_option_encoding;
31
33
  ID rb_id_option_filepath;
34
+ ID rb_id_option_freeze;
32
35
  ID rb_id_option_frozen_string_literal;
33
36
  ID rb_id_option_line;
34
37
  ID rb_id_option_main_script;
@@ -36,6 +39,10 @@ ID rb_id_option_partial_script;
36
39
  ID rb_id_option_scopes;
37
40
  ID rb_id_option_version;
38
41
  ID rb_id_source_for;
42
+ ID rb_id_forwarding_positionals;
43
+ ID rb_id_forwarding_keywords;
44
+ ID rb_id_forwarding_block;
45
+ ID rb_id_forwarding_all;
39
46
 
40
47
  /******************************************************************************/
41
48
  /* IO of Ruby code */
@@ -93,14 +100,53 @@ build_options_scopes(pm_options_t *options, VALUE scopes) {
93
100
  for (size_t scope_index = 0; scope_index < scopes_count; scope_index++) {
94
101
  VALUE scope = rb_ary_entry(scopes, scope_index);
95
102
 
96
- // Check that the scope is an array. If it's not, then raise a type
97
- // error.
98
- if (!RB_TYPE_P(scope, T_ARRAY)) {
99
- rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Array)", rb_obj_class(scope));
103
+ // The scope can be either an array or it can be a Prism::Scope object.
104
+ // Parse out the correct values here from either.
105
+ VALUE locals;
106
+ uint8_t forwarding = PM_OPTIONS_SCOPE_FORWARDING_NONE;
107
+
108
+ if (RB_TYPE_P(scope, T_ARRAY)) {
109
+ locals = scope;
110
+ } else if (rb_obj_is_kind_of(scope, rb_cPrismScope)) {
111
+ locals = rb_ivar_get(scope, rb_intern("@locals"));
112
+ if (!RB_TYPE_P(locals, T_ARRAY)) {
113
+ rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Array)", rb_obj_class(locals));
114
+ }
115
+
116
+ VALUE names = rb_ivar_get(scope, rb_intern("@forwarding"));
117
+ if (!RB_TYPE_P(names, T_ARRAY)) {
118
+ rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Array)", rb_obj_class(names));
119
+ }
120
+
121
+ size_t names_count = RARRAY_LEN(names);
122
+ for (size_t name_index = 0; name_index < names_count; name_index++) {
123
+ VALUE name = rb_ary_entry(names, name_index);
124
+
125
+ // Check that the name is a symbol. If it's not, then raise
126
+ // a type error.
127
+ if (!RB_TYPE_P(name, T_SYMBOL)) {
128
+ rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Symbol)", rb_obj_class(name));
129
+ }
130
+
131
+ ID id = SYM2ID(name);
132
+ if (id == rb_id_forwarding_positionals) {
133
+ forwarding |= PM_OPTIONS_SCOPE_FORWARDING_POSITIONALS;
134
+ } else if (id == rb_id_forwarding_keywords) {
135
+ forwarding |= PM_OPTIONS_SCOPE_FORWARDING_KEYWORDS;
136
+ } else if (id == rb_id_forwarding_block) {
137
+ forwarding |= PM_OPTIONS_SCOPE_FORWARDING_BLOCK;
138
+ } else if (id == rb_id_forwarding_all) {
139
+ forwarding |= PM_OPTIONS_SCOPE_FORWARDING_ALL;
140
+ } else {
141
+ rb_raise(rb_eArgError, "invalid forwarding value: %" PRIsVALUE, name);
142
+ }
143
+ }
144
+ } else {
145
+ rb_raise(rb_eTypeError, "wrong argument type %"PRIsVALUE" (expected Array or Prism::Scope)", rb_obj_class(scope));
100
146
  }
101
147
 
102
148
  // Initialize the scope array.
103
- size_t locals_count = RARRAY_LEN(scope);
149
+ size_t locals_count = RARRAY_LEN(locals);
104
150
  pm_options_scope_t *options_scope = &options->scopes[scope_index];
105
151
  if (!pm_options_scope_init(options_scope, locals_count)) {
106
152
  rb_raise(rb_eNoMemError, "failed to allocate memory");
@@ -108,7 +154,7 @@ build_options_scopes(pm_options_t *options, VALUE scopes) {
108
154
 
109
155
  // Iterate over the locals and add them to the scope.
110
156
  for (size_t local_index = 0; local_index < locals_count; local_index++) {
111
- VALUE local = rb_ary_entry(scope, local_index);
157
+ VALUE local = rb_ary_entry(locals, local_index);
112
158
 
113
159
  // Check that the local is a symbol. If it's not, then raise a
114
160
  // type error.
@@ -121,6 +167,9 @@ build_options_scopes(pm_options_t *options, VALUE scopes) {
121
167
  const char *name = rb_id2name(SYM2ID(local));
122
168
  pm_string_constant_init(scope_local, name, strlen(name));
123
169
  }
170
+
171
+ // Now set the forwarding options.
172
+ pm_options_scope_forwarding_set(options_scope, forwarding);
124
173
  }
125
174
  }
126
175
 
@@ -179,6 +228,8 @@ build_options_i(VALUE key, VALUE value, VALUE argument) {
179
228
  if (!NIL_P(value)) pm_options_main_script_set(options, RTEST(value));
180
229
  } else if (key_id == rb_id_option_partial_script) {
181
230
  if (!NIL_P(value)) pm_options_partial_script_set(options, RTEST(value));
231
+ } else if (key_id == rb_id_option_freeze) {
232
+ if (!NIL_P(value)) pm_options_freeze_set(options, RTEST(value));
182
233
  } else {
183
234
  rb_raise(rb_eArgError, "unknown keyword: %" PRIsVALUE, key);
184
235
  }
@@ -343,6 +394,7 @@ dump(int argc, VALUE *argv, VALUE self) {
343
394
  #endif
344
395
 
345
396
  VALUE value = dump_input(&input, &options);
397
+ if (options.freeze) rb_obj_freeze(value);
346
398
 
347
399
  #ifdef PRISM_BUILD_DEBUG
348
400
  xfree(dup);
@@ -382,56 +434,90 @@ dump_file(int argc, VALUE *argv, VALUE self) {
382
434
  /* Extracting values for the parse result */
383
435
  /******************************************************************************/
384
436
 
437
+ /**
438
+ * The same as rb_class_new_instance, but accepts an additional boolean to
439
+ * indicate whether or not the resulting class instance should be frozen.
440
+ */
441
+ static inline VALUE
442
+ rb_class_new_instance_freeze(int argc, const VALUE *argv, VALUE klass, bool freeze) {
443
+ VALUE value = rb_class_new_instance(argc, argv, klass);
444
+ if (freeze) rb_obj_freeze(value);
445
+ return value;
446
+ }
447
+
448
+ /**
449
+ * Create a new Location instance from the given parser and bounds.
450
+ */
451
+ static inline VALUE
452
+ parser_location(const pm_parser_t *parser, VALUE source, bool freeze, const uint8_t *start, size_t length) {
453
+ VALUE argv[] = { source, LONG2FIX(start - parser->start), LONG2FIX(length) };
454
+ return rb_class_new_instance_freeze(3, argv, rb_cPrismLocation, freeze);
455
+ }
456
+
457
+ /**
458
+ * Create a new Location instance from the given parser and location.
459
+ */
460
+ #define PARSER_LOCATION_LOC(parser, source, freeze, loc) \
461
+ parser_location(parser, source, freeze, loc.start, (size_t) (loc.end - loc.start))
462
+
463
+ /**
464
+ * Build a new Comment instance from the given parser and comment.
465
+ */
466
+ static inline VALUE
467
+ parser_comment(const pm_parser_t *parser, VALUE source, bool freeze, const pm_comment_t *comment) {
468
+ VALUE argv[] = { PARSER_LOCATION_LOC(parser, source, freeze, comment->location) };
469
+ VALUE type = (comment->type == PM_COMMENT_EMBDOC) ? rb_cPrismEmbDocComment : rb_cPrismInlineComment;
470
+ return rb_class_new_instance_freeze(1, argv, type, freeze);
471
+ }
472
+
385
473
  /**
386
474
  * Extract the comments out of the parser into an array.
387
475
  */
388
476
  static VALUE
389
- parser_comments(pm_parser_t *parser, VALUE source) {
477
+ parser_comments(const pm_parser_t *parser, VALUE source, bool freeze) {
390
478
  VALUE comments = rb_ary_new_capa(parser->comment_list.size);
391
479
 
392
- for (pm_comment_t *comment = (pm_comment_t *) parser->comment_list.head; comment != NULL; comment = (pm_comment_t *) comment->node.next) {
393
- VALUE location_argv[] = {
394
- source,
395
- LONG2FIX(comment->location.start - parser->start),
396
- LONG2FIX(comment->location.end - comment->location.start)
397
- };
398
-
399
- VALUE type = (comment->type == PM_COMMENT_EMBDOC) ? rb_cPrismEmbDocComment : rb_cPrismInlineComment;
400
- VALUE comment_argv[] = { rb_class_new_instance(3, location_argv, rb_cPrismLocation) };
401
- rb_ary_push(comments, rb_class_new_instance(1, comment_argv, type));
480
+ for (
481
+ const pm_comment_t *comment = (const pm_comment_t *) parser->comment_list.head;
482
+ comment != NULL;
483
+ comment = (const pm_comment_t *) comment->node.next
484
+ ) {
485
+ VALUE value = parser_comment(parser, source, freeze, comment);
486
+ rb_ary_push(comments, value);
402
487
  }
403
488
 
489
+ if (freeze) rb_obj_freeze(comments);
404
490
  return comments;
405
491
  }
406
492
 
493
+ /**
494
+ * Build a new MagicComment instance from the given parser and magic comment.
495
+ */
496
+ static inline VALUE
497
+ parser_magic_comment(const pm_parser_t *parser, VALUE source, bool freeze, const pm_magic_comment_t *magic_comment) {
498
+ VALUE key_loc = parser_location(parser, source, freeze, magic_comment->key_start, magic_comment->key_length);
499
+ VALUE value_loc = parser_location(parser, source, freeze, magic_comment->value_start, magic_comment->value_length);
500
+ VALUE argv[] = { key_loc, value_loc };
501
+ return rb_class_new_instance_freeze(2, argv, rb_cPrismMagicComment, freeze);
502
+ }
503
+
407
504
  /**
408
505
  * Extract the magic comments out of the parser into an array.
409
506
  */
410
507
  static VALUE
411
- parser_magic_comments(pm_parser_t *parser, VALUE source) {
508
+ parser_magic_comments(const pm_parser_t *parser, VALUE source, bool freeze) {
412
509
  VALUE magic_comments = rb_ary_new_capa(parser->magic_comment_list.size);
413
510
 
414
- for (pm_magic_comment_t *magic_comment = (pm_magic_comment_t *) parser->magic_comment_list.head; magic_comment != NULL; magic_comment = (pm_magic_comment_t *) magic_comment->node.next) {
415
- VALUE key_loc_argv[] = {
416
- source,
417
- LONG2FIX(magic_comment->key_start - parser->start),
418
- LONG2FIX(magic_comment->key_length)
419
- };
420
-
421
- VALUE value_loc_argv[] = {
422
- source,
423
- LONG2FIX(magic_comment->value_start - parser->start),
424
- LONG2FIX(magic_comment->value_length)
425
- };
426
-
427
- VALUE magic_comment_argv[] = {
428
- rb_class_new_instance(3, key_loc_argv, rb_cPrismLocation),
429
- rb_class_new_instance(3, value_loc_argv, rb_cPrismLocation)
430
- };
431
-
432
- rb_ary_push(magic_comments, rb_class_new_instance(2, magic_comment_argv, rb_cPrismMagicComment));
511
+ for (
512
+ const pm_magic_comment_t *magic_comment = (const pm_magic_comment_t *) parser->magic_comment_list.head;
513
+ magic_comment != NULL;
514
+ magic_comment = (const pm_magic_comment_t *) magic_comment->node.next
515
+ ) {
516
+ VALUE value = parser_magic_comment(parser, source, freeze, magic_comment);
517
+ rb_ary_push(magic_comments, value);
433
518
  }
434
519
 
520
+ if (freeze) rb_obj_freeze(magic_comments);
435
521
  return magic_comments;
436
522
  }
437
523
 
@@ -440,17 +526,11 @@ parser_magic_comments(pm_parser_t *parser, VALUE source) {
440
526
  * exists.
441
527
  */
442
528
  static VALUE
443
- parser_data_loc(const pm_parser_t *parser, VALUE source) {
529
+ parser_data_loc(const pm_parser_t *parser, VALUE source, bool freeze) {
444
530
  if (parser->data_loc.end == NULL) {
445
531
  return Qnil;
446
532
  } else {
447
- VALUE argv[] = {
448
- source,
449
- LONG2FIX(parser->data_loc.start - parser->start),
450
- LONG2FIX(parser->data_loc.end - parser->data_loc.start)
451
- };
452
-
453
- return rb_class_new_instance(3, argv, rb_cPrismLocation);
533
+ return PARSER_LOCATION_LOC(parser, source, freeze, parser->data_loc);
454
534
  }
455
535
  }
456
536
 
@@ -458,16 +538,17 @@ parser_data_loc(const pm_parser_t *parser, VALUE source) {
458
538
  * Extract the errors out of the parser into an array.
459
539
  */
460
540
  static VALUE
461
- parser_errors(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
541
+ parser_errors(const pm_parser_t *parser, rb_encoding *encoding, VALUE source, bool freeze) {
462
542
  VALUE errors = rb_ary_new_capa(parser->error_list.size);
463
- pm_diagnostic_t *error;
464
543
 
465
- for (error = (pm_diagnostic_t *) parser->error_list.head; error != NULL; error = (pm_diagnostic_t *) error->node.next) {
466
- VALUE location_argv[] = {
467
- source,
468
- LONG2FIX(error->location.start - parser->start),
469
- LONG2FIX(error->location.end - error->location.start)
470
- };
544
+ for (
545
+ const pm_diagnostic_t *error = (const pm_diagnostic_t *) parser->error_list.head;
546
+ error != NULL;
547
+ error = (const pm_diagnostic_t *) error->node.next
548
+ ) {
549
+ VALUE type = ID2SYM(rb_intern(pm_diagnostic_id_human(error->diag_id)));
550
+ VALUE message = rb_obj_freeze(rb_enc_str_new_cstr(error->message, encoding));
551
+ VALUE location = PARSER_LOCATION_LOC(parser, source, freeze, error->location);
471
552
 
472
553
  VALUE level = Qnil;
473
554
  switch (error->level) {
@@ -484,16 +565,12 @@ parser_errors(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
484
565
  rb_raise(rb_eRuntimeError, "Unknown level: %" PRIu8, error->level);
485
566
  }
486
567
 
487
- VALUE error_argv[] = {
488
- ID2SYM(rb_intern(pm_diagnostic_id_human(error->diag_id))),
489
- rb_enc_str_new_cstr(error->message, encoding),
490
- rb_class_new_instance(3, location_argv, rb_cPrismLocation),
491
- level
492
- };
493
-
494
- rb_ary_push(errors, rb_class_new_instance(4, error_argv, rb_cPrismParseError));
568
+ VALUE argv[] = { type, message, location, level };
569
+ VALUE value = rb_class_new_instance_freeze(4, argv, rb_cPrismParseError, freeze);
570
+ rb_ary_push(errors, value);
495
571
  }
496
572
 
573
+ if (freeze) rb_obj_freeze(errors);
497
574
  return errors;
498
575
  }
499
576
 
@@ -501,16 +578,17 @@ parser_errors(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
501
578
  * Extract the warnings out of the parser into an array.
502
579
  */
503
580
  static VALUE
504
- parser_warnings(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
581
+ parser_warnings(const pm_parser_t *parser, rb_encoding *encoding, VALUE source, bool freeze) {
505
582
  VALUE warnings = rb_ary_new_capa(parser->warning_list.size);
506
- pm_diagnostic_t *warning;
507
583
 
508
- for (warning = (pm_diagnostic_t *) parser->warning_list.head; warning != NULL; warning = (pm_diagnostic_t *) warning->node.next) {
509
- VALUE location_argv[] = {
510
- source,
511
- LONG2FIX(warning->location.start - parser->start),
512
- LONG2FIX(warning->location.end - warning->location.start)
513
- };
584
+ for (
585
+ const pm_diagnostic_t *warning = (const pm_diagnostic_t *) parser->warning_list.head;
586
+ warning != NULL;
587
+ warning = (const pm_diagnostic_t *) warning->node.next
588
+ ) {
589
+ VALUE type = ID2SYM(rb_intern(pm_diagnostic_id_human(warning->diag_id)));
590
+ VALUE message = rb_obj_freeze(rb_enc_str_new_cstr(warning->message, encoding));
591
+ VALUE location = PARSER_LOCATION_LOC(parser, source, freeze, warning->location);
514
592
 
515
593
  VALUE level = Qnil;
516
594
  switch (warning->level) {
@@ -524,16 +602,12 @@ parser_warnings(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
524
602
  rb_raise(rb_eRuntimeError, "Unknown level: %" PRIu8, warning->level);
525
603
  }
526
604
 
527
- VALUE warning_argv[] = {
528
- ID2SYM(rb_intern(pm_diagnostic_id_human(warning->diag_id))),
529
- rb_enc_str_new_cstr(warning->message, encoding),
530
- rb_class_new_instance(3, location_argv, rb_cPrismLocation),
531
- level
532
- };
533
-
534
- rb_ary_push(warnings, rb_class_new_instance(4, warning_argv, rb_cPrismParseWarning));
605
+ VALUE argv[] = { type, message, location, level };
606
+ VALUE value = rb_class_new_instance_freeze(4, argv, rb_cPrismParseWarning, freeze);
607
+ rb_ary_push(warnings, value);
535
608
  }
536
609
 
610
+ if (freeze) rb_obj_freeze(warnings);
537
611
  return warnings;
538
612
  }
539
613
 
@@ -541,18 +615,18 @@ parser_warnings(pm_parser_t *parser, rb_encoding *encoding, VALUE source) {
541
615
  * Create a new parse result from the given parser, value, encoding, and source.
542
616
  */
543
617
  static VALUE
544
- parse_result_create(VALUE class, pm_parser_t *parser, VALUE value, rb_encoding *encoding, VALUE source) {
618
+ parse_result_create(VALUE class, const pm_parser_t *parser, VALUE value, rb_encoding *encoding, VALUE source, bool freeze) {
545
619
  VALUE result_argv[] = {
546
620
  value,
547
- parser_comments(parser, source),
548
- parser_magic_comments(parser, source),
549
- parser_data_loc(parser, source),
550
- parser_errors(parser, encoding, source),
551
- parser_warnings(parser, encoding, source),
621
+ parser_comments(parser, source, freeze),
622
+ parser_magic_comments(parser, source, freeze),
623
+ parser_data_loc(parser, source, freeze),
624
+ parser_errors(parser, encoding, source, freeze),
625
+ parser_warnings(parser, encoding, source, freeze),
552
626
  source
553
627
  };
554
628
 
555
- return rb_class_new_instance(7, result_argv, class);
629
+ return rb_class_new_instance_freeze(7, result_argv, class, freeze);
556
630
  }
557
631
 
558
632
  /******************************************************************************/
@@ -568,6 +642,7 @@ typedef struct {
568
642
  VALUE source;
569
643
  VALUE tokens;
570
644
  rb_encoding *encoding;
645
+ bool freeze;
571
646
  } parse_lex_data_t;
572
647
 
573
648
  /**
@@ -579,10 +654,13 @@ static void
579
654
  parse_lex_token(void *data, pm_parser_t *parser, pm_token_t *token) {
580
655
  parse_lex_data_t *parse_lex_data = (parse_lex_data_t *) parser->lex_callback->data;
581
656
 
582
- VALUE yields = rb_assoc_new(
583
- pm_token_new(parser, token, parse_lex_data->encoding, parse_lex_data->source),
584
- INT2FIX(parser->lex_state)
585
- );
657
+ VALUE value = pm_token_new(parser, token, parse_lex_data->encoding, parse_lex_data->source, parse_lex_data->freeze);
658
+ VALUE yields = rb_assoc_new(value, INT2FIX(parser->lex_state));
659
+
660
+ if (parse_lex_data->freeze) {
661
+ rb_obj_freeze(value);
662
+ rb_obj_freeze(yields);
663
+ }
586
664
 
587
665
  rb_ary_push(parse_lex_data->tokens, yields);
588
666
  }
@@ -602,14 +680,37 @@ parse_lex_encoding_changed_callback(pm_parser_t *parser) {
602
680
  // one or two tokens, since the encoding can only change at the top of the
603
681
  // file.
604
682
  VALUE tokens = parse_lex_data->tokens;
683
+ VALUE next_tokens = rb_ary_new();
684
+
605
685
  for (long index = 0; index < RARRAY_LEN(tokens); index++) {
606
686
  VALUE yields = rb_ary_entry(tokens, index);
607
687
  VALUE token = rb_ary_entry(yields, 0);
608
688
 
609
689
  VALUE value = rb_ivar_get(token, rb_intern("@value"));
610
- rb_enc_associate(value, parse_lex_data->encoding);
611
- ENC_CODERANGE_CLEAR(value);
690
+ VALUE next_value = rb_str_dup(value);
691
+
692
+ rb_enc_associate(next_value, parse_lex_data->encoding);
693
+ if (parse_lex_data->freeze) rb_obj_freeze(next_value);
694
+
695
+ VALUE next_token_argv[] = {
696
+ parse_lex_data->source,
697
+ rb_ivar_get(token, rb_intern("@type")),
698
+ next_value,
699
+ rb_ivar_get(token, rb_intern("@location"))
700
+ };
701
+
702
+ VALUE next_token = rb_class_new_instance(4, next_token_argv, rb_cPrismToken);
703
+ VALUE next_yields = rb_assoc_new(next_token, rb_ary_entry(yields, 1));
704
+
705
+ if (parse_lex_data->freeze) {
706
+ rb_obj_freeze(next_token);
707
+ rb_obj_freeze(next_yields);
708
+ }
709
+
710
+ rb_ary_push(next_tokens, next_yields);
612
711
  }
712
+
713
+ rb_ary_replace(parse_lex_data->tokens, next_tokens);
613
714
  }
614
715
 
615
716
  /**
@@ -629,7 +730,8 @@ parse_lex_input(pm_string_t *input, const pm_options_t *options, bool return_nod
629
730
  parse_lex_data_t parse_lex_data = {
630
731
  .source = source,
631
732
  .tokens = rb_ary_new(),
632
- .encoding = rb_utf8_encoding()
733
+ .encoding = rb_utf8_encoding(),
734
+ .freeze = options->freeze,
633
735
  };
634
736
 
635
737
  parse_lex_data_t *data = &parse_lex_data;
@@ -652,14 +754,22 @@ parse_lex_input(pm_string_t *input, const pm_options_t *options, bool return_nod
652
754
  rb_ary_push(offsets, ULONG2NUM(parser.newline_list.offsets[index]));
653
755
  }
654
756
 
757
+ if (options->freeze) {
758
+ rb_obj_freeze(source_string);
759
+ rb_obj_freeze(offsets);
760
+ rb_obj_freeze(source);
761
+ rb_obj_freeze(parse_lex_data.tokens);
762
+ }
763
+
655
764
  VALUE result;
656
765
  if (return_nodes) {
657
766
  VALUE value = rb_ary_new_capa(2);
658
- rb_ary_push(value, pm_ast_new(&parser, node, parse_lex_data.encoding, source));
767
+ rb_ary_push(value, pm_ast_new(&parser, node, parse_lex_data.encoding, source, options->freeze));
659
768
  rb_ary_push(value, parse_lex_data.tokens);
660
- result = parse_result_create(rb_cPrismParseLexResult, &parser, value, parse_lex_data.encoding, source);
769
+ if (options->freeze) rb_obj_freeze(value);
770
+ result = parse_result_create(rb_cPrismParseLexResult, &parser, value, parse_lex_data.encoding, source, options->freeze);
661
771
  } else {
662
- result = parse_result_create(rb_cPrismLexResult, &parser, parse_lex_data.tokens, parse_lex_data.encoding, source);
772
+ result = parse_result_create(rb_cPrismLexResult, &parser, parse_lex_data.tokens, parse_lex_data.encoding, source, options->freeze);
663
773
  }
664
774
 
665
775
  pm_node_destroy(&parser, node);
@@ -725,9 +835,13 @@ parse_input(pm_string_t *input, const pm_options_t *options) {
725
835
  pm_node_t *node = pm_parse(&parser);
726
836
  rb_encoding *encoding = rb_enc_find(parser.encoding->name);
727
837
 
728
- VALUE source = pm_source_new(&parser, encoding);
729
- VALUE value = pm_ast_new(&parser, node, encoding, source);
730
- VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source) ;
838
+ VALUE source = pm_source_new(&parser, encoding, options->freeze);
839
+ VALUE value = pm_ast_new(&parser, node, encoding, source, options->freeze);
840
+ VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source, options->freeze);
841
+
842
+ if (options->freeze) {
843
+ rb_obj_freeze(source);
844
+ }
731
845
 
732
846
  pm_node_destroy(&parser, node);
733
847
  pm_parser_free(&parser);
@@ -749,6 +863,8 @@ parse_input(pm_string_t *input, const pm_options_t *options) {
749
863
  * encoding or nil.
750
864
  * * `filepath` - the filepath of the source being parsed. This should be a
751
865
  * string or nil.
866
+ * * `freeze` - whether or not to deeply freeze the AST. This should be a
867
+ * boolean or nil.
752
868
  * * `frozen_string_literal` - whether or not the frozen string literal pragma
753
869
  * has been set. This should be a boolean or nil.
754
870
  * * `line` - the line number that the parse starts on. This should be an
@@ -768,12 +884,12 @@ parse_input(pm_string_t *input, const pm_options_t *options) {
768
884
  * parsed. This should be an array of arrays of symbols or nil. Scopes are
769
885
  * ordered from the outermost scope to the innermost one.
770
886
  * * `version` - the version of Ruby syntax that prism should used to parse Ruby
771
- * code. By default prism assumes you want to parse with the latest version
772
- * of Ruby syntax (which you can trigger with `nil` or `"latest"`). You
773
- * may also restrict the syntax to a specific version of Ruby, e.g., with `"3.3.0"`.
774
- * To parse with the same syntax version that the current Ruby is running
775
- * use `version: RUBY_VERSION`. Raises ArgumentError if the version is not
776
- * currently supported by Prism.
887
+ * code. By default prism assumes you want to parse with the latest
888
+ * version of Ruby syntax (which you can trigger with `nil` or
889
+ * `"latest"`). You may also restrict the syntax to a specific version of
890
+ * Ruby, e.g., with `"3.3.0"`. To parse with the same syntax version that
891
+ * the current Ruby is running use `version: RUBY_VERSION`. Raises
892
+ * ArgumentError if the version is not currently supported by Prism.
777
893
  */
778
894
  static VALUE
779
895
  parse(int argc, VALUE *argv, VALUE self) {
@@ -921,9 +1037,9 @@ parse_stream(int argc, VALUE *argv, VALUE self) {
921
1037
  pm_node_t *node = pm_parse_stream(&parser, &buffer, (void *) stream, parse_stream_fgets, &options);
922
1038
  rb_encoding *encoding = rb_enc_find(parser.encoding->name);
923
1039
 
924
- VALUE source = pm_source_new(&parser, encoding);
925
- VALUE value = pm_ast_new(&parser, node, encoding, source);
926
- VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source);
1040
+ VALUE source = pm_source_new(&parser, encoding, options.freeze);
1041
+ VALUE value = pm_ast_new(&parser, node, encoding, source, options.freeze);
1042
+ VALUE result = parse_result_create(rb_cPrismParseResult, &parser, value, encoding, source, options.freeze);
927
1043
 
928
1044
  pm_node_destroy(&parser, node);
929
1045
  pm_buffer_free(&buffer);
@@ -943,8 +1059,8 @@ parse_input_comments(pm_string_t *input, const pm_options_t *options) {
943
1059
  pm_node_t *node = pm_parse(&parser);
944
1060
  rb_encoding *encoding = rb_enc_find(parser.encoding->name);
945
1061
 
946
- VALUE source = pm_source_new(&parser, encoding);
947
- VALUE comments = parser_comments(&parser, source);
1062
+ VALUE source = pm_source_new(&parser, encoding, options->freeze);
1063
+ VALUE comments = parser_comments(&parser, source, options->freeze);
948
1064
 
949
1065
  pm_node_destroy(&parser, node);
950
1066
  pm_parser_free(&parser);
@@ -1133,6 +1249,68 @@ parse_file_failure_p(int argc, VALUE *argv, VALUE self) {
1133
1249
  return RTEST(parse_file_success_p(argc, argv, self)) ? Qfalse : Qtrue;
1134
1250
  }
1135
1251
 
1252
+ /******************************************************************************/
1253
+ /* String query methods */
1254
+ /******************************************************************************/
1255
+
1256
+ /**
1257
+ * Process the result of a call to a string query method and return an
1258
+ * appropriate value.
1259
+ */
1260
+ static VALUE
1261
+ string_query(pm_string_query_t result) {
1262
+ switch (result) {
1263
+ case PM_STRING_QUERY_ERROR:
1264
+ rb_raise(rb_eArgError, "Invalid or non ascii-compatible encoding");
1265
+ return Qfalse;
1266
+ case PM_STRING_QUERY_FALSE:
1267
+ return Qfalse;
1268
+ case PM_STRING_QUERY_TRUE:
1269
+ return Qtrue;
1270
+ }
1271
+ return Qfalse;
1272
+ }
1273
+
1274
+ /**
1275
+ * call-seq:
1276
+ * Prism::StringQuery::local?(string) -> bool
1277
+ *
1278
+ * Returns true if the string constitutes a valid local variable name. Note that
1279
+ * this means the names that can be set through Binding#local_variable_set, not
1280
+ * necessarily the ones that can be set through a local variable assignment.
1281
+ */
1282
+ static VALUE
1283
+ string_query_local_p(VALUE self, VALUE string) {
1284
+ const uint8_t *source = (const uint8_t *) check_string(string);
1285
+ return string_query(pm_string_query_local(source, RSTRING_LEN(string), rb_enc_get(string)->name));
1286
+ }
1287
+
1288
+ /**
1289
+ * call-seq:
1290
+ * Prism::StringQuery::constant?(string) -> bool
1291
+ *
1292
+ * Returns true if the string constitutes a valid constant name. Note that this
1293
+ * means the names that can be set through Module#const_set, not necessarily the
1294
+ * ones that can be set through a constant assignment.
1295
+ */
1296
+ static VALUE
1297
+ string_query_constant_p(VALUE self, VALUE string) {
1298
+ const uint8_t *source = (const uint8_t *) check_string(string);
1299
+ return string_query(pm_string_query_constant(source, RSTRING_LEN(string), rb_enc_get(string)->name));
1300
+ }
1301
+
1302
+ /**
1303
+ * call-seq:
1304
+ * Prism::StringQuery::method_name?(string) -> bool
1305
+ *
1306
+ * Returns true if the string constitutes a valid method name.
1307
+ */
1308
+ static VALUE
1309
+ string_query_method_name_p(VALUE self, VALUE string) {
1310
+ const uint8_t *source = (const uint8_t *) check_string(string);
1311
+ return string_query(pm_string_query_method_name(source, RSTRING_LEN(string), rb_enc_get(string)->name));
1312
+ }
1313
+
1136
1314
  /******************************************************************************/
1137
1315
  /* Initialization of the extension */
1138
1316
  /******************************************************************************/
@@ -1170,12 +1348,15 @@ Init_prism(void) {
1170
1348
  rb_cPrismParseResult = rb_define_class_under(rb_cPrism, "ParseResult", rb_cPrismResult);
1171
1349
  rb_cPrismLexResult = rb_define_class_under(rb_cPrism, "LexResult", rb_cPrismResult);
1172
1350
  rb_cPrismParseLexResult = rb_define_class_under(rb_cPrism, "ParseLexResult", rb_cPrismResult);
1351
+ rb_cPrismStringQuery = rb_define_class_under(rb_cPrism, "StringQuery", rb_cObject);
1352
+ rb_cPrismScope = rb_define_class_under(rb_cPrism, "Scope", rb_cObject);
1173
1353
 
1174
1354
  // Intern all of the IDs eagerly that we support so that we don't have to do
1175
1355
  // it every time we parse.
1176
1356
  rb_id_option_command_line = rb_intern_const("command_line");
1177
1357
  rb_id_option_encoding = rb_intern_const("encoding");
1178
1358
  rb_id_option_filepath = rb_intern_const("filepath");
1359
+ rb_id_option_freeze = rb_intern_const("freeze");
1179
1360
  rb_id_option_frozen_string_literal = rb_intern_const("frozen_string_literal");
1180
1361
  rb_id_option_line = rb_intern_const("line");
1181
1362
  rb_id_option_main_script = rb_intern_const("main_script");
@@ -1183,11 +1364,15 @@ Init_prism(void) {
1183
1364
  rb_id_option_scopes = rb_intern_const("scopes");
1184
1365
  rb_id_option_version = rb_intern_const("version");
1185
1366
  rb_id_source_for = rb_intern("for");
1367
+ rb_id_forwarding_positionals = rb_intern("*");
1368
+ rb_id_forwarding_keywords = rb_intern("**");
1369
+ rb_id_forwarding_block = rb_intern("&");
1370
+ rb_id_forwarding_all = rb_intern("...");
1186
1371
 
1187
1372
  /**
1188
1373
  * The version of the prism library.
1189
1374
  */
1190
- rb_define_const(rb_cPrism, "VERSION", rb_str_new2(EXPECTED_PRISM_VERSION));
1375
+ rb_define_const(rb_cPrism, "VERSION", rb_str_freeze(rb_str_new_cstr(EXPECTED_PRISM_VERSION)));
1191
1376
 
1192
1377
  // First, the functions that have to do with lexing and parsing.
1193
1378
  rb_define_singleton_method(rb_cPrism, "lex", lex, -1);
@@ -1211,6 +1396,10 @@ Init_prism(void) {
1211
1396
  rb_define_singleton_method(rb_cPrism, "dump_file", dump_file, -1);
1212
1397
  #endif
1213
1398
 
1399
+ rb_define_singleton_method(rb_cPrismStringQuery, "local?", string_query_local_p, 1);
1400
+ rb_define_singleton_method(rb_cPrismStringQuery, "constant?", string_query_constant_p, 1);
1401
+ rb_define_singleton_method(rb_cPrismStringQuery, "method_name?", string_query_method_name_p, 1);
1402
+
1214
1403
  // Next, initialize the other APIs.
1215
1404
  Init_prism_api_node();
1216
1405
  Init_prism_pack();