RubyGems - rbs - Versions diffs - 1.6.2 → 1.7.0.beta.1 - Mend

rbs 1.6.2 → 1.7.0.beta.1

Files changed (57) hide show

checksums.yaml +4 -4
data/.github/workflows/ruby.yml +0 -4
data/.gitignore +1 -0
data/CHANGELOG.md +6 -0
data/Gemfile +1 -0
data/Rakefile +7 -22
data/core/kernel.rbs +4 -4
data/core/trace_point.rbs +1 -1
data/ext/rbs/extension/constants.c +140 -0
data/ext/rbs/extension/constants.h +72 -0
data/ext/rbs/extension/extconf.rb +3 -0
data/ext/rbs/extension/lexer.c +1070 -0
data/ext/rbs/extension/lexer.h +145 -0
data/ext/rbs/extension/location.c +295 -0
data/ext/rbs/extension/location.h +59 -0
data/ext/rbs/extension/main.c +9 -0
data/ext/rbs/extension/parser.c +2418 -0
data/ext/rbs/extension/parser.h +23 -0
data/ext/rbs/extension/parserstate.c +313 -0
data/ext/rbs/extension/parserstate.h +141 -0
data/ext/rbs/extension/rbs_extension.h +40 -0
data/ext/rbs/extension/ruby_objs.c +585 -0
data/ext/rbs/extension/ruby_objs.h +46 -0
data/ext/rbs/extension/unescape.c +65 -0
data/goodcheck.yml +1 -1
data/lib/rbs/ast/comment.rb +0 -12
data/lib/rbs/buffer.rb +4 -0
data/lib/rbs/cli.rb +5 -8
data/lib/rbs/collection/sources/git.rb +18 -3
data/lib/rbs/errors.rb +14 -1
data/lib/rbs/location.rb +221 -217
data/lib/rbs/location_aux.rb +108 -0
data/lib/rbs/locator.rb +10 -7
data/lib/rbs/parser_aux.rb +24 -0
data/lib/rbs/types.rb +2 -3
data/lib/rbs/version.rb +1 -1
data/lib/rbs/writer.rb +4 -2
data/lib/rbs.rb +3 -7
data/rbs.gemspec +2 -1
data/sig/ancestor_builder.rbs +2 -2
data/sig/annotation.rbs +2 -2
data/sig/comment.rbs +7 -7
data/sig/constant_table.rbs +1 -1
data/sig/declarations.rbs +9 -9
data/sig/definition.rbs +1 -1
data/sig/definition_builder.rbs +2 -2
data/sig/errors.rbs +30 -25
data/sig/location.rbs +42 -79
data/sig/locator.rbs +2 -2
data/sig/members.rbs +7 -7
data/sig/method_types.rbs +3 -3
data/sig/parser.rbs +11 -21
data/sig/types.rbs +45 -27
data/sig/writer.rbs +1 -1
data/stdlib/json/0/json.rbs +3 -3
metadata +24 -6
data/lib/rbs/parser.rb +0 -3614

data/ext/rbs/extension/parser.h ADDED Viewed

@@ -0,0 +1,23 @@
+#ifndef RBS__PARSER_H
+#define RBS__PARSER_H
+#include "ruby.h"
+#include "parserstate.h"
+/**
+ * RBS::Parser class
+ * */
+extern VALUE RBS_Parser;
+/**
+ * RBS::Parser::KEYWORDS constant, which stores a hash from keyword string to token type fixnum
+ * */
+extern VALUE RBS_Parser_KEYWORDS;
+VALUE parse_type(parserstate *state);
+VALUE parse_method_type(parserstate *state);
+VALUE parse_signature(parserstate *state);
+void rbs__init_parser();
+#endif

data/ext/rbs/extension/parserstate.c ADDED Viewed

@@ -0,0 +1,313 @@
+#include "rbs_extension.h"
+#define RESET_TABLE_P(table) (table->size == 0)
+id_table *alloc_empty_table() {
+  id_table *table = malloc(sizeof(id_table));
+  table->size = 10;
+  table->count = 0;
+  table->ids = calloc(10, sizeof(ID));
+  return table;
+}
+id_table *alloc_reset_table() {
+  id_table *table = malloc(sizeof(id_table));
+  table->size = 0;
+  return table;
+}
+id_table *parser_push_typevar_table(parserstate *state, bool reset) {
+  if (reset) {
+    id_table *table = alloc_reset_table();
+    table->next = state->vars;
+    state->vars = table;
+  }
+  id_table *table = alloc_empty_table();
+  table->next = state->vars;
+  state->vars = table;
+  return table;
+}
+void parser_pop_typevar_table(parserstate *state) {
+  id_table *table;
+  if (state->vars) {
+    table = state->vars;
+    state->vars = table->next;
+    free(table->ids);
+    free(table);
+  } else {
+    rb_raise(rb_eRuntimeError, "Cannot pop empty table");
+  }
+  if (state->vars && RESET_TABLE_P(state->vars)) {
+    table = state->vars;
+    state->vars = table->next;
+    free(table);
+  }
+}
+void parser_insert_typevar(parserstate *state, ID id) {
+  id_table *table = state->vars;
+  if (RESET_TABLE_P(table)) {
+    rb_raise(rb_eRuntimeError, "Cannot insert to reset table");
+  }
+  if (table->size == table->count) {
+    // expand
+    ID *ptr = table->ids;
+    table->size += 10;
+    table->ids = calloc(table->size, sizeof(ID));
+    memcpy(table->ids, ptr, sizeof(ID) * table->count);
+    free(ptr);
+  }
+  table->ids[table->count++] = id;
+}
+bool parser_typevar_member(parserstate *state, ID id) {
+  id_table *table = state->vars;
+  while (table && !RESET_TABLE_P(table)) {
+    for (size_t i = 0; i < table->count; i++) {
+      if (table->ids[i] == id) {
+        return true;
+      }
+    }
+    table = table->next;
+  }
+  return false;
+}
+void print_parser(parserstate *state) {
+  pp(state->buffer);
+  printf("  current_token = %s (%d...%d)\n", token_type_str(state->current_token.type), state->current_token.range.start.char_pos, state->current_token.range.end.char_pos);
+  printf("     next_token = %s (%d...%d)\n", token_type_str(state->next_token.type), state->next_token.range.start.char_pos, state->next_token.range.end.char_pos);
+  printf("    next_token2 = %s (%d...%d)\n", token_type_str(state->next_token2.type), state->next_token2.range.start.char_pos, state->next_token2.range.end.char_pos);
+  printf("    next_token3 = %s (%d...%d)\n", token_type_str(state->next_token3.type), state->next_token3.range.start.char_pos, state->next_token3.range.end.char_pos);
+}
+void parser_advance(parserstate *state) {
+  state->current_token = state->next_token;
+  state->next_token = state->next_token2;
+  state->next_token2 = state->next_token3;
+  while (true) {
+    if (state->next_token3.type == pEOF) {
+      break;
+    }
+    state->next_token3 = rbsparser_next_token(state->lexstate);
+    if (state->next_token3.type == tCOMMENT) {
+      // skip
+    } else if (state->next_token3.type == tLINECOMMENT) {
+      insert_comment_line(state, state->next_token3);
+    } else {
+      break;
+    }
+  }
+}
+/**
+ * Advance token if _next_ token is `type`.
+ * Ensures one token advance and `state->current_token.type == type`, or current token not changed.
+ *
+ * @returns true if token advances, false otherwise.
+ **/
+bool parser_advance_if(parserstate *state, enum TokenType type) {
+  if (state->next_token.type == type) {
+    parser_advance(state);
+    return true;
+  } else {
+    return false;
+  }
+}
+void parser_advance_assert(parserstate *state, enum TokenType type) {
+  parser_advance(state);
+  if (state->current_token.type != type) {
+    raise_syntax_error(
+      state,
+      state->current_token,
+      "expected a token `%s`",
+      token_type_str(type)
+    );
+  }
+}
+void print_token(token tok) {
+  printf(
+    "%s char=%d...%d\n",
+    token_type_str(tok.type),
+    tok.range.start.char_pos,
+    tok.range.end.char_pos
+  );
+}
+void insert_comment_line(parserstate *state, token tok) {
+  int prev_line = tok.range.start.line - 1;
+  comment *com = comment_get_comment(state->last_comment, prev_line);
+  if (com) {
+    comment_insert_new_line(com, tok);
+  } else {
+    state->last_comment = alloc_comment(tok, state->last_comment);
+  }
+}
+VALUE get_comment(parserstate *state, int subject_line) {
+  int comment_line = subject_line - 1;
+  comment *com = comment_get_comment(state->last_comment, comment_line);
+  if (com) {
+    return comment_to_ruby(com, state->buffer);
+  } else {
+    return Qnil;
+  }
+}
+comment *alloc_comment(token comment_token, comment *last_comment) {
+  comment *new_comment = calloc(1, sizeof(comment));
+  new_comment->next_comment = last_comment;
+  new_comment->start = comment_token.range.start;
+  new_comment->end = comment_token.range.end;
+  new_comment->line_size = 0;
+  new_comment->line_count = 0;
+  comment_insert_new_line(new_comment, comment_token);
+  return new_comment;
+}
+void free_comment(comment *com) {
+  if (com->next_comment) {
+    free_comment(com->next_comment);
+  }
+  free(com->tokens);
+  free(com);
+}
+void comment_insert_new_line(comment *com, token comment_token) {
+  if (com->line_count == 0) {
+    com->start = comment_token.range.start;
+  }
+  if (com->line_count == com->line_size) {
+    com->line_size += 10;
+    if (com->tokens) {
+      token *p = com->tokens;
+      com->tokens = calloc(com->line_size, sizeof(token));
+      memcpy(com->tokens, p, sizeof(token) * com->line_count);
+      free(p);
+    } else {
+      com->tokens = calloc(com->line_size, sizeof(token));
+    }
+  }
+  com->tokens[com->line_count++] = comment_token;
+  com->end = comment_token.range.end;
+}
+comment *comment_get_comment(comment *com, int line) {
+  if (com == NULL) {
+    return NULL;
+  }
+  if (com->end.line < line) {
+    return NULL;
+  }
+  if (com->end.line == line) {
+    return com;
+  }
+  return comment_get_comment(com->next_comment, line);
+}
+VALUE comment_to_ruby(comment *com, VALUE buffer) {
+  VALUE content = rb_funcall(buffer, rb_intern("content"), 0);
+  rb_encoding *enc = rb_enc_get(content);
+  VALUE string = rb_enc_str_new_cstr("", enc);
+  int hash_bytes = rb_enc_codelen('#', enc);
+  int space_bytes = rb_enc_codelen(' ', enc);
+  for (size_t i = 0; i < com->line_count; i++) {
+    token tok = com->tokens[i];
+    char *comment_start = RSTRING_PTR(content) + tok.range.start.byte_pos + hash_bytes;
+    int comment_bytes = RANGE_BYTES(tok.range) - hash_bytes;
+    unsigned char c = rb_enc_mbc_to_codepoint(comment_start, RSTRING_END(content), enc);
+    if (c == ' ') {
+      comment_start += space_bytes;
+      comment_bytes -= space_bytes;
+    }
+    rb_str_cat(string, comment_start, comment_bytes);
+    rb_str_cat_cstr(string, "\n");
+  }
+  return rbs_ast_comment(
+    string,
+    rbs_location_pp(buffer, &com->start, &com->end)
+  );
+}
+parserstate *alloc_parser(VALUE buffer, int line, int column, VALUE variables) {
+  VALUE string = rb_funcall(buffer, rb_intern("content"), 0);
+  lexstate *lexer = calloc(1, sizeof(lexstate));
+  lexer->string = string;
+  lexer->current.line = line;
+  lexer->current.column = column;
+  lexer->start = lexer->current;
+  lexer->first_token_of_line = lexer->current.column == 0;
+  parserstate *parser = calloc(1, sizeof(parserstate));
+  parser->lexstate = lexer;
+  parser->buffer = buffer;
+  parser->current_token = NullToken;
+  parser->next_token = NullToken;
+  parser->next_token2 = NullToken;
+  parser->next_token3 = NullToken;
+  parser_advance(parser);
+  parser_advance(parser);
+  parser_advance(parser);
+  if (!NIL_P(variables)) {
+    parser_push_typevar_table(parser, true);
+    for (long i = 0; i < rb_array_len(variables); i++) {
+      VALUE index = INT2FIX(i);
+      VALUE symbol = rb_ary_aref(1, &index, variables);
+      parser_insert_typevar(parser, SYM2ID(symbol));
+    }
+  }
+  return parser;
+}
+void free_parser(parserstate *parser) {
+  free(parser->lexstate);
+  if (parser->last_comment) {
+    free_comment(parser->last_comment);
+  }
+  free(parser);
+}

data/ext/rbs/extension/parserstate.h ADDED Viewed

@@ -0,0 +1,141 @@
+#ifndef RBS__PARSERSTATE_H
+#define RBS__PARSERSTATE_H
+#include <stdbool.h>
+#include "lexer.h"
+#include "location.h"
+/**
+ * id_table represents a set of IDs.
+ * This is used to manage the set of bound variables.
+ * */
+typedef struct id_table {
+  size_t size;
+  size_t count;
+  ID *ids;
+  struct id_table *next;
+} id_table;
+/**
+ * comment represents a sequence of comment lines.
+ *
+ *     # Comment for the method.
+ *     #
+ *     # ```rb
+ *     # object.foo()  # Do something
+ *     # ```
+ *     #
+ *     def foo: () -> void
+ *
+ * A comment object represents the six lines of comments.
+ * */
+typedef struct comment {
+  position start;
+  position end;
+  size_t line_size;
+  size_t line_count;
+  token *tokens;
+  struct comment *next_comment;
+} comment;
+/**
+ * An RBS parser is a LL(3) parser.
+ * */
+typedef struct {
+  lexstate *lexstate;
+  token current_token;
+  token next_token;       /* The first lookahead token */
+  token next_token2;      /* The second lookahead token */
+  token next_token3;      /* The third lookahead token */
+  VALUE buffer;
+  id_table *vars;         /* Known type variables */
+  comment *last_comment;  /* Last read comment */
+} parserstate;
+comment *alloc_comment(token comment_token, comment *last_comment);
+void free_comment(comment *com);
+void comment_insert_new_line(comment *com, token comment_token);
+comment *comment_get_comment(comment *com, int line);
+VALUE comment_to_ruby(comment *com, VALUE buffer);
+/**
+ * Insert new table entry.
+ * Setting `reset` inserts a _reset_ entry, which stops searching.
+ *
+ * ```
+ * class Foo[A]
+ *          ^^^                      <= push new table with reset
+ *   def foo: [B] () -> [A, B]
+ *            ^^^                    <= push new table without reset
+ *
+ *   class Baz[C]
+ *            ^^^                    <= push new table with reset
+ *   end
+ * end
+ * ```
+ * */
+id_table *parser_push_typevar_table(parserstate *state, bool reset);
+void parser_pop_typevar_table(parserstate *state);
+/**
+ * Insert new type variable into the latest table.
+ * */
+void parser_insert_typevar(parserstate *state, ID id);
+/**
+ * Returns true if given type variable is recorded in the table.
+ * If not found, it goes one table up, if it's not a reset table.
+ * Or returns false, if it's a reset table.
+ * */
+bool parser_typevar_member(parserstate *state, ID id);
+/**
+ * Allocate new parserstate object.
+ *
+ * ```
+ * alloc_parser(buffer, 0, 1, variables)    // New parserstate with variables
+ * alloc_parser(buffer, 3, 5, Qnil)         // New parserstate without variables
+ * ```
+ * */
+parserstate *alloc_parser(VALUE buffer, int line, int column, VALUE variables);
+void free_parser(parserstate *parser);
+/**
+ * Advance one token.
+ * */
+void parser_advance(parserstate *state);
+/**
+ * Advance one token, and assert the current token type.
+ * Raises an exception if `current_token->type != type`.
+ * */
+void parser_advance_assert(parserstate *state, enum TokenType type);
+/**
+ * Advance one token if the next_token is a token of the type.
+ * */
+bool parser_advance_if(parserstate *state, enum TokenType type);
+void print_parser(parserstate *state);
+/**
+ * Insert new comment line token.
+ * */
+void insert_comment_line(parserstate *state, token token);
+/**
+ * Returns a RBS::Comment object associated with an subject at `subject_line`.
+ *
+ * ```rbs
+ * # Comment1
+ * class Foo           # This is the subject line for Comment1
+ *
+ *   # Comment2
+ *   %a{annotation}    # This is the subject line for Comment2
+ *   def foo: () -> void
+ * end
+ * ```
+ * */
+VALUE get_comment(parserstate *state, int subject_line);
+#endif