herb 0.7.4-aarch64-linux-gnu → 0.8.0-aarch64-linux-gnu
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/Makefile +8 -5
- data/config.yml +40 -20
- data/ext/herb/error_helpers.c +57 -3
- data/ext/herb/error_helpers.h +1 -1
- data/ext/herb/extconf.rb +1 -0
- data/ext/herb/extension.c +10 -24
- data/ext/herb/extension_helpers.c +12 -18
- data/ext/herb/extension_helpers.h +4 -4
- data/ext/herb/nodes.c +72 -37
- data/herb.gemspec +0 -2
- data/lib/herb/3.0/herb.so +0 -0
- data/lib/herb/3.1/herb.so +0 -0
- data/lib/herb/3.2/herb.so +0 -0
- data/lib/herb/3.3/herb.so +0 -0
- data/lib/herb/3.4/herb.so +0 -0
- data/lib/herb/ast/helpers.rb +11 -0
- data/lib/herb/ast/node.rb +15 -6
- data/lib/herb/ast/nodes.rb +609 -392
- data/lib/herb/cli.rb +31 -0
- data/lib/herb/colors.rb +82 -0
- data/lib/herb/engine/compiler.rb +140 -14
- data/lib/herb/engine/debug_visitor.rb +1 -5
- data/lib/herb/engine/parser_error_overlay.rb +1 -1
- data/lib/herb/engine.rb +18 -20
- data/lib/herb/errors.rb +166 -56
- data/lib/herb/location.rb +2 -2
- data/lib/herb/project.rb +86 -21
- data/lib/herb/token.rb +14 -2
- data/lib/herb/version.rb +1 -1
- data/lib/herb.rb +1 -0
- data/sig/herb/ast/helpers.rbs +3 -0
- data/sig/herb/ast/node.rbs +12 -5
- data/sig/herb/ast/nodes.rbs +124 -62
- data/sig/herb/colors.rbs +35 -0
- data/sig/herb/engine/compiler.rbs +23 -1
- data/sig/herb/errors.rbs +74 -20
- data/sig/herb/token.rbs +8 -0
- data/sig/herb_c_extension.rbs +1 -1
- data/sig/serialized_ast_errors.rbs +8 -0
- data/src/analyze.c +461 -249
- data/src/analyze_helpers.c +5 -0
- data/src/analyze_missing_end.c +147 -0
- data/src/analyze_transform.c +196 -0
- data/src/analyzed_ruby.c +23 -2
- data/src/ast_node.c +14 -17
- data/src/ast_nodes.c +179 -181
- data/src/ast_pretty_print.c +232 -232
- data/src/element_source.c +7 -6
- data/src/errors.c +272 -152
- data/src/extract.c +92 -34
- data/src/herb.c +37 -49
- data/src/html_util.c +34 -96
- data/src/include/analyze.h +10 -2
- data/src/include/analyze_helpers.h +3 -0
- data/src/include/analyzed_ruby.h +4 -2
- data/src/include/ast_node.h +4 -4
- data/src/include/ast_nodes.h +68 -67
- data/src/include/ast_pretty_print.h +2 -2
- data/src/include/element_source.h +3 -1
- data/src/include/errors.h +42 -26
- data/src/include/extract.h +4 -4
- data/src/include/herb.h +6 -7
- data/src/include/html_util.h +4 -5
- data/src/include/lexer.h +1 -3
- data/src/include/lexer_peek_helpers.h +21 -19
- data/src/include/lexer_struct.h +12 -10
- data/src/include/location.h +10 -13
- data/src/include/macros.h +4 -0
- data/src/include/parser.h +12 -6
- data/src/include/parser_helpers.h +26 -16
- data/src/include/position.h +3 -14
- data/src/include/pretty_print.h +38 -28
- data/src/include/prism_helpers.h +1 -1
- data/src/include/range.h +4 -13
- data/src/include/token.h +5 -11
- data/src/include/token_struct.h +2 -2
- data/src/include/utf8.h +3 -2
- data/src/include/util/hb_arena.h +31 -0
- data/src/include/util/hb_arena_debug.h +8 -0
- data/src/include/util/hb_array.h +33 -0
- data/src/include/util/hb_buffer.h +34 -0
- data/src/include/util/hb_string.h +29 -0
- data/src/include/util/hb_system.h +9 -0
- data/src/include/util.h +3 -14
- data/src/include/version.h +1 -1
- data/src/include/visitor.h +1 -1
- data/src/io.c +7 -4
- data/src/lexer.c +62 -88
- data/src/lexer_peek_helpers.c +42 -38
- data/src/location.c +9 -37
- data/src/main.c +19 -23
- data/src/parser.c +373 -313
- data/src/parser_helpers.c +60 -54
- data/src/parser_match_tags.c +316 -0
- data/src/pretty_print.c +88 -117
- data/src/prism_helpers.c +7 -7
- data/src/range.c +2 -35
- data/src/token.c +36 -87
- data/src/utf8.c +4 -4
- data/src/util/hb_arena.c +179 -0
- data/src/util/hb_arena_debug.c +237 -0
- data/src/{array.c → util/hb_array.c} +26 -27
- data/src/util/hb_buffer.c +203 -0
- data/src/util/hb_string.c +85 -0
- data/src/util/hb_system.c +30 -0
- data/src/util.c +29 -99
- data/src/visitor.c +54 -54
- data/templates/ext/herb/error_helpers.c.erb +3 -3
- data/templates/ext/herb/error_helpers.h.erb +1 -1
- data/templates/ext/herb/nodes.c.erb +11 -6
- data/templates/java/error_helpers.c.erb +75 -0
- data/templates/java/error_helpers.h.erb +20 -0
- data/templates/java/nodes.c.erb +97 -0
- data/templates/java/nodes.h.erb +23 -0
- data/templates/java/org/herb/ast/Errors.java.erb +121 -0
- data/templates/java/org/herb/ast/NodeVisitor.java.erb +14 -0
- data/templates/java/org/herb/ast/Nodes.java.erb +220 -0
- data/templates/java/org/herb/ast/Visitor.java.erb +56 -0
- data/templates/javascript/packages/core/src/visitor.ts.erb +29 -1
- data/templates/javascript/packages/node/extension/error_helpers.cpp.erb +8 -8
- data/templates/javascript/packages/node/extension/error_helpers.h.erb +1 -1
- data/templates/javascript/packages/node/extension/nodes.cpp.erb +9 -9
- data/templates/javascript/packages/node/extension/nodes.h.erb +1 -1
- data/templates/lib/herb/ast/nodes.rb.erb +28 -16
- data/templates/lib/herb/errors.rb.erb +17 -12
- data/templates/rust/src/ast/nodes.rs.erb +220 -0
- data/templates/rust/src/errors.rs.erb +216 -0
- data/templates/rust/src/nodes.rs.erb +374 -0
- data/templates/src/analyze_missing_end.c.erb +36 -0
- data/templates/src/analyze_transform.c.erb +24 -0
- data/templates/src/ast_nodes.c.erb +14 -16
- data/templates/src/ast_pretty_print.c.erb +36 -36
- data/templates/src/errors.c.erb +36 -38
- data/templates/src/include/ast_nodes.h.erb +11 -10
- data/templates/src/include/ast_pretty_print.h.erb +2 -2
- data/templates/src/include/errors.h.erb +9 -9
- data/templates/src/parser_match_tags.c.erb +38 -0
- data/templates/src/visitor.c.erb +4 -4
- data/templates/template.rb +22 -3
- data/templates/wasm/error_helpers.cpp.erb +9 -9
- data/templates/wasm/error_helpers.h.erb +1 -1
- data/templates/wasm/nodes.cpp.erb +9 -9
- data/templates/wasm/nodes.h.erb +1 -1
- data/vendor/prism/Rakefile +4 -1
- data/vendor/prism/config.yml +2 -1
- data/vendor/prism/include/prism/ast.h +31 -1
- data/vendor/prism/include/prism/diagnostic.h +1 -0
- data/vendor/prism/include/prism/version.h +3 -3
- data/vendor/prism/src/diagnostic.c +3 -1
- data/vendor/prism/src/prism.c +130 -71
- data/vendor/prism/src/util/pm_string.c +6 -8
- data/vendor/prism/templates/include/prism/ast.h.erb +2 -0
- data/vendor/prism/templates/java/org/prism/Loader.java.erb +2 -2
- data/vendor/prism/templates/javascript/src/deserialize.js.erb +2 -2
- data/vendor/prism/templates/lib/prism/serialize.rb.erb +2 -2
- data/vendor/prism/templates/sig/prism.rbs.erb +4 -0
- data/vendor/prism/templates/src/diagnostic.c.erb +1 -0
- metadata +34 -21
- data/lib/herb/libherb/array.rb +0 -51
- data/lib/herb/libherb/ast_node.rb +0 -50
- data/lib/herb/libherb/buffer.rb +0 -56
- data/lib/herb/libherb/extract_result.rb +0 -20
- data/lib/herb/libherb/lex_result.rb +0 -32
- data/lib/herb/libherb/libherb.rb +0 -52
- data/lib/herb/libherb/parse_result.rb +0 -20
- data/lib/herb/libherb/token.rb +0 -46
- data/lib/herb/libherb.rb +0 -35
- data/src/buffer.c +0 -232
- data/src/include/array.h +0 -33
- data/src/include/buffer.h +0 -39
- data/src/include/json.h +0 -28
- data/src/include/memory.h +0 -12
- data/src/json.c +0 -205
- data/src/memory.c +0 -53
- data/src/position.c +0 -33
data/src/pretty_print.c
CHANGED
|
@@ -3,146 +3,149 @@
|
|
|
3
3
|
#include "include/ast_node.h"
|
|
4
4
|
#include "include/ast_nodes.h"
|
|
5
5
|
#include "include/ast_pretty_print.h"
|
|
6
|
-
#include "include/buffer.h"
|
|
7
6
|
#include "include/errors.h"
|
|
8
7
|
#include "include/token_struct.h"
|
|
9
8
|
#include "include/util.h"
|
|
9
|
+
#include "include/util/hb_buffer.h"
|
|
10
|
+
#include "include/util/hb_string.h"
|
|
10
11
|
|
|
11
12
|
#include <stdbool.h>
|
|
12
13
|
#include <stdio.h>
|
|
13
14
|
#include <stdlib.h>
|
|
14
15
|
|
|
15
|
-
void pretty_print_indent(
|
|
16
|
+
void pretty_print_indent(hb_buffer_T* buffer, const size_t indent) {
|
|
16
17
|
for (size_t i = 0; i < indent; i++) {
|
|
17
|
-
|
|
18
|
+
hb_buffer_append(buffer, " ");
|
|
18
19
|
}
|
|
19
20
|
}
|
|
20
21
|
|
|
21
|
-
void pretty_print_newline(const size_t indent, const size_t relative_indent,
|
|
22
|
+
void pretty_print_newline(const size_t indent, const size_t relative_indent, hb_buffer_T* buffer) {
|
|
22
23
|
pretty_print_indent(buffer, indent);
|
|
23
24
|
pretty_print_indent(buffer, relative_indent);
|
|
24
|
-
|
|
25
|
+
hb_buffer_append(buffer, "\n");
|
|
25
26
|
}
|
|
26
27
|
|
|
27
28
|
void pretty_print_label(
|
|
28
|
-
|
|
29
|
+
hb_string_T name,
|
|
29
30
|
const size_t indent,
|
|
30
31
|
const size_t relative_indent,
|
|
31
32
|
const bool last_property,
|
|
32
|
-
|
|
33
|
+
hb_buffer_T* buffer
|
|
33
34
|
) {
|
|
34
35
|
pretty_print_indent(buffer, indent);
|
|
35
36
|
pretty_print_indent(buffer, relative_indent);
|
|
36
37
|
|
|
37
38
|
if (last_property) {
|
|
38
|
-
|
|
39
|
+
hb_buffer_append(buffer, "└── ");
|
|
39
40
|
} else {
|
|
40
|
-
|
|
41
|
+
hb_buffer_append(buffer, "├── ");
|
|
41
42
|
}
|
|
42
43
|
|
|
43
|
-
|
|
44
|
-
|
|
44
|
+
hb_buffer_append_string(buffer, name);
|
|
45
|
+
hb_buffer_append(buffer, ": ");
|
|
45
46
|
}
|
|
46
47
|
|
|
47
48
|
void pretty_print_quoted_property(
|
|
48
|
-
|
|
49
|
-
|
|
49
|
+
hb_string_T name,
|
|
50
|
+
hb_string_T value,
|
|
50
51
|
const size_t indent,
|
|
51
52
|
const size_t relative_indent,
|
|
52
53
|
const bool last_property,
|
|
53
|
-
|
|
54
|
+
hb_buffer_T* buffer
|
|
54
55
|
) {
|
|
55
|
-
|
|
56
|
+
hb_string_T quoted = quoted_string(value);
|
|
56
57
|
pretty_print_property(name, quoted, indent, relative_indent, last_property, buffer);
|
|
57
|
-
free(quoted);
|
|
58
|
+
free(quoted.data);
|
|
58
59
|
}
|
|
59
60
|
|
|
60
61
|
void pretty_print_boolean_property(
|
|
61
|
-
|
|
62
|
+
hb_string_T name,
|
|
62
63
|
bool value,
|
|
63
64
|
const size_t indent,
|
|
64
65
|
const size_t relative_indent,
|
|
65
66
|
const bool last_property,
|
|
66
|
-
|
|
67
|
+
hb_buffer_T* buffer
|
|
67
68
|
) {
|
|
68
|
-
pretty_print_property(name, value ? "true" : "false", indent, relative_indent, last_property, buffer);
|
|
69
|
+
pretty_print_property(name, hb_string(value ? "true" : "false"), indent, relative_indent, last_property, buffer);
|
|
69
70
|
}
|
|
70
71
|
|
|
71
72
|
void pretty_print_property(
|
|
72
|
-
|
|
73
|
-
|
|
73
|
+
hb_string_T name,
|
|
74
|
+
hb_string_T value,
|
|
74
75
|
const size_t indent,
|
|
75
76
|
const size_t relative_indent,
|
|
76
77
|
const bool last_property,
|
|
77
|
-
|
|
78
|
+
hb_buffer_T* buffer
|
|
78
79
|
) {
|
|
79
80
|
pretty_print_label(name, indent, relative_indent, last_property, buffer);
|
|
80
|
-
|
|
81
|
-
|
|
81
|
+
hb_buffer_append_string(buffer, value);
|
|
82
|
+
hb_buffer_append(buffer, "\n");
|
|
82
83
|
}
|
|
83
84
|
|
|
84
85
|
void pretty_print_size_t_property(
|
|
85
86
|
size_t value,
|
|
86
|
-
|
|
87
|
+
hb_string_T name,
|
|
87
88
|
const size_t indent,
|
|
88
89
|
const size_t relative_indent,
|
|
89
90
|
const bool last_property,
|
|
90
|
-
|
|
91
|
+
hb_buffer_T* buffer
|
|
91
92
|
) {
|
|
92
93
|
pretty_print_label(name, indent, relative_indent, last_property, buffer);
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
94
|
+
|
|
95
|
+
char size_string[21];
|
|
96
|
+
snprintf(size_string, 21, "%zu", value);
|
|
97
|
+
|
|
98
|
+
hb_buffer_append(buffer, size_string);
|
|
99
|
+
hb_buffer_append(buffer, "\n");
|
|
97
100
|
}
|
|
98
101
|
|
|
99
102
|
void pretty_print_array(
|
|
100
|
-
|
|
101
|
-
|
|
103
|
+
hb_string_T name,
|
|
104
|
+
hb_array_T* array,
|
|
102
105
|
const size_t indent,
|
|
103
106
|
const size_t relative_indent,
|
|
104
107
|
const bool last_property,
|
|
105
|
-
|
|
108
|
+
hb_buffer_T* buffer
|
|
106
109
|
) {
|
|
107
110
|
if (array == NULL) {
|
|
108
|
-
pretty_print_property(name, "∅", indent, relative_indent, last_property, buffer);
|
|
111
|
+
pretty_print_property(name, hb_string("∅"), indent, relative_indent, last_property, buffer);
|
|
109
112
|
|
|
110
113
|
return;
|
|
111
114
|
}
|
|
112
115
|
|
|
113
|
-
if (
|
|
114
|
-
pretty_print_property(name, "[]", indent, relative_indent, last_property, buffer);
|
|
116
|
+
if (hb_array_size(array) == 0) {
|
|
117
|
+
pretty_print_property(name, hb_string("[]"), indent, relative_indent, last_property, buffer);
|
|
115
118
|
|
|
116
119
|
return;
|
|
117
120
|
}
|
|
118
121
|
|
|
119
122
|
pretty_print_label(name, indent, relative_indent, last_property, buffer);
|
|
120
123
|
|
|
121
|
-
|
|
124
|
+
hb_buffer_append(buffer, "(");
|
|
122
125
|
|
|
123
126
|
char count[16];
|
|
124
|
-
sprintf(count, "%zu",
|
|
125
|
-
|
|
126
|
-
|
|
127
|
+
sprintf(count, "%zu", hb_array_size(array));
|
|
128
|
+
hb_buffer_append(buffer, count);
|
|
129
|
+
hb_buffer_append(buffer, ")\n");
|
|
127
130
|
|
|
128
131
|
if (indent < 20) {
|
|
129
|
-
for (size_t i = 0; i <
|
|
130
|
-
AST_NODE_T* child =
|
|
132
|
+
for (size_t i = 0; i < hb_array_size(array); i++) {
|
|
133
|
+
AST_NODE_T* child = hb_array_get(array, i);
|
|
131
134
|
pretty_print_indent(buffer, indent);
|
|
132
135
|
pretty_print_indent(buffer, relative_indent + 1);
|
|
133
136
|
|
|
134
|
-
if (i ==
|
|
135
|
-
|
|
137
|
+
if (i == hb_array_size(array) - 1) {
|
|
138
|
+
hb_buffer_append(buffer, "└── ");
|
|
136
139
|
} else {
|
|
137
|
-
|
|
140
|
+
hb_buffer_append(buffer, "├── ");
|
|
138
141
|
}
|
|
139
142
|
|
|
140
143
|
ast_pretty_print_node(child, indent + 1, relative_indent + 1, buffer);
|
|
141
144
|
|
|
142
|
-
if (i !=
|
|
145
|
+
if (i != hb_array_size(array) - 1) { pretty_print_newline(indent + 1, relative_indent, buffer); }
|
|
143
146
|
}
|
|
144
147
|
}
|
|
145
|
-
|
|
148
|
+
hb_buffer_append(buffer, "\n");
|
|
146
149
|
}
|
|
147
150
|
|
|
148
151
|
void pretty_print_errors(
|
|
@@ -150,97 +153,92 @@ void pretty_print_errors(
|
|
|
150
153
|
const size_t indent,
|
|
151
154
|
const size_t relative_indent,
|
|
152
155
|
const bool last_property,
|
|
153
|
-
|
|
156
|
+
hb_buffer_T* buffer
|
|
154
157
|
) {
|
|
155
|
-
if (node->errors != NULL &&
|
|
158
|
+
if (node->errors != NULL && hb_array_size(node->errors) > 0) {
|
|
156
159
|
error_pretty_print_array("errors", node->errors, indent, relative_indent, last_property, buffer);
|
|
157
|
-
|
|
160
|
+
hb_buffer_append(buffer, "\n");
|
|
158
161
|
}
|
|
159
162
|
}
|
|
160
163
|
|
|
161
|
-
void pretty_print_location(location_T
|
|
162
|
-
|
|
164
|
+
void pretty_print_location(location_T location, hb_buffer_T* buffer) {
|
|
165
|
+
hb_buffer_append(buffer, "(location: (");
|
|
163
166
|
char location_string[128];
|
|
164
167
|
sprintf(
|
|
165
168
|
location_string,
|
|
166
|
-
"%
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
|
|
170
|
-
|
|
169
|
+
"%u,%u)-(%u,%u",
|
|
170
|
+
location.start.line,
|
|
171
|
+
location.start.column,
|
|
172
|
+
location.end.line,
|
|
173
|
+
location.end.column
|
|
171
174
|
);
|
|
172
|
-
|
|
173
|
-
|
|
175
|
+
hb_buffer_append(buffer, location_string);
|
|
176
|
+
hb_buffer_append(buffer, "))");
|
|
174
177
|
}
|
|
175
178
|
|
|
176
179
|
void pretty_print_position_property(
|
|
177
180
|
position_T* position,
|
|
178
|
-
|
|
181
|
+
hb_string_T name,
|
|
179
182
|
const size_t indent,
|
|
180
183
|
const size_t relative_indent,
|
|
181
184
|
const bool last_property,
|
|
182
|
-
|
|
185
|
+
hb_buffer_T* buffer
|
|
183
186
|
) {
|
|
184
187
|
pretty_print_label(name, indent, relative_indent, last_property, buffer);
|
|
185
188
|
|
|
186
189
|
if (position != NULL) {
|
|
187
|
-
|
|
190
|
+
hb_buffer_append(buffer, "(");
|
|
188
191
|
|
|
189
192
|
char position_string[128];
|
|
190
193
|
|
|
191
|
-
sprintf(
|
|
192
|
-
position_string,
|
|
193
|
-
"%zu:%zu",
|
|
194
|
-
(position->line) ? position->line : 0,
|
|
195
|
-
(position->column) ? position->column : 0
|
|
196
|
-
);
|
|
194
|
+
sprintf(position_string, "%u:%u", (position->line) ? position->line : 0, (position->column) ? position->column : 0);
|
|
197
195
|
|
|
198
|
-
|
|
199
|
-
|
|
196
|
+
hb_buffer_append(buffer, position_string);
|
|
197
|
+
hb_buffer_append(buffer, ")");
|
|
200
198
|
} else {
|
|
201
|
-
|
|
199
|
+
hb_buffer_append(buffer, "∅");
|
|
202
200
|
}
|
|
203
201
|
|
|
204
|
-
|
|
202
|
+
hb_buffer_append(buffer, "\n");
|
|
205
203
|
}
|
|
206
204
|
|
|
207
205
|
void pretty_print_token_property(
|
|
208
206
|
token_T* token,
|
|
209
|
-
|
|
207
|
+
hb_string_T name,
|
|
210
208
|
const size_t indent,
|
|
211
209
|
const size_t relative_indent,
|
|
212
210
|
const bool last_property,
|
|
213
|
-
|
|
211
|
+
hb_buffer_T* buffer
|
|
214
212
|
) {
|
|
215
213
|
pretty_print_label(name, indent, relative_indent, last_property, buffer);
|
|
216
214
|
|
|
217
215
|
if (token != NULL && token->value != NULL) {
|
|
218
|
-
|
|
219
|
-
|
|
220
|
-
free(quoted);
|
|
216
|
+
hb_string_T quoted = quoted_string(hb_string(token->value));
|
|
217
|
+
hb_buffer_append_string(buffer, quoted);
|
|
218
|
+
free(quoted.data);
|
|
221
219
|
|
|
222
|
-
|
|
220
|
+
hb_buffer_append(buffer, " ");
|
|
223
221
|
pretty_print_location(token->location, buffer);
|
|
224
222
|
} else {
|
|
225
|
-
|
|
223
|
+
hb_buffer_append(buffer, "∅");
|
|
226
224
|
}
|
|
227
225
|
|
|
228
|
-
|
|
226
|
+
hb_buffer_append(buffer, "\n");
|
|
229
227
|
}
|
|
230
228
|
|
|
231
229
|
void pretty_print_string_property(
|
|
232
|
-
|
|
233
|
-
|
|
230
|
+
hb_string_T string,
|
|
231
|
+
hb_string_T name,
|
|
234
232
|
const size_t indent,
|
|
235
233
|
const size_t relative_indent,
|
|
236
234
|
const bool last_property,
|
|
237
|
-
|
|
235
|
+
hb_buffer_T* buffer
|
|
238
236
|
) {
|
|
239
|
-
|
|
240
|
-
|
|
241
|
-
|
|
237
|
+
hb_string_T value = hb_string("∅");
|
|
238
|
+
hb_string_T escaped = { .data = NULL, .length = 0 };
|
|
239
|
+
hb_string_T quoted;
|
|
242
240
|
|
|
243
|
-
if (string
|
|
241
|
+
if (!hb_string_is_empty(string)) {
|
|
244
242
|
escaped = escape_newlines(string);
|
|
245
243
|
quoted = quoted_string(escaped);
|
|
246
244
|
value = quoted;
|
|
@@ -248,35 +246,8 @@ void pretty_print_string_property(
|
|
|
248
246
|
|
|
249
247
|
pretty_print_property(name, value, indent, relative_indent, last_property, buffer);
|
|
250
248
|
|
|
251
|
-
if (string
|
|
252
|
-
if (escaped
|
|
253
|
-
if (quoted
|
|
249
|
+
if (!hb_string_is_empty(string)) {
|
|
250
|
+
if (!hb_string_is_empty(escaped)) { free(escaped.data); }
|
|
251
|
+
if (!hb_string_is_empty(quoted)) { free(quoted.data); }
|
|
254
252
|
}
|
|
255
253
|
}
|
|
256
|
-
|
|
257
|
-
void pretty_print_analyzed_ruby(analyzed_ruby_T* analyzed, const char* source) {
|
|
258
|
-
printf(
|
|
259
|
-
"------------------------\nanalyzed (%p)\n------------------------\n%s\n------------------------\n if: %i\n "
|
|
260
|
-
" elsif: %i\n else: %i\n end: %i\n block: %i\n block_closing: %i\n case: %i\n when: %i\n for: "
|
|
261
|
-
"%i\n while: %i\n "
|
|
262
|
-
" until: %i\n begin: %i\n "
|
|
263
|
-
"rescue: %i\n ensure: %i\n unless: %i\n==================\n\n",
|
|
264
|
-
(void*) analyzed,
|
|
265
|
-
source,
|
|
266
|
-
analyzed->has_if_node,
|
|
267
|
-
analyzed->has_elsif_node,
|
|
268
|
-
analyzed->has_else_node,
|
|
269
|
-
analyzed->has_end,
|
|
270
|
-
analyzed->has_block_node,
|
|
271
|
-
analyzed->has_block_closing,
|
|
272
|
-
analyzed->has_case_node,
|
|
273
|
-
analyzed->has_when_node,
|
|
274
|
-
analyzed->has_for_node,
|
|
275
|
-
analyzed->has_while_node,
|
|
276
|
-
analyzed->has_until_node,
|
|
277
|
-
analyzed->has_begin_node,
|
|
278
|
-
analyzed->has_rescue_node,
|
|
279
|
-
analyzed->has_ensure_node,
|
|
280
|
-
analyzed->has_unless_node
|
|
281
|
-
);
|
|
282
|
-
}
|
data/src/prism_helpers.c
CHANGED
|
@@ -16,15 +16,15 @@ const char* pm_error_level_to_string(pm_error_level_t level) {
|
|
|
16
16
|
}
|
|
17
17
|
}
|
|
18
18
|
|
|
19
|
-
position_T
|
|
20
|
-
position_T
|
|
19
|
+
position_T position_from_source_with_offset(const char* source, size_t offset) {
|
|
20
|
+
position_T position = { .line = 1, .column = 0 };
|
|
21
21
|
|
|
22
22
|
for (size_t i = 0; i < offset; i++) {
|
|
23
23
|
if (is_newline(source[i])) {
|
|
24
|
-
position
|
|
25
|
-
position
|
|
24
|
+
position.line++;
|
|
25
|
+
position.column = 0;
|
|
26
26
|
} else {
|
|
27
|
-
position
|
|
27
|
+
position.column++;
|
|
28
28
|
}
|
|
29
29
|
}
|
|
30
30
|
|
|
@@ -40,8 +40,8 @@ RUBY_PARSE_ERROR_T* ruby_parse_error_from_prism_error(
|
|
|
40
40
|
size_t start_offset = (size_t) (error->location.start - parser->start);
|
|
41
41
|
size_t end_offset = (size_t) (error->location.end - parser->start);
|
|
42
42
|
|
|
43
|
-
position_T
|
|
44
|
-
position_T
|
|
43
|
+
position_T start = position_from_source_with_offset(source, start_offset);
|
|
44
|
+
position_T end = position_from_source_with_offset(source, end_offset);
|
|
45
45
|
|
|
46
46
|
return ruby_parse_error_init(
|
|
47
47
|
error->message,
|
data/src/range.c
CHANGED
|
@@ -1,38 +1,5 @@
|
|
|
1
1
|
#include "include/range.h"
|
|
2
2
|
|
|
3
|
-
|
|
4
|
-
return
|
|
5
|
-
}
|
|
6
|
-
|
|
7
|
-
range_T* range_init(const size_t from, const size_t to) {
|
|
8
|
-
range_T* range = calloc(1, range_sizeof());
|
|
9
|
-
|
|
10
|
-
range->from = from;
|
|
11
|
-
range->to = to;
|
|
12
|
-
|
|
13
|
-
return range;
|
|
14
|
-
}
|
|
15
|
-
|
|
16
|
-
size_t range_from(const range_T* range) {
|
|
17
|
-
return range->from;
|
|
18
|
-
}
|
|
19
|
-
|
|
20
|
-
size_t range_to(const range_T* range) {
|
|
21
|
-
return range->to;
|
|
22
|
-
}
|
|
23
|
-
|
|
24
|
-
size_t range_length(range_T* range) {
|
|
25
|
-
return range_to(range) - range_from(range);
|
|
26
|
-
}
|
|
27
|
-
|
|
28
|
-
range_T* range_copy(range_T* range) {
|
|
29
|
-
if (!range) { return NULL; }
|
|
30
|
-
|
|
31
|
-
return range_init(range_from(range), range_to(range));
|
|
32
|
-
}
|
|
33
|
-
|
|
34
|
-
void range_free(range_T* range) {
|
|
35
|
-
if (range == NULL) { return; }
|
|
36
|
-
|
|
37
|
-
free(range);
|
|
3
|
+
uint32_t range_length(range_T range) {
|
|
4
|
+
return range.to - range.from;
|
|
38
5
|
}
|
data/src/token.c
CHANGED
|
@@ -1,37 +1,35 @@
|
|
|
1
1
|
#include "include/token.h"
|
|
2
|
-
#include "include/json.h"
|
|
3
2
|
#include "include/lexer.h"
|
|
4
3
|
#include "include/position.h"
|
|
4
|
+
#include "include/range.h"
|
|
5
5
|
#include "include/token_struct.h"
|
|
6
6
|
#include "include/util.h"
|
|
7
7
|
|
|
8
|
+
#include <stdbool.h>
|
|
8
9
|
#include <stdio.h>
|
|
9
10
|
#include <stdlib.h>
|
|
10
11
|
#include <string.h>
|
|
11
12
|
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
}
|
|
15
|
-
|
|
16
|
-
token_T* token_init(const char* value, const token_type_T type, lexer_T* lexer) {
|
|
17
|
-
token_T* token = calloc(1, token_sizeof());
|
|
13
|
+
token_T* token_init(hb_string_T value, const token_type_T type, lexer_T* lexer) {
|
|
14
|
+
token_T* token = calloc(1, sizeof(token_T));
|
|
18
15
|
|
|
19
16
|
if (type == TOKEN_NEWLINE) {
|
|
20
17
|
lexer->current_line++;
|
|
21
18
|
lexer->current_column = 0;
|
|
22
19
|
}
|
|
23
20
|
|
|
24
|
-
|
|
25
|
-
token->value = herb_strdup(value);
|
|
26
|
-
} else {
|
|
27
|
-
token->value = NULL;
|
|
28
|
-
}
|
|
21
|
+
token->value = hb_string_to_c_string_using_malloc(value);
|
|
29
22
|
|
|
30
23
|
token->type = type;
|
|
31
|
-
token->range =
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
24
|
+
token->range = (range_T) { .from = lexer->previous_position, .to = lexer->current_position };
|
|
25
|
+
|
|
26
|
+
location_from(
|
|
27
|
+
&token->location,
|
|
28
|
+
lexer->previous_line,
|
|
29
|
+
lexer->previous_column,
|
|
30
|
+
lexer->current_line,
|
|
31
|
+
lexer->current_column
|
|
32
|
+
);
|
|
35
33
|
|
|
36
34
|
lexer->previous_line = lexer->current_line;
|
|
37
35
|
lexer->previous_column = lexer->current_column;
|
|
@@ -82,93 +80,42 @@ const char* token_type_to_string(const token_type_T type) {
|
|
|
82
80
|
return "Unknown token_type_T";
|
|
83
81
|
}
|
|
84
82
|
|
|
85
|
-
|
|
83
|
+
hb_string_T token_to_string(const token_T* token) {
|
|
86
84
|
const char* type_string = token_type_to_string(token->type);
|
|
87
|
-
const char* template = "#<Herb::Token type=\"%s\" value=\"
|
|
85
|
+
const char* template = "#<Herb::Token type=\"%s\" value=\"%.*s\" range=[%u, %u] start=(%u:%u) end=(%u:%u)>";
|
|
88
86
|
|
|
89
87
|
char* string = calloc(strlen(type_string) + strlen(template) + strlen(token->value) + 16, sizeof(char));
|
|
90
|
-
|
|
88
|
+
hb_string_T escaped;
|
|
91
89
|
|
|
92
90
|
if (token->type == TOKEN_EOF) {
|
|
93
|
-
escaped = herb_strdup("<EOF>");
|
|
91
|
+
escaped = hb_string(herb_strdup("<EOF>"));
|
|
94
92
|
} else {
|
|
95
|
-
escaped = escape_newlines(token->value);
|
|
93
|
+
escaped = escape_newlines(hb_string(token->value));
|
|
96
94
|
}
|
|
97
95
|
|
|
98
96
|
sprintf(
|
|
99
97
|
string,
|
|
100
98
|
template,
|
|
101
99
|
type_string,
|
|
102
|
-
escaped,
|
|
103
|
-
|
|
104
|
-
token->range
|
|
105
|
-
token->
|
|
106
|
-
token->location
|
|
107
|
-
token->location
|
|
108
|
-
token->location
|
|
100
|
+
escaped.length,
|
|
101
|
+
escaped.data,
|
|
102
|
+
token->range.from,
|
|
103
|
+
token->range.to,
|
|
104
|
+
token->location.start.line,
|
|
105
|
+
token->location.start.column,
|
|
106
|
+
token->location.end.line,
|
|
107
|
+
token->location.end.column
|
|
109
108
|
);
|
|
110
109
|
|
|
111
|
-
free(escaped);
|
|
112
|
-
|
|
113
|
-
return string;
|
|
114
|
-
}
|
|
115
|
-
|
|
116
|
-
char* token_to_json(const token_T* token) {
|
|
117
|
-
buffer_T json = buffer_new();
|
|
118
|
-
|
|
119
|
-
json_start_root_object(&json);
|
|
120
|
-
json_add_string(&json, "type", token_type_to_string(token->type));
|
|
121
|
-
json_add_string(&json, "value", token->value);
|
|
122
|
-
|
|
123
|
-
buffer_T range = buffer_new();
|
|
124
|
-
json_start_array(&json, "range");
|
|
125
|
-
json_add_size_t(&range, NULL, token->range->from);
|
|
126
|
-
json_add_size_t(&range, NULL, token->range->to);
|
|
127
|
-
buffer_concat(&json, &range);
|
|
128
|
-
buffer_free(&range);
|
|
129
|
-
json_end_array(&json);
|
|
130
|
-
|
|
131
|
-
buffer_T start = buffer_new();
|
|
132
|
-
json_start_object(&json, "start");
|
|
133
|
-
json_add_size_t(&start, "line", token->location->start->line);
|
|
134
|
-
json_add_size_t(&start, "column", token->location->start->column);
|
|
135
|
-
buffer_concat(&json, &start);
|
|
136
|
-
buffer_free(&start);
|
|
137
|
-
json_end_object(&json);
|
|
138
|
-
|
|
139
|
-
buffer_T end = buffer_new();
|
|
140
|
-
json_start_object(&json, "end");
|
|
141
|
-
json_add_size_t(&end, "line", token->location->end->line);
|
|
142
|
-
json_add_size_t(&end, "column", token->location->end->column);
|
|
143
|
-
buffer_concat(&json, &end);
|
|
144
|
-
buffer_free(&end);
|
|
145
|
-
json_end_object(&json);
|
|
146
|
-
|
|
147
|
-
json_end_object(&json);
|
|
148
|
-
|
|
149
|
-
return buffer_value(&json);
|
|
150
|
-
}
|
|
151
|
-
|
|
152
|
-
char* token_value(const token_T* token) {
|
|
153
|
-
return token->value;
|
|
154
|
-
}
|
|
155
|
-
|
|
156
|
-
int token_type(const token_T* token) {
|
|
157
|
-
return token->type;
|
|
158
|
-
}
|
|
110
|
+
free(escaped.data);
|
|
159
111
|
|
|
160
|
-
|
|
161
|
-
return token->location->start;
|
|
162
|
-
}
|
|
163
|
-
|
|
164
|
-
position_T* token_end_position(token_T* token) {
|
|
165
|
-
return token->location->end;
|
|
112
|
+
return hb_string(string);
|
|
166
113
|
}
|
|
167
114
|
|
|
168
115
|
token_T* token_copy(token_T* token) {
|
|
169
116
|
if (!token) { return NULL; }
|
|
170
117
|
|
|
171
|
-
token_T* new_token = calloc(1,
|
|
118
|
+
token_T* new_token = calloc(1, sizeof(token_T));
|
|
172
119
|
|
|
173
120
|
if (!new_token) { return NULL; }
|
|
174
121
|
|
|
@@ -184,18 +131,20 @@ token_T* token_copy(token_T* token) {
|
|
|
184
131
|
}
|
|
185
132
|
|
|
186
133
|
new_token->type = token->type;
|
|
187
|
-
new_token->range =
|
|
188
|
-
new_token->location =
|
|
134
|
+
new_token->range = token->range;
|
|
135
|
+
new_token->location = token->location;
|
|
189
136
|
|
|
190
137
|
return new_token;
|
|
191
138
|
}
|
|
192
139
|
|
|
140
|
+
bool token_value_empty(const token_T* token) {
|
|
141
|
+
return token == NULL || token->value == NULL || token->value[0] == '\0';
|
|
142
|
+
}
|
|
143
|
+
|
|
193
144
|
void token_free(token_T* token) {
|
|
194
145
|
if (!token) { return; }
|
|
195
146
|
|
|
196
147
|
if (token->value != NULL) { free(token->value); }
|
|
197
|
-
if (token->range != NULL) { range_free(token->range); }
|
|
198
|
-
if (token->location != NULL) { location_free(token->location); }
|
|
199
148
|
|
|
200
149
|
free(token);
|
|
201
150
|
}
|
data/src/utf8.c
CHANGED
|
@@ -5,7 +5,7 @@
|
|
|
5
5
|
// 110xxxxx = 2 bytes
|
|
6
6
|
// 1110xxxx = 3 bytes
|
|
7
7
|
// 11110xxx = 4 bytes
|
|
8
|
-
|
|
8
|
+
uint32_t utf8_char_byte_length(unsigned char first_byte) {
|
|
9
9
|
if ((first_byte & 0x80) == 0) {
|
|
10
10
|
return 1;
|
|
11
11
|
} else if ((first_byte & 0xE0) == 0xC0) {
|
|
@@ -24,18 +24,18 @@ bool utf8_is_valid_continuation_byte(unsigned char byte) {
|
|
|
24
24
|
return (byte & 0xC0) == 0x80;
|
|
25
25
|
}
|
|
26
26
|
|
|
27
|
-
|
|
27
|
+
uint32_t utf8_sequence_length(const char* str, size_t position, size_t max_length) {
|
|
28
28
|
if (position >= max_length) { return 0; }
|
|
29
29
|
|
|
30
30
|
unsigned char first_byte = (unsigned char) str[position];
|
|
31
|
-
|
|
31
|
+
uint32_t expected_length = utf8_char_byte_length(first_byte);
|
|
32
32
|
|
|
33
33
|
if (position + expected_length > max_length) {
|
|
34
34
|
return 1; // Not enough bytes, treat as single byte
|
|
35
35
|
}
|
|
36
36
|
|
|
37
37
|
if (expected_length > 1) {
|
|
38
|
-
for (
|
|
38
|
+
for (uint32_t i = 1; i < expected_length; i++) {
|
|
39
39
|
if (!utf8_is_valid_continuation_byte((unsigned char) str[position + i])) {
|
|
40
40
|
return 1; // Invalid continuation byte, treat first byte as single byte
|
|
41
41
|
}
|