lrama 0.5.9 → 0.5.10
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.github/workflows/test.yaml +5 -0
- data/.gitignore +7 -4
- data/Gemfile +9 -5
- data/Rakefile +13 -0
- data/Steepfile +9 -3
- data/lib/lrama/context.rb +1 -3
- data/lib/lrama/counterexamples/path.rb +0 -46
- data/lib/lrama/counterexamples/production_path.rb +17 -0
- data/lib/lrama/counterexamples/start_path.rb +21 -0
- data/lib/lrama/counterexamples/transition_path.rb +17 -0
- data/lib/lrama/counterexamples.rb +3 -0
- data/lib/lrama/grammar/code/initial_action_code.rb +28 -0
- data/lib/lrama/grammar/code/no_reference_code.rb +24 -0
- data/lib/lrama/grammar/code/printer_code.rb +34 -0
- data/lib/lrama/grammar/code/rule_action.rb +62 -0
- data/lib/lrama/grammar/code.rb +9 -93
- data/lib/lrama/grammar/counter.rb +15 -0
- data/lib/lrama/grammar/error_token.rb +3 -3
- data/lib/lrama/grammar/parameterizing_rules/builder/base.rb +28 -0
- data/lib/lrama/grammar/parameterizing_rules/builder/list.rb +20 -0
- data/lib/lrama/grammar/parameterizing_rules/builder/nonempty_list.rb +20 -0
- data/lib/lrama/grammar/parameterizing_rules/builder/option.rb +20 -0
- data/lib/lrama/grammar/parameterizing_rules/builder/separated_list.rb +28 -0
- data/lib/lrama/grammar/parameterizing_rules/builder/separated_nonempty_list.rb +27 -0
- data/lib/lrama/grammar/parameterizing_rules/builder.rb +43 -0
- data/lib/lrama/grammar/printer.rb +3 -3
- data/lib/lrama/grammar/reference.rb +7 -16
- data/lib/lrama/grammar/rule.rb +18 -2
- data/lib/lrama/grammar/rule_builder.rb +179 -0
- data/lib/lrama/grammar.rb +109 -324
- data/lib/lrama/lexer/location.rb +22 -0
- data/lib/lrama/lexer/token/parameterizing.rb +18 -3
- data/lib/lrama/lexer/token/tag.rb +4 -0
- data/lib/lrama/lexer/token/user_code.rb +54 -4
- data/lib/lrama/lexer/token.rb +22 -4
- data/lib/lrama/lexer.rb +31 -29
- data/lib/lrama/options.rb +1 -2
- data/lib/lrama/output.rb +2 -2
- data/lib/lrama/parser.rb +420 -343
- data/lib/lrama/report/profile.rb +1 -12
- data/lib/lrama/version.rb +1 -1
- data/parser.y +106 -49
- data/rbs_collection.lock.yaml +5 -1
- data/rbs_collection.yaml +1 -0
- data/sig/lrama/grammar/code/printer_code.rbs +15 -0
- data/sig/lrama/grammar/code.rbs +24 -0
- data/sig/lrama/grammar/counter.rbs +11 -0
- data/sig/lrama/grammar/parameterizing_rules/builder.rbs +10 -0
- data/sig/lrama/grammar/precedence.rbs +11 -0
- data/sig/lrama/grammar/printer.rbs +11 -0
- data/sig/lrama/grammar/reference.rbs +5 -5
- data/sig/lrama/grammar/rule.rbs +13 -0
- data/sig/lrama/grammar/rule_builder.rbs +41 -0
- data/sig/lrama/lexer/location.rbs +14 -0
- data/sig/lrama/lexer/token/parameterizing.rbs +7 -0
- data/sig/lrama/lexer/token/tag.rbs +1 -0
- data/sig/lrama/lexer/token/user_code.rbs +8 -1
- data/sig/lrama/lexer/token.rbs +8 -3
- data/sig/stdlib/strscan/string_scanner.rbs +5 -0
- data/template/bison/yacc.c +5 -0
- metadata +29 -2
data/lib/lrama/lexer/token.rb
CHANGED
@@ -1,20 +1,38 @@
|
|
1
1
|
module Lrama
|
2
2
|
class Lexer
|
3
|
-
class Token < Struct.new(:s_value, :alias_name, keyword_init: true)
|
3
|
+
class Token < Struct.new(:s_value, :alias_name, :location, keyword_init: true)
|
4
4
|
|
5
|
-
attr_accessor :
|
5
|
+
attr_accessor :referred
|
6
6
|
|
7
7
|
def to_s
|
8
|
-
"#{super}
|
8
|
+
"#{super} location: #{location}"
|
9
9
|
end
|
10
10
|
|
11
11
|
def referred_by?(string)
|
12
|
-
[self.s_value, self.alias_name].include?(string)
|
12
|
+
[self.s_value, self.alias_name].compact.include?(string)
|
13
13
|
end
|
14
14
|
|
15
15
|
def ==(other)
|
16
16
|
self.class == other.class && self.s_value == other.s_value
|
17
17
|
end
|
18
|
+
|
19
|
+
def first_line
|
20
|
+
location.first_line
|
21
|
+
end
|
22
|
+
alias :line :first_line
|
23
|
+
|
24
|
+
def first_column
|
25
|
+
location.first_column
|
26
|
+
end
|
27
|
+
alias :column :first_column
|
28
|
+
|
29
|
+
def last_line
|
30
|
+
location.last_line
|
31
|
+
end
|
32
|
+
|
33
|
+
def last_column
|
34
|
+
location.last_column
|
35
|
+
end
|
18
36
|
end
|
19
37
|
end
|
20
38
|
end
|
data/lib/lrama/lexer.rb
CHANGED
@@ -1,4 +1,5 @@
|
|
1
1
|
require "strscan"
|
2
|
+
require "lrama/lexer/location"
|
2
3
|
require "lrama/lexer/token"
|
3
4
|
|
4
5
|
module Lrama
|
@@ -7,7 +8,7 @@ module Lrama
|
|
7
8
|
attr_accessor :status
|
8
9
|
attr_accessor :end_symbol
|
9
10
|
|
10
|
-
SYMBOLS = %
|
11
|
+
SYMBOLS = ['%{', '%}', '%%', '{', '}', '\[', '\]', '\(', '\)', '\,', ':', '\|', ';']
|
11
12
|
PERCENT_TOKENS = %w(
|
12
13
|
%union
|
13
14
|
%token
|
@@ -31,8 +32,8 @@ module Lrama
|
|
31
32
|
|
32
33
|
def initialize(text)
|
33
34
|
@scanner = StringScanner.new(text)
|
34
|
-
@head = @scanner.pos
|
35
|
-
@line = 1
|
35
|
+
@head_column = @head = @scanner.pos
|
36
|
+
@head_line = @line = 1
|
36
37
|
@status = :initial
|
37
38
|
@end_symbol = nil
|
38
39
|
end
|
@@ -54,6 +55,13 @@ module Lrama
|
|
54
55
|
@scanner.pos - @head
|
55
56
|
end
|
56
57
|
|
58
|
+
def location
|
59
|
+
Location.new(
|
60
|
+
first_line: @head_line, first_column: @head_column,
|
61
|
+
last_line: @line, last_column: column
|
62
|
+
)
|
63
|
+
end
|
64
|
+
|
57
65
|
def lex_token
|
58
66
|
while !@scanner.eos? do
|
59
67
|
case
|
@@ -63,9 +71,8 @@ module Lrama
|
|
63
71
|
# noop
|
64
72
|
when @scanner.scan(/\/\*/)
|
65
73
|
lex_comment
|
66
|
-
when @scanner.scan(
|
67
|
-
@scanner
|
68
|
-
newline
|
74
|
+
when @scanner.scan(/\/\/.*(?<newline>\n)?/)
|
75
|
+
newline if @scanner[:newline]
|
69
76
|
else
|
70
77
|
break
|
71
78
|
end
|
@@ -84,17 +91,17 @@ module Lrama
|
|
84
91
|
when @scanner.scan(/[\?\+\*]/)
|
85
92
|
return [@scanner.matched, @scanner.matched]
|
86
93
|
when @scanner.scan(/<\w+>/)
|
87
|
-
return [:TAG,
|
94
|
+
return [:TAG, Lrama::Lexer::Token::Tag.new(s_value: @scanner.matched, location: location)]
|
88
95
|
when @scanner.scan(/'.'/)
|
89
|
-
return [:CHARACTER,
|
96
|
+
return [:CHARACTER, Lrama::Lexer::Token::Char.new(s_value: @scanner.matched, location: location)]
|
90
97
|
when @scanner.scan(/'\\\\'|'\\b'|'\\t'|'\\f'|'\\r'|'\\n'|'\\v'|'\\13'/)
|
91
|
-
return [:CHARACTER,
|
92
|
-
when @scanner.scan(/"/)
|
93
|
-
return [:STRING, %Q(
|
98
|
+
return [:CHARACTER, Lrama::Lexer::Token::Char.new(s_value: @scanner.matched, location: location)]
|
99
|
+
when @scanner.scan(/".*?"/)
|
100
|
+
return [:STRING, %Q(#{@scanner.matched})]
|
94
101
|
when @scanner.scan(/\d+/)
|
95
102
|
return [:INTEGER, Integer(@scanner.matched)]
|
96
103
|
when @scanner.scan(/([a-zA-Z_.][-a-zA-Z0-9_.]*)/)
|
97
|
-
token =
|
104
|
+
token = Lrama::Lexer::Token::Ident.new(s_value: @scanner.matched, location: location)
|
98
105
|
type =
|
99
106
|
if @scanner.check(/\s*(\[\s*[a-zA-Z_.][-a-zA-Z0-9_.]*\s*\])?\s*:/)
|
100
107
|
:IDENT_COLON
|
@@ -118,25 +125,27 @@ module Lrama
|
|
118
125
|
when @scanner.scan(/}/)
|
119
126
|
if nested == 0 && @end_symbol == '}'
|
120
127
|
@scanner.unscan
|
121
|
-
return [:C_DECLARATION,
|
128
|
+
return [:C_DECLARATION, Lrama::Lexer::Token::UserCode.new(s_value: code, location: location)]
|
122
129
|
else
|
123
130
|
code += @scanner.matched
|
124
131
|
nested -= 1
|
125
132
|
end
|
126
133
|
when @scanner.check(/#{@end_symbol}/)
|
127
|
-
return [:C_DECLARATION,
|
134
|
+
return [:C_DECLARATION, Lrama::Lexer::Token::UserCode.new(s_value: code, location: location)]
|
128
135
|
when @scanner.scan(/\n/)
|
129
136
|
code += @scanner.matched
|
130
137
|
newline
|
131
|
-
when @scanner.scan(/"/)
|
132
|
-
|
133
|
-
|
134
|
-
|
135
|
-
|
136
|
-
matched = @scanner.scan_until(/'/)
|
137
|
-
code += %Q('#{matched})
|
138
|
+
when @scanner.scan(/".*?"/)
|
139
|
+
code += %Q(#{@scanner.matched})
|
140
|
+
@line += @scanner.matched.count("\n")
|
141
|
+
when @scanner.scan(/'.*?'/)
|
142
|
+
code += %Q(#{@scanner.matched})
|
138
143
|
else
|
139
|
-
|
144
|
+
if @scanner.scan(/[^\"'\{\}\n#{@end_symbol}]+/)
|
145
|
+
code += @scanner.matched
|
146
|
+
else
|
147
|
+
code += @scanner.getch
|
148
|
+
end
|
140
149
|
end
|
141
150
|
end
|
142
151
|
raise ParseError, "Unexpected code: #{code}."
|
@@ -158,13 +167,6 @@ module Lrama
|
|
158
167
|
end
|
159
168
|
end
|
160
169
|
|
161
|
-
def setup_token(token)
|
162
|
-
token.line = @head_line
|
163
|
-
token.column = @head_column
|
164
|
-
|
165
|
-
token
|
166
|
-
end
|
167
|
-
|
168
170
|
def newline
|
169
171
|
@line += 1
|
170
172
|
@head = @scanner.pos + 1
|
data/lib/lrama/options.rb
CHANGED
@@ -4,7 +4,7 @@ module Lrama
|
|
4
4
|
attr_accessor :skeleton, :header, :header_file,
|
5
5
|
:report_file, :outfile,
|
6
6
|
:error_recovery, :grammar_file,
|
7
|
-
:
|
7
|
+
:trace_opts, :report_opts, :y,
|
8
8
|
:debug
|
9
9
|
|
10
10
|
def initialize
|
@@ -15,7 +15,6 @@ module Lrama
|
|
15
15
|
@outfile = "y.tab.c"
|
16
16
|
@error_recovery = false
|
17
17
|
@grammar_file = nil
|
18
|
-
@report_file = nil
|
19
18
|
@trace_opts = nil
|
20
19
|
@report_opts = nil
|
21
20
|
@y = STDIN
|
data/lib/lrama/output.rb
CHANGED