shex 0.6.2 → 0.7.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.md +108 -97
- data/VERSION +1 -1
- data/etc/doap.ttl +1 -1
- data/lib/shex/algebra/and.rb +3 -12
- data/lib/shex/algebra/each_of.rb +2 -12
- data/lib/shex/algebra/import.rb +6 -0
- data/lib/shex/algebra/not.rb +3 -10
- data/lib/shex/algebra/one_of.rb +2 -12
- data/lib/shex/algebra/operator.rb +28 -15
- data/lib/shex/algebra/or.rb +3 -12
- data/lib/shex/algebra/schema.rb +2 -9
- data/lib/shex/algebra/shape.rb +4 -2
- data/lib/shex/algebra/shape_expression.rb +29 -0
- data/lib/shex/algebra/start.rb +2 -10
- data/lib/shex/algebra/stem.rb +5 -1
- data/lib/shex/algebra/stem_range.rb +3 -1
- data/lib/shex/algebra/triple_constraint.rb +1 -1
- data/lib/shex/algebra/triple_expression.rb +18 -0
- data/lib/shex/algebra.rb +0 -1
- data/lib/shex/meta.rb +325 -9859
- data/lib/shex/parser.rb +559 -474
- data/lib/shex/terminals.rb +5 -25
- data/lib/shex.rb +4 -1
- metadata +57 -23
data/lib/shex/parser.rb
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
# -*- encoding: utf-8 -*-
|
2
2
|
require 'ebnf'
|
3
|
-
require 'ebnf/
|
3
|
+
require 'ebnf/peg/parser'
|
4
4
|
require 'shex/meta'
|
5
5
|
|
6
6
|
module ShEx
|
@@ -10,9 +10,8 @@ module ShEx
|
|
10
10
|
# @see https://www.w3.org/2005/01/yacker/uploads/ShEx3?lang=perl&markup=html#productions
|
11
11
|
# @see https://en.wikipedia.org/wiki/LR_parser
|
12
12
|
class Parser
|
13
|
-
include ShEx::Meta
|
14
13
|
include ShEx::Terminals
|
15
|
-
include EBNF::
|
14
|
+
include EBNF::PEG::Parser
|
16
15
|
include RDF::Util::Logger
|
17
16
|
|
18
17
|
##
|
@@ -27,679 +26,798 @@ module ShEx
|
|
27
26
|
# @return [String]
|
28
27
|
attr_accessor :input
|
29
28
|
|
30
|
-
##
|
31
|
-
# The current input tokens being processed.
|
32
|
-
#
|
33
|
-
# @return [Array<Token>]
|
34
|
-
attr_reader :tokens
|
35
|
-
|
36
29
|
##
|
37
30
|
# The internal representation of the result using hierarchy of RDF objects and ShEx::Operator
|
38
31
|
# objects.
|
39
32
|
# @return [Array]
|
40
|
-
# @see https://
|
33
|
+
# @see https://ruby-rdf.github.io/sparql/SPARQL/Algebra
|
41
34
|
attr_accessor :result
|
42
35
|
|
43
36
|
# Terminals passed to lexer. Order matters!
|
44
|
-
terminal(:CODE, CODE, unescape: true) do |
|
37
|
+
terminal(:CODE, CODE, unescape: true) do |value|
|
45
38
|
# { foo %}
|
46
39
|
# Keep surrounding whitespace for now
|
47
|
-
|
40
|
+
value[1..-2].sub(/%\s*$/, '') # Drop {} and %
|
48
41
|
end
|
49
|
-
terminal(:REPEAT_RANGE, REPEAT_RANGE) do |
|
50
|
-
card =
|
51
|
-
card[1] =
|
52
|
-
|
42
|
+
terminal(:REPEAT_RANGE, REPEAT_RANGE) do |value|
|
43
|
+
card = value[1..-2].split(',').map {|v| v =~ /^\d+$/ ? v.to_i : v}
|
44
|
+
card[1] = value.include?(',') ? '*' : card[0] if card.length == 1
|
45
|
+
{min: card[0], max: card[1]}
|
53
46
|
end
|
54
|
-
terminal(:BLANK_NODE_LABEL, BLANK_NODE_LABEL) do |
|
55
|
-
|
47
|
+
terminal(:BLANK_NODE_LABEL, BLANK_NODE_LABEL) do |value|
|
48
|
+
bnode(value[2..-1])
|
56
49
|
end
|
57
|
-
terminal(:IRIREF, IRIREF, unescape: true) do |
|
50
|
+
terminal(:IRIREF, IRIREF, unescape: true) do |value|
|
58
51
|
begin
|
59
|
-
|
52
|
+
iri(value[1..-2])
|
60
53
|
rescue ArgumentError => e
|
61
54
|
raise Error, e.message
|
62
55
|
end
|
63
56
|
end
|
64
|
-
terminal(:DOUBLE, DOUBLE) do |
|
57
|
+
terminal(:DOUBLE, DOUBLE) do |value|
|
65
58
|
# Note that a Turtle Double may begin with a '.[eE]', so tack on a leading
|
66
59
|
# zero if necessary
|
67
|
-
value =
|
68
|
-
|
60
|
+
value = value.sub(/\.([eE])/, '.0\1')
|
61
|
+
literal(value, datatype: RDF::XSD.double)
|
69
62
|
end
|
70
|
-
terminal(:DECIMAL, DECIMAL) do |
|
63
|
+
terminal(:DECIMAL, DECIMAL) do |value|
|
71
64
|
# Note that a Turtle Decimal may begin with a '.', so tack on a leading
|
72
65
|
# zero if necessary
|
73
|
-
value
|
74
|
-
#value = "0#{token.value}" if token.value[0,1] == "."
|
75
|
-
input[:literal] = literal(value, datatype: RDF::XSD.decimal)
|
66
|
+
literal(value, datatype: RDF::XSD.decimal)
|
76
67
|
end
|
77
|
-
terminal(:INTEGER, INTEGER) do |
|
78
|
-
|
68
|
+
terminal(:INTEGER, INTEGER) do |value|
|
69
|
+
literal(value, datatype: RDF::XSD.integer)
|
79
70
|
end
|
80
|
-
terminal(:PNAME_LN, PNAME_LN, unescape: true) do |
|
81
|
-
prefix, suffix =
|
82
|
-
|
83
|
-
|
71
|
+
terminal(:PNAME_LN, PNAME_LN, unescape: true) do |value|
|
72
|
+
prefix, suffix = value.split(":", 2)
|
73
|
+
error(nil, "Compact IRI missing prefix definition: #{prefix}", production: :PNAME_LN) unless prefix(prefix)
|
74
|
+
ns(prefix, suffix)
|
84
75
|
end
|
85
|
-
terminal(:PNAME_NS, PNAME_NS) do |
|
86
|
-
|
87
|
-
|
88
|
-
input[:iri] = ns(prefix, nil)
|
89
|
-
input[:prefix] = prefix && prefix.to_sym
|
76
|
+
terminal(:PNAME_NS, PNAME_NS) do |value|
|
77
|
+
value[0..-2]
|
90
78
|
end
|
91
|
-
terminal(:ATPNAME_LN, ATPNAME_LN, unescape: true) do |
|
92
|
-
prefix, suffix =
|
79
|
+
terminal(:ATPNAME_LN, ATPNAME_LN, unescape: true) do |value, parent_prod|
|
80
|
+
prefix, suffix = value.split(":", 2)
|
93
81
|
prefix.sub!(/^@#{WS}*/, '')
|
94
|
-
|
95
|
-
error(nil, "Compact IRI missing prefix definition: #{token.value}", production: :ATPNAME_LN) unless input[:shapeLabel].absolute?
|
82
|
+
ns(prefix, suffix)
|
96
83
|
end
|
97
|
-
terminal(:ATPNAME_NS, ATPNAME_NS) do |
|
98
|
-
prefix =
|
84
|
+
terminal(:ATPNAME_NS, ATPNAME_NS) do |value|
|
85
|
+
prefix = value[0..-2]
|
99
86
|
prefix.sub!(/^@\s*/, '')
|
100
87
|
|
101
|
-
|
102
|
-
end
|
103
|
-
terminal(:LANGTAG, LANGTAG) do |
|
104
|
-
|
105
|
-
end
|
106
|
-
terminal(:LANG_STRING_LITERAL_LONG1, LANG_STRING_LITERAL_LONG1, unescape: true) do |
|
107
|
-
|
108
|
-
|
109
|
-
|
110
|
-
|
111
|
-
|
112
|
-
|
113
|
-
|
114
|
-
|
115
|
-
|
116
|
-
|
117
|
-
end
|
118
|
-
terminal(:
|
119
|
-
|
120
|
-
|
121
|
-
|
122
|
-
|
123
|
-
|
124
|
-
|
125
|
-
|
126
|
-
|
127
|
-
|
128
|
-
|
129
|
-
|
130
|
-
|
131
|
-
|
132
|
-
|
133
|
-
|
134
|
-
|
135
|
-
|
136
|
-
|
137
|
-
# String terminals
|
138
|
-
terminal(nil, STR_EXPR, map: STR_MAP) do |prod, token, input|
|
139
|
-
case token.value
|
140
|
-
when '*' then input[:cardinality] = {min: 0, max: "*"}
|
141
|
-
when '+' then input[:cardinality] = {min: 1, max: "*"}
|
142
|
-
when '?' then input[:cardinality] = {min: 0, max: 1}
|
143
|
-
when '!' then input[:not] = token.value
|
144
|
-
when '^' then input[:inverse] = token.value
|
145
|
-
when '.' then input[:dot] = token.value
|
146
|
-
when 'true', 'false' then input[:literal] = RDF::Literal::Boolean.new(token.value)
|
147
|
-
when '~' then input[:pattern] = token.value
|
148
|
-
when 'BNODE', 'IRI',
|
149
|
-
'NONLITERAL' then input[:nonLiteralKind] = token.value.downcase.to_sym
|
150
|
-
when 'CLOSED' then input[:closed] = token.value.downcase.to_sym
|
151
|
-
when 'EXTERNAL' then input[:external] = token.value.downcase.to_sym
|
152
|
-
when 'FRACTIONDIGITS',
|
153
|
-
'TOTALDIGITS' then input[:numericLength] = token.value.downcase.to_sym
|
154
|
-
when 'LITERAL' then input[:shapeAtomLiteral] = token.value.downcase.to_sym
|
155
|
-
when 'LENGTH',
|
156
|
-
'MINLENGTH',
|
157
|
-
'MAXLENGTH' then input[:stringLength] = token.value.downcase.to_sym
|
158
|
-
when 'MININCLUSIVE',
|
159
|
-
'MINEXCLUSIVE',
|
160
|
-
'MAXINCLUSIVE',
|
161
|
-
'MAXEXCLUSIVE' then input[:numericRange] = token.value.downcase.to_sym
|
162
|
-
when 'NOT' then input[:not] = token.value.downcase.to_sym
|
163
|
-
when 'START' then input[:start] = token.value.downcase.to_sym
|
164
|
-
else
|
165
|
-
#raise "Unexpected MC terminal: #{token.inspect}"
|
166
|
-
end
|
88
|
+
ns(prefix, nil)
|
89
|
+
end
|
90
|
+
terminal(:LANGTAG, LANGTAG) do |value|
|
91
|
+
value[1..-1]
|
92
|
+
end
|
93
|
+
terminal(:LANG_STRING_LITERAL_LONG1, LANG_STRING_LITERAL_LONG1, unescape: true) do |value|
|
94
|
+
s, _, l = value[3..-1].rpartition("'''@")
|
95
|
+
[s, language: l]
|
96
|
+
end
|
97
|
+
terminal(:LANG_STRING_LITERAL_LONG2, LANG_STRING_LITERAL_LONG2, unescape: true) do |value|
|
98
|
+
s, _, l = value[3..-1].rpartition('"""@')
|
99
|
+
[s, language: l]
|
100
|
+
end
|
101
|
+
terminal(:LANG_STRING_LITERAL1, LANG_STRING_LITERAL1, unescape: true) do |value|
|
102
|
+
s, _, l = value[1..-1].rpartition("'@")
|
103
|
+
[s, language: l]
|
104
|
+
end
|
105
|
+
terminal(:LANG_STRING_LITERAL2, LANG_STRING_LITERAL2, unescape: true) do |value|
|
106
|
+
s, _, l = value[1..-1].rpartition('"@')
|
107
|
+
[s, language: l]
|
108
|
+
end
|
109
|
+
terminal(:STRING_LITERAL_LONG1, STRING_LITERAL_LONG1, unescape: true) do |value|
|
110
|
+
value[3..-4]
|
111
|
+
end
|
112
|
+
terminal(:STRING_LITERAL_LONG2, STRING_LITERAL_LONG2, unescape: true) do |value|
|
113
|
+
value[3..-4]
|
114
|
+
end
|
115
|
+
terminal(:STRING_LITERAL1, STRING_LITERAL1, unescape: true) do |value|
|
116
|
+
value[1..-2]
|
117
|
+
end
|
118
|
+
terminal(:STRING_LITERAL2, STRING_LITERAL2, unescape: true) do |value|
|
119
|
+
value[1..-2]
|
120
|
+
end
|
121
|
+
terminal(:REGEXP, REGEXP)
|
122
|
+
terminal(:RDF_TYPE, RDF_TYPE) do |value|
|
123
|
+
(a = RDF.type.dup; a.lexical = 'a'; a)
|
167
124
|
end
|
168
125
|
|
169
126
|
# Productions
|
170
127
|
# [1] shexDoc ::= directive* ((notStartAction | startActions) statement*)?
|
171
|
-
|
172
|
-
|
173
|
-
|
128
|
+
start_production(:shexDoc, as_hash: true, clear_packrat: true)
|
129
|
+
production(:shexDoc) do |value|
|
174
130
|
expressions = []
|
175
|
-
|
176
|
-
|
177
|
-
|
178
|
-
expressions
|
179
|
-
|
131
|
+
prefixes = []
|
132
|
+
|
133
|
+
# directive *
|
134
|
+
expressions += value[:_shexDoc_1]
|
135
|
+
|
136
|
+
# ((notStartAction | startActions) statement*)?
|
137
|
+
if value = value[:_shexDoc_2]
|
138
|
+
# These may start with codeDecl or start. otherwise, they are all shapes
|
139
|
+
expressions += Array(value[:_shexDoc_4])
|
140
|
+
expressions += Array(value[:_shexDoc_5])
|
141
|
+
end
|
142
|
+
|
143
|
+
# Extract declarations, startacts and start from expressions
|
144
|
+
declarations, expressions = expressions.partition {|op| op.is_a?(Array)}
|
145
|
+
prefixes, bases = declarations.partition {|op| op.first == :prefix}
|
146
|
+
semacts, expressions = expressions.partition {|op| op.is_a?(Algebra::SemAct)}
|
147
|
+
starts, expressions = expressions.partition {|op| op.is_a?(Algebra::Start)}
|
180
148
|
|
181
|
-
|
182
|
-
|
149
|
+
operands = []
|
150
|
+
operands += bases unless bases.empty?
|
151
|
+
unless prefixes.empty?
|
152
|
+
operands << [:prefix, prefixes.map {|p| p[1,2]}]
|
153
|
+
end
|
154
|
+
operands += semacts
|
155
|
+
operands += starts
|
156
|
+
operands << expressions.unshift(:shapes) unless expressions.empty?
|
157
|
+
Algebra::Schema.new(*operands, **self.options)
|
183
158
|
end
|
159
|
+
start_production(:_shexDoc_2, as_hash: true)
|
160
|
+
start_production(:_shexDoc_3, as_hash: true)
|
184
161
|
|
185
|
-
# [2] directive ::= baseDecl | prefixDecl
|
162
|
+
# [2] directive ::= baseDecl | prefixDecl | importDecl
|
186
163
|
|
187
164
|
# [3] baseDecl ::= "BASE" IRIREF
|
188
|
-
|
189
|
-
|
165
|
+
start_production(:baseDecl, as_hash: true, insensitive_strings: :lower)
|
166
|
+
production(:baseDecl) do |value|
|
167
|
+
self.base_uri = iri(value[:IRIREF])
|
168
|
+
[:base, self.base_uri]
|
190
169
|
end
|
191
170
|
|
192
171
|
# [4] prefixDecl ::= "PREFIX" PNAME_NS IRIREF
|
193
|
-
|
194
|
-
|
195
|
-
|
196
|
-
(
|
172
|
+
start_production(:prefixDecl, as_hash: true, insensitive_strings: :lower)
|
173
|
+
production(:prefixDecl) do |value|
|
174
|
+
pfx = value[:PNAME_NS]
|
175
|
+
prefix(pfx, value[:IRIREF])
|
176
|
+
[:prefix, pfx.to_s, value[:IRIREF]]
|
177
|
+
end
|
178
|
+
|
179
|
+
# [4] importDecl ::= "IMPORT" IRIREF
|
180
|
+
start_production(:importDecl, as_hash: true, insensitive_strings: :lower)
|
181
|
+
production(:importDecl) do |value|
|
182
|
+
Algebra::Import.new(value[:IRIREF], **self.options)
|
197
183
|
end
|
198
184
|
|
199
185
|
# [5] notStartAction ::= start | shapeExprDecl
|
200
|
-
# [6] start ::= "
|
201
|
-
|
202
|
-
|
186
|
+
# [6] start ::= "START" '=' inlineShapeExpression
|
187
|
+
start_production(:start, as_hash: true, insensitive_strings: :lower)
|
188
|
+
production(:start) do |value|
|
189
|
+
Algebra::Start.new(value[:inlineShapeExpression], **self.options)
|
203
190
|
end
|
191
|
+
|
204
192
|
# [7] startActions ::= codeDecl+
|
205
193
|
|
206
194
|
# [8] statement ::= directive | notStartAction
|
207
195
|
|
208
|
-
# [9] shapeExprDecl ::=
|
209
|
-
|
210
|
-
|
211
|
-
|
196
|
+
# [9] shapeExprDecl ::= shapeExprLabel (shapeExpression | "EXTERNAL")
|
197
|
+
start_production(:shapeExprDecl, as_hash: true)
|
198
|
+
production(:shapeExprDecl) do |value|
|
199
|
+
id = value[:shapeExprLabel]
|
200
|
+
expression = case value[:_shapeExprDecl_1]
|
212
201
|
when Algebra::NodeConstraint, Algebra::Or, Algebra::And, Algebra::Not, Algebra::Shape, RDF::Resource
|
213
|
-
|
202
|
+
value[:_shapeExprDecl_1]
|
203
|
+
when /external/i
|
204
|
+
Algebra::External.new(**options)
|
214
205
|
else
|
215
|
-
|
206
|
+
Algebra::Shape.new(**options)
|
216
207
|
end
|
217
208
|
expression.id = id if id && !expression.is_a?(RDF::Resource)
|
218
209
|
|
219
|
-
|
210
|
+
expression
|
220
211
|
end
|
221
212
|
|
222
|
-
# [10] shapeExpression
|
223
|
-
|
224
|
-
|
225
|
-
production(:shapeExpression) do |input, data, callback|
|
226
|
-
expression = Array(data[:shapeExpression]).first || data[:shape]
|
227
|
-
expression = Algebra::Not.new(expression) if data[:not]
|
228
|
-
(input[:shapeExpression] ||= []) << expression
|
213
|
+
# [10] shapeExpression ::= shapeOr
|
214
|
+
production(:shapeExpression) do |value|
|
215
|
+
value.first[:shapeOr]
|
229
216
|
end
|
230
217
|
|
231
218
|
# [11] inlineShapeExpression ::= inlineShapeOr
|
232
|
-
|
233
|
-
|
234
|
-
start_production(:shapeOrA) do |input, data, callback|
|
235
|
-
data[:shapeExpression] = input.delete(:shapeExpression)
|
236
|
-
data[:shapeExpression] ||= Array(input.delete(:shape)) if input[:shape]
|
237
|
-
data[:shapeExpression] = [Algebra::Not.new(*data[:shapeExpression])] if input.delete(:not)
|
219
|
+
production(:inlineShapeExpression) do |value|
|
220
|
+
value.first[:inlineShapeOr]
|
238
221
|
end
|
239
|
-
|
240
|
-
|
241
|
-
|
242
|
-
|
243
|
-
|
244
|
-
|
245
|
-
|
246
|
-
|
247
|
-
|
248
|
-
|
249
|
-
shape_and(input, data)
|
222
|
+
|
223
|
+
# [12] shapeOr ::= shapeAnd ("OR" shapeAnd)*
|
224
|
+
start_production(:shapeOr, as_hash: true)
|
225
|
+
production(:shapeOr) do |value|
|
226
|
+
if value[:_shapeOr_1].empty?
|
227
|
+
value[:shapeAnd]
|
228
|
+
else
|
229
|
+
lhs = value[:_shapeOr_1].map {|v| v.last[:shapeAnd]}
|
230
|
+
Algebra::Or.new(value[:shapeAnd], *lhs, **self.options)
|
231
|
+
end
|
250
232
|
end
|
233
|
+
start_production(:_shapeOr_2, insensitive_strings: :lower)
|
251
234
|
|
252
235
|
# [13] inlineShapeOr ::= inlineShapeAnd ("OR" inlineShapeAnd)*
|
253
|
-
|
254
|
-
|
255
|
-
|
256
|
-
|
257
|
-
input.merge!(data.dup.keep_if {|k, v| [:closed, :extraPropertySet, :codeDecl].include?(k)})
|
258
|
-
expression = if Array(data[:shapeExpression]).length > 1
|
259
|
-
Algebra::Or.new(*data[:shapeExpression])
|
236
|
+
start_production(:inlineShapeOr, as_hash: true)
|
237
|
+
production(:inlineShapeOr) do |value|
|
238
|
+
if value[:_inlineShapeOr_1].empty?
|
239
|
+
value[:inlineShapeAnd]
|
260
240
|
else
|
261
|
-
|
241
|
+
lhs = value[:_inlineShapeOr_1].map {|v| v.last[:inlineShapeAnd]}
|
242
|
+
Algebra::Or.new(value[:inlineShapeAnd], *lhs, **self.options)
|
262
243
|
end
|
263
|
-
(input[:shapeExpression] ||= []) << expression if expression
|
264
|
-
rescue ArgumentError => e
|
265
|
-
error(nil, "Argument Error on OR: #{e.message}")
|
266
244
|
end
|
267
|
-
|
245
|
+
start_production(:_inlineShapeOr_2, insensitive_strings: :lower)
|
268
246
|
|
269
247
|
# [14] shapeAnd ::= shapeNot ("AND" shapeNot)*
|
270
|
-
|
271
|
-
|
272
|
-
|
273
|
-
|
274
|
-
|
275
|
-
|
276
|
-
|
277
|
-
def shape_and(input, data)
|
278
|
-
input.merge!(data.dup.keep_if {|k, v| [:closed, :extraPropertySet, :codeDecl].include?(k)})
|
279
|
-
expressions = Array(data[:shapeExpression]).inject([]) do |memo, expr|
|
280
|
-
#memo.concat(expr.is_a?(Algebra::And) ? expr.operands : [expr])
|
281
|
-
memo.concat([expr])
|
248
|
+
start_production(:shapeAnd, as_hash: true)
|
249
|
+
production(:shapeAnd) do |value|
|
250
|
+
if value[:_shapeAnd_1].empty?
|
251
|
+
value[:shapeNot]
|
252
|
+
else
|
253
|
+
lhs = value[:_shapeAnd_1].map {|v| v.last[:shapeNot]}
|
254
|
+
Algebra::And.new(value[:shapeNot], *lhs, **self.options)
|
282
255
|
end
|
256
|
+
end
|
257
|
+
start_production(:_shapeAnd_2, insensitive_strings: :lower)
|
283
258
|
|
284
|
-
|
285
|
-
|
259
|
+
# [15] inlineShapeAnd ::= inlineShapeNot ("AND" inlineShapeNot)*
|
260
|
+
start_production(:inlineShapeAnd, as_hash: true)
|
261
|
+
production(:inlineShapeAnd) do |value|
|
262
|
+
if value[:_inlineShapeAnd_1].empty?
|
263
|
+
value[:inlineShapeNot]
|
286
264
|
else
|
287
|
-
|
265
|
+
lhs = value[:_inlineShapeAnd_1].map {|v| v.last[:inlineShapeNot]}
|
266
|
+
Algebra::And.new(value[:inlineShapeNot], *lhs, **self.options)
|
288
267
|
end
|
289
|
-
(input[:shapeExpression] ||= []) << expression if expression
|
290
|
-
rescue ArgumentError => e
|
291
|
-
error(nil, "Argument Error on AND: #{e.message}")
|
292
268
|
end
|
293
|
-
|
269
|
+
start_production(:_inlineShapeAnd_2, insensitive_strings: :lower)
|
294
270
|
|
295
271
|
# [16] shapeNot ::= "NOT"? shapeAtom
|
296
|
-
|
297
|
-
|
272
|
+
start_production(:shapeNot, as_hash: true)
|
273
|
+
production(:shapeNot) do |value|
|
274
|
+
atom = value[:shapeAtom]
|
275
|
+
value[:_shapeNot_1] ? Algebra::Not.new(atom || Algebra::Shape.new(**options), **self.options) : atom
|
298
276
|
end
|
277
|
+
start_production(:_shapeNot_1, insensitive_strings: :lower)
|
278
|
+
|
299
279
|
# [17] inlineShapeNot ::= "NOT"? inlineShapeAtom
|
300
|
-
|
301
|
-
|
280
|
+
start_production(:inlineShapeNot, as_hash: true)
|
281
|
+
production(:inlineShapeNot) do |value|
|
282
|
+
atom = value[:inlineShapeAtom]
|
283
|
+
value[:_inlineShapeNot_1] ? Algebra::Not.new(atom || Algebra::Shape.new(**options), **self.options) : atom
|
302
284
|
end
|
303
|
-
|
304
|
-
input.merge!(data.dup.keep_if {|k, v| [:closed, :extraPropertySet, :codeDecl].include?(k)})
|
305
|
-
expression = Array(data[:shapeExpression]).first
|
306
|
-
expression = Algebra::Not.new(expression) if data[:not]
|
307
|
-
#error(nil, "Expected an atom for NOT") unless expression
|
308
|
-
(input[:shapeExpression] ||= []) << expression if expression
|
309
|
-
end
|
310
|
-
private :shape_not
|
285
|
+
start_production(:_inlineShapeNot_1, insensitive_strings: :lower)
|
311
286
|
|
312
|
-
# [18] shapeAtom ::=
|
313
|
-
# |
|
287
|
+
# [18] shapeAtom ::= nonLitNodeConstraint shapeOrRef?
|
288
|
+
# | litNodeConstraint
|
289
|
+
# | shapeOrRef nonLitNodeConstraint?
|
314
290
|
# | "(" shapeExpression ")"
|
315
291
|
# | '.' # no constraint
|
316
|
-
production(:shapeAtom) do |
|
317
|
-
|
292
|
+
production(:shapeAtom) do |value|
|
293
|
+
expressions = case
|
294
|
+
when value.is_a?(Algebra::Operator)
|
295
|
+
[value]
|
296
|
+
when value == '.' then []
|
297
|
+
when value[:nonLitNodeConstraint]
|
298
|
+
[value[:nonLitNodeConstraint], value[:_shapeAtom_4]].compact
|
299
|
+
when value[:shapeOrRef]
|
300
|
+
[value[:shapeOrRef], value[:_shapeAtom_5]].compact
|
301
|
+
when value[:_shapeAtom_3]
|
302
|
+
value[:_shapeAtom_3]
|
303
|
+
else []
|
304
|
+
end
|
305
|
+
|
306
|
+
case expressions.length
|
307
|
+
when 0 then nil
|
308
|
+
when 1 then expressions.first
|
309
|
+
else Algebra::And.new(*expressions, **self.options)
|
310
|
+
end
|
318
311
|
end
|
312
|
+
start_production(:_shapeAtom_1, as_hash: true)
|
313
|
+
start_production(:_shapeAtom_2, as_hash: true)
|
314
|
+
production(:_shapeAtom_3) do |value|
|
315
|
+
value[1][:shapeExpression]
|
316
|
+
end
|
317
|
+
|
318
|
+
# [19] shapeAtomNoRef ::= nonLitNodeConstraint shapeOrRef?
|
319
|
+
# | litNodeConstraint
|
320
|
+
# | shapeDefinition nonLitNodeConstraint?
|
321
|
+
# | "(" shapeExpression ")"
|
322
|
+
# | '.' # no constraint
|
323
|
+
production(:shapeAtomNoRef) do |value|
|
324
|
+
expressions = case
|
325
|
+
when value.is_a?(Algebra::Operator)
|
326
|
+
[value]
|
327
|
+
when value == '.' then []
|
328
|
+
when value[:nonLitNodeConstraint]
|
329
|
+
[value[:nonLitNodeConstraint], value[:_shapeAtomNoRef_4]].compact
|
330
|
+
when value[:shapeDefinition]
|
331
|
+
[value[:shapeDefinition], value[:_shapeAtomNoRef_5]].compact
|
332
|
+
when value[:_shapeAtomNoRef_3]
|
333
|
+
value[:_shapeAtomNoRef_3]
|
334
|
+
else []
|
335
|
+
end
|
319
336
|
|
320
|
-
|
321
|
-
|
322
|
-
|
323
|
-
|
324
|
-
|
325
|
-
|
337
|
+
case expressions.length
|
338
|
+
when 0 then nil
|
339
|
+
when 1 then expressions.first
|
340
|
+
else Algebra::And.new(*expressions, **self.options)
|
341
|
+
end
|
342
|
+
end
|
343
|
+
start_production(:_shapeAtomNoRef_1, as_hash: true)
|
344
|
+
start_production(:_shapeAtomNoRef_2, as_hash: true)
|
345
|
+
production(:_shapeAtomNoRef_3) do |value|
|
346
|
+
value[1][:shapeExpression]
|
326
347
|
end
|
327
348
|
|
328
|
-
# [20] inlineShapeAtom ::=
|
329
|
-
# |
|
349
|
+
# [20] inlineShapeAtom ::= nonLitNodeConstraint inlineShapeOrRef?
|
350
|
+
# | litNodeConstraint
|
351
|
+
# | inlineShapeOrRef nonLitNodeConstraint?
|
330
352
|
# | "(" shapeExpression ")"
|
331
353
|
# | '.' # no constraint
|
332
|
-
production(:inlineShapeAtom) do |
|
333
|
-
|
334
|
-
|
335
|
-
|
336
|
-
|
337
|
-
|
338
|
-
|
354
|
+
production(:inlineShapeAtom) do |value|
|
355
|
+
expressions = case
|
356
|
+
when value == '.' then []
|
357
|
+
when value.is_a?(Algebra::Operator)
|
358
|
+
[value]
|
359
|
+
when value[:nonLitNodeConstraint]
|
360
|
+
[value[:nonLitNodeConstraint], value[:_inlineShapeAtom_4]].compact
|
361
|
+
when value[:inlineShapeOrRef]
|
362
|
+
[value[:inlineShapeOrRef], value[:__inlineShapeAtom_5]].compact
|
363
|
+
when value[:_inlineShapeAtom_3]
|
364
|
+
value[:_inlineShapeAtom_3]
|
365
|
+
else []
|
366
|
+
end
|
339
367
|
|
340
|
-
|
341
|
-
expression = case expression.length
|
368
|
+
case expressions.length
|
342
369
|
when 0 then nil
|
343
|
-
when 1 then
|
344
|
-
else
|
370
|
+
when 1 then expressions.first
|
371
|
+
else Algebra::And.new(*expressions, **self.options)
|
345
372
|
end
|
346
|
-
|
347
|
-
(input[:shapeExpression] ||= []) << expression if expression
|
348
373
|
end
|
349
|
-
|
374
|
+
start_production(:_inlineShapeAtom_1, as_hash: true)
|
375
|
+
start_production(:_inlineShapeAtom_2, as_hash: true)
|
376
|
+
production(:_inlineShapeAtom_3) do |value|
|
377
|
+
value[1][:shapeExpression]
|
378
|
+
end
|
350
379
|
|
351
380
|
# [21] shapeOrRef ::= shapeDefinition | shapeRef
|
352
|
-
production(:shapeOrRef) do |input, data, callback|
|
353
|
-
shape_or_ref(input, data)
|
354
|
-
end
|
355
381
|
# [22] inlineShapeOrRef ::= inlineShapeDefinition | shapeRef
|
356
|
-
production(:inlineShapeOrRef) do |input, data, callback|
|
357
|
-
shape_or_ref(input, data)
|
358
|
-
end
|
359
|
-
def shape_or_ref(input, data)
|
360
|
-
input.merge!(data.dup.keep_if {|k, v| [:closed, :extraPropertySet, :codeDecl].include?(k)})
|
361
|
-
input[:shapeOrRef] = data[:shape] if data[:shape]
|
362
|
-
rescue ArgumentError => e
|
363
|
-
error(nil, "Argument Error on ShapeOrRef: #{e.message}")
|
364
|
-
end
|
365
|
-
private :shape_or_ref
|
366
382
|
|
367
|
-
# [23] shapeRef ::= ATPNAME_LN | ATPNAME_NS | '@'
|
368
|
-
production(:shapeRef) do |
|
369
|
-
|
383
|
+
# [23] shapeRef ::= ATPNAME_LN | ATPNAME_NS | '@' shapeExprLabel
|
384
|
+
production(:shapeRef) do |value|
|
385
|
+
value.is_a?(Array) ? value.last[:shapeExprLabel] : value
|
370
386
|
end
|
371
387
|
|
372
388
|
# [24] litNodeConstraint ::= "LITERAL" xsFacet*
|
373
389
|
# | datatype xsFacet*
|
374
390
|
# | valueSet xsFacet*
|
375
391
|
# | numericFacet+
|
376
|
-
|
377
|
-
|
378
|
-
|
379
|
-
|
380
|
-
|
381
|
-
|
382
|
-
|
392
|
+
start_production(:_litNodeConstraint_1, as_hash: true, insensitive_strings: :lower)
|
393
|
+
production(:_litNodeConstraint_1) do |value|
|
394
|
+
# LITERAL" xsFacet*
|
395
|
+
facets = value[:_litNodeConstraint_5]
|
396
|
+
validate_facets(facets, :litNodeConstraint)
|
397
|
+
Algebra::NodeConstraint.new(:literal, *facets, **self.options)
|
398
|
+
end
|
399
|
+
start_production(:_litNodeConstraint_2, as_hash: true)
|
400
|
+
production(:_litNodeConstraint_2) do |value|
|
401
|
+
# datatype xsFacet*
|
402
|
+
facets = value[:_litNodeConstraint_6]
|
403
|
+
validate_facets(facets, :litNodeConstraint)
|
404
|
+
|
405
|
+
# Numeric Facet Constraints can only be used when datatype is derived from the set of SPARQL 1.1 Operand Data Types
|
406
|
+
l = RDF::Literal("0", datatype: value[:datatype])
|
407
|
+
facets.each do |f|
|
408
|
+
error(nil, "#{f.first} constraint may only be used once on a numeric datatype (#{value[:datatype]})", production: :litNodeConstraint) if
|
409
|
+
f.to_s.match(/digits|inclusive|exclusive/) &&
|
410
|
+
!l.is_a?(RDF::Literal::Numeric)
|
383
411
|
end
|
384
412
|
|
385
|
-
attrs = []
|
386
|
-
attrs
|
387
|
-
|
388
|
-
|
389
|
-
|
390
|
-
|
391
|
-
|
392
|
-
|
413
|
+
attrs = [[:datatype, value[:datatype]]] + facets
|
414
|
+
Algebra::NodeConstraint.new(*attrs.compact, **self.options)
|
415
|
+
end
|
416
|
+
start_production(:_litNodeConstraint_3, as_hash: true)
|
417
|
+
production(:_litNodeConstraint_3) do |value|
|
418
|
+
# valueSet xsFacet*
|
419
|
+
facets = value[:_litNodeConstraint_7]
|
420
|
+
validate_facets(facets, :litNodeConstraint)
|
421
|
+
attrs = value[:valueSet]+ facets
|
422
|
+
Algebra::NodeConstraint.new(*attrs.compact, **self.options)
|
423
|
+
end
|
424
|
+
production(:_litNodeConstraint_4) do |value|
|
425
|
+
# numericFacet+
|
426
|
+
validate_facets(value, :litNodeConstraint)
|
427
|
+
Algebra::NodeConstraint.new(*value, **self.options)
|
393
428
|
end
|
394
429
|
|
395
430
|
# [25] nonLitNodeConstraint ::= nonLiteralKind stringFacet*
|
396
431
|
# | stringFacet+
|
397
|
-
|
398
|
-
|
399
|
-
|
400
|
-
|
401
|
-
|
402
|
-
attrs
|
403
|
-
|
404
|
-
|
432
|
+
start_production(:_nonLitNodeConstraint_1, as_hash: true)
|
433
|
+
production(:_nonLitNodeConstraint_1) do |value|
|
434
|
+
# nonLiteralKind stringFacet*
|
435
|
+
facets = Array(value[:_nonLitNodeConstraint_3])
|
436
|
+
validate_facets(facets, :nonLitNodeConstraint)
|
437
|
+
attrs = Array(value[:nonLiteralKind]) + facets
|
438
|
+
Algebra::NodeConstraint.new(*attrs.compact, **self.options)
|
439
|
+
end
|
440
|
+
production(:_nonLitNodeConstraint_2) do |value|
|
441
|
+
# stringFacet+
|
442
|
+
validate_facets(value, :nonLitNodeConstraint)
|
443
|
+
Algebra::NodeConstraint.new(*value, **self.options)
|
444
|
+
end
|
445
|
+
|
446
|
+
def validate_facets(facets, prod)
|
447
|
+
facets.each do |facet|
|
448
|
+
if facets.count {|f| f.first == facet.first} > 1
|
449
|
+
error(nil, "#{facet.first} constraint may only be used once in a Node Constraint", production: prod)
|
450
|
+
end
|
451
|
+
end
|
405
452
|
end
|
453
|
+
private :validate_facets
|
406
454
|
|
407
455
|
# [26] nonLiteralKind ::= "IRI" | "BNODE" | "NONLITERAL"
|
456
|
+
start_production(:nonLiteralKind, insensitive_strings: :lower)
|
457
|
+
production(:nonLiteralKind) do |value|
|
458
|
+
value.to_sym
|
459
|
+
end
|
408
460
|
|
409
461
|
# [27] xsFacet ::= stringFacet | numericFacet
|
410
462
|
# [28] stringFacet ::= stringLength INTEGER
|
411
463
|
# | REGEXP
|
412
|
-
production(:stringFacet) do |
|
413
|
-
|
414
|
-
|
415
|
-
|
416
|
-
|
417
|
-
|
418
|
-
[data[:stringLength], data[:literal]]
|
419
|
-
elsif re = data[:regexp]
|
420
|
-
unless re =~ %r(^/(.*)/([smix]*)$)
|
421
|
-
error(nil, "#{re.inspect} regular expression must be in the form /pattern/flags?", production: :stringFacet)
|
464
|
+
production(:stringFacet) do |value|
|
465
|
+
if value.is_a?(Array) # stringLength
|
466
|
+
value
|
467
|
+
else
|
468
|
+
unless value =~ %r(^/(.*)/([smix]*)$)
|
469
|
+
error(nil, "#{value.inspect} regular expression must be in the form /pattern/flags?", production: :stringFacet)
|
422
470
|
end
|
471
|
+
|
423
472
|
flags = $2 unless $2.to_s.empty?
|
424
473
|
pattern = $1.gsub('\\/', '/').gsub(UCHAR) do
|
425
474
|
[($1 || $2).hex].pack('U*')
|
426
475
|
end.force_encoding(Encoding::UTF_8)
|
427
476
|
|
428
477
|
# Any other escaped character is a syntax error
|
429
|
-
if pattern.match(%r([^\\]\\[^nrt/\\|\.?*+\[\]\(\){}$#x2D#x5B#x5D#x5E-]))
|
478
|
+
if pattern.match?(%r([^\\]\\[^nrt/\\|\.?*+\[\]\(\){}$#x2D#x5B#x5D#x5E-]))
|
430
479
|
error(nil, "Regexp contains illegal escape: #{pattern.inspect}", production: :stringFacet)
|
431
480
|
end
|
432
481
|
|
433
482
|
[:pattern, pattern, flags].compact
|
434
483
|
end
|
435
484
|
end
|
485
|
+
start_production(:_stringFacet_1, as_hash: true)
|
486
|
+
production(:_stringFacet_1) do |value|
|
487
|
+
[value[:stringLength].to_sym, value[:INTEGER]]
|
488
|
+
end
|
436
489
|
|
437
490
|
# [29] stringLength ::= "LENGTH" | "MINLENGTH" | "MAXLENGTH"
|
491
|
+
start_production(:stringLength, insensitive_strings: :lower)
|
438
492
|
|
439
|
-
# [30] numericFacet ::= numericRange
|
493
|
+
# [30] numericFacet ::= numericRange numericLiteral
|
440
494
|
# | numericLength INTEGER
|
441
|
-
|
442
|
-
|
443
|
-
|
444
|
-
|
445
|
-
|
446
|
-
|
447
|
-
|
448
|
-
[data[:numericLength], data[:literal]]
|
449
|
-
end
|
495
|
+
start_production(:_numericFacet_1, as_hash: true)
|
496
|
+
production(:_numericFacet_1) do |value|
|
497
|
+
[value[:numericRange].to_sym, value[:numericLiteral]]
|
498
|
+
end
|
499
|
+
start_production(:_numericFacet_2, as_hash: true)
|
500
|
+
production(:_numericFacet_2) do |value|
|
501
|
+
[value[:numericLength].to_sym, value[:INTEGER]]
|
450
502
|
end
|
451
503
|
|
452
504
|
# [31] numericRange ::= "MININCLUSIVE" | "MINEXCLUSIVE" | "MAXINCLUSIVE" | "MAXEXCLUSIVE"
|
505
|
+
start_production(:numericRange, insensitive_strings: :lower)
|
506
|
+
|
453
507
|
# [32] numericLength ::= "TOTALDIGITS" | "FRACTIONDIGITS"
|
508
|
+
start_production(:numericLength, insensitive_strings: :lower)
|
454
509
|
|
455
510
|
# [33] shapeDefinition ::= (includeSet | extraPropertySet | "CLOSED")* '{' tripleExpression? '}' annotation* semanticActions
|
456
|
-
|
457
|
-
|
511
|
+
start_production(:shapeDefinition, as_hash: true)
|
512
|
+
production(:shapeDefinition) do |value|
|
513
|
+
shape_definition(
|
514
|
+
value[:_shapeDefinition_1],
|
515
|
+
value[:_shapeDefinition_2],
|
516
|
+
value[:_shapeDefinition_3],
|
517
|
+
value[:semanticActions])
|
458
518
|
end
|
519
|
+
start_production(:_shapeDefinition_4, insensitive_strings: :lower)
|
520
|
+
|
459
521
|
# [34] inlineShapeDefinition ::= (includeSet | extraPropertySet | "CLOSED")* '{' tripleExpression? '}'
|
460
|
-
|
461
|
-
|
462
|
-
|
463
|
-
|
464
|
-
|
465
|
-
|
466
|
-
|
467
|
-
|
522
|
+
start_production(:inlineShapeDefinition, as_hash: true)
|
523
|
+
production(:inlineShapeDefinition) do |value|
|
524
|
+
shape_definition(
|
525
|
+
value[:_inlineShapeDefinition_1],
|
526
|
+
value[:_inlineShapeDefinition_2])
|
527
|
+
end
|
528
|
+
def shape_definition(extra_closed, expression, annotations = [], semact = [])
|
529
|
+
closed = extra_closed.any? {|v| v.to_s == 'closed'}
|
530
|
+
extra = extra_closed.reject {|v| v.to_s == 'closed'}
|
531
|
+
attrs = extra
|
532
|
+
attrs << :closed if closed
|
468
533
|
attrs << expression if expression
|
469
|
-
attrs +=
|
470
|
-
attrs +=
|
534
|
+
attrs += annotations
|
535
|
+
attrs += semact
|
471
536
|
|
472
|
-
|
537
|
+
Algebra::Shape.new(*attrs, **self.options)
|
473
538
|
end
|
474
539
|
private :shape_definition
|
475
540
|
|
476
541
|
# [35] extraPropertySet ::= "EXTRA" predicate+
|
477
|
-
|
478
|
-
|
542
|
+
start_production(:extraPropertySet, insensitive_strings: :lower)
|
543
|
+
production(:extraPropertySet) do |value|
|
544
|
+
value.last[:_extraPropertySet_1].unshift(:extra)
|
479
545
|
end
|
480
546
|
|
481
547
|
# [36] tripleExpression ::= oneOfTripleExpr
|
482
|
-
|
483
|
-
|
484
|
-
expression = if Array(data[:tripleExpression]).length > 1
|
485
|
-
Algebra::OneOf.new(*data[:tripleExpression])
|
486
|
-
else
|
487
|
-
Array(data[:tripleExpression]).first
|
488
|
-
end
|
489
|
-
input[:tripleExpression] = expression if expression
|
548
|
+
production(:tripleExpression) do |value|
|
549
|
+
value.first[:oneOfTripleExpr]
|
490
550
|
end
|
491
551
|
|
492
|
-
# [
|
493
|
-
|
494
|
-
|
495
|
-
|
496
|
-
|
497
|
-
|
498
|
-
|
499
|
-
|
552
|
+
# [37] oneOfTripleExpr ::= groupTripleExpr ('|' groupTripleExpr)*
|
553
|
+
start_production(:oneOfTripleExpr, as_hash: true)
|
554
|
+
production(:oneOfTripleExpr) do |value|
|
555
|
+
expressions = [value[:groupTripleExpr]] + value[:_oneOfTripleExpr_1]
|
556
|
+
expressions.length == 1 ? expressions.first : Algebra::OneOf.new(*expressions, **self.options)
|
557
|
+
end
|
558
|
+
production(:_oneOfTripleExpr_2) do |value|
|
559
|
+
value.last[:groupTripleExpr]
|
500
560
|
end
|
501
561
|
|
502
|
-
# [
|
503
|
-
|
504
|
-
|
505
|
-
|
506
|
-
|
507
|
-
|
562
|
+
# [40] groupTripleExpr ::= unaryTripleExpr (';' unaryTripleExpr?)*
|
563
|
+
start_production(:groupTripleExpr, as_hash: true)
|
564
|
+
production(:groupTripleExpr) do |value|
|
565
|
+
expressions = [value[:unaryTripleExpr]] + value[:_groupTripleExpr_1]
|
566
|
+
expressions.length == 1 ? expressions.first : Algebra::EachOf.new(*expressions, **self.options)
|
567
|
+
end
|
568
|
+
production(:_groupTripleExpr_2) do |value|
|
569
|
+
value.last[:_groupTripleExpr_3]
|
508
570
|
end
|
509
571
|
|
510
|
-
# [
|
511
|
-
|
512
|
-
|
572
|
+
# [43] unaryTripleExpr ::= ('$' tripleExprLabel)? (tripleConstraint | bracketedTripleExpr) | include
|
573
|
+
start_production(:_unaryTripleExpr_1, as_hash: true)
|
574
|
+
production(:_unaryTripleExpr_1) do |value|
|
575
|
+
expression = value[:_unaryTripleExpr_3]
|
576
|
+
expression.id = value[:_unaryTripleExpr_2] if expression && value[:_unaryTripleExpr_2]
|
577
|
+
|
578
|
+
expression
|
579
|
+
end
|
580
|
+
production(:_unaryTripleExpr_4) do |value|
|
581
|
+
# '$' tripleExprLabel
|
582
|
+
value.last[:tripleExprLabel]
|
513
583
|
end
|
514
584
|
|
515
|
-
# [44] bracketedTripleExpr ::= '('
|
516
|
-
|
517
|
-
|
518
|
-
case expression =
|
519
|
-
when Algebra::
|
585
|
+
# [44] bracketedTripleExpr ::= '(' tripleExpression ')' cardinality? annotation* semanticActions
|
586
|
+
start_production(:bracketedTripleExpr, as_hash: true)
|
587
|
+
production(:bracketedTripleExpr) do |value|
|
588
|
+
case expression = value[:tripleExpression]
|
589
|
+
when Algebra::TripleExpression
|
520
590
|
else
|
521
|
-
error(nil, "Bracketed Expression requires
|
591
|
+
error(nil, "Bracketed Expression requires contained triple expression", production: :bracketedTripleExpr)
|
522
592
|
end
|
523
|
-
cardinality =
|
593
|
+
cardinality = value[:_bracketedTripleExpr_1] || {}
|
524
594
|
attrs = [
|
525
595
|
([:min, cardinality[:min]] if cardinality[:min]),
|
526
596
|
([:max, cardinality[:max]] if cardinality[:max])
|
527
597
|
].compact
|
528
|
-
attrs +=
|
529
|
-
attrs += Array(
|
598
|
+
attrs += value[:semanticActions]
|
599
|
+
attrs += Array(value[:_bracketedTripleExpr_2])
|
530
600
|
|
531
601
|
expression.operands.concat(attrs)
|
532
|
-
|
602
|
+
expression
|
533
603
|
end
|
534
604
|
|
535
|
-
# [45] tripleConstraint ::= senseFlags? predicate
|
536
|
-
|
537
|
-
|
605
|
+
# [45] tripleConstraint ::= senseFlags? predicate inlineShapeExpression cardinality? annotation* semanticActions
|
606
|
+
start_production(:tripleConstraint, as_hash: true)
|
607
|
+
production(:tripleConstraint) do |value|
|
608
|
+
cardinality = value[:_tripleConstraint_2] || {}
|
538
609
|
attrs = [
|
539
|
-
(:inverse if
|
540
|
-
[:predicate,
|
541
|
-
|
610
|
+
(:inverse if value[:_tripleConstraint_1]),
|
611
|
+
[:predicate, value[:predicate]],
|
612
|
+
value[:inlineShapeExpression],
|
542
613
|
([:min, cardinality[:min]] if cardinality[:min]),
|
543
614
|
([:max, cardinality[:max]] if cardinality[:max])
|
544
615
|
].compact
|
545
|
-
attrs +=
|
546
|
-
attrs +=
|
616
|
+
attrs += value[:_tripleConstraint_3]
|
617
|
+
attrs += value[:semanticActions]
|
547
618
|
|
548
|
-
|
619
|
+
Algebra::TripleConstraint.new(*attrs, **self.options) # unless attrs.empty?
|
549
620
|
end
|
550
621
|
|
551
622
|
# [46] cardinality ::= '*' | '+' | '?' | REPEAT_RANGE
|
623
|
+
production(:cardinality) do |value|
|
624
|
+
case value
|
625
|
+
when '*' then {min: 0, max: "*"}
|
626
|
+
when '+' then {min: 1, max: "*"}
|
627
|
+
when '?' then {min: 0, max: 1}
|
628
|
+
else value
|
629
|
+
end
|
630
|
+
end
|
631
|
+
|
552
632
|
# [47] senseFlags ::= '^'
|
553
633
|
# [48] valueSet ::= '[' valueSetValue* ']'
|
634
|
+
production(:valueSet) do |value|
|
635
|
+
value[1][:_valueSet_1]
|
636
|
+
end
|
554
637
|
|
555
638
|
# [49] valueSetValue ::= iriRange | literalRange | languageRange | '.' exclusion+
|
556
|
-
production(:valueSetValue) do |
|
557
|
-
|
558
|
-
|
559
|
-
|
560
|
-
|
561
|
-
|
562
|
-
|
563
|
-
|
564
|
-
|
565
|
-
|
566
|
-
|
567
|
-
|
568
|
-
|
569
|
-
|
570
|
-
|
571
|
-
|
572
|
-
|
573
|
-
|
574
|
-
|
575
|
-
|
639
|
+
production(:valueSetValue) do |value|
|
640
|
+
Algebra::Value.new(value, **self.options)
|
641
|
+
end
|
642
|
+
production(:_valueSetValue_1) do |value|
|
643
|
+
# All exclusions must be consistent IRI/Literal/Language
|
644
|
+
value = value.last[:_valueSetValue_2]
|
645
|
+
case value.first
|
646
|
+
when Algebra::IriStem, RDF::URI
|
647
|
+
unless value.all? {|e| e.is_a?(Algebra::IriStem) || e.is_a?(RDF::URI)}
|
648
|
+
error(nil, "Exclusions must all be IRI type")
|
649
|
+
end
|
650
|
+
Algebra::IriStemRange.new(:wildcard, value.unshift(:exclusions), **self.options)
|
651
|
+
when Algebra::LiteralStem, RDF::Literal
|
652
|
+
unless value.all? {|e| e.is_a?(Algebra::LiteralStem) || e.is_a?(RDF::Literal)}
|
653
|
+
error(nil, "Exclusions must all be Literal type")
|
654
|
+
end
|
655
|
+
Algebra::LiteralStemRange.new(:wildcard, value.unshift(:exclusions), **self.options)
|
656
|
+
else
|
657
|
+
unless value.all? {|e| e.is_a?(Algebra::LanguageStem) || e.is_a?(String)}
|
658
|
+
error(nil, "Exclusions must all be Language type")
|
576
659
|
end
|
660
|
+
Algebra::LanguageStemRange.new(:wildcard, value.unshift(:exclusions), **self.options)
|
577
661
|
end
|
578
|
-
(input[:valueSetValue] ||= []) << Algebra::Value.new(range)
|
579
662
|
end
|
580
663
|
|
581
|
-
# [50] exclusion ::= '-' (iri | literal | LANGTAG) '~'?
|
582
|
-
|
583
|
-
|
584
|
-
|
585
|
-
|
586
|
-
when
|
587
|
-
when
|
664
|
+
# [50] exclusion ::= '.' '-' (iri | literal | LANGTAG) '~'?
|
665
|
+
start_production(:exclusion, as_hash: true)
|
666
|
+
production(:exclusion) do |value|
|
667
|
+
if value[:_exclusion_2]
|
668
|
+
case value[:_exclusion_1]
|
669
|
+
when RDF::URI then Algebra::IriStem.new(value[:_exclusion_1], **self.options)
|
670
|
+
when RDF::Literal then Algebra::LiteralStem.new(value[:_exclusion_1], **self.options)
|
671
|
+
else Algebra::LanguageStem.new(value[:_exclusion_1], **self.options)
|
588
672
|
end
|
589
673
|
else
|
590
|
-
|
674
|
+
value[:_exclusion_1]
|
591
675
|
end
|
592
676
|
end
|
593
677
|
|
594
678
|
# [51] iriRange ::= iri ('~' iriExclusion*)?
|
595
|
-
production(:iriRange) do |
|
596
|
-
|
597
|
-
|
598
|
-
|
599
|
-
|
600
|
-
|
601
|
-
|
602
|
-
|
679
|
+
production(:iriRange) do |value|
|
680
|
+
iri = value.first[:iri]
|
681
|
+
if value.last[:_iriRange_1]
|
682
|
+
exclusions = value.last[:_iriRange_1].last[:_iriRange_3]
|
683
|
+
if exclusions.empty?
|
684
|
+
Algebra::IriStem.new(iri, **self.options)
|
685
|
+
else
|
686
|
+
Algebra::IriStemRange.new(iri, exclusions.unshift(:exclusions), **self.options)
|
687
|
+
end
|
603
688
|
else
|
604
|
-
|
689
|
+
iri
|
605
690
|
end
|
606
691
|
end
|
607
692
|
|
608
693
|
# [52] iriExclusion ::= '-' iri '~'?
|
609
|
-
|
610
|
-
|
611
|
-
|
694
|
+
start_production(:iriExclusion, as_hash: true)
|
695
|
+
production(:iriExclusion) do |value|
|
696
|
+
value[:_iriExclusion_1] ? Algebra::IriStem.new(value[:iri], **self.options) : value[:iri]
|
612
697
|
end
|
613
698
|
|
614
699
|
# [53] literalRange ::= literal ('~' literalExclusion*)?
|
615
|
-
production(:literalRange) do |
|
616
|
-
|
617
|
-
|
618
|
-
|
619
|
-
|
620
|
-
|
621
|
-
|
622
|
-
|
700
|
+
production(:literalRange) do |value|
|
701
|
+
lit = value.first[:literal]
|
702
|
+
if value.last[:_literalRange_1]
|
703
|
+
exclusions = value.last[:_literalRange_1].last[:_literalRange_3]
|
704
|
+
if exclusions.empty?
|
705
|
+
Algebra::LiteralStem.new(lit, **self.options)
|
706
|
+
else
|
707
|
+
Algebra::LiteralStemRange.new(lit, exclusions.unshift(:exclusions), **self.options)
|
708
|
+
end
|
623
709
|
else
|
624
|
-
|
710
|
+
lit
|
625
711
|
end
|
626
712
|
end
|
627
713
|
|
628
714
|
# [54] literalExclusion ::= '-' literal '~'?
|
629
|
-
|
630
|
-
|
631
|
-
|
715
|
+
start_production(:literalExclusion, as_hash: true)
|
716
|
+
production(:literalExclusion) do |value|
|
717
|
+
val = value[:literal]
|
718
|
+
value[:_literalExclusion_1] ? Algebra::LiteralStem.new(val, **self.options) : val
|
632
719
|
end
|
633
720
|
|
634
721
|
# [55] languageRange ::= LANGTAG ('~' languageExclusion*)?
|
635
|
-
|
636
|
-
|
637
|
-
|
638
|
-
|
639
|
-
|
640
|
-
|
641
|
-
|
642
|
-
|
722
|
+
# | '@' '~' languageExclusion*
|
723
|
+
start_production(:_languageRange_1, as_hash: true)
|
724
|
+
production(:_languageRange_1) do |value|
|
725
|
+
exclusions = value[:_languageRange_3] if value[:_languageRange_3]
|
726
|
+
pattern = !!value[:_languageRange_3]
|
727
|
+
if pattern && exclusions.empty?
|
728
|
+
Algebra::LanguageStem.new(value[:LANGTAG], **self.options)
|
729
|
+
elsif pattern
|
730
|
+
Algebra::LanguageStemRange.new(value[:LANGTAG], exclusions.unshift(:exclusions), **self.options)
|
731
|
+
else
|
732
|
+
Algebra::Language.new(value[:LANGTAG], **self.options)
|
733
|
+
end
|
734
|
+
end
|
735
|
+
start_production(:_languageRange_2, as_hash: true)
|
736
|
+
production(:_languageRange_2) do |value|
|
737
|
+
exclusions = value[:_languageRange_6]
|
738
|
+
if exclusions.empty?
|
739
|
+
Algebra::LanguageStem.new('', **self.options)
|
643
740
|
else
|
644
|
-
Algebra::
|
741
|
+
Algebra::LanguageStemRange.new('', exclusions.unshift(:exclusions), **self.options)
|
645
742
|
end
|
646
743
|
end
|
744
|
+
production(:_languageRange_4) do |value|
|
745
|
+
value.last[:_languageRange_5]
|
746
|
+
end
|
647
747
|
|
648
|
-
# [56] languageExclusion ::= '-'
|
649
|
-
|
650
|
-
|
651
|
-
|
748
|
+
# [56] languageExclusion ::= '-' LANGTAG '~'?
|
749
|
+
start_production(:languageExclusion, as_hash: true)
|
750
|
+
production(:languageExclusion) do |value|
|
751
|
+
val = value[:LANGTAG]
|
752
|
+
value[:_languageExclusion_1] ? Algebra::LanguageStem.new(val, **self.options) : val
|
652
753
|
end
|
653
754
|
|
654
|
-
# [57] include ::= '&'
|
655
|
-
production(:include) do |
|
656
|
-
|
755
|
+
# [57] include ::= '&' tripleExprLabel
|
756
|
+
production(:include) do |value|
|
757
|
+
value.last[:tripleExprLabel]
|
657
758
|
end
|
658
759
|
|
659
760
|
# [58] annotation ::= '//' predicate (iri | literal)
|
660
|
-
|
661
|
-
|
662
|
-
(
|
761
|
+
start_production(:annotation, as_hash: true)
|
762
|
+
production(:annotation) do |value|
|
763
|
+
Algebra::Annotation.new([:predicate, value[:predicate]], value[:_annotation_1], **self.options)
|
663
764
|
end
|
664
765
|
|
665
766
|
# [59] semanticActions ::= codeDecl*
|
666
767
|
|
667
768
|
# [60] codeDecl ::= '%' iri (CODE | "%")
|
668
|
-
|
669
|
-
|
769
|
+
start_production(:codeDecl, as_hash: true)
|
770
|
+
production(:codeDecl) do |value|
|
771
|
+
code = value[:_codeDecl_1] unless value[:_codeDecl_1] == '%'
|
772
|
+
Algebra::SemAct.new(*[value[:iri], code].compact, **self.options)
|
670
773
|
end
|
671
774
|
|
672
775
|
# [13t] literal ::= rdfLiteral | numericLiteral | booleanLiteral
|
673
776
|
|
674
777
|
# [61] predicate ::= iri | RDF_TYPE
|
675
|
-
production(:predicate) do |
|
676
|
-
|
778
|
+
production(:predicate) do |value|
|
779
|
+
value
|
677
780
|
end
|
678
781
|
|
679
782
|
# [62] datatype ::= iri
|
680
|
-
production(:datatype) do |
|
681
|
-
|
783
|
+
production(:datatype) do |value|
|
784
|
+
value.first[:iri]
|
682
785
|
end
|
683
786
|
|
684
|
-
# [63]
|
685
|
-
|
686
|
-
|
787
|
+
# [63] shapeExprLabel ::= iri | blankNode
|
788
|
+
# [16t] numericLiteral ::= INTEGER | DECIMAL | DOUBLE
|
789
|
+
# [65] rdfLiteral ::= langString | string ('^^' datatype)?
|
790
|
+
production(:rdfLiteral) do |value|
|
791
|
+
literal(*value)
|
792
|
+
end
|
793
|
+
start_production(:_rdfLiteral_1, as_hash: true)
|
794
|
+
production(:_rdfLiteral_1) do |value|
|
795
|
+
[value[:string], {datatype: value[:_rdfLiteral_2]}]
|
796
|
+
end
|
797
|
+
production(:_rdfLiteral_3) do |value|
|
798
|
+
value.last[:datatype]
|
687
799
|
end
|
688
800
|
|
689
|
-
# [
|
690
|
-
|
691
|
-
production(:
|
692
|
-
|
801
|
+
# [134s] booleanLiteral ::= "true" | "false"
|
802
|
+
start_production(:booleanLiteral, insensitive_strings: :lower)
|
803
|
+
production(:booleanLiteral) do |value|
|
804
|
+
literal(value == 'true')
|
693
805
|
end
|
694
806
|
|
695
|
-
# [134s] booleanLiteral ::= 'true' | 'false'
|
696
807
|
# [135s] string ::= STRING_LITERAL1 | STRING_LITERAL_LONG1
|
697
808
|
# | STRING_LITERAL2 | STRING_LITERAL_LONG2
|
698
809
|
# [66] langString ::= LANG_STRING_LITERAL1 | LANG_STRING_LITERAL_LONG1
|
699
810
|
# | LANG_STRING_LITERAL2 | LANG_STRING_LITERAL_LONG2
|
700
811
|
# [136s] iri ::= IRIREF | prefixedName
|
701
812
|
# [1372] prefixedName ::= PNAME_LN | PNAME_NS
|
813
|
+
production(:prefixedName) do |value|
|
814
|
+
value.is_a?(RDF::URI) ? value : ns(value, '')
|
815
|
+
end
|
816
|
+
|
702
817
|
# [138s] blankNode ::= BLANK_NODE_LABEL
|
818
|
+
production(:blankNode) do |value|
|
819
|
+
value.first[:BLANK_NODE_LABEL]
|
820
|
+
end
|
703
821
|
|
704
822
|
##
|
705
823
|
# Initializes a new parser instance.
|
@@ -758,7 +876,7 @@ module ShEx
|
|
758
876
|
@result.to_sxp
|
759
877
|
end
|
760
878
|
|
761
|
-
alias_method :
|
879
|
+
alias_method :peg_parse, :parse
|
762
880
|
|
763
881
|
# Parse query
|
764
882
|
#
|
@@ -777,50 +895,17 @@ module ShEx
|
|
777
895
|
# @raise [ShEx::StructureError, ArgumentError] on structural problems with schema
|
778
896
|
# @see https://www.w3.org/TR/sparql11-query/#sparqlAlgebra
|
779
897
|
# @see https://axel.deri.ie/sparqltutorial/ESWC2007_SPARQL_Tutorial_unit2b.pdf
|
780
|
-
def parse(prod =
|
781
|
-
|
898
|
+
def parse(prod = :shexDoc)
|
899
|
+
@result = peg_parse(@input,
|
782
900
|
prod.to_sym,
|
783
|
-
|
784
|
-
first: FIRST,
|
785
|
-
follow: FOLLOW,
|
901
|
+
ShEx::Meta::RULES,
|
786
902
|
whitespace: WS,
|
787
|
-
**@options
|
788
|
-
) do |context, *data|
|
789
|
-
case context
|
790
|
-
when :trace
|
791
|
-
if options[:logger]
|
792
|
-
level, lineno, depth, *args = data
|
793
|
-
case level
|
794
|
-
when 0
|
795
|
-
log_error(*args, depth: depth, lineno: lineno)
|
796
|
-
when 1
|
797
|
-
log_warn(*args, depth: depth, lineno: lineno)
|
798
|
-
when 2
|
799
|
-
log_info(*args, depth: depth, lineno: lineno)
|
800
|
-
else
|
801
|
-
log_debug(*args, depth: depth, lineno: lineno)
|
802
|
-
end
|
803
|
-
end
|
804
|
-
end
|
805
|
-
end
|
806
|
-
|
807
|
-
# The last thing on the @prod_data stack is the result
|
808
|
-
@result = case
|
809
|
-
when !prod_data.is_a?(Hash)
|
810
|
-
prod_data
|
811
|
-
when prod_data.empty?
|
812
|
-
nil
|
813
|
-
when prod_data[:schema]
|
814
|
-
prod_data[:schema]
|
815
|
-
else
|
816
|
-
key = prod_data.keys.first
|
817
|
-
[key] + Array(prod_data[key]) # Creates [:key, [:triple], ...]
|
818
|
-
end
|
903
|
+
**@options)
|
819
904
|
|
820
905
|
# Validate resulting expression
|
821
906
|
@result.validate! if @result && validate?
|
822
907
|
@result
|
823
|
-
rescue EBNF::
|
908
|
+
rescue EBNF::PEG::Parser::Error, EBNF::LL1::Lexer::Error => e
|
824
909
|
raise ShEx::ParseError, e.message, e.backtrace
|
825
910
|
end
|
826
911
|
|