omextra 0.0.0.dev472__py3-none-any.whl → 0.0.0.dev473__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,16 @@
1
+ Copyright 2020 Charles Yeomans
2
+
3
+ Permission is hereby granted, free of charge, to any person obtaining a copy of this software
4
+ and associated documentation files (the "Software"), to deal in the Software without
5
+ restriction, including without limitation the rights to use, copy, modify, merge, publish,
6
+ distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the
7
+ Software is furnished to do so, subject to the following conditions:
8
+
9
+ The above copyright notice and this permission notice shall be included in all copies or
10
+ substantial portions of the Software.
11
+
12
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING
13
+ BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
14
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
15
+ DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
16
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
@@ -0,0 +1,69 @@
1
+ """
2
+ Parser generator for ABNF grammars.
3
+
4
+ Originally based on library by Charles Yeomans (see LICENSE file):
5
+
6
+ https://github.com/declaresub/abnf/tree/561ced67c0a8afc869ad0de5b39dbe4f6e71b0d8/src/abnf
7
+
8
+ It has however been nearly entirely rewritten.
9
+ """
10
+
11
+
12
+ from .base import ( # noqa
13
+ Match,
14
+ longest_match,
15
+
16
+ Parser,
17
+
18
+ Rule,
19
+ Grammar,
20
+
21
+ iter_parse,
22
+ parse,
23
+ )
24
+
25
+ from .core import ( # noqa
26
+ CORE_RULES,
27
+ )
28
+
29
+ from .errors import ( # noqa
30
+ AbnfError,
31
+ AbnfGrammarParseError,
32
+ )
33
+
34
+ from .meta import ( # noqa
35
+ META_GRAMMAR_RULES,
36
+ META_GRAMMAR,
37
+
38
+ parse_grammar,
39
+ )
40
+
41
+ from .parsers import ( # noqa
42
+ Literal,
43
+ StringLiteral,
44
+ CaseInsensitiveStringLiteral,
45
+ RangeLiteral,
46
+ literal,
47
+
48
+ Concat,
49
+ concat,
50
+
51
+ Repeat,
52
+ Option,
53
+ repeat,
54
+
55
+ Either,
56
+ either,
57
+
58
+ RuleRef,
59
+ rule,
60
+ )
61
+
62
+ from .utils import ( # noqa
63
+ strip_insignificant_match_rules,
64
+ only_match_rules,
65
+
66
+ parse_rules,
67
+
68
+ fix_grammar_ws,
69
+ )
@@ -0,0 +1,293 @@
1
+ """
2
+ TODO:
3
+ - cache lol
4
+ - get greedier
5
+ - match-powered optimizer
6
+ - greedily compile regexes
7
+ - error reporting
8
+ """
9
+ import abc
10
+ import io
11
+ import itertools
12
+ import typing as ta
13
+
14
+ from omlish import check
15
+ from omlish import lang
16
+
17
+ from .errors import AbnfError
18
+
19
+
20
+ with lang.auto_proxy_import(globals()):
21
+ from . import parsers
22
+
23
+
24
+ ##
25
+
26
+
27
+ @ta.final
28
+ class Match(ta.NamedTuple):
29
+ parser: 'Parser'
30
+ start: int
31
+ end: int
32
+ children: tuple['Match', ...]
33
+
34
+ @property
35
+ def length(self) -> int:
36
+ return self.end - self.start
37
+
38
+ #
39
+
40
+ def __repr__(self) -> str:
41
+ return (
42
+ f'{self.__class__.__name__}('
43
+ f'{self.parser._match_repr()}, ' # noqa
44
+ f'{self.start}, {self.end}'
45
+ f'{f", {self.children!r}" if self.children else ""})'
46
+ )
47
+
48
+ def render_to(
49
+ self,
50
+ write: ta.Callable[[str], ta.Any],
51
+ *,
52
+ indent: int | None = None,
53
+ _level: int = 0,
54
+ ) -> None:
55
+ ix: str | None = (' ' * (indent * _level)) if indent is not None else None
56
+ if ix:
57
+ write(ix)
58
+ p = self.parser
59
+ if isinstance(p, (parsers.StringLiteral, parsers.CaseInsensitiveStringLiteral)):
60
+ write(f'literal<{self.start}-{self.end}>({p.value!r})')
61
+ elif isinstance(p, parsers.RangeLiteral):
62
+ write(f'literal<{self.start}-{self.end}>({p.value.lo!r}-{p.value.hi!r})')
63
+ else:
64
+ write(f'{p.__class__.__name__.lower()}<{self.start}-{self.end}>')
65
+ if isinstance(p, parsers.RuleRef):
66
+ write(f':{p.name}')
67
+ if self.children:
68
+ write('(')
69
+ if ix is not None:
70
+ write('\n')
71
+ for i, c in enumerate(self.children):
72
+ if i and ix is None:
73
+ write(', ')
74
+ c.render_to(write, indent=indent, _level=_level + 1)
75
+ if ix is not None:
76
+ write(',\n')
77
+ if ix:
78
+ write(ix)
79
+ write(')')
80
+
81
+ def render(
82
+ self,
83
+ *,
84
+ indent: int | None = None,
85
+ ) -> str:
86
+ sb = io.StringIO()
87
+ self.render_to(sb.write, indent=indent)
88
+ return sb.getvalue()
89
+
90
+ def __str__(self) -> str:
91
+ return self.render()
92
+
93
+ #
94
+
95
+ def map_children(self, fn: ta.Callable[['Match'], 'Match']) -> 'Match':
96
+ return self._replace(children=tuple(map(fn, self.children)))
97
+
98
+ def flat_map_children(self, fn: ta.Callable[['Match'], ta.Iterable['Match']]) -> 'Match':
99
+ return self._replace(children=tuple(itertools.chain.from_iterable(map(fn, self.children))))
100
+
101
+
102
+ def longest_match(ms: ta.Iterable[Match]) -> Match | None:
103
+ bm: Match | None = None
104
+ bl = 0
105
+ for m in ms:
106
+ l = m.length
107
+ if bm is None or l > bl:
108
+ bm, bl = m, l
109
+ return bm
110
+
111
+
112
+ ##
113
+
114
+
115
+ class Parser(lang.Abstract, lang.PackageSealed):
116
+ def _match_repr(self) -> str:
117
+ return f'{self.__class__.__name__}@{id(self)}'
118
+
119
+ @abc.abstractmethod
120
+ def _iter_parse(self, ctx: '_Context', start: int) -> ta.Iterator[Match]:
121
+ raise NotImplementedError
122
+
123
+
124
+ ##
125
+
126
+
127
+ class Rule(lang.Final):
128
+ def __init__(
129
+ self,
130
+ name: str,
131
+ parser: Parser,
132
+ *,
133
+ insignificant: bool = False,
134
+ ) -> None:
135
+ super().__init__()
136
+
137
+ self._name = check.non_empty_str(name)
138
+ self._name_f = name.casefold()
139
+ self._parser = check.isinstance(parser, Parser)
140
+ self._insignificant = insignificant
141
+
142
+ def __repr__(self) -> str:
143
+ return f'{self.__class__.__name__}({self._name!r})'
144
+
145
+ @property
146
+ def name(self) -> str:
147
+ return self._name
148
+
149
+ @property
150
+ def name_f(self) -> str:
151
+ return self._name_f
152
+
153
+ @property
154
+ def parser(self) -> Parser:
155
+ return self._parser
156
+
157
+ @property
158
+ def insignificant(self) -> bool:
159
+ return self._insignificant
160
+
161
+
162
+ class Grammar(lang.Final):
163
+ def __init__(
164
+ self,
165
+ *rules: Rule,
166
+ root: Rule | str | None = None,
167
+ ) -> None:
168
+ super().__init__()
169
+
170
+ rules_set: set[Rule] = set()
171
+ rules_by_name: dict[str, Rule] = {}
172
+ rules_by_name_f: dict[str, Rule] = {}
173
+ rules_by_parser: dict[Parser, Rule] = {}
174
+ for gr in rules:
175
+ check.not_in(gr, rules_set)
176
+ check.not_in(gr._name, rules_by_name) # noqa
177
+ check.not_in(gr._name_f, rules_by_name_f) # noqa
178
+ check.not_in(gr._parser, rules_by_parser) # noqa
179
+ rules_by_name[gr._name] = gr # noqa
180
+ rules_by_name_f[gr._name_f] = gr # noqa
181
+ rules_by_parser[gr._parser] = gr # noqa
182
+ self._rules = rules_set
183
+ self._rules_by_name: ta.Mapping[str, Rule] = rules_by_name
184
+ self._rules_by_name_f: ta.Mapping[str, Rule] = rules_by_name_f
185
+ self._rules_by_parser: ta.Mapping[Parser, Rule] = rules_by_parser
186
+
187
+ if isinstance(root, str):
188
+ root = rules_by_name_f[root.casefold()]
189
+ self._root = root
190
+
191
+ @property
192
+ def root(self) -> Rule | None:
193
+ return self._root
194
+
195
+ def rule(self, name: str) -> Rule | None:
196
+ return self._rules_by_name_f.get(name.casefold())
197
+
198
+ def iter_parse(
199
+ self,
200
+ source: str,
201
+ root: Rule | str | None = None,
202
+ *,
203
+ start: int = 0,
204
+ ) -> ta.Iterator[Match]:
205
+ if root is None:
206
+ if (root := self._root) is None:
207
+ raise AbnfError('No root or default root specified')
208
+ else:
209
+ if isinstance(root, str):
210
+ root = self._rules_by_name_f[root.casefold()]
211
+ else:
212
+ root = check.in_(check.isinstance(root, Rule), self._rules)
213
+
214
+ ctx = _Context(self, source)
215
+ return ctx.iter_parse(root._parser, start) # noqa
216
+
217
+ def parse(
218
+ self,
219
+ source: str,
220
+ root: str | None = None,
221
+ *,
222
+ start: int = 0,
223
+ ) -> Match | None:
224
+ return longest_match(self.iter_parse(
225
+ source,
226
+ root,
227
+ start=start,
228
+ ))
229
+
230
+
231
+ ##
232
+
233
+
234
+ class _Context(lang.Final):
235
+ def __init__(self, grammar: Grammar, source: str) -> None:
236
+ super().__init__()
237
+
238
+ self._grammar = grammar
239
+ self._source = source
240
+
241
+ @property
242
+ def grammar(self) -> Grammar:
243
+ return self._grammar
244
+
245
+ @property
246
+ def source(self) -> str:
247
+ return self._source
248
+
249
+ def iter_parse(self, parser: Parser, start: int) -> ta.Iterator[Match]:
250
+ return parser._iter_parse(self, start) # noqa
251
+
252
+
253
+ ##
254
+
255
+
256
+ def iter_parse(
257
+ obj: Grammar | Rule | Parser,
258
+ src: str,
259
+ *,
260
+ root: str | None = None,
261
+ start: int = 0,
262
+ ) -> ta.Iterator[Match]:
263
+ if isinstance(obj, Grammar):
264
+ gram = obj
265
+ elif isinstance(obj, Rule):
266
+ check.none(root)
267
+ gram = Grammar(obj, root=obj)
268
+ elif isinstance(obj, Parser):
269
+ check.none(root)
270
+ gram = Grammar(Rule('root', obj), root='root')
271
+ else:
272
+ raise TypeError(obj)
273
+
274
+ return gram.iter_parse(
275
+ src,
276
+ root,
277
+ start=start,
278
+ )
279
+
280
+
281
+ def parse(
282
+ obj: Grammar | Rule | Parser,
283
+ src: str,
284
+ *,
285
+ root: str | None = None,
286
+ start: int = 0,
287
+ ) -> Match | None:
288
+ return longest_match(iter_parse(
289
+ obj,
290
+ src,
291
+ root=root,
292
+ start=start,
293
+ ))
@@ -0,0 +1,141 @@
1
+ """
2
+ https://datatracker.ietf.org/doc/html/rfc5234
3
+ """
4
+ import typing as ta
5
+
6
+ from .base import Grammar
7
+ from .base import Rule
8
+ from .parsers import concat
9
+ from .parsers import either
10
+ from .parsers import literal
11
+ from .parsers import repeat
12
+ from .parsers import rule
13
+
14
+
15
+ ##
16
+
17
+
18
+ CORE_RULES: ta.Sequence[Rule] = [
19
+
20
+ Rule(
21
+ 'ALPHA',
22
+ either(
23
+ literal('\x41', '\x5a'),
24
+ literal('\x61', '\x7a'),
25
+ ),
26
+ ),
27
+
28
+ Rule(
29
+ 'BIT',
30
+ either(
31
+ literal('0'),
32
+ literal('1'),
33
+ ),
34
+ ),
35
+
36
+ Rule(
37
+ 'CHAR',
38
+ literal('\x01', '\x7f'),
39
+ ),
40
+
41
+ Rule(
42
+ 'CTL',
43
+ either(
44
+ literal('\x00', '\x1f'),
45
+ literal('\x7f', case_sensitive=True),
46
+ ),
47
+ ),
48
+
49
+ Rule(
50
+ 'CR',
51
+ literal('\x0d', case_sensitive=True),
52
+ insignificant=True,
53
+ ),
54
+
55
+ Rule(
56
+ 'CRLF',
57
+ concat(
58
+ rule('CR'),
59
+ rule('LF'),
60
+ ),
61
+ insignificant=True,
62
+ ),
63
+
64
+ Rule(
65
+ 'DIGIT',
66
+ literal('\x30', '\x39'),
67
+ ),
68
+
69
+ Rule(
70
+ 'DQUOTE',
71
+ literal('\x22', case_sensitive=True),
72
+ ),
73
+
74
+ Rule(
75
+ 'HEXDIG',
76
+ either(
77
+ rule('DIGIT'),
78
+ literal('A'),
79
+ literal('B'),
80
+ literal('C'),
81
+ literal('D'),
82
+ literal('E'),
83
+ literal('F'),
84
+ ),
85
+ ),
86
+
87
+ Rule(
88
+ 'HTAB',
89
+ literal('\x09', case_sensitive=True),
90
+ insignificant=True,
91
+ ),
92
+
93
+ Rule(
94
+ 'LF',
95
+ literal('\x0a', case_sensitive=True),
96
+ insignificant=True,
97
+ ),
98
+
99
+ Rule(
100
+ 'LWSP',
101
+ repeat(
102
+ either(
103
+ rule('WSP'),
104
+ concat(
105
+ rule('CRLF'),
106
+ rule('WSP'),
107
+ ),
108
+ ),
109
+ ),
110
+ insignificant=True,
111
+ ),
112
+
113
+ Rule(
114
+ 'OCTET',
115
+ literal('\x00', '\xff'),
116
+ ),
117
+
118
+ Rule(
119
+ 'SP',
120
+ literal('\x20', case_sensitive=True),
121
+ insignificant=True,
122
+ ),
123
+
124
+ Rule(
125
+ 'VCHAR',
126
+ literal('\x21', '\x7e'),
127
+ ),
128
+
129
+ Rule(
130
+ 'WSP',
131
+ either(
132
+ rule('SP'),
133
+ rule('HTAB'),
134
+ ),
135
+ insignificant=True,
136
+ ),
137
+
138
+ ]
139
+
140
+
141
+ CORE_GRAMMAR = Grammar(*CORE_RULES)
@@ -0,0 +1,6 @@
1
+ class AbnfError(Exception):
2
+ pass
3
+
4
+
5
+ class AbnfGrammarParseError(AbnfError):
6
+ pass