math_ml 0.14 → 1.0.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/LICENSE +339 -0
- data/lib/math_ml/element.rb +233 -225
- data/lib/math_ml/latex/builtin/symbol.rb +546 -546
- data/lib/math_ml/latex/builtin.rb +3 -3
- data/lib/math_ml/latex.rb +1140 -1103
- data/lib/math_ml/string.rb +17 -16
- data/lib/math_ml/symbol/character_reference.rb +2100 -2101
- data/lib/math_ml/symbol/entity_reference.rb +2100 -2100
- data/lib/math_ml/symbol/utf8.rb +2100 -2102
- data/lib/math_ml/util.rb +350 -339
- data/lib/math_ml.rb +14 -14
- metadata +43 -75
- data/Rakefile +0 -60
- data/Rakefile.utirake +0 -392
- data/spec/math_ml/element_spec.rb +0 -32
- data/spec/math_ml/latex/macro_spec.rb +0 -122
- data/spec/math_ml/latex/parser_spec.rb +0 -580
- data/spec/math_ml/latex/scanner_spec.rb +0 -202
- data/spec/math_ml/string_spec.rb +0 -29
- data/spec/math_ml/util_spec.rb +0 -700
- data/spec/math_ml_spec.rb +0 -14
- data/spec/util.rb +0 -43
data/lib/math_ml/util.rb
CHANGED
@@ -6,345 +6,356 @@
|
|
6
6
|
# You can redistribute it and/or modify it under GPL2.
|
7
7
|
#
|
8
8
|
|
9
|
-
require
|
9
|
+
require 'math_ml'
|
10
10
|
|
11
11
|
module MathML::Util
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
|
19
|
-
|
20
|
-
|
21
|
-
|
22
|
-
|
23
|
-
|
24
|
-
|
25
|
-
|
26
|
-
|
27
|
-
|
28
|
-
|
29
|
-
|
30
|
-
|
31
|
-
|
32
|
-
|
33
|
-
|
34
|
-
|
35
|
-
|
36
|
-
|
37
|
-
|
38
|
-
|
39
|
-
|
40
|
-
|
41
|
-
|
42
|
-
|
43
|
-
|
44
|
-
|
45
|
-
|
46
|
-
|
47
|
-
|
48
|
-
|
49
|
-
|
50
|
-
|
51
|
-
|
52
|
-
|
53
|
-
|
54
|
-
|
55
|
-
|
56
|
-
|
57
|
-
|
58
|
-
|
59
|
-
|
60
|
-
|
61
|
-
|
62
|
-
|
63
|
-
|
64
|
-
|
65
|
-
|
66
|
-
|
67
|
-
|
68
|
-
|
69
|
-
|
70
|
-
|
71
|
-
|
72
|
-
|
73
|
-
|
74
|
-
|
75
|
-
|
76
|
-
|
77
|
-
|
78
|
-
|
79
|
-
|
80
|
-
|
81
|
-
|
82
|
-
|
83
|
-
|
84
|
-
|
85
|
-
|
86
|
-
|
87
|
-
|
88
|
-
|
89
|
-
|
90
|
-
|
91
|
-
|
92
|
-
|
93
|
-
|
94
|
-
|
95
|
-
|
96
|
-
|
97
|
-
|
98
|
-
|
99
|
-
|
100
|
-
|
101
|
-
|
102
|
-
|
103
|
-
|
104
|
-
|
105
|
-
|
106
|
-
|
107
|
-
|
108
|
-
|
109
|
-
|
110
|
-
|
111
|
-
|
112
|
-
|
113
|
-
|
114
|
-
|
115
|
-
|
116
|
-
|
117
|
-
|
118
|
-
|
119
|
-
|
120
|
-
|
121
|
-
|
122
|
-
|
123
|
-
|
124
|
-
|
125
|
-
|
126
|
-
|
127
|
-
|
128
|
-
|
129
|
-
|
130
|
-
|
131
|
-
|
132
|
-
|
133
|
-
|
134
|
-
|
135
|
-
|
136
|
-
|
137
|
-
|
138
|
-
|
139
|
-
|
140
|
-
|
141
|
-
|
142
|
-
|
143
|
-
|
144
|
-
|
145
|
-
|
146
|
-
|
147
|
-
|
148
|
-
|
149
|
-
|
150
|
-
|
151
|
-
|
152
|
-
|
153
|
-
|
154
|
-
|
155
|
-
|
156
|
-
|
157
|
-
|
158
|
-
|
159
|
-
|
160
|
-
|
161
|
-
|
162
|
-
|
163
|
-
|
164
|
-
|
165
|
-
|
166
|
-
|
167
|
-
|
168
|
-
|
169
|
-
|
170
|
-
|
171
|
-
|
172
|
-
|
173
|
-
|
174
|
-
|
175
|
-
|
176
|
-
|
177
|
-
|
178
|
-
|
179
|
-
|
180
|
-
|
181
|
-
|
182
|
-
|
183
|
-
|
184
|
-
|
185
|
-
|
186
|
-
|
187
|
-
|
188
|
-
|
189
|
-
|
190
|
-
|
191
|
-
|
192
|
-
|
193
|
-
|
194
|
-
|
195
|
-
|
196
|
-
|
197
|
-
|
198
|
-
|
199
|
-
|
200
|
-
|
201
|
-
|
202
|
-
|
203
|
-
|
204
|
-
|
205
|
-
|
206
|
-
|
207
|
-
|
208
|
-
|
209
|
-
|
210
|
-
|
211
|
-
|
212
|
-
|
213
|
-
|
214
|
-
|
215
|
-
|
216
|
-
|
217
|
-
|
218
|
-
|
219
|
-
|
220
|
-
|
221
|
-
|
222
|
-
|
223
|
-
|
224
|
-
|
225
|
-
|
226
|
-
|
227
|
-
|
228
|
-
|
229
|
-
|
230
|
-
|
231
|
-
|
232
|
-
|
233
|
-
|
234
|
-
|
235
|
-
|
236
|
-
|
237
|
-
|
238
|
-
|
239
|
-
|
240
|
-
|
241
|
-
|
242
|
-
|
243
|
-
|
244
|
-
|
245
|
-
|
246
|
-
|
247
|
-
|
248
|
-
|
249
|
-
|
250
|
-
|
251
|
-
|
252
|
-
|
253
|
-
|
254
|
-
|
255
|
-
|
256
|
-
|
257
|
-
|
258
|
-
|
259
|
-
|
260
|
-
|
261
|
-
|
262
|
-
|
263
|
-
|
264
|
-
|
265
|
-
|
266
|
-
|
267
|
-
|
268
|
-
|
269
|
-
|
270
|
-
|
271
|
-
|
272
|
-
|
273
|
-
|
274
|
-
|
275
|
-
|
276
|
-
|
277
|
-
|
278
|
-
|
279
|
-
|
280
|
-
|
281
|
-
|
282
|
-
|
283
|
-
|
284
|
-
|
285
|
-
|
286
|
-
|
287
|
-
|
288
|
-
|
289
|
-
|
290
|
-
|
291
|
-
|
292
|
-
|
293
|
-
|
294
|
-
|
295
|
-
|
296
|
-
|
297
|
-
|
298
|
-
|
299
|
-
|
300
|
-
|
301
|
-
|
302
|
-
|
303
|
-
|
304
|
-
|
305
|
-
|
306
|
-
|
307
|
-
|
308
|
-
|
309
|
-
|
310
|
-
|
311
|
-
|
312
|
-
|
313
|
-
|
314
|
-
|
315
|
-
|
316
|
-
|
317
|
-
|
318
|
-
|
319
|
-
|
320
|
-
|
321
|
-
|
322
|
-
|
323
|
-
|
324
|
-
|
325
|
-
|
326
|
-
|
327
|
-
|
328
|
-
|
329
|
-
|
330
|
-
|
331
|
-
|
332
|
-
|
333
|
-
|
334
|
-
|
335
|
-
|
336
|
-
|
337
|
-
|
338
|
-
|
339
|
-
|
340
|
-
|
341
|
-
|
342
|
-
|
343
|
-
|
344
|
-
|
345
|
-
|
346
|
-
|
347
|
-
|
348
|
-
|
349
|
-
|
12
|
+
ESCAPES = { '<' => 'lt',
|
13
|
+
'>' => 'gt',
|
14
|
+
'&' => 'amp',
|
15
|
+
'"' => 'quot',
|
16
|
+
"'" => 'apos' }
|
17
|
+
INVALID_RE = /(?!)/
|
18
|
+
EQNARRAY_RE = /\\begin\s*\{eqnarray\}(#{MathML::LaTeX::MBEC}*?)\\end\s*\{eqnarray\}/
|
19
|
+
SINGLE_COMMAND_RE = /(\\([a-zA-Z]+))[ \t]?/
|
20
|
+
|
21
|
+
def self.escapeXML(s, br = false)
|
22
|
+
r = s.gsub(/[<>&"']/) { |m| "&#{ESCAPES[m]};" }
|
23
|
+
br ? r.gsub(/\n/, "<br />\n") : r
|
24
|
+
end
|
25
|
+
|
26
|
+
def escapeXML(s, br = false)
|
27
|
+
MathML::Util.escapeXML(s, br)
|
28
|
+
end
|
29
|
+
|
30
|
+
def self.collect_regexp(a)
|
31
|
+
if a
|
32
|
+
a = [a].flatten
|
33
|
+
if a.size > 0
|
34
|
+
Regexp.new(a.inject('') { |r, i| i.is_a?(Regexp) ? "#{r}#{i}|" : r }.chop)
|
35
|
+
else
|
36
|
+
INVALID_RE
|
37
|
+
end
|
38
|
+
else
|
39
|
+
INVALID_RE
|
40
|
+
end
|
41
|
+
end
|
42
|
+
|
43
|
+
def collect_regexp(a)
|
44
|
+
MathML::Util.collect_regexp(a)
|
45
|
+
end
|
46
|
+
|
47
|
+
class MathData
|
48
|
+
attr_reader :math_list, :msrc_list, :dmath_list, :dsrc_list, :escape_list, :esrc_list, :user_list, :usrc_list
|
49
|
+
|
50
|
+
def initialize
|
51
|
+
@math_list = []
|
52
|
+
@msrc_list = []
|
53
|
+
@dmath_list = []
|
54
|
+
@dsrc_list = []
|
55
|
+
@escape_list = []
|
56
|
+
@esrc_list = []
|
57
|
+
@user_list = []
|
58
|
+
@usrc_list = []
|
59
|
+
end
|
60
|
+
|
61
|
+
def update(s)
|
62
|
+
@math_list.concat(s.math_list)
|
63
|
+
@msrc_list.concat(s.msrc_list)
|
64
|
+
@dmath_list.concat(s.dmath_list)
|
65
|
+
@dsrc_list.concat(s.dsrc_list)
|
66
|
+
@escape_list.concat(s.escape_list)
|
67
|
+
@esrc_list.concat(s.esrc_list)
|
68
|
+
@user_list.concat(s.user_list)
|
69
|
+
@usrc_list.concat(s.usrc_list)
|
70
|
+
end
|
71
|
+
end
|
72
|
+
|
73
|
+
class SimpleLaTeX
|
74
|
+
include MathML::Util
|
75
|
+
@@default_latex = nil
|
76
|
+
DEFAULT = {
|
77
|
+
delimiter: "\001",
|
78
|
+
math_env_list: [
|
79
|
+
/\$((?:\\.|[^\\$])#{MathML::LaTeX::MBEC}*?)\$/m,
|
80
|
+
/\\\((#{MathML::LaTeX::MBEC}*?)\\\)/m
|
81
|
+
],
|
82
|
+
dmath_env_list: [
|
83
|
+
/\$\$(#{MathML::LaTeX::MBEC}*?)\$\$/m,
|
84
|
+
/\\\[(#{MathML::LaTeX::MBEC}*?)\\\]/m
|
85
|
+
],
|
86
|
+
escape_list: [
|
87
|
+
/\\(.)/m
|
88
|
+
],
|
89
|
+
through_list: [],
|
90
|
+
escape_any: false,
|
91
|
+
without_parse: false
|
92
|
+
}
|
93
|
+
|
94
|
+
def initialize(options = {})
|
95
|
+
@params = DEFAULT.merge(options)
|
96
|
+
@params[:parser] = MathML::LaTeX::Parser.new unless @params[:parser] || @params[:without_parse]
|
97
|
+
|
98
|
+
@params[:math_envs] = collect_regexp(@params[:math_env_list])
|
99
|
+
@params[:dmath_envs] = collect_regexp(@params[:dmath_env_list])
|
100
|
+
@params[:escapes] = collect_regexp(@params[:escape_list])
|
101
|
+
@params[:throughs] = collect_regexp(@params[:through_list])
|
102
|
+
reset_encode_proc
|
103
|
+
reset_rescue_proc
|
104
|
+
reset_decode_proc
|
105
|
+
reset_unencode_proc
|
106
|
+
end
|
107
|
+
|
108
|
+
def reset_encode_proc
|
109
|
+
@encode_proc_re = INVALID_RE
|
110
|
+
@encode_proc = nil
|
111
|
+
end
|
112
|
+
|
113
|
+
def set_encode_proc(*re, &proc)
|
114
|
+
@encode_proc_re = collect_regexp(re)
|
115
|
+
@encode_proc = proc
|
116
|
+
end
|
117
|
+
|
118
|
+
def reset_rescue_proc
|
119
|
+
@rescue_proc = nil
|
120
|
+
end
|
121
|
+
|
122
|
+
def set_rescue_proc(&proc)
|
123
|
+
@rescue_proc = proc
|
124
|
+
end
|
125
|
+
|
126
|
+
def reset_decode_proc
|
127
|
+
@decode_proc = nil
|
128
|
+
end
|
129
|
+
|
130
|
+
def set_decode_proc(&proc)
|
131
|
+
@decode_proc = proc
|
132
|
+
end
|
133
|
+
|
134
|
+
def set_unencode_proc(&proc)
|
135
|
+
@unencode_proc = proc
|
136
|
+
end
|
137
|
+
|
138
|
+
def reset_unencode_proc
|
139
|
+
@unencode_proc = nil
|
140
|
+
end
|
141
|
+
|
142
|
+
def encode(src, *proc_re, &proc)
|
143
|
+
data = if proc_re.size > 0 && proc_re[0].is_a?(MathData)
|
144
|
+
proc_re.shift
|
145
|
+
else
|
146
|
+
MathData.new
|
147
|
+
end
|
148
|
+
|
149
|
+
proc_re = proc_re.size == 0 ? @encode_proc_re : collect_regexp(proc_re)
|
150
|
+
proc ||= @encode_proc
|
151
|
+
|
152
|
+
s = StringScanner.new(src)
|
153
|
+
encoded = ''
|
154
|
+
|
155
|
+
until s.eos?
|
156
|
+
if s.scan(/
|
157
|
+
(.*?)
|
158
|
+
(((((#{@params[:throughs]})|
|
159
|
+
#{@params[:dmath_envs]})|
|
160
|
+
#{@params[:math_envs]})|
|
161
|
+
#{proc_re})|
|
162
|
+
#{@params[:escapes]})
|
163
|
+
/mx)
|
164
|
+
encoded << s[1]
|
165
|
+
if s[6]
|
166
|
+
encoded << s[6]
|
167
|
+
elsif s[5] || s[4]
|
168
|
+
env_src = s[5] || s[4]
|
169
|
+
if @params[:dmath_envs] =~ env_src
|
170
|
+
encoded << "#{@params[:delimiter]}d#{data.dsrc_list.size}#{@params[:delimiter]}"
|
171
|
+
data.dsrc_list << env_src
|
172
|
+
else
|
173
|
+
encoded << "#{@params[:delimiter]}m#{data.msrc_list.size}#{@params[:delimiter]}"
|
174
|
+
data.msrc_list << env_src
|
175
|
+
end
|
176
|
+
elsif s[3]
|
177
|
+
size = s[3].size
|
178
|
+
s.pos = left = s.pos - size
|
179
|
+
if r = proc.call(s)
|
180
|
+
right = s.pos
|
181
|
+
encoded << "#{@params[:delimiter]}u#{data.user_list.size}#{@params[:delimiter]}"
|
182
|
+
data.user_list << r
|
183
|
+
data.usrc_list << s.string[left...right]
|
184
|
+
else
|
185
|
+
encoded << s.peek(size)
|
186
|
+
s.pos = s.pos + size
|
187
|
+
end
|
188
|
+
elsif s[2]
|
189
|
+
encoded << "#{@params[:delimiter]}e#{data.escape_list.size}#{@params[:delimiter]}"
|
190
|
+
@params[:escapes] =~ s[2]
|
191
|
+
data.esrc_list << s[2]
|
192
|
+
data.escape_list << escapeXML($+, true)
|
193
|
+
end
|
194
|
+
else
|
195
|
+
encoded << s.rest
|
196
|
+
s.terminate
|
197
|
+
end
|
198
|
+
end
|
199
|
+
|
200
|
+
parse(data, @params[:parser]) unless @params[:without_parse]
|
201
|
+
|
202
|
+
[encoded, data]
|
203
|
+
end
|
204
|
+
|
205
|
+
def error_to_html(e)
|
206
|
+
"<br />\n#{escapeXML(e.message)}<br />\n<code>#{escapeXML(e.done).gsub(/\n/, "<br />\n")}" \
|
207
|
+
"<strong>#{escapeXML(e.rest).gsub(/\n/, "<br />\n")}</strong></code><br />"
|
208
|
+
end
|
209
|
+
|
210
|
+
def latex_parser
|
211
|
+
@params[:parser] = MathML::LaTeX::Parser.new unless @params[:parser]
|
212
|
+
@params[:parser]
|
213
|
+
end
|
214
|
+
|
215
|
+
def parse(data, parser = nil)
|
216
|
+
parser ||= latex_parser
|
217
|
+
(data.math_list.size...data.msrc_list.size).each do |i|
|
218
|
+
@params[:math_envs] =~ data.msrc_list[i]
|
219
|
+
data.math_list[i] = parser.parse($+)
|
220
|
+
rescue MathML::LaTeX::ParseError => e
|
221
|
+
data.math_list[i] = if @rescue_proc
|
222
|
+
@rescue_proc.call(e)
|
223
|
+
else
|
224
|
+
error_to_html(e)
|
225
|
+
end
|
226
|
+
end
|
227
|
+
(data.dmath_list.size...data.dsrc_list.size).each do |i|
|
228
|
+
@params[:dmath_envs] =~ data.dsrc_list[i]
|
229
|
+
data.dmath_list[i] = parser.parse($+, true)
|
230
|
+
rescue MathML::LaTeX::ParseError => e
|
231
|
+
data.dmath_list[i] = if @rescue_proc
|
232
|
+
@rescue_proc.call(e)
|
233
|
+
else
|
234
|
+
error_to_html(e)
|
235
|
+
end
|
236
|
+
end
|
237
|
+
end
|
238
|
+
|
239
|
+
def decode(encoded, data, without_parsed = false, &proc)
|
240
|
+
return nil if encoded.nil?
|
241
|
+
|
242
|
+
proc ||= @decode_proc
|
243
|
+
encoded.gsub(/#{Regexp.escape(@params[:delimiter])}([demu])(\d+)#{Regexp.escape(@params[:delimiter])}/) do
|
244
|
+
i = $2.to_i
|
245
|
+
t, d, s =
|
246
|
+
case $1
|
247
|
+
when 'd'
|
248
|
+
[:dmath, without_parsed ? escapeXML(data.dsrc_list[i], true) : data.dmath_list[i], data.dsrc_list[i]]
|
249
|
+
when 'e'
|
250
|
+
[:escape, data.escape_list[i], data.esrc_list[i]]
|
251
|
+
when 'm'
|
252
|
+
[:math, without_parsed ? escapeXML(data.msrc_list[i], true) : data.math_list[i], data.msrc_list[i]]
|
253
|
+
when 'u'
|
254
|
+
[:user, data.user_list[i], data.usrc_list[i]]
|
255
|
+
end
|
256
|
+
if proc
|
257
|
+
proc.call(d, type: t, index: i, src: s) || d
|
258
|
+
else
|
259
|
+
d
|
260
|
+
end
|
261
|
+
end
|
262
|
+
end
|
263
|
+
|
264
|
+
def decode_partial(type, encoded, data, &proc)
|
265
|
+
return nil if encoded.nil?
|
266
|
+
|
267
|
+
head =
|
268
|
+
case type
|
269
|
+
when :math
|
270
|
+
'm'
|
271
|
+
when :dmath
|
272
|
+
'd'
|
273
|
+
when :escape
|
274
|
+
'e'
|
275
|
+
when :user
|
276
|
+
'u'
|
277
|
+
else
|
278
|
+
return
|
279
|
+
end
|
280
|
+
encoded.gsub(/#{Regexp.escape(@params[:delimiter])}#{head}(\d+)#{Regexp.escape(@params[:delimiter])}/) do
|
281
|
+
i = $1.to_i
|
282
|
+
t, d, s =
|
283
|
+
case head
|
284
|
+
when 'd'
|
285
|
+
[:dmath, data.dmath_list[i], data.dsrc_list[i]]
|
286
|
+
when 'e'
|
287
|
+
[:escape, data.escape_list[i], data.esrc_list[i]]
|
288
|
+
when 'm'
|
289
|
+
[:math, data.math_list[i], data.msrc_list[i]]
|
290
|
+
when 'u'
|
291
|
+
[:user, data.user_list[i], data.usrc_list[i]]
|
292
|
+
end
|
293
|
+
if proc
|
294
|
+
proc.call(d, type: t, index: i, src: s) || "#{@params[:delimiter]}#{head}#{i}#{@params[:delimiter]}"
|
295
|
+
else
|
296
|
+
d
|
297
|
+
end
|
298
|
+
end
|
299
|
+
end
|
300
|
+
|
301
|
+
def unencode(encoded, data, without_escape = false, &proc)
|
302
|
+
return nil if encoded.nil?
|
303
|
+
|
304
|
+
proc ||= @unencode_proc
|
305
|
+
encoded.gsub(/#{Regexp.escape(@params[:delimiter])}([demu])(\d+)#{Regexp.escape(@params[:delimiter])}/) do
|
306
|
+
i = $2.to_i
|
307
|
+
t, s =
|
308
|
+
case $1
|
309
|
+
when 'd'
|
310
|
+
[:dmath, data.dsrc_list[i]]
|
311
|
+
when 'e'
|
312
|
+
[:escape, data.esrc_list[i]]
|
313
|
+
when 'm'
|
314
|
+
[:math, data.msrc_list[i]]
|
315
|
+
when 'u'
|
316
|
+
[:user, data.usrc_list[i]]
|
317
|
+
end
|
318
|
+
s = escapeXML(s, true) unless without_escape
|
319
|
+
if proc
|
320
|
+
proc.call(s, type: t, index: i) || s
|
321
|
+
else
|
322
|
+
s
|
323
|
+
end
|
324
|
+
end
|
325
|
+
end
|
326
|
+
|
327
|
+
def self.encode(src)
|
328
|
+
@@default_latex ||= new
|
329
|
+
@@default_latex.encode(src)
|
330
|
+
end
|
331
|
+
|
332
|
+
def self.decode(src, data)
|
333
|
+
@@default_latex.decode(src, data)
|
334
|
+
end
|
335
|
+
|
336
|
+
def parse_eqnarray(src, parser = nil)
|
337
|
+
src = "\\begin{array}{ccc}#{src}\\end{array}"
|
338
|
+
parser ||= latex_parser
|
339
|
+
begin
|
340
|
+
parser.parse(src, true)
|
341
|
+
rescue MathML::LaTeX::ParseError => e
|
342
|
+
e = MathML::LaTeX::ParseError.new(
|
343
|
+
e.message,
|
344
|
+
e.rest.sub(/\\end\{array\}\z/, '\end{eqnarray}'),
|
345
|
+
e.done.sub(/\A\\begin\{array\}\{ccc\}/, '\begin{eqnarray}')
|
346
|
+
)
|
347
|
+
@rescue_proc ? @rescue_proc.call(e) : error_to_html(e)
|
348
|
+
end
|
349
|
+
end
|
350
|
+
|
351
|
+
def parse_single_command(src, parser = nil)
|
352
|
+
s = src[SINGLE_COMMAND_RE, 1]
|
353
|
+
parser ||= latex_parser
|
354
|
+
begin
|
355
|
+
parser.parse(s)
|
356
|
+
rescue MathML::LaTeX::ParseError => e
|
357
|
+
src[SINGLE_COMMAND_RE, 2]
|
358
|
+
end
|
359
|
+
end
|
360
|
+
end
|
350
361
|
end
|