markly 0.6.1 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (52) hide show
  1. checksums.yaml +4 -4
  2. checksums.yaml.gz.sig +0 -0
  3. data/conduct.md +133 -0
  4. data/ext/markly/arena.c +9 -8
  5. data/ext/markly/autolink.c +217 -134
  6. data/ext/markly/blocks.c +40 -4
  7. data/ext/markly/cmark-gfm-core-extensions.h +11 -11
  8. data/ext/markly/cmark-gfm-extension_api.h +1 -0
  9. data/ext/markly/cmark-gfm.h +18 -2
  10. data/ext/markly/cmark-gfm_version.h +2 -2
  11. data/ext/markly/cmark.c +3 -3
  12. data/ext/markly/commonmark.c +33 -38
  13. data/ext/markly/ext_scanners.c +360 -640
  14. data/ext/markly/extconf.rb +8 -1
  15. data/ext/markly/footnotes.c +23 -0
  16. data/ext/markly/footnotes.h +2 -0
  17. data/ext/markly/html.c +60 -23
  18. data/ext/markly/inlines.c +216 -61
  19. data/ext/markly/latex.c +6 -4
  20. data/ext/markly/man.c +7 -11
  21. data/ext/markly/map.c +11 -4
  22. data/ext/markly/map.h +5 -2
  23. data/ext/markly/markly.c +582 -586
  24. data/ext/markly/markly.h +1 -1
  25. data/ext/markly/node.c +76 -10
  26. data/ext/markly/node.h +49 -1
  27. data/ext/markly/parser.h +1 -0
  28. data/ext/markly/plaintext.c +12 -29
  29. data/ext/markly/references.c +1 -0
  30. data/ext/markly/render.c +15 -7
  31. data/ext/markly/scanners.c +13916 -20242
  32. data/ext/markly/scanners.h +8 -0
  33. data/ext/markly/scanners.re +47 -8
  34. data/ext/markly/strikethrough.c +1 -1
  35. data/ext/markly/table.c +143 -74
  36. data/ext/markly/xml.c +2 -1
  37. data/lib/markly/flags.rb +16 -0
  38. data/lib/markly/node/inspect.rb +59 -53
  39. data/lib/markly/node.rb +125 -58
  40. data/lib/markly/renderer/generic.rb +136 -0
  41. data/lib/markly/renderer/html.rb +301 -0
  42. data/lib/markly/version.rb +7 -1
  43. data/lib/markly.rb +38 -32
  44. data/license.md +39 -0
  45. data/readme.md +36 -0
  46. data.tar.gz.sig +0 -0
  47. metadata +63 -31
  48. metadata.gz.sig +0 -0
  49. data/bin/markly +0 -94
  50. data/lib/markly/markly.so +0 -0
  51. data/lib/markly/renderer/html_renderer.rb +0 -281
  52. data/lib/markly/renderer.rb +0 -133
data/lib/markly/node.rb CHANGED
@@ -1,72 +1,139 @@
1
1
  # frozen_string_literal: true
2
2
 
3
+ # Released under the MIT License.
4
+ # Copyright, 2016-2019, by Garen Torikian.
5
+ # Copyright, 2016-2017, by Yuki Izumi.
6
+ # Copyright, 2017, by Goro Fuji.
7
+ # Copyright, 2018, by Jerry van Leeuwen.
8
+ # Copyright, 2020-2023, by Samuel Williams.
9
+
3
10
  require_relative 'node/inspect'
4
11
 
5
12
  module Markly
6
- class Node
7
- include Enumerable
8
- include Inspect
9
-
10
- # Public: An iterator that "walks the tree," descending into children recursively.
11
- #
12
- # blk - A {Proc} representing the action to take for each child
13
- def walk(&block)
14
- return enum_for(:walk) unless block_given?
13
+ class Node
14
+ include Enumerable
15
+ include Inspect
15
16
 
16
- yield self
17
- each do |child|
18
- child.walk(&block)
19
- end
20
- end
17
+ # Public: An iterator that "walks the tree," descending into children recursively.
18
+ #
19
+ # blk - A {Proc} representing the action to take for each child
20
+ def walk(&block)
21
+ return enum_for(:walk) unless block_given?
21
22
 
22
- # Public: Convert the node to an HTML string.
23
- #
24
- # options - A {Symbol} or {Array of Symbol}s indicating the render options
25
- # extensions - An {Array of Symbol}s indicating the extensions to use
26
- #
27
- # Returns a {String}.
28
- def to_html(flags: DEFAULT, extensions: [])
29
- _render_html(flags, extensions).force_encoding('utf-8')
30
- end
23
+ yield self
24
+ each do |child|
25
+ child.walk(&block)
26
+ end
27
+ end
31
28
 
32
- # Public: Convert the node to a CommonMark string.
33
- #
34
- # options - A {Symbol} or {Array of Symbol}s indicating the render options
35
- # width - Column to wrap the output at
36
- #
37
- # Returns a {String}.
38
- def to_commonmark(flags: DEFAULT, width: 120)
39
- _render_commonmark(flags, width).force_encoding('utf-8')
40
- end
29
+ # Public: Convert the node to an HTML string.
30
+ #
31
+ # options - A {Symbol} or {Array of Symbol}s indicating the render options
32
+ # extensions - An {Array of Symbol}s indicating the extensions to use
33
+ #
34
+ # Returns a {String}.
35
+ def to_html(flags: DEFAULT, extensions: [])
36
+ _render_html(flags, extensions).force_encoding('utf-8')
37
+ end
41
38
 
42
- alias to_markdown to_commonmark
39
+ # Public: Convert the node to a CommonMark string.
40
+ #
41
+ # options - A {Symbol} or {Array of Symbol}s indicating the render options
42
+ # width - Column to wrap the output at
43
+ #
44
+ # Returns a {String}.
45
+ def to_commonmark(flags: DEFAULT, width: 120)
46
+ _render_commonmark(flags, width).force_encoding('utf-8')
47
+ end
43
48
 
44
- # Public: Convert the node to a plain text string.
45
- #
46
- # options - A {Symbol} or {Array of Symbol}s indicating the render options
47
- # width - Column to wrap the output at
48
- #
49
- # Returns a {String}.
50
- def to_plaintext(flags: DEFAULT, width: 120)
51
- _render_plaintext(flags, width).force_encoding('utf-8')
52
- end
49
+ alias to_markdown to_commonmark
53
50
 
54
- # Public: Iterate over the children (if any) of the current pointer.
55
- def each
56
- return enum_for(:each) unless block_given?
51
+ # Public: Convert the node to a plain text string.
52
+ #
53
+ # options - A {Symbol} or {Array of Symbol}s indicating the render options
54
+ # width - Column to wrap the output at
55
+ #
56
+ # Returns a {String}.
57
+ def to_plaintext(flags: DEFAULT, width: 120)
58
+ _render_plaintext(flags, width).force_encoding('utf-8')
59
+ end
57
60
 
58
- child = first_child
59
- while child
60
- nextchild = child.next
61
- yield child
62
- child = nextchild
63
- end
64
- end
61
+ # Public: Iterate over the children (if any) of the current pointer.
62
+ def each
63
+ return enum_for(:each) unless block_given?
65
64
 
66
- # Deprecated: Please use `each` instead
67
- def each_child(&block)
68
- warn '[DEPRECATION] `each_child` is deprecated. Please use `each` instead.'
69
- each(&block)
70
- end
71
- end
65
+ child = first_child
66
+ while child
67
+ next_child = child.next
68
+ yield child
69
+ child = next_child
70
+ end
71
+ end
72
+
73
+ def find_header(title)
74
+ each do |child|
75
+ if child.type == :header && child.first_child.string_content == title
76
+ return child
77
+ end
78
+ end
79
+ end
80
+
81
+ # Delete all nodes until the block returns true.
82
+ #
83
+ # @returns [Markly::Node] the node that returned true.
84
+ def delete_until
85
+ current = self
86
+ while current
87
+ return current if yield(current)
88
+ next_node = current.next
89
+ current.delete
90
+ current = next_node
91
+ end
92
+ end
93
+
94
+ # Replace a section (header + content) with a new node.
95
+ #
96
+ # @parameter title [String] the title of the section to replace.
97
+ # @parameter new_node [Markly::Node] the node to replace the section with.
98
+ # @parameter replace_header [Boolean] whether to replace the header itself or not.
99
+ # @parameter remove_subsections [Boolean] whether to remove subsections or not.
100
+ def replace_section(new_node, replace_header: true, remove_subsections: true)
101
+ # Delete until the next heading:
102
+ self.next&.delete_until do |node|
103
+ node.type == :heading && (!remove_subsections || node.header_level <= self.header_level)
104
+ end
105
+
106
+ self.append_after(new_node) if new_node
107
+ self.delete if replace_header
108
+ end
109
+
110
+ def next_heading
111
+ current = self.next
112
+ while current
113
+ if current.type == :heading
114
+ return current
115
+ end
116
+ current = current.next
117
+ end
118
+ end
119
+
120
+ # Append the given node after the current node.
121
+ #
122
+ # It's okay to provide a document node, it's children will be appended.
123
+ #
124
+ # @parameter node [Markly::Node] the node to append.
125
+ def append_after(node)
126
+ if node.type == :document
127
+ node = node.first_child
128
+ end
129
+
130
+ current = self
131
+ while node
132
+ next_node = node.next
133
+ current.insert_after(node)
134
+ current = node
135
+ node = next_node
136
+ end
137
+ end
138
+ end
72
139
  end
@@ -0,0 +1,136 @@
1
+ # frozen_string_literal: true
2
+
3
+ # Released under the MIT License.
4
+ # Copyright, 2015-2019, by Garen Torikian.
5
+ # Copyright, 2016-2017, by Yuki Izumi.
6
+ # Copyright, 2020-2023, by Samuel Williams.
7
+
8
+ require 'set'
9
+ require 'stringio'
10
+
11
+ module Markly
12
+ module Renderer
13
+ class Generic
14
+ def initialize(flags: DEFAULT, extensions: [])
15
+ @flags = flags
16
+ @stream = StringIO.new(+'')
17
+ @need_blocksep = false
18
+ @in_tight = false
19
+ @in_plain = false
20
+ @tagfilter = extensions.include?(:tagfilter)
21
+ end
22
+
23
+ attr_accessor :in_tight
24
+ attr_accessor :in_plain
25
+
26
+ def out(*args)
27
+ args.each do |arg|
28
+ if arg == :children
29
+ @node.each { |child| out(child) }
30
+ elsif arg.is_a?(Array)
31
+ arg.each { |x| render(x) }
32
+ elsif arg.is_a?(Node)
33
+ render(arg)
34
+ else
35
+ @stream.write(arg)
36
+ end
37
+ end
38
+ end
39
+
40
+ def render(node)
41
+ @node = node
42
+ if node.type == :document
43
+ document(node)
44
+ @stream.string
45
+ elsif @in_plain && node.type != :text && node.type != :softbreak
46
+ node.each { |child| render(child) }
47
+ else
48
+ send(node.type, node)
49
+ end
50
+ end
51
+
52
+ def document(_node)
53
+ out(:children)
54
+ end
55
+
56
+ def code_block(node)
57
+ code_block(node)
58
+ end
59
+
60
+ def reference_def(_node); end
61
+
62
+ def cr
63
+ return if @stream.string.empty? || @stream.string[-1] == "\n"
64
+
65
+ out("\n")
66
+ end
67
+
68
+ def blocksep
69
+ out("\n")
70
+ end
71
+
72
+ def containersep
73
+ cr unless @in_tight
74
+ end
75
+
76
+ def block
77
+ cr
78
+ yield
79
+ cr
80
+ end
81
+
82
+ def container(starter, ender)
83
+ out(starter)
84
+ yield
85
+ out(ender)
86
+ end
87
+
88
+ def plain
89
+ old_in_plain = @in_plain
90
+ @in_plain = true
91
+ yield
92
+ @in_plain = old_in_plain
93
+ end
94
+
95
+ private
96
+
97
+ def escape_href(str)
98
+ @node.html_escape_href(str)
99
+ end
100
+
101
+ def escape_html(str)
102
+ @node.html_escape_html(str)
103
+ end
104
+
105
+ def tagfilter(str)
106
+ if @tagfilter
107
+ str.gsub(
108
+ %r{
109
+ <
110
+ (
111
+ title|textarea|style|xmp|iframe|
112
+ noembed|noframes|script|plaintext
113
+ )
114
+ (?=\s|>|/>)
115
+ }xi,
116
+ '&lt;\1'
117
+ )
118
+ else
119
+ str
120
+ end
121
+ end
122
+
123
+ def source_position(node)
124
+ return '' unless flag_enabled?(SOURCE_POSITION)
125
+
126
+ s = node.source_position
127
+ " data-sourcepos=\"#{s[:start_line]}:#{s[:start_column]}-" \
128
+ "#{s[:end_line]}:#{s[:end_column]}\""
129
+ end
130
+
131
+ def flag_enabled?(flag)
132
+ (@flags & flag) != 0
133
+ end
134
+ end
135
+ end
136
+ end
@@ -0,0 +1,301 @@
1
+ # frozen_string_literal: true
2
+
3
+ # Released under the MIT License.
4
+ # Copyright, 2015-2020, by Garen Torikian.
5
+ # Copyright, 2015, by Nick Wellnhofer.
6
+ # Copyright, 2017, by Yuki Izumi.
7
+ # Copyright, 2017-2019, by Ashe Connor.
8
+ # Copyright, 2018, by Michael Camilleri.
9
+ # Copyright, 2020-2023, by Samuel Williams.
10
+
11
+ require_relative 'generic'
12
+ require 'cgi'
13
+
14
+ module Markly
15
+ module Renderer
16
+ class HTML < Generic
17
+ def initialize(ids: false, tight: false, **options)
18
+ super(**options)
19
+
20
+ @ids = ids
21
+ @section = nil
22
+ @tight = tight
23
+
24
+ @footnotes = {}
25
+ end
26
+
27
+ def document(_)
28
+ @section = false
29
+ super
30
+ out("</ol>\n</section>\n") if @written_footnote_ix
31
+ out("</section>") if @section
32
+ end
33
+
34
+ def id_for(node)
35
+ if @ids
36
+ id = node.to_plaintext.chomp.downcase.gsub(/\s+/, '-')
37
+
38
+ return " id=\"#{CGI.escape_html id}\""
39
+ end
40
+ end
41
+
42
+ def header(node)
43
+ block do
44
+ if @ids
45
+ out('</section>') if @section
46
+ @section = true
47
+ out("<section#{id_for(node)}>")
48
+ end
49
+
50
+ out('<h', node.header_level, "#{source_position(node)}>", :children,
51
+ '</h', node.header_level, '>')
52
+ end
53
+ end
54
+
55
+ def paragraph(node)
56
+ if @tight && node.parent.type != :blockquote
57
+ out(:children)
58
+ else
59
+ block do
60
+ container("<p#{source_position(node)}>", '</p>') do
61
+ out(:children)
62
+ if node.parent.type == :footnote_definition && node.next.nil?
63
+ out(' ')
64
+ out_footnote_backref
65
+ end
66
+ end
67
+ end
68
+ end
69
+ end
70
+
71
+ def list(node)
72
+ old_tight = @tight
73
+ @tight = node.list_tight
74
+
75
+ block do
76
+ if node.list_type == :bullet_list
77
+ container("<ul#{source_position(node)}>\n", '</ul>') do
78
+ out(:children)
79
+ end
80
+ else
81
+ start = if node.list_start == 1
82
+ "<ol#{source_position(node)}>\n"
83
+ else
84
+ "<ol start=\"#{node.list_start}\"#{source_position(node)}>\n"
85
+ end
86
+ container(start, '</ol>') do
87
+ out(:children)
88
+ end
89
+ end
90
+ end
91
+
92
+ @tight = old_tight
93
+ end
94
+
95
+ def list_item(node)
96
+ block do
97
+ tasklist_data = tasklist(node)
98
+ container("<li#{source_position(node)}#{tasklist_data}>#{' ' if tasklist?(node)}", '</li>') do
99
+ out(:children)
100
+ end
101
+ end
102
+ end
103
+
104
+ def tasklist(node)
105
+ return '' unless tasklist?(node)
106
+
107
+ state = if checked?(node)
108
+ 'checked="" disabled=""'
109
+ else
110
+ 'disabled=""'
111
+ end
112
+ "><input type=\"checkbox\" #{state} /"
113
+ end
114
+
115
+ def blockquote(node)
116
+ block do
117
+ container("<blockquote#{source_position(node)}>\n", '</blockquote>') do
118
+ out(:children)
119
+ end
120
+ end
121
+ end
122
+
123
+ def hrule(node)
124
+ block do
125
+ out("<hr#{source_position(node)} />")
126
+ end
127
+ end
128
+
129
+ def code_block(node)
130
+ block do
131
+ if flag_enabled?(GITHUB_PRE_LANG)
132
+ out("<pre#{source_position(node)}")
133
+ out(' lang="', node.fence_info.split(/\s+/)[0], '"') if node.fence_info && !node.fence_info.empty?
134
+ out('><code>')
135
+ else
136
+ out("<pre#{source_position(node)}><code")
137
+ if node.fence_info && !node.fence_info.empty?
138
+ out(' class="language-', node.fence_info.split(/\s+/)[0], '">')
139
+ else
140
+ out('>')
141
+ end
142
+ end
143
+ out(escape_html(node.string_content))
144
+ out('</code></pre>')
145
+ end
146
+ end
147
+
148
+ def html(node)
149
+ block do
150
+ if flag_enabled?(UNSAFE)
151
+ out(tagfilter(node.string_content))
152
+ else
153
+ out('<!-- raw HTML omitted -->')
154
+ end
155
+ end
156
+ end
157
+
158
+ def inline_html(node)
159
+ if flag_enabled?(UNSAFE)
160
+ out(tagfilter(node.string_content))
161
+ else
162
+ out('<!-- raw HTML omitted -->')
163
+ end
164
+ end
165
+
166
+ def emph(node)
167
+ out('<em>', :children, '</em>')
168
+ end
169
+
170
+ def strong(node)
171
+ if node.parent.nil? || node.parent.type == node.type
172
+ out(:children)
173
+ else
174
+ out('<strong>', :children, '</strong>')
175
+ end
176
+ end
177
+
178
+ def link(node)
179
+ out('<a href="', node.url.nil? ? '' : escape_href(node.url), '"')
180
+ out(' title="', escape_html(node.title), '"') if node.title && !node.title.empty?
181
+ out('>', :children, '</a>')
182
+ end
183
+
184
+ def image(node)
185
+ out('<img src="', escape_href(node.url), '"')
186
+ plain do
187
+ out(' alt="', :children, '"')
188
+ end
189
+ out(' title="', escape_html(node.title), '"') if node.title && !node.title.empty?
190
+ out(' />')
191
+ end
192
+
193
+ def text(node)
194
+ out(escape_html(node.string_content))
195
+ end
196
+
197
+ def code(node)
198
+ out('<code>')
199
+ out(escape_html(node.string_content))
200
+ out('</code>')
201
+ end
202
+
203
+ def linebreak(_node)
204
+ out("<br />\n")
205
+ end
206
+
207
+ def softbreak(_)
208
+ if flag_enabled?(HARD_BREAKS)
209
+ out("<br />\n")
210
+ elsif flag_enabled?(NO_BREAKS)
211
+ out(' ')
212
+ else
213
+ out("\n")
214
+ end
215
+ end
216
+
217
+ def table(node)
218
+ @alignments = node.table_alignments
219
+ @needs_close_tbody = false
220
+ out("<table#{source_position(node)}>\n", :children)
221
+ out("</tbody>\n") if @needs_close_tbody
222
+ out("</table>\n")
223
+ end
224
+
225
+ def table_header(node)
226
+ @column_index = 0
227
+
228
+ @in_header = true
229
+ out("<thead>\n<tr#{source_position(node)}>\n", :children, "</tr>\n</thead>\n")
230
+ @in_header = false
231
+ end
232
+
233
+ def table_row(node)
234
+ @column_index = 0
235
+ if !@in_header && !@needs_close_tbody
236
+ @needs_close_tbody = true
237
+ out("<tbody>\n")
238
+ end
239
+ out("<tr#{source_position(node)}>\n", :children, "</tr>\n")
240
+ end
241
+
242
+ def table_cell(node)
243
+ align = case @alignments[@column_index]
244
+ when :left then ' align="left"'
245
+ when :right then ' align="right"'
246
+ when :center then ' align="center"'
247
+ else; ''
248
+ end
249
+ out(@in_header ? "<th#{align}#{source_position(node)}>" : "<td#{align}#{source_position(node)}>", :children, @in_header ? "</th>\n" : "</td>\n")
250
+ @column_index += 1
251
+ end
252
+
253
+ def strikethrough(_)
254
+ out('<del>', :children, '</del>')
255
+ end
256
+
257
+ def footnote_reference(node)
258
+ label = node.parent_footnote_def.string_content
259
+
260
+ out("<sup class=\"footnote-ref\"><a href=\"#fn-#{label}\" id=\"fnref-#{label}\" data-footnote-ref>#{node.string_content}</a></sup>")
261
+ # out(node.to_html)
262
+ end
263
+
264
+ def footnote_definition(node)
265
+ unless @footnote_ix
266
+ out("<section class=\"footnotes\" data-footnotes>\n<ol>\n")
267
+ @footnote_ix = 0
268
+ end
269
+
270
+ @footnote_ix += 1
271
+ label = node.string_content
272
+ @footnotes[@footnote_ix] = label
273
+
274
+ out("<li id=\"fn-#{label}\">\n", :children)
275
+ out("\n") if out_footnote_backref
276
+ out("</li>\n")
277
+ # </ol>
278
+ # </section>
279
+ end
280
+
281
+ private
282
+
283
+ def out_footnote_backref
284
+ return false if @written_footnote_ix == @footnote_ix
285
+
286
+ @written_footnote_ix = @footnote_ix
287
+
288
+ out("<a href=\"#fnref-#{@footnotes[@footnote_ix]}\" class=\"footnote-backref\" data-footnote-backref data-footnote-backref-idx=\"#{@footnote_ix}\" aria-label=\"Back to reference #{@footnote_ix}\">↩</a>")
289
+ true
290
+ end
291
+
292
+ def tasklist?(node)
293
+ node.type_string == 'tasklist'
294
+ end
295
+
296
+ def checked?(node)
297
+ node.tasklist_item_checked?
298
+ end
299
+ end
300
+ end
301
+ end
@@ -1,5 +1,11 @@
1
1
  # frozen_string_literal: true
2
2
 
3
+ # Released under the MIT License.
4
+ # Copyright, 2015-2020, by Garen Torikian.
5
+ # Copyright, 2016-2017, by Yuki Izumi.
6
+ # Copyright, 2017-2018, by Ashe Connor.
7
+ # Copyright, 2020-2023, by Samuel Williams.
8
+
3
9
  module Markly
4
- VERSION = '0.6.1'
10
+ VERSION = '0.8.0'
5
11
  end