commonmarker 0.23.10 → 2.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/Cargo.lock +1156 -0
- data/Cargo.toml +7 -0
- data/README.md +237 -172
- data/ext/commonmarker/Cargo.toml +20 -0
- data/ext/commonmarker/extconf.rb +3 -6
- data/ext/commonmarker/src/lib.rs +103 -0
- data/ext/commonmarker/src/node.rs +1221 -0
- data/ext/commonmarker/src/options.rs +220 -0
- data/ext/commonmarker/src/plugins/syntax_highlighting.rs +166 -0
- data/ext/commonmarker/src/plugins.rs +6 -0
- data/ext/commonmarker/src/utils.rs +8 -0
- data/lib/commonmarker/config.rb +92 -40
- data/lib/commonmarker/constants.rb +7 -0
- data/lib/commonmarker/extension.rb +14 -0
- data/lib/commonmarker/node/ast.rb +8 -0
- data/lib/commonmarker/node/inspect.rb +14 -4
- data/lib/commonmarker/node.rb +29 -47
- data/lib/commonmarker/renderer.rb +1 -127
- data/lib/commonmarker/utils.rb +22 -0
- data/lib/commonmarker/version.rb +2 -2
- data/lib/commonmarker.rb +27 -25
- metadata +38 -191
- data/Rakefile +0 -109
- data/bin/commonmarker +0 -118
- data/commonmarker.gemspec +0 -38
- data/ext/commonmarker/arena.c +0 -104
- data/ext/commonmarker/autolink.c +0 -508
- data/ext/commonmarker/autolink.h +0 -8
- data/ext/commonmarker/blocks.c +0 -1622
- data/ext/commonmarker/buffer.c +0 -278
- data/ext/commonmarker/buffer.h +0 -116
- data/ext/commonmarker/case_fold_switch.inc +0 -4327
- data/ext/commonmarker/chunk.h +0 -135
- data/ext/commonmarker/cmark-gfm-core-extensions.h +0 -54
- data/ext/commonmarker/cmark-gfm-extension_api.h +0 -737
- data/ext/commonmarker/cmark-gfm-extensions_export.h +0 -42
- data/ext/commonmarker/cmark-gfm.h +0 -833
- data/ext/commonmarker/cmark-gfm_export.h +0 -42
- data/ext/commonmarker/cmark-gfm_version.h +0 -7
- data/ext/commonmarker/cmark.c +0 -55
- data/ext/commonmarker/cmark_ctype.c +0 -44
- data/ext/commonmarker/cmark_ctype.h +0 -33
- data/ext/commonmarker/commonmark.c +0 -514
- data/ext/commonmarker/commonmarker.c +0 -1308
- data/ext/commonmarker/commonmarker.h +0 -16
- data/ext/commonmarker/config.h +0 -76
- data/ext/commonmarker/core-extensions.c +0 -27
- data/ext/commonmarker/entities.inc +0 -2138
- data/ext/commonmarker/ext_scanners.c +0 -879
- data/ext/commonmarker/ext_scanners.h +0 -24
- data/ext/commonmarker/footnotes.c +0 -63
- data/ext/commonmarker/footnotes.h +0 -27
- data/ext/commonmarker/houdini.h +0 -57
- data/ext/commonmarker/houdini_href_e.c +0 -100
- data/ext/commonmarker/houdini_html_e.c +0 -66
- data/ext/commonmarker/houdini_html_u.c +0 -149
- data/ext/commonmarker/html.c +0 -502
- data/ext/commonmarker/html.h +0 -27
- data/ext/commonmarker/inlines.c +0 -1788
- data/ext/commonmarker/inlines.h +0 -29
- data/ext/commonmarker/iterator.c +0 -159
- data/ext/commonmarker/iterator.h +0 -26
- data/ext/commonmarker/latex.c +0 -468
- data/ext/commonmarker/linked_list.c +0 -37
- data/ext/commonmarker/man.c +0 -274
- data/ext/commonmarker/map.c +0 -129
- data/ext/commonmarker/map.h +0 -44
- data/ext/commonmarker/node.c +0 -1045
- data/ext/commonmarker/node.h +0 -167
- data/ext/commonmarker/parser.h +0 -59
- data/ext/commonmarker/plaintext.c +0 -218
- data/ext/commonmarker/plugin.c +0 -36
- data/ext/commonmarker/plugin.h +0 -34
- data/ext/commonmarker/references.c +0 -43
- data/ext/commonmarker/references.h +0 -26
- data/ext/commonmarker/registry.c +0 -63
- data/ext/commonmarker/registry.h +0 -24
- data/ext/commonmarker/render.c +0 -213
- data/ext/commonmarker/render.h +0 -62
- data/ext/commonmarker/scanners.c +0 -14056
- data/ext/commonmarker/scanners.h +0 -70
- data/ext/commonmarker/scanners.re +0 -341
- data/ext/commonmarker/strikethrough.c +0 -167
- data/ext/commonmarker/strikethrough.h +0 -9
- data/ext/commonmarker/syntax_extension.c +0 -149
- data/ext/commonmarker/syntax_extension.h +0 -34
- data/ext/commonmarker/table.c +0 -917
- data/ext/commonmarker/table.h +0 -12
- data/ext/commonmarker/tagfilter.c +0 -60
- data/ext/commonmarker/tagfilter.h +0 -8
- data/ext/commonmarker/tasklist.c +0 -156
- data/ext/commonmarker/tasklist.h +0 -8
- data/ext/commonmarker/utf8.c +0 -317
- data/ext/commonmarker/utf8.h +0 -35
- data/ext/commonmarker/xml.c +0 -182
- data/lib/commonmarker/renderer/html_renderer.rb +0 -256
data/Cargo.toml
ADDED
data/README.md
CHANGED
@@ -1,11 +1,13 @@
|
|
1
|
-
#
|
1
|
+
# Commonmarker
|
2
2
|
|
3
|
-
|
3
|
+
Ruby wrapper for Rust's [comrak](https://github.com/kivikakk/comrak) crate.
|
4
4
|
|
5
|
-
|
6
|
-
GitHub's fork of the reference parser for CommonMark. It passes all of the C tests, and is therefore spec-complete. It also includes extensions to the CommonMark spec as documented in the [GitHub Flavored Markdown spec](http://github.github.com/gfm/), such as support for tables, strikethroughs, and autolinking.
|
5
|
+
It passes all of the CommonMark test suite, and is therefore spec-complete. It also includes extensions to the CommonMark spec as documented in the [GitHub Flavored Markdown spec](http://github.github.com/gfm/), such as support for tables, strikethroughs, and autolinking.
|
7
6
|
|
8
|
-
|
7
|
+
> [!NOTE]
|
8
|
+
> By default, several extensions not in any spec have been enabled, for the sake of end user convenience when generating HTML.
|
9
|
+
>
|
10
|
+
> For more information on the available options and extensions, see [the documentation below](#options-and-plugins).
|
9
11
|
|
10
12
|
## Installation
|
11
13
|
|
@@ -23,47 +25,79 @@ Or install it yourself as:
|
|
23
25
|
|
24
26
|
## Usage
|
25
27
|
|
28
|
+
This gem expects to receive UTF-8 strings. Ensure your strings are the right encoding before passing them into `Commonmarker`.
|
29
|
+
|
26
30
|
### Converting to HTML
|
27
31
|
|
28
|
-
Call `
|
32
|
+
Call `to_html` on a string to convert it to HTML:
|
29
33
|
|
30
|
-
```
|
34
|
+
```ruby
|
31
35
|
require 'commonmarker'
|
32
|
-
|
33
|
-
|
36
|
+
Commonmarker.to_html('"Hi *there*"', options: {
|
37
|
+
parse: { smart: true }
|
38
|
+
})
|
39
|
+
# => <p>“Hi <em>there</em>”</p>\n
|
34
40
|
```
|
35
41
|
|
36
|
-
The second argument is optional--[see below](#options) for more information.
|
42
|
+
(The second argument is optional--[see below](#options-and-plugins) for more information.)
|
37
43
|
|
38
44
|
### Generating a document
|
39
45
|
|
40
|
-
You can also parse a string to receive a `
|
46
|
+
You can also parse a string to receive a `:document` node. You can then print that node to HTML, iterate over the children, and do other fun node stuff. For example:
|
41
47
|
|
42
|
-
```
|
48
|
+
```ruby
|
43
49
|
require 'commonmarker'
|
44
50
|
|
45
|
-
doc =
|
46
|
-
|
51
|
+
doc = Commonmarker.parse("*Hello* world", options: {
|
52
|
+
parse: { smart: true }
|
53
|
+
})
|
54
|
+
puts(doc.to_html) # => <p><em>Hello</em> world</p>\n
|
47
55
|
|
48
56
|
doc.walk do |node|
|
49
|
-
puts node.type # [:document, :paragraph, :
|
57
|
+
puts node.type # => [:document, :paragraph, :emph, :text, :text]
|
50
58
|
end
|
51
59
|
```
|
52
60
|
|
53
|
-
The second argument is optional--[see below](#options) for more information.
|
61
|
+
(The second argument is optional--[see below](#options-and-plugins) for more information.)
|
62
|
+
|
63
|
+
When it comes to modifying the document, you can perform the following operations:
|
64
|
+
|
65
|
+
- `insert_before`
|
66
|
+
- `insert_after`
|
67
|
+
- `prepend_child`
|
68
|
+
- `append_child`
|
69
|
+
- `delete`
|
70
|
+
|
71
|
+
You can also get the source position of a node by calling `source_position`:
|
72
|
+
|
73
|
+
```ruby
|
74
|
+
doc = Commonmarker.parse("*Hello* world")
|
75
|
+
puts doc.first_child.first_child.source_position
|
76
|
+
# => {:start_line=>1, :start_column=>1, :end_line=>1, :end_column=>7}
|
77
|
+
```
|
78
|
+
|
79
|
+
You can also modify the following attributes:
|
80
|
+
|
81
|
+
- `url`
|
82
|
+
- `title`
|
83
|
+
- `header_level`
|
84
|
+
- `list_type`
|
85
|
+
- `list_start`
|
86
|
+
- `list_tight`
|
87
|
+
- `fence_info`
|
54
88
|
|
55
|
-
#### Example:
|
89
|
+
#### Example: Walking the AST
|
56
90
|
|
57
91
|
You can use `walk` or `each` to iterate over nodes:
|
58
92
|
|
59
93
|
- `walk` will iterate on a node and recursively iterate on a node's children.
|
60
|
-
- `each` will iterate on a node
|
94
|
+
- `each` will iterate on a node's direct children, but no further.
|
61
95
|
|
62
|
-
```
|
96
|
+
```ruby
|
63
97
|
require 'commonmarker'
|
64
98
|
|
65
|
-
# parse
|
66
|
-
doc =
|
99
|
+
# parse some string
|
100
|
+
doc = Commonmarker.parse("# The site\n\n [GitHub](https://www.github.com)")
|
67
101
|
|
68
102
|
# Walk tree and print out URLs for links
|
69
103
|
doc.walk do |node|
|
@@ -71,17 +105,7 @@ doc.walk do |node|
|
|
71
105
|
printf("URL = %s\n", node.url)
|
72
106
|
end
|
73
107
|
end
|
74
|
-
|
75
|
-
# Capitalize all regular text in headers
|
76
|
-
doc.walk do |node|
|
77
|
-
if node.type == :header
|
78
|
-
node.each do |subnode|
|
79
|
-
if subnode.type == :text
|
80
|
-
subnode.string_content = subnode.string_content.upcase
|
81
|
-
end
|
82
|
-
end
|
83
|
-
end
|
84
|
-
end
|
108
|
+
# => URL = https://www.github.com
|
85
109
|
|
86
110
|
# Transform links to regular text
|
87
111
|
doc.walk do |node|
|
@@ -90,169 +114,199 @@ doc.walk do |node|
|
|
90
114
|
node.delete
|
91
115
|
end
|
92
116
|
end
|
117
|
+
# => <h1><a href=\"#the-site\"></a>The site</h1>\n<p>GitHub</p>\n
|
93
118
|
```
|
94
119
|
|
95
|
-
|
120
|
+
#### Example: Converting a document back into raw CommonMark
|
96
121
|
|
97
|
-
You can
|
122
|
+
You can use `to_commonmark` on a node to render it as raw text:
|
98
123
|
|
99
|
-
```
|
100
|
-
|
101
|
-
|
102
|
-
|
103
|
-
|
104
|
-
end
|
124
|
+
```ruby
|
125
|
+
require 'commonmarker'
|
126
|
+
|
127
|
+
# parse some string
|
128
|
+
doc = Commonmarker.parse("# The site\n\n [GitHub](https://www.github.com)")
|
105
129
|
|
106
|
-
|
107
|
-
|
108
|
-
|
109
|
-
|
110
|
-
|
111
|
-
end
|
130
|
+
# Transform links to regular text
|
131
|
+
doc.walk do |node|
|
132
|
+
if node.type == :link
|
133
|
+
node.insert_before(node.first_child)
|
134
|
+
node.delete
|
112
135
|
end
|
113
136
|
end
|
114
137
|
|
115
|
-
|
116
|
-
|
117
|
-
|
118
|
-
# Print any warnings to STDERR
|
119
|
-
renderer.warnings.each do |w|
|
120
|
-
STDERR.write("#{w}\n")
|
121
|
-
end
|
138
|
+
doc.to_commonmark
|
139
|
+
# => # The site\n\nGitHub\n
|
122
140
|
```
|
123
141
|
|
124
|
-
## Options
|
142
|
+
## Options and plugins
|
125
143
|
|
126
|
-
|
144
|
+
### Options
|
127
145
|
|
128
|
-
|
129
|
-
|
130
|
-
| Name | Description
|
131
|
-
| ----------------------------- | -----------
|
132
|
-
| `:DEFAULT` | The default parsing system.
|
133
|
-
| `:SOURCEPOS` | Include source position in nodes
|
134
|
-
| `:UNSAFE` | Allow raw/custom HTML and unsafe links.
|
135
|
-
| `:VALIDATE_UTF8` | Replace illegal sequences with the replacement character `U+FFFD`.
|
136
|
-
| `:SMART` | Use smart punctuation (curly quotes, etc.).
|
137
|
-
| `:LIBERAL_HTML_TAG` | Support liberal parsing of inline HTML tags.
|
138
|
-
| `:FOOTNOTES` | Parse footnotes.
|
139
|
-
| `:STRIKETHROUGH_DOUBLE_TILDE` | Parse strikethroughs by double tildes (compatibility with [redcarpet](https://github.com/vmg/redcarpet))
|
140
|
-
|
141
|
-
### Render options
|
146
|
+
Commonmarker accepts the same parse, render, and extensions options that comrak does, as a hash dictionary with symbol keys:
|
142
147
|
|
143
|
-
|
144
|
-
|
145
|
-
|
146
|
-
|
147
|
-
|
148
|
-
| `:UNSAFE` | Allow raw/custom HTML and unsafe links. |
|
149
|
-
| `:NOBREAKS` | Translate `\n` in the source to a single whitespace. |
|
150
|
-
| `:VALIDATE_UTF8` | Replace illegal sequences with the replacement character `U+FFFD`. |
|
151
|
-
| `:SMART` | Use smart punctuation (curly quotes, etc.). |
|
152
|
-
| `:GITHUB_PRE_LANG` | Use GitHub-style `<pre lang>` for fenced code blocks. |
|
153
|
-
| `:LIBERAL_HTML_TAG` | Support liberal parsing of inline HTML tags. |
|
154
|
-
| `:FOOTNOTES` | Render footnotes. |
|
155
|
-
| `:STRIKETHROUGH_DOUBLE_TILDE` | Parse strikethroughs by double tildes (compatibility with [redcarpet](https://github.com/vmg/redcarpet)) |
|
156
|
-
| `:TABLE_PREFER_STYLE_ATTRIBUTES` | Use `style` insted of `align` for table cells. |
|
157
|
-
| `:FULL_INFO_STRING` | Include full info strings of code blocks in separate attribute. |
|
158
|
-
|
159
|
-
### Passing options
|
160
|
-
|
161
|
-
To apply a single option, pass it in as a symbol argument:
|
162
|
-
|
163
|
-
``` ruby
|
164
|
-
CommonMarker.render_doc("\"Hello,\" said the spider.", :SMART)
|
165
|
-
# <p>“Hello,” said the spider.</p>\n
|
148
|
+
```ruby
|
149
|
+
Commonmarker.to_html('"Hi *there*"', options:{
|
150
|
+
parse: { smart: true },
|
151
|
+
render: { hardbreaks: false}
|
152
|
+
})
|
166
153
|
```
|
167
154
|
|
168
|
-
|
155
|
+
Note that there is a distinction in comrak for "parse" options and "render" options, which are represented in the tables below. As well, if you wish to disable any-non boolean option, pass in `nil`.
|
169
156
|
|
170
|
-
|
171
|
-
CommonMarker.render_html("\"'Shelob' is my name.\"", [:HARDBREAKS, :SOURCEPOS])
|
172
|
-
```
|
157
|
+
### Parse options
|
173
158
|
|
174
|
-
|
159
|
+
| Name | Description | Default |
|
160
|
+
| --------------------------- | ------------------------------------------------------------------------------------------------------------------------------------------- | ------- |
|
161
|
+
| `smart` | Punctuation (quotes, full-stops and hyphens) are converted into 'smart' punctuation. | `false` |
|
162
|
+
| `default_info_string` | The default info string for fenced code blocks. | `""` |
|
163
|
+
| `relaxed_tasklist_matching` | Enables relaxing of the tasklist extension matching, allowing any non-space to be used for the "checked" state instead of only `x` and `X`. | `false` |
|
164
|
+
| `relaxed_autolinks` | Enable relaxing of the autolink extension parsing, allowing links to be recognized when in brackets, as well as permitting any url scheme. | `false` |
|
175
165
|
|
176
|
-
|
166
|
+
### Render options
|
177
167
|
|
178
|
-
|
168
|
+
| Name | Description | Default |
|
169
|
+
| -------------------- | ------------------------------------------------------------------------------------------------------ | ------- |
|
170
|
+
| `hardbreaks` | [Soft line breaks](http://spec.commonmark.org/0.27/#soft-line-breaks) translate into hard line breaks. | `true` |
|
171
|
+
| `github_pre_lang` | GitHub-style `<pre lang="xyz">` is used for fenced code blocks with info tags. | `true` |
|
172
|
+
| `full_info_string` | Gives info string data after a space in a `data-meta` attribute on code blocks. | `false` |
|
173
|
+
| `width` | The wrap column when outputting CommonMark. | `80` |
|
174
|
+
| `unsafe` | Allow rendering of raw HTML and potentially dangerous links. | `false` |
|
175
|
+
| `escape` | Escape raw HTML instead of clobbering it. | `false` |
|
176
|
+
| `sourcepos` | Include source position attribute in HTML and XML output. | `false` |
|
177
|
+
| `escaped_char_spans` | Wrap escaped characters in span tags. | `true` |
|
178
|
+
| `ignore_setext` | Ignores setext-style headings. | `false` |
|
179
|
+
| `ignore_empty_links` | Ignores empty links, leaving the Markdown text in place. | `false` |
|
180
|
+
| `gfm_quirks` | Outputs HTML with GFM-style quirks; namely, not nesting `<strong>` inlines. | `false` |
|
181
|
+
| `prefer_fenced` | Always output fenced code blocks, even where an indented one could be used. | `false` |
|
182
|
+
|
183
|
+
As well, there are several extensions which you can toggle in the same manner:
|
179
184
|
|
180
|
-
|
185
|
+
```ruby
|
186
|
+
Commonmarker.to_html('"Hi *there*"', options: {
|
187
|
+
extension: { footnotes: true, description_lists: true },
|
188
|
+
render: { hardbreaks: false }
|
189
|
+
})
|
190
|
+
```
|
181
191
|
|
182
|
-
|
183
|
-
|
184
|
-
|
185
|
-
|
186
|
-
|
192
|
+
### Extension options
|
193
|
+
|
194
|
+
| Name | Description | Default |
|
195
|
+
| ----------------------------- | ------------------------------------------------------------------------------------------------------------------- | ------- |
|
196
|
+
| `strikethrough` | Enables the [strikethrough extension](https://github.github.com/gfm/#strikethrough-extension-) from the GFM spec. | `true` |
|
197
|
+
| `tagfilter` | Enables the [tagfilter extension](https://github.github.com/gfm/#disallowed-raw-html-extension-) from the GFM spec. | `true` |
|
198
|
+
| `table` | Enables the [table extension](https://github.github.com/gfm/#tables-extension-) from the GFM spec. | `true` |
|
199
|
+
| `autolink` | Enables the [autolink extension](https://github.github.com/gfm/#autolinks-extension-) from the GFM spec. | `true` |
|
200
|
+
| `tasklist` | Enables the [task list extension](https://github.github.com/gfm/#task-list-items-extension-) from the GFM spec. | `true` |
|
201
|
+
| `superscript` | Enables the superscript Comrak extension. | `false` |
|
202
|
+
| `header_ids` | Enables the header IDs Comrak extension. from the GFM spec. | `""` |
|
203
|
+
| `footnotes` | Enables the footnotes extension per `cmark-gfm`. | `false` |
|
204
|
+
| `description_lists` | Enables the description lists extension. | `false` |
|
205
|
+
| `front_matter_delimiter` | Enables the front matter extension. | `""` |
|
206
|
+
| `multiline_block_quotes` | Enables the multiline block quotes extension. | `false` |
|
207
|
+
| `math_dollars`, `math_code` | Enables the math extension. | `false` |
|
208
|
+
| `shortcodes` | Enables the shortcodes extension. | `true` |
|
209
|
+
| `wikilinks_title_before_pipe` | Enables the wikilinks extension, placing the title before the dividing pipe. | `false` |
|
210
|
+
| `wikilinks_title_after_pipe` | Enables the shortcodes extension, placing the title after the dividing pipe. | `false` |
|
211
|
+
| `underline` | Enables the underline extension. | `false` |
|
212
|
+
| `spoiler` | Enables the spoiler extension. | `false` |
|
213
|
+
| `greentext` | Enables the greentext extension. | `false` |
|
214
|
+
| `subscript` | Enables the subscript extension. | `false` |
|
215
|
+
| `alerts` | Enables the alerts extension. | `false` |
|
216
|
+
|
217
|
+
For more information on these options, see [the comrak documentation](https://github.com/kivikakk/comrak#usage).
|
218
|
+
|
219
|
+
### Plugins
|
220
|
+
|
221
|
+
In addition to the possibilities provided by generic CommonMark rendering, Commonmarker also supports plugins as a means of
|
222
|
+
providing further niceties.
|
223
|
+
|
224
|
+
#### Syntax Highlighter Plugin
|
225
|
+
|
226
|
+
The library comes with [a set of pre-existing themes](https://docs.rs/syntect/5.0.0/syntect/highlighting/struct.ThemeSet.html#implementations) for highlighting code:
|
227
|
+
|
228
|
+
- `"base16-ocean.dark"`
|
229
|
+
- `"base16-eighties.dark"`
|
230
|
+
- `"base16-mocha.dark"`
|
231
|
+
- `"base16-ocean.light"`
|
232
|
+
- `"InspiredGitHub"`
|
233
|
+
- `"Solarized (dark)"`
|
234
|
+
- `"Solarized (light)"`
|
235
|
+
|
236
|
+
````ruby
|
237
|
+
code = <<~CODE
|
238
|
+
```ruby
|
239
|
+
def hello
|
240
|
+
puts "hello"
|
241
|
+
end
|
242
|
+
```
|
243
|
+
CODE
|
187
244
|
|
188
|
-
|
245
|
+
# pass in a theme name from a pre-existing set
|
246
|
+
puts Commonmarker.to_html(code, plugins: { syntax_highlighter: { theme: "InspiredGitHub" } })
|
189
247
|
|
190
|
-
|
248
|
+
# <pre style="background-color:#ffffff;" lang="ruby"><code>
|
249
|
+
# <span style="font-weight:bold;color:#a71d5d;">def </span><span style="font-weight:bold;color:#795da3;">hello
|
250
|
+
# </span><span style="color:#62a35c;">puts </span><span style="color:#183691;">"hello"
|
251
|
+
# </span><span style="font-weight:bold;color:#a71d5d;">end
|
252
|
+
# </span>
|
253
|
+
# </code></pre>
|
254
|
+
````
|
191
255
|
|
192
|
-
|
256
|
+
By default, the plugin uses the `"base16-ocean.dark"` theme to syntax highlight code.
|
193
257
|
|
194
|
-
|
258
|
+
To disable this plugin, set the value to `nil`:
|
195
259
|
|
196
|
-
|
197
|
-
|
198
|
-
|
260
|
+
````ruby
|
261
|
+
code = <<~CODE
|
262
|
+
```ruby
|
263
|
+
def hello
|
264
|
+
puts "hello"
|
265
|
+
end
|
266
|
+
```
|
267
|
+
CODE
|
199
268
|
|
200
|
-
|
201
|
-
```
|
269
|
+
Commonmarker.to_html(code, plugins: { syntax_highlighter: nil })
|
202
270
|
|
203
|
-
|
271
|
+
# <pre lang="ruby"><code>def hello
|
272
|
+
# puts "hello"
|
273
|
+
# end
|
274
|
+
# </code></pre>
|
275
|
+
````
|
204
276
|
|
205
|
-
|
277
|
+
To output CSS classes instead of `style` attributes, set the `theme` key to `""`:
|
206
278
|
|
207
|
-
|
208
|
-
|
209
|
-
|
210
|
-
|
211
|
-
|
212
|
-
|
213
|
-
|
214
|
-
<paragraph>
|
215
|
-
<emph>
|
216
|
-
<text xml:space="preserve">Hello</text>
|
217
|
-
</emph>
|
218
|
-
<text xml:space="preserve"> world!</text>
|
219
|
-
</paragraph>
|
220
|
-
</document>
|
221
|
-
```
|
279
|
+
````ruby
|
280
|
+
code = <<~CODE
|
281
|
+
```ruby
|
282
|
+
def hello
|
283
|
+
puts "hello"
|
284
|
+
end
|
285
|
+
CODE
|
222
286
|
|
223
|
-
|
287
|
+
Commonmarker.to_html(code, plugins: { syntax_highlighter: { theme: "" } })
|
224
288
|
|
225
|
-
|
289
|
+
# <pre class="syntax-highlighting"><code><span class="source ruby"><span class="meta function ruby"><span class="keyword control def ruby">def</span></span><span class="meta function ruby"> # <span class="entity name function ruby">hello</span></span>
|
290
|
+
# <span class="support function builtin ruby">puts</span> <span class="string quoted double ruby"><span class="punctuation definition string begin ruby">"</span>hello<span class="punctuation definition string end ruby">"</span></span>
|
291
|
+
# <span class="keyword control ruby">end</span>\n</span></code></pre>
|
292
|
+
````
|
226
293
|
|
227
|
-
|
228
|
-
doc = CommonMarker.render_doc('*Hello* world!', :DEFAULT)
|
229
|
-
puts(doc.to_plaintext)
|
294
|
+
To use a custom theme, you can provide a `path` to a directory containing `.tmtheme` files to load:
|
230
295
|
|
231
|
-
|
296
|
+
```ruby
|
297
|
+
Commonmarker.to_html(code, plugins: { syntax_highlighter: { theme: "Monokai", path: "./themes" } })
|
232
298
|
```
|
233
299
|
|
234
|
-
|
235
|
-
|
236
|
-
Commonmark will be generated when calling `to_commonmark` or using `--to=commonmark` on the command line.
|
237
|
-
|
238
|
-
``` ruby
|
239
|
-
text = <<-TEXT
|
240
|
-
1. I am a numeric list.
|
241
|
-
2. I continue the list.
|
242
|
-
* Suddenly, an unordered list!
|
243
|
-
* What fun!
|
244
|
-
TEXT
|
300
|
+
## Output formats
|
245
301
|
|
246
|
-
|
247
|
-
puts(doc.to_commonmark)
|
302
|
+
Commonmarker can currently only generate output in one format: HTML.
|
248
303
|
|
249
|
-
|
250
|
-
2. I continue the list.
|
304
|
+
### HTML
|
251
305
|
|
252
|
-
|
306
|
+
```ruby
|
307
|
+
puts Commonmarker.to_html('*Hello* world!')
|
253
308
|
|
254
|
-
|
255
|
-
- What fun\!
|
309
|
+
# <p><em>Hello</em> world!</p>
|
256
310
|
```
|
257
311
|
|
258
312
|
## Developing locally
|
@@ -264,25 +318,36 @@ script/bootstrap
|
|
264
318
|
bundle exec rake compile
|
265
319
|
```
|
266
320
|
|
267
|
-
If there were no errors, you're done! Otherwise, make sure to follow the
|
321
|
+
If there were no errors, you're done! Otherwise, make sure to follow the comrak dependency instructions.
|
268
322
|
|
269
323
|
## Benchmarks
|
270
324
|
|
271
|
-
Some rough benchmarks:
|
272
|
-
|
273
325
|
```
|
274
|
-
|
275
|
-
|
276
|
-
|
277
|
-
|
278
|
-
|
279
|
-
|
280
|
-
|
281
|
-
|
282
|
-
|
283
|
-
|
284
|
-
|
285
|
-
|
286
|
-
|
287
|
-
|
326
|
+
❯ bundle exec rake benchmark
|
327
|
+
input size = 11064832 bytes
|
328
|
+
|
329
|
+
ruby 3.3.0 (2023-12-25 revision 5124f9ac75) [arm64-darwin23]
|
330
|
+
Warming up --------------------------------------
|
331
|
+
Markly.render_html 1.000 i/100ms
|
332
|
+
Markly::Node#to_html 1.000 i/100ms
|
333
|
+
Commonmarker.to_html 1.000 i/100ms
|
334
|
+
Commonmarker::Node.to_html
|
335
|
+
1.000 i/100ms
|
336
|
+
Kramdown::Document#to_html
|
337
|
+
1.000 i/100ms
|
338
|
+
Calculating -------------------------------------
|
339
|
+
Markly.render_html 15.606 (±25.6%) i/s - 71.000 in 5.047132s
|
340
|
+
Markly::Node#to_html 15.692 (±25.5%) i/s - 72.000 in 5.095810s
|
341
|
+
Commonmarker.to_html 4.482 (± 0.0%) i/s - 23.000 in 5.137680s
|
342
|
+
Commonmarker::Node.to_html
|
343
|
+
5.092 (±19.6%) i/s - 25.000 in 5.072220s
|
344
|
+
Kramdown::Document#to_html
|
345
|
+
0.379 (± 0.0%) i/s - 2.000 in 5.277770s
|
346
|
+
|
347
|
+
Comparison:
|
348
|
+
Markly::Node#to_html: 15.7 i/s
|
349
|
+
Markly.render_html: 15.6 i/s - same-ish: difference falls within error
|
350
|
+
Commonmarker::Node.to_html: 5.1 i/s - 3.08x slower
|
351
|
+
Commonmarker.to_html: 4.5 i/s - 3.50x slower
|
352
|
+
Kramdown::Document#to_html: 0.4 i/s - 41.40x slower
|
288
353
|
```
|
@@ -0,0 +1,20 @@
|
|
1
|
+
[package]
|
2
|
+
name = "commonmarker"
|
3
|
+
version = "1.0.0"
|
4
|
+
edition = "2021"
|
5
|
+
rust-version = "1.75.0"
|
6
|
+
publish = false
|
7
|
+
|
8
|
+
[dependencies]
|
9
|
+
magnus = { version = "0.7", features = ["rb-sys"] }
|
10
|
+
rb-sys = { version = "*", default-features = false, features = [
|
11
|
+
"stable-api-compiled-fallback",
|
12
|
+
] }
|
13
|
+
comrak = { version = "0.35", features = ["shortcodes"] }
|
14
|
+
syntect = { version = "5.2", features = ["plist-load"] }
|
15
|
+
typed-arena = "2.0"
|
16
|
+
rctree = "0.6"
|
17
|
+
|
18
|
+
[lib]
|
19
|
+
name = "commonmarker"
|
20
|
+
crate-type = ["cdylib"]
|
data/ext/commonmarker/extconf.rb
CHANGED
@@ -0,0 +1,103 @@
|
|
1
|
+
extern crate core;
|
2
|
+
|
3
|
+
use comrak::{markdown_to_html_with_plugins, parse_document, ComrakOptions};
|
4
|
+
use magnus::{define_module, function, r_hash::ForEach, scan_args, Error, RHash, Symbol, Value};
|
5
|
+
use node::CommonmarkerNode;
|
6
|
+
use plugins::syntax_highlighting::construct_syntax_highlighter_from_plugin;
|
7
|
+
|
8
|
+
mod options;
|
9
|
+
use options::iterate_options_hash;
|
10
|
+
|
11
|
+
mod plugins;
|
12
|
+
|
13
|
+
use typed_arena::Arena;
|
14
|
+
|
15
|
+
mod node;
|
16
|
+
mod utils;
|
17
|
+
|
18
|
+
pub const EMPTY_STR: &str = "";
|
19
|
+
|
20
|
+
fn commonmark_parse(args: &[Value]) -> Result<CommonmarkerNode, magnus::Error> {
|
21
|
+
let args = scan_args::scan_args::<_, (), (), (), _, ()>(args)?;
|
22
|
+
let (rb_commonmark,): (String,) = args.required;
|
23
|
+
|
24
|
+
let kwargs =
|
25
|
+
scan_args::get_kwargs::<_, (), (Option<RHash>,), ()>(args.keywords, &[], &["options"])?;
|
26
|
+
let (rb_options,) = kwargs.optional;
|
27
|
+
|
28
|
+
let mut comrak_options = ComrakOptions::default();
|
29
|
+
|
30
|
+
if let Some(rb_options) = rb_options {
|
31
|
+
rb_options.foreach(|key: Symbol, value: RHash| {
|
32
|
+
iterate_options_hash(&mut comrak_options, key, value)?;
|
33
|
+
Ok(ForEach::Continue)
|
34
|
+
})?;
|
35
|
+
}
|
36
|
+
|
37
|
+
let arena = Arena::new();
|
38
|
+
let root = parse_document(&arena, &rb_commonmark, &comrak_options);
|
39
|
+
|
40
|
+
CommonmarkerNode::new_from_comrak_node(root)
|
41
|
+
}
|
42
|
+
|
43
|
+
fn commonmark_to_html(args: &[Value]) -> Result<String, magnus::Error> {
|
44
|
+
let args = scan_args::scan_args::<_, (), (), (), _, ()>(args)?;
|
45
|
+
let (rb_commonmark,): (String,) = args.required;
|
46
|
+
|
47
|
+
let kwargs = scan_args::get_kwargs::<_, (), (Option<RHash>, Option<RHash>), ()>(
|
48
|
+
args.keywords,
|
49
|
+
&[],
|
50
|
+
&["options", "plugins"],
|
51
|
+
)?;
|
52
|
+
let (rb_options, rb_plugins) = kwargs.optional;
|
53
|
+
|
54
|
+
let comrak_options = match format_options(rb_options) {
|
55
|
+
Ok(options) => options,
|
56
|
+
Err(err) => return Err(err),
|
57
|
+
};
|
58
|
+
|
59
|
+
let mut comrak_plugins = comrak::Plugins::default();
|
60
|
+
|
61
|
+
let syntect_adapter = match construct_syntax_highlighter_from_plugin(rb_plugins) {
|
62
|
+
Ok(Some(adapter)) => Some(adapter),
|
63
|
+
Ok(None) => None,
|
64
|
+
Err(err) => return Err(err),
|
65
|
+
};
|
66
|
+
|
67
|
+
match syntect_adapter {
|
68
|
+
Some(ref adapter) => comrak_plugins.render.codefence_syntax_highlighter = Some(adapter),
|
69
|
+
None => comrak_plugins.render.codefence_syntax_highlighter = None,
|
70
|
+
}
|
71
|
+
|
72
|
+
Ok(markdown_to_html_with_plugins(
|
73
|
+
&rb_commonmark,
|
74
|
+
&comrak_options,
|
75
|
+
&comrak_plugins,
|
76
|
+
))
|
77
|
+
}
|
78
|
+
|
79
|
+
fn format_options<'c>(rb_options: Option<RHash>) -> Result<comrak::Options<'c>, magnus::Error> {
|
80
|
+
let mut comrak_options = ComrakOptions::default();
|
81
|
+
|
82
|
+
if let Some(rb_options) = rb_options {
|
83
|
+
rb_options.foreach(|key: Symbol, value: RHash| {
|
84
|
+
iterate_options_hash(&mut comrak_options, key, value)?;
|
85
|
+
Ok(ForEach::Continue)
|
86
|
+
})?;
|
87
|
+
}
|
88
|
+
|
89
|
+
Ok(comrak_options)
|
90
|
+
}
|
91
|
+
|
92
|
+
#[magnus::init]
|
93
|
+
fn init() -> Result<(), Error> {
|
94
|
+
let m_commonmarker = define_module("Commonmarker")?;
|
95
|
+
|
96
|
+
m_commonmarker.define_module_function("commonmark_parse", function!(commonmark_parse, -1))?;
|
97
|
+
m_commonmarker
|
98
|
+
.define_module_function("commonmark_to_html", function!(commonmark_to_html, -1))?;
|
99
|
+
|
100
|
+
node::init(m_commonmarker).expect("cannot define Commonmarker::Node class");
|
101
|
+
|
102
|
+
Ok(())
|
103
|
+
}
|