html-to-markdown 2.24.6 → 2.25.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (231) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile.lock +2 -2
  3. data/README.md +1 -1
  4. data/ext/html-to-markdown-rb/native/Cargo.lock +9 -32
  5. data/ext/html-to-markdown-rb/native/Cargo.toml +1 -1
  6. data/lib/html_to_markdown/version.rb +1 -1
  7. data/rust-vendor/html-to-markdown-rs/Cargo.toml +0 -1
  8. data/rust-vendor/html-to-markdown-rs/src/converter/main_helpers.rs +1 -1
  9. data/rust-vendor/html-to-markdown-rs/src/hocr/converter/hierarchy.rs +20 -5
  10. data/rust-vendor/html-to-markdown-rs/src/lib.rs +1 -0
  11. data/rust-vendor/{markup5ever_rcdom/lib.rs → html-to-markdown-rs/src/rcdom.rs} +56 -91
  12. data/rust-vendor/html-to-markdown-rs/tests/hocr_compliance_test.rs +157 -0
  13. data/rust-vendor/memmap2/.cargo-checksum.json +1 -1
  14. data/rust-vendor/memmap2/.cargo_vcs_info.json +1 -1
  15. data/rust-vendor/memmap2/CHANGELOG.md +8 -0
  16. data/rust-vendor/memmap2/Cargo.lock +1 -1
  17. data/rust-vendor/memmap2/Cargo.toml +2 -1
  18. data/rust-vendor/memmap2/Cargo.toml.orig +2 -1
  19. data/rust-vendor/memmap2/src/lib.rs +25 -1
  20. data/rust-vendor/memmap2/src/stub.rs +1 -4
  21. data/rust-vendor/memmap2/src/unix.rs +14 -1
  22. data/rust-vendor/png/.cargo-checksum.json +1 -1
  23. data/rust-vendor/png/.cargo_vcs_info.json +1 -1
  24. data/rust-vendor/png/CHANGES.md +44 -0
  25. data/rust-vendor/png/Cargo.lock +124 -171
  26. data/rust-vendor/png/Cargo.toml +1 -1
  27. data/rust-vendor/png/Cargo.toml.orig +1 -1
  28. data/rust-vendor/png/benches/expand_paletted.rs +5 -5
  29. data/rust-vendor/png/benches/unfilter.rs +3 -3
  30. data/rust-vendor/png/src/adam7.rs +17 -10
  31. data/rust-vendor/png/src/common.rs +8 -8
  32. data/rust-vendor/png/src/decoder/mod.rs +53 -20
  33. data/rust-vendor/png/src/decoder/stream.rs +263 -78
  34. data/rust-vendor/png/src/decoder/unfiltering_buffer.rs +210 -53
  35. data/rust-vendor/png/src/decoder/zlib.rs +130 -90
  36. data/rust-vendor/png/src/encoder.rs +4 -2
  37. data/rust-vendor/png/src/{filter.rs → filter/mod.rs} +100 -367
  38. data/rust-vendor/png/src/filter/optimization-notes.md +104 -0
  39. data/rust-vendor/png/src/filter/paeth.rs +398 -0
  40. data/rust-vendor/png/src/filter/simd.rs +308 -0
  41. data/rust-vendor/png/src/lib.rs +1 -0
  42. data/rust-vendor/syn/.cargo-checksum.json +1 -1
  43. data/rust-vendor/syn/.cargo_vcs_info.json +1 -1
  44. data/rust-vendor/syn/Cargo.lock +40 -41
  45. data/rust-vendor/syn/Cargo.toml +1 -1
  46. data/rust-vendor/syn/Cargo.toml.orig +1 -1
  47. data/rust-vendor/syn/src/item.rs +61 -40
  48. data/rust-vendor/syn/src/lib.rs +2 -1
  49. data/rust-vendor/syn/tests/test_item.rs +54 -0
  50. data/rust-vendor/unicode-ident/.cargo-checksum.json +1 -1
  51. data/rust-vendor/unicode-ident/.cargo_vcs_info.json +1 -1
  52. data/rust-vendor/unicode-ident/Cargo.lock +21 -21
  53. data/rust-vendor/unicode-ident/Cargo.toml +1 -1
  54. data/rust-vendor/unicode-ident/Cargo.toml.orig +1 -1
  55. data/rust-vendor/unicode-ident/src/lib.rs +1 -1
  56. data/rust-vendor/unicode-ident/src/tables.rs +87 -97
  57. data/rust-vendor/unicode-ident/tests/static_size.rs +1 -1
  58. metadata +7 -177
  59. data/rust-vendor/markup5ever_rcdom/.cargo-checksum.json +0 -1
  60. data/rust-vendor/markup5ever_rcdom/.cargo_vcs_info.json +0 -7
  61. data/rust-vendor/markup5ever_rcdom/Cargo.lock +0 -658
  62. data/rust-vendor/markup5ever_rcdom/Cargo.toml +0 -109
  63. data/rust-vendor/markup5ever_rcdom/Cargo.toml.orig +0 -42
  64. data/rust-vendor/markup5ever_rcdom/LICENSE-APACHE +0 -201
  65. data/rust-vendor/markup5ever_rcdom/LICENSE-MIT +0 -25
  66. data/rust-vendor/markup5ever_rcdom/README.md +0 -7
  67. data/rust-vendor/markup5ever_rcdom/custom-html5lib-tokenizer-tests/regression.test +0 -69
  68. data/rust-vendor/markup5ever_rcdom/data/test/ignore +0 -1
  69. data/rust-vendor/markup5ever_rcdom/examples/hello_xml.rs +0 -39
  70. data/rust-vendor/markup5ever_rcdom/examples/html2html.rs +0 -51
  71. data/rust-vendor/markup5ever_rcdom/examples/print-rcdom.rs +0 -78
  72. data/rust-vendor/markup5ever_rcdom/examples/xml_tree_printer.rs +0 -67
  73. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.gitattributes +0 -2
  74. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.github/workflows/downstream.yml +0 -76
  75. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.github/workflows/lint.yml +0 -25
  76. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.gitignore +0 -79
  77. data/rust-vendor/markup5ever_rcdom/html5lib-tests/AUTHORS.rst +0 -34
  78. data/rust-vendor/markup5ever_rcdom/html5lib-tests/LICENSE +0 -21
  79. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/chardet/test_big5.txt +0 -51
  80. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/scripted/tests1.dat +0 -5
  81. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/test-yahoo-jp.dat +0 -10
  82. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/tests1.dat +0 -388
  83. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/tests2.dat +0 -115
  84. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint +0 -6
  85. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/__init__.py +0 -0
  86. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/__init__.py +0 -0
  87. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/LICENSE +0 -18
  88. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/__init__.py +0 -0
  89. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/lexer.py +0 -211
  90. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/lexer.pyi +0 -34
  91. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/parser.py +0 -872
  92. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/parser.pyi +0 -83
  93. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/py.typed +0 -0
  94. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/util.py +0 -72
  95. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/util.pyi +0 -7
  96. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/vendor.txt +0 -1
  97. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor-patches/funcparserlib.patch +0 -24
  98. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/lint.py +0 -280
  99. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/parser.py +0 -177
  100. data/rust-vendor/markup5ever_rcdom/html5lib-tests/pyproject.toml +0 -7
  101. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/core.test +0 -125
  102. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/injectmeta.test +0 -66
  103. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/optionaltags.test +0 -965
  104. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/options.test +0 -60
  105. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/whitespace.test +0 -51
  106. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/README.md +0 -107
  107. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/contentModelFlags.test +0 -93
  108. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/domjs.test +0 -335
  109. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/entities.test +0 -542
  110. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/escapeFlag.test +0 -36
  111. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/namedEntities.test +0 -42422
  112. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/numericEntities.test +0 -1677
  113. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/pendingSpecChanges.test +0 -9
  114. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test1.test +0 -353
  115. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test2.test +0 -275
  116. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test3.test +0 -11233
  117. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test4.test +0 -532
  118. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/unicodeChars.test +0 -1577
  119. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/unicodeCharsProblematic.test +0 -41
  120. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/xmlViolation.test +0 -20
  121. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/README.md +0 -108
  122. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/adoption01.dat +0 -354
  123. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/adoption02.dat +0 -39
  124. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/blocks.dat +0 -695
  125. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/comments01.dat +0 -217
  126. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/doctype01.dat +0 -474
  127. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/domjs-unsafe.dat +0 -0
  128. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/entities01.dat +0 -943
  129. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/entities02.dat +0 -309
  130. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/foreign-fragment.dat +0 -645
  131. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/html5test-com.dat +0 -301
  132. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/inbody01.dat +0 -54
  133. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/isindex.dat +0 -49
  134. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/main-element.dat +0 -46
  135. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/math.dat +0 -104
  136. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/menuitem-element.dat +0 -240
  137. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/namespace-sensitivity.dat +0 -22
  138. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/noscript01.dat +0 -237
  139. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/pending-spec-changes-plain-text-unsafe.dat +0 -0
  140. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/pending-spec-changes.dat +0 -46
  141. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/plain-text-unsafe.dat +0 -0
  142. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/quirks01.dat +0 -53
  143. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/ruby.dat +0 -302
  144. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scriptdata01.dat +0 -372
  145. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/adoption01.dat +0 -16
  146. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/ark.dat +0 -27
  147. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/webkit01.dat +0 -30
  148. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/search-element.dat +0 -46
  149. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/svg.dat +0 -104
  150. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tables01.dat +0 -322
  151. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/template.dat +0 -1673
  152. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests1.dat +0 -1956
  153. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests10.dat +0 -849
  154. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests11.dat +0 -523
  155. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests12.dat +0 -62
  156. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests14.dat +0 -75
  157. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests15.dat +0 -216
  158. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests16.dat +0 -2602
  159. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests17.dat +0 -179
  160. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests18.dat +0 -558
  161. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests19.dat +0 -1398
  162. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests2.dat +0 -831
  163. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests20.dat +0 -842
  164. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests21.dat +0 -306
  165. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests22.dat +0 -190
  166. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests23.dat +0 -168
  167. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests24.dat +0 -79
  168. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests25.dat +0 -288
  169. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests26.dat +0 -453
  170. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests3.dat +0 -305
  171. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests4.dat +0 -74
  172. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests5.dat +0 -210
  173. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests6.dat +0 -663
  174. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests7.dat +0 -453
  175. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests8.dat +0 -165
  176. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests9.dat +0 -472
  177. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests_innerHTML_1.dat +0 -843
  178. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tricky01.dat +0 -336
  179. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/webkit01.dat +0 -785
  180. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/webkit02.dat +0 -554
  181. data/rust-vendor/markup5ever_rcdom/tests/foreach_html5lib_test/mod.rs +0 -41
  182. data/rust-vendor/markup5ever_rcdom/tests/html-driver.rs +0 -29
  183. data/rust-vendor/markup5ever_rcdom/tests/html-serializer.rs +0 -265
  184. data/rust-vendor/markup5ever_rcdom/tests/html-tokenizer.rs +0 -487
  185. data/rust-vendor/markup5ever_rcdom/tests/html-tree-builder.rs +0 -298
  186. data/rust-vendor/markup5ever_rcdom/tests/html-tree-sink.rs +0 -141
  187. data/rust-vendor/markup5ever_rcdom/tests/util/find_tests.rs +0 -34
  188. data/rust-vendor/markup5ever_rcdom/tests/util/runner.rs +0 -48
  189. data/rust-vendor/markup5ever_rcdom/tests/xml-driver.rs +0 -101
  190. data/rust-vendor/markup5ever_rcdom/tests/xml-tokenizer.rs +0 -374
  191. data/rust-vendor/markup5ever_rcdom/tests/xml-tree-builder.rs +0 -237
  192. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/AUTHORS.rst +0 -9
  193. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/LICENSE +0 -21
  194. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/README.md +0 -92
  195. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/comments.test +0 -274
  196. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/doctype.test +0 -3232
  197. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/entities.test +0 -283
  198. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/eof.test +0 -113
  199. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/namedEntities.test +0 -42210
  200. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/numericEntities.test +0 -1349
  201. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/test1.test +0 -162
  202. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/test2.test +0 -64
  203. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/unicodeChars.test +0 -1295
  204. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/README.md +0 -104
  205. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/namespace.dat +0 -119
  206. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/test1.dat +0 -124
  207. data/rust-vendor/xml5ever/.cargo-checksum.json +0 -1
  208. data/rust-vendor/xml5ever/.cargo_vcs_info.json +0 -6
  209. data/rust-vendor/xml5ever/Cargo.lock +0 -752
  210. data/rust-vendor/xml5ever/Cargo.toml +0 -69
  211. data/rust-vendor/xml5ever/Cargo.toml.orig +0 -29
  212. data/rust-vendor/xml5ever/LICENSE-APACHE +0 -201
  213. data/rust-vendor/xml5ever/LICENSE-MIT +0 -25
  214. data/rust-vendor/xml5ever/README.md +0 -72
  215. data/rust-vendor/xml5ever/benches/xml5ever.rs +0 -77
  216. data/rust-vendor/xml5ever/data/bench/strong.xml +0 -1
  217. data/rust-vendor/xml5ever/examples/README.md +0 -223
  218. data/rust-vendor/xml5ever/examples/example.xml +0 -3
  219. data/rust-vendor/xml5ever/examples/simple_xml_tokenizer.rs +0 -81
  220. data/rust-vendor/xml5ever/examples/xml_tokenizer.rs +0 -115
  221. data/rust-vendor/xml5ever/src/driver.rs +0 -90
  222. data/rust-vendor/xml5ever/src/lib.rs +0 -47
  223. data/rust-vendor/xml5ever/src/macros.rs +0 -18
  224. data/rust-vendor/xml5ever/src/serialize/mod.rs +0 -216
  225. data/rust-vendor/xml5ever/src/tokenizer/char_ref/mod.rs +0 -456
  226. data/rust-vendor/xml5ever/src/tokenizer/interface.rs +0 -116
  227. data/rust-vendor/xml5ever/src/tokenizer/mod.rs +0 -1344
  228. data/rust-vendor/xml5ever/src/tokenizer/qname.rs +0 -84
  229. data/rust-vendor/xml5ever/src/tokenizer/states.rs +0 -167
  230. data/rust-vendor/xml5ever/src/tree_builder/mod.rs +0 -774
  231. data/rust-vendor/xml5ever/src/tree_builder/types.rs +0 -37
@@ -1,104 +0,0 @@
1
- Tree Construction Tests
2
- =======================
3
-
4
- Each file containing tree construction tests consists of any number of
5
- tests separated by two newlines (LF) and a single newline before the end
6
- of the file. For instance:
7
-
8
- [TEST]LF
9
- LF
10
- [TEST]LF
11
- LF
12
- [TEST]LF
13
-
14
- Where [TEST] is the following format:
15
-
16
- Each test must begin with a string "\#data" followed by a newline (LF).
17
- All subsequent lines until a line that says "\#errors" are the test data
18
- and must be passed to the system being tested unchanged, except with the
19
- final newline (on the last line) removed.
20
-
21
- Then there must be a line that says "\#errors". It must be followed by
22
- one line per parse error that a conformant checker would return. It
23
- doesn't matter what those lines are, although they can't be
24
- "\#document-fragment", "\#document", "\#script-off", "\#script-on", or
25
- empty, the only thing that matters is that there be the right number
26
- of parse errors.
27
-
28
- Then there \*may\* be a line that says "\#document-fragment", which must
29
- be followed by a newline (LF), followed by a string of characters that
30
- indicates the context element, followed by a newline (LF). If the string
31
- of characters starts with "svg ", the context element is in the SVG
32
- namespace and the substring after "svg " is the local name. If the
33
- string of characters starts with "math ", the context element is in the
34
- MathML namespace and the substring after "math " is the local name.
35
- Otherwise, the context element is in the HTML namespace and the string
36
- is the local name. If this line is present the "\#data" must be parsed
37
- using the HTML fragment parsing algorithm with the context element as
38
- context.
39
-
40
- Then there \*may\* be a line that says "\#script-off" or
41
- "\#script-in". If a line that says "\#script-off" is present, the
42
- parser must set the scripting flag to disabled. If a line that says
43
- "\#script-on" is present, it must set it to enabled. Otherwise, the
44
- test should be run in both modes.
45
-
46
- Then there must be a line that says "\#document", which must be followed
47
- by a dump of the tree of the parsed DOM. Each node must be represented
48
- by a single line. Each line must start with "| ", followed by two spaces
49
- per parent node that the node has before the root document node.
50
-
51
- - Element nodes must be represented by a "`<`" then the *tag name
52
- string* "`>`", and all the attributes must be given, sorted
53
- lexicographically by UTF-16 code unit according to their *attribute
54
- name string*, on subsequent lines, as if they were children of the
55
- element node.
56
- - Attribute nodes must have the *attribute name string*, then an "="
57
- sign, then the attribute value in double quotes (").
58
- - Text nodes must be the string, in double quotes. Newlines aren't
59
- escaped.
60
- - Comments must be "`<`" then "`!-- `" then the data then "` -->`".
61
- - DOCTYPEs must be "`<!DOCTYPE `" then the name then if either of the
62
- system id or public id is non-empty a space, public id in
63
- double-quotes, another space an the system id in double-quotes, and
64
- then in any case "`>`".
65
- - Processing instructions must be "`<?`", then the target, then a
66
- space, then the data and then "`>`". (The HTML parser cannot emit
67
- processing instructions, but scripts can, and the WebVTT to DOM
68
- rules can emit them.)
69
- - Template contents are represented by the string "content" with the
70
- children below it.
71
-
72
- The *tag name string* is the local name prefixed by a namespace
73
- designator. For the HTML namespace, the namespace designator is the
74
- empty string, i.e. there's no prefix. For the SVG namespace, the
75
- namespace designator is "svg ". For the MathML namespace, the namespace
76
- designator is "math ".
77
-
78
- The *attribute name string* is the local name prefixed by a namespace
79
- designator. For no namespace, the namespace designator is the empty
80
- string, i.e. there's no prefix. For the XLink namespace, the namespace
81
- designator is "xlink ". For the XML namespace, the namespace designator
82
- is "xml ". For the XMLNS namespace, the namespace designator is "xmlns
83
- ". Note the difference between "xlink:href" which is an attribute in no
84
- namespace with the local name "xlink:href" and "xlink href" which is an
85
- attribute in the xlink namespace with the local name "href".
86
-
87
- If there is also a "\#document-fragment" the bit following "\#document"
88
- must be a representation of the HTML fragment serialization for the
89
- context element given by "\#document-fragment".
90
-
91
- For example:
92
-
93
- #data
94
- <p>One<p>Two
95
- #errors
96
- 3: Missing document type declaration
97
- #document
98
- | <html>
99
- | <head>
100
- | <body>
101
- | <p>
102
- | "One"
103
- | <p>
104
- | "Two"
@@ -1,119 +0,0 @@
1
- #data
2
- <a xmlns = "www.example.org"></a>
3
- #document
4
- | <{www.example.org}a>
5
-
6
- #data
7
- <a xmlns:xml = "www.example.org"></a>
8
- #document
9
- | <a>
10
-
11
- #data
12
- <a xmlns:n1="www.example.org/n1"><n1:a/></a>
13
- #document
14
- | <a>
15
- | <{www.example.org/n1}n1:a>
16
-
17
- #data
18
- <a><b xmlns:n1="www.example.org/n1"><n1:c></a>
19
- #document
20
- | <a>
21
- | <b>
22
- | <{www.example.org/n1}n1:c>
23
-
24
- #data
25
- <a><b xmlns:n1="www.example.org/n1"/><n1:c></a>
26
- #document
27
- | <a>
28
- | <b>
29
- | <n1:c>
30
-
31
- #data
32
- <a><b xmlns:n1="www.example.org/n1"><x/></b><n1:c></a>
33
- #document
34
- | <a>
35
- | <b>
36
- | <x>
37
- | <n1:c>
38
-
39
- #data
40
- <a><b xmlns:n1="www.example.org/n1"><n1:x><n1:b/></n1:x></b><n1:c></a>
41
- #document
42
- | <a>
43
- | <b>
44
- | <{www.example.org/n1}n1:x>
45
- | <{www.example.org/n1}n1:b>
46
- | <n1:c>
47
-
48
- #data
49
- <a><b xmlns:n1="www.example.org/n1"><n1:x xmlns:n1="www.example.org/n_1"><n1:b/></n1:x></b><n1:c></a>
50
- #document
51
- | <a>
52
- | <b>
53
- | <{www.example.org/n_1}n1:x>
54
- | <{www.example.org/n_1}n1:b>
55
- | <n1:c>
56
-
57
- #data
58
- <a><b xmlns:n1="x"><n1:x xmlns:n1=""><n1:b><n1:b2 xmlns:n1="y"/></n1:b></n1:x><n1:c><n1:c2/></n1:c></b></a>
59
- #document
60
- | <a>
61
- | <b>
62
- | <n1:x>
63
- | <n1:b>
64
- | <{y}n1:b2>
65
- | <{x}n1:c>
66
- | <{x}n1:c2>
67
-
68
- #data
69
- <a xmlns="student" id="3"><b name="No NS"></a>
70
- #document
71
- | <{student}a>
72
- | id="3"
73
- | <{student}b>
74
- | name="No NS"
75
-
76
- #data
77
- <a xmlns:n1="www.example.org" n1:x="val" />
78
- #document
79
- | <a>
80
- | {www.example.org}n1:x="val"
81
-
82
- #data
83
- <a xmlns:n1="www.example.org" xmlns:n2="www.example.org" n1:x="val" n2:x="dupl"/>
84
- #document
85
- | <a>
86
- | {www.example.org}n1:x="val"
87
-
88
- #data
89
- <a xmlns:n1="www.example.org" xmlns:n2="www.example.org"><bad a="1" a= "2"/><bad n1:a="1" n2:a="2"/></a>
90
- #document
91
- | <a>
92
- | <bad>
93
- | a="1"
94
- | <bad>
95
- | {www.example.org}n1:a="1"
96
-
97
- #data
98
- <a xmlns:n1="www.example.org" xmlns="www.example.org"><ok a="1" b="2"/><ok a="1" n1:a="2"/></a>
99
- #document
100
- | <{www.example.org}a>
101
- | <{www.example.org}ok>
102
- | a="1"
103
- | b="2"
104
- | <{www.example.org}ok>
105
- | a="1"
106
- | {www.example.org}n1:a="2"
107
-
108
- #data
109
- <a xmlns="www.example.org"><h><ok a="1"/></h><m><v n="v1"></v><v n="v2"></v></m></a>
110
- #document
111
- | <{www.example.org}a>
112
- | <{www.example.org}h>
113
- | <{www.example.org}ok>
114
- | a="1"
115
- | <{www.example.org}m>
116
- | <{www.example.org}v>
117
- | n="v1"
118
- | <{www.example.org}v>
119
- | n="v2"
@@ -1,124 +0,0 @@
1
- #data
2
- <a></a>
3
- #document
4
- | <a>
5
-
6
- #data
7
- <!DOCTYPE xhtml><a>
8
- #document
9
- | <!DOCTYPE xhtml>
10
- | <a>
11
-
12
- #data
13
- <!DOCTYPE xhtml PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><a>
14
- #document
15
- | <!DOCTYPE xhtml "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
16
- | <a>
17
-
18
- #data
19
- <a><!DOCTYPE xhtml PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"></a>
20
- #document
21
- | <a>
22
-
23
- #data
24
- <a></a><!DOCTYPE xhtml PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
25
- #document
26
- | <a>
27
-
28
- #data
29
- <!--COMMENT?--><a>
30
- #document
31
- | <!-- COMMENT? -->
32
- | <a>
33
-
34
- #data
35
- <!COMMENT?><a>
36
- #document
37
- | <!-- COMMENT? -->
38
- | <a>
39
-
40
- #data
41
- <?pix xml?><a>
42
- #document
43
- | <?pix xml?>
44
- | <a>
45
-
46
- #data
47
- <a/>
48
- #document
49
- | <a>
50
-
51
- #data
52
- <a>Text
53
- #document
54
- | <a>
55
- | "Text"
56
-
57
-
58
- #data
59
- <a><b>
60
- #document
61
- | <a>
62
- | <b>
63
-
64
- #data
65
- <a><b></b></a>
66
- #document
67
- | <a>
68
- | <b>
69
-
70
- #data
71
- <a><b/></a>
72
- #document
73
- | <a>
74
- | <b>
75
-
76
- #data
77
- <a><b/>
78
- #document
79
- | <a>
80
- | <b>
81
-
82
- #data
83
- <a><b>Text
84
- #document
85
- | <a>
86
- | <b>
87
- | "Text"
88
-
89
- #data
90
- <a><b>Text</b>
91
- #document
92
- | <a>
93
- | <b>
94
- | "Text"
95
-
96
- #data
97
- <a><!--COMMENT-->
98
- #document
99
- | <a>
100
- | <!-- COMMENT -->
101
-
102
- #data
103
- <a><?xslt dummy?>
104
- #document
105
- | <a>
106
- | <?xslt dummy?>
107
-
108
- #data
109
- <a></a><?xslt dummy?>
110
- #document
111
- | <a>
112
- | <?xslt dummy?>
113
-
114
- #data
115
- <a></a><!--COMMENT-->
116
- #document
117
- | <a>
118
- | <!-- COMMENT -->
119
-
120
- #data
121
- <a><x></x></a><b>
122
- #document
123
- | <a>
124
- | <x>
@@ -1 +0,0 @@
1
- {"files":{".cargo_vcs_info.json":"de1c3c82ac61982b9726332820b9e2902cddabf4e01d9c201ca36d224fde543d","Cargo.lock":"93e7f49c37ac19c49eb43310fd8d77e4789e7bb18520ef84644779316641a3ee","Cargo.toml":"d1a382f682bec7ae043e2e158d26e1b34a183cd8ecd1535122a98e73656fd8e2","Cargo.toml.orig":"dee9beda7fa78a98996594b52956f66d4a5d3bf842bb1fce3ae9fea49c242970","LICENSE-APACHE":"a60eea817514531668d7e00765731449fe14d059d3249e0bc93b36de45f759f2","LICENSE-MIT":"86dd7f026f916daf7511e39951ad8ea8cf55a8db67ae64060dacf829761c18f3","README.md":"76fbd1fa9c9d5b6f0b6fe99e4786a2985cf0a0bbfc82f0bde854c023fa2b2ab0","benches/xml5ever.rs":"64a6dfe6d84a4e93bf4f57e1923b6bf0ce916ca0daa478ba9b17bc6f628daaae","data/bench/strong.xml":"5adb31981cca062df929353c60dfa1c7fb91170b5a389a13c8be6555a4cf107d","examples/README.md":"75d4d950e38d72eaca75676991598a269a6f8c9b896e9dc4c74937fab2f259ec","examples/example.xml":"3db9bfaa6333a1b18fe45d460e4bcd37b73ee6b8f793fc1162c103a1f6f55d83","examples/simple_xml_tokenizer.rs":"1c5937192eee7601202ca7be8d17794377fbbc591d42178a3a8b91375ff8bf96","examples/xml_tokenizer.rs":"db8fd96f642eba0c3774f29cc3d9c554657b45dce7c6cafccd3fc838b5f4335f","src/driver.rs":"27897d32c13b1e253edadba6d49709b026b372ec272a5e64e4dc7d99d51919ff","src/lib.rs":"a46291ffd5d30e41e0284cc421640edb22d4fc07a20933ba1f208020dbbfe622","src/macros.rs":"cd9923eca89fe3650b2741867ba16c3ba93bbbe3af58c3bec2be36d828580769","src/serialize/mod.rs":"1ff05bf4fb9b43eafa2a5579cb8e8dc0d0c5465d35723321f351257c4a7ab43e","src/tokenizer/char_ref/mod.rs":"84a1d70a985944d2afb35a5aabbebe949605fe829dc2ae9ec831207db49a2341","src/tokenizer/interface.rs":"dda4a0c0990654c577733a64582a28b2f2b70fab7c2e1f71b9621aa87dd72e28","src/tokenizer/mod.rs":"e9d848faa7b2a81167e333cc57f22176911689ff21d02cb7f0ee66f4de28b561","src/tokenizer/qname.rs":"e9228f43897def8d7af3e0842226309b3a39dce3768b48a2237bb85e242f44ca","src/tokenizer/states.rs":"382afc0ec2b67ebdd59cac4b25af6c4cddae1d6ff2a5b8fe5d7f331d8c2f6747","src/tree_builder/mod.rs":"ac0a635dd88047141fca6dc1784d168228f93b5c8183274bf6c1ccf206033bce","src/tree_builder/types.rs":"d5c3ba265a280af7932f5ba789cd9d69bdc74cde1744b581d7c9071bf4c28917"},"package":"f57dd51b88a4b9f99f9b55b136abb86210629d61c48117ddb87f567e51e66be7"}
@@ -1,6 +0,0 @@
1
- {
2
- "git": {
3
- "sha1": "34059007a855d284608f9447ed74c0c209bc0ad8"
4
- },
5
- "path_in_vcs": "xml5ever"
6
- }