html-to-markdown 2.24.6 → 2.25.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (231) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile.lock +2 -2
  3. data/README.md +1 -1
  4. data/ext/html-to-markdown-rb/native/Cargo.lock +9 -32
  5. data/ext/html-to-markdown-rb/native/Cargo.toml +1 -1
  6. data/lib/html_to_markdown/version.rb +1 -1
  7. data/rust-vendor/html-to-markdown-rs/Cargo.toml +0 -1
  8. data/rust-vendor/html-to-markdown-rs/src/converter/main_helpers.rs +1 -1
  9. data/rust-vendor/html-to-markdown-rs/src/hocr/converter/hierarchy.rs +20 -5
  10. data/rust-vendor/html-to-markdown-rs/src/lib.rs +1 -0
  11. data/rust-vendor/{markup5ever_rcdom/lib.rs → html-to-markdown-rs/src/rcdom.rs} +56 -91
  12. data/rust-vendor/html-to-markdown-rs/tests/hocr_compliance_test.rs +157 -0
  13. data/rust-vendor/memmap2/.cargo-checksum.json +1 -1
  14. data/rust-vendor/memmap2/.cargo_vcs_info.json +1 -1
  15. data/rust-vendor/memmap2/CHANGELOG.md +8 -0
  16. data/rust-vendor/memmap2/Cargo.lock +1 -1
  17. data/rust-vendor/memmap2/Cargo.toml +2 -1
  18. data/rust-vendor/memmap2/Cargo.toml.orig +2 -1
  19. data/rust-vendor/memmap2/src/lib.rs +25 -1
  20. data/rust-vendor/memmap2/src/stub.rs +1 -4
  21. data/rust-vendor/memmap2/src/unix.rs +14 -1
  22. data/rust-vendor/png/.cargo-checksum.json +1 -1
  23. data/rust-vendor/png/.cargo_vcs_info.json +1 -1
  24. data/rust-vendor/png/CHANGES.md +44 -0
  25. data/rust-vendor/png/Cargo.lock +124 -171
  26. data/rust-vendor/png/Cargo.toml +1 -1
  27. data/rust-vendor/png/Cargo.toml.orig +1 -1
  28. data/rust-vendor/png/benches/expand_paletted.rs +5 -5
  29. data/rust-vendor/png/benches/unfilter.rs +3 -3
  30. data/rust-vendor/png/src/adam7.rs +17 -10
  31. data/rust-vendor/png/src/common.rs +8 -8
  32. data/rust-vendor/png/src/decoder/mod.rs +53 -20
  33. data/rust-vendor/png/src/decoder/stream.rs +263 -78
  34. data/rust-vendor/png/src/decoder/unfiltering_buffer.rs +210 -53
  35. data/rust-vendor/png/src/decoder/zlib.rs +130 -90
  36. data/rust-vendor/png/src/encoder.rs +4 -2
  37. data/rust-vendor/png/src/{filter.rs → filter/mod.rs} +100 -367
  38. data/rust-vendor/png/src/filter/optimization-notes.md +104 -0
  39. data/rust-vendor/png/src/filter/paeth.rs +398 -0
  40. data/rust-vendor/png/src/filter/simd.rs +308 -0
  41. data/rust-vendor/png/src/lib.rs +1 -0
  42. data/rust-vendor/syn/.cargo-checksum.json +1 -1
  43. data/rust-vendor/syn/.cargo_vcs_info.json +1 -1
  44. data/rust-vendor/syn/Cargo.lock +40 -41
  45. data/rust-vendor/syn/Cargo.toml +1 -1
  46. data/rust-vendor/syn/Cargo.toml.orig +1 -1
  47. data/rust-vendor/syn/src/item.rs +61 -40
  48. data/rust-vendor/syn/src/lib.rs +2 -1
  49. data/rust-vendor/syn/tests/test_item.rs +54 -0
  50. data/rust-vendor/unicode-ident/.cargo-checksum.json +1 -1
  51. data/rust-vendor/unicode-ident/.cargo_vcs_info.json +1 -1
  52. data/rust-vendor/unicode-ident/Cargo.lock +21 -21
  53. data/rust-vendor/unicode-ident/Cargo.toml +1 -1
  54. data/rust-vendor/unicode-ident/Cargo.toml.orig +1 -1
  55. data/rust-vendor/unicode-ident/src/lib.rs +1 -1
  56. data/rust-vendor/unicode-ident/src/tables.rs +87 -97
  57. data/rust-vendor/unicode-ident/tests/static_size.rs +1 -1
  58. metadata +7 -177
  59. data/rust-vendor/markup5ever_rcdom/.cargo-checksum.json +0 -1
  60. data/rust-vendor/markup5ever_rcdom/.cargo_vcs_info.json +0 -7
  61. data/rust-vendor/markup5ever_rcdom/Cargo.lock +0 -658
  62. data/rust-vendor/markup5ever_rcdom/Cargo.toml +0 -109
  63. data/rust-vendor/markup5ever_rcdom/Cargo.toml.orig +0 -42
  64. data/rust-vendor/markup5ever_rcdom/LICENSE-APACHE +0 -201
  65. data/rust-vendor/markup5ever_rcdom/LICENSE-MIT +0 -25
  66. data/rust-vendor/markup5ever_rcdom/README.md +0 -7
  67. data/rust-vendor/markup5ever_rcdom/custom-html5lib-tokenizer-tests/regression.test +0 -69
  68. data/rust-vendor/markup5ever_rcdom/data/test/ignore +0 -1
  69. data/rust-vendor/markup5ever_rcdom/examples/hello_xml.rs +0 -39
  70. data/rust-vendor/markup5ever_rcdom/examples/html2html.rs +0 -51
  71. data/rust-vendor/markup5ever_rcdom/examples/print-rcdom.rs +0 -78
  72. data/rust-vendor/markup5ever_rcdom/examples/xml_tree_printer.rs +0 -67
  73. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.gitattributes +0 -2
  74. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.github/workflows/downstream.yml +0 -76
  75. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.github/workflows/lint.yml +0 -25
  76. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.gitignore +0 -79
  77. data/rust-vendor/markup5ever_rcdom/html5lib-tests/AUTHORS.rst +0 -34
  78. data/rust-vendor/markup5ever_rcdom/html5lib-tests/LICENSE +0 -21
  79. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/chardet/test_big5.txt +0 -51
  80. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/scripted/tests1.dat +0 -5
  81. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/test-yahoo-jp.dat +0 -10
  82. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/tests1.dat +0 -388
  83. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/tests2.dat +0 -115
  84. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint +0 -6
  85. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/__init__.py +0 -0
  86. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/__init__.py +0 -0
  87. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/LICENSE +0 -18
  88. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/__init__.py +0 -0
  89. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/lexer.py +0 -211
  90. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/lexer.pyi +0 -34
  91. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/parser.py +0 -872
  92. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/parser.pyi +0 -83
  93. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/py.typed +0 -0
  94. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/util.py +0 -72
  95. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/util.pyi +0 -7
  96. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/vendor.txt +0 -1
  97. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor-patches/funcparserlib.patch +0 -24
  98. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/lint.py +0 -280
  99. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/parser.py +0 -177
  100. data/rust-vendor/markup5ever_rcdom/html5lib-tests/pyproject.toml +0 -7
  101. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/core.test +0 -125
  102. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/injectmeta.test +0 -66
  103. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/optionaltags.test +0 -965
  104. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/options.test +0 -60
  105. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/whitespace.test +0 -51
  106. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/README.md +0 -107
  107. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/contentModelFlags.test +0 -93
  108. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/domjs.test +0 -335
  109. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/entities.test +0 -542
  110. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/escapeFlag.test +0 -36
  111. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/namedEntities.test +0 -42422
  112. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/numericEntities.test +0 -1677
  113. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/pendingSpecChanges.test +0 -9
  114. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test1.test +0 -353
  115. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test2.test +0 -275
  116. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test3.test +0 -11233
  117. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test4.test +0 -532
  118. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/unicodeChars.test +0 -1577
  119. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/unicodeCharsProblematic.test +0 -41
  120. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/xmlViolation.test +0 -20
  121. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/README.md +0 -108
  122. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/adoption01.dat +0 -354
  123. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/adoption02.dat +0 -39
  124. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/blocks.dat +0 -695
  125. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/comments01.dat +0 -217
  126. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/doctype01.dat +0 -474
  127. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/domjs-unsafe.dat +0 -0
  128. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/entities01.dat +0 -943
  129. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/entities02.dat +0 -309
  130. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/foreign-fragment.dat +0 -645
  131. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/html5test-com.dat +0 -301
  132. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/inbody01.dat +0 -54
  133. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/isindex.dat +0 -49
  134. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/main-element.dat +0 -46
  135. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/math.dat +0 -104
  136. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/menuitem-element.dat +0 -240
  137. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/namespace-sensitivity.dat +0 -22
  138. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/noscript01.dat +0 -237
  139. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/pending-spec-changes-plain-text-unsafe.dat +0 -0
  140. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/pending-spec-changes.dat +0 -46
  141. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/plain-text-unsafe.dat +0 -0
  142. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/quirks01.dat +0 -53
  143. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/ruby.dat +0 -302
  144. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scriptdata01.dat +0 -372
  145. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/adoption01.dat +0 -16
  146. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/ark.dat +0 -27
  147. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/webkit01.dat +0 -30
  148. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/search-element.dat +0 -46
  149. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/svg.dat +0 -104
  150. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tables01.dat +0 -322
  151. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/template.dat +0 -1673
  152. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests1.dat +0 -1956
  153. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests10.dat +0 -849
  154. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests11.dat +0 -523
  155. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests12.dat +0 -62
  156. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests14.dat +0 -75
  157. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests15.dat +0 -216
  158. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests16.dat +0 -2602
  159. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests17.dat +0 -179
  160. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests18.dat +0 -558
  161. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests19.dat +0 -1398
  162. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests2.dat +0 -831
  163. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests20.dat +0 -842
  164. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests21.dat +0 -306
  165. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests22.dat +0 -190
  166. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests23.dat +0 -168
  167. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests24.dat +0 -79
  168. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests25.dat +0 -288
  169. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests26.dat +0 -453
  170. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests3.dat +0 -305
  171. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests4.dat +0 -74
  172. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests5.dat +0 -210
  173. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests6.dat +0 -663
  174. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests7.dat +0 -453
  175. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests8.dat +0 -165
  176. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests9.dat +0 -472
  177. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests_innerHTML_1.dat +0 -843
  178. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tricky01.dat +0 -336
  179. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/webkit01.dat +0 -785
  180. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/webkit02.dat +0 -554
  181. data/rust-vendor/markup5ever_rcdom/tests/foreach_html5lib_test/mod.rs +0 -41
  182. data/rust-vendor/markup5ever_rcdom/tests/html-driver.rs +0 -29
  183. data/rust-vendor/markup5ever_rcdom/tests/html-serializer.rs +0 -265
  184. data/rust-vendor/markup5ever_rcdom/tests/html-tokenizer.rs +0 -487
  185. data/rust-vendor/markup5ever_rcdom/tests/html-tree-builder.rs +0 -298
  186. data/rust-vendor/markup5ever_rcdom/tests/html-tree-sink.rs +0 -141
  187. data/rust-vendor/markup5ever_rcdom/tests/util/find_tests.rs +0 -34
  188. data/rust-vendor/markup5ever_rcdom/tests/util/runner.rs +0 -48
  189. data/rust-vendor/markup5ever_rcdom/tests/xml-driver.rs +0 -101
  190. data/rust-vendor/markup5ever_rcdom/tests/xml-tokenizer.rs +0 -374
  191. data/rust-vendor/markup5ever_rcdom/tests/xml-tree-builder.rs +0 -237
  192. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/AUTHORS.rst +0 -9
  193. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/LICENSE +0 -21
  194. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/README.md +0 -92
  195. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/comments.test +0 -274
  196. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/doctype.test +0 -3232
  197. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/entities.test +0 -283
  198. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/eof.test +0 -113
  199. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/namedEntities.test +0 -42210
  200. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/numericEntities.test +0 -1349
  201. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/test1.test +0 -162
  202. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/test2.test +0 -64
  203. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/unicodeChars.test +0 -1295
  204. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/README.md +0 -104
  205. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/namespace.dat +0 -119
  206. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/test1.dat +0 -124
  207. data/rust-vendor/xml5ever/.cargo-checksum.json +0 -1
  208. data/rust-vendor/xml5ever/.cargo_vcs_info.json +0 -6
  209. data/rust-vendor/xml5ever/Cargo.lock +0 -752
  210. data/rust-vendor/xml5ever/Cargo.toml +0 -69
  211. data/rust-vendor/xml5ever/Cargo.toml.orig +0 -29
  212. data/rust-vendor/xml5ever/LICENSE-APACHE +0 -201
  213. data/rust-vendor/xml5ever/LICENSE-MIT +0 -25
  214. data/rust-vendor/xml5ever/README.md +0 -72
  215. data/rust-vendor/xml5ever/benches/xml5ever.rs +0 -77
  216. data/rust-vendor/xml5ever/data/bench/strong.xml +0 -1
  217. data/rust-vendor/xml5ever/examples/README.md +0 -223
  218. data/rust-vendor/xml5ever/examples/example.xml +0 -3
  219. data/rust-vendor/xml5ever/examples/simple_xml_tokenizer.rs +0 -81
  220. data/rust-vendor/xml5ever/examples/xml_tokenizer.rs +0 -115
  221. data/rust-vendor/xml5ever/src/driver.rs +0 -90
  222. data/rust-vendor/xml5ever/src/lib.rs +0 -47
  223. data/rust-vendor/xml5ever/src/macros.rs +0 -18
  224. data/rust-vendor/xml5ever/src/serialize/mod.rs +0 -216
  225. data/rust-vendor/xml5ever/src/tokenizer/char_ref/mod.rs +0 -456
  226. data/rust-vendor/xml5ever/src/tokenizer/interface.rs +0 -116
  227. data/rust-vendor/xml5ever/src/tokenizer/mod.rs +0 -1344
  228. data/rust-vendor/xml5ever/src/tokenizer/qname.rs +0 -84
  229. data/rust-vendor/xml5ever/src/tokenizer/states.rs +0 -167
  230. data/rust-vendor/xml5ever/src/tree_builder/mod.rs +0 -774
  231. data/rust-vendor/xml5ever/src/tree_builder/types.rs +0 -37
@@ -1,217 +0,0 @@
1
- #data
2
- FOO<!-- BAR -->BAZ
3
- #errors
4
- (1,3): expected-doctype-but-got-chars
5
- #document
6
- | <html>
7
- | <head>
8
- | <body>
9
- | "FOO"
10
- | <!-- BAR -->
11
- | "BAZ"
12
-
13
- #data
14
- FOO<!-- BAR --!>BAZ
15
- #errors
16
- (1,3): expected-doctype-but-got-chars
17
- (1,15): unexpected-bang-after-double-dash-in-comment
18
- #new-errors
19
- (1:16) incorrectly-closed-comment
20
- #document
21
- | <html>
22
- | <head>
23
- | <body>
24
- | "FOO"
25
- | <!-- BAR -->
26
- | "BAZ"
27
-
28
- #data
29
- FOO<!-- BAR --! >BAZ
30
- #errors
31
- (1,3): expected-doctype-but-got-chars
32
- (1:21) eof-in-comment
33
- #new-errors
34
- (1:21) eof-in-comment
35
- #document
36
- | <html>
37
- | <head>
38
- | <body>
39
- | "FOO"
40
- | <!-- BAR --! >BAZ -->
41
-
42
- #data
43
- FOO<!-- BAR --!
44
- >BAZ
45
- #errors
46
- (1,3): expected-doctype-but-got-chars
47
- (2:5) eof-in-comment
48
- #new-errors
49
- (2:5) eof-in-comment
50
- #document
51
- | <html>
52
- | <head>
53
- | <body>
54
- | "FOO"
55
- | <!-- BAR --!
56
- >BAZ -->
57
-
58
- #data
59
- FOO<!-- BAR -- >BAZ
60
- #errors
61
- (1,3): expected-doctype-but-got-chars
62
- (1,21): eof-in-comment
63
- #new-errors
64
- (1:22) eof-in-comment
65
- #document
66
- | <html>
67
- | <head>
68
- | <body>
69
- | "FOO"
70
- | <!-- BAR -- >BAZ -->
71
-
72
- #data
73
- FOO<!-- BAR -- <QUX> -- MUX -->BAZ
74
- #errors
75
- (1,3): expected-doctype-but-got-chars
76
- #document
77
- | <html>
78
- | <head>
79
- | <body>
80
- | "FOO"
81
- | <!-- BAR -- <QUX> -- MUX -->
82
- | "BAZ"
83
-
84
- #data
85
- FOO<!-- BAR -- <QUX> -- MUX --!>BAZ
86
- #errors
87
- (1,3): expected-doctype-but-got-chars
88
- (1,31): unexpected-bang-after-double-dash-in-comment
89
- #new-errors
90
- (1:32) incorrectly-closed-comment
91
- #document
92
- | <html>
93
- | <head>
94
- | <body>
95
- | "FOO"
96
- | <!-- BAR -- <QUX> -- MUX -->
97
- | "BAZ"
98
-
99
- #data
100
- FOO<!-- BAR -- <QUX> -- MUX -- >BAZ
101
- #errors
102
- (1,3): expected-doctype-but-got-chars
103
- (1,35): eof-in-comment
104
- #new-errors
105
- (1:36) eof-in-comment
106
- #document
107
- | <html>
108
- | <head>
109
- | <body>
110
- | "FOO"
111
- | <!-- BAR -- <QUX> -- MUX -- >BAZ -->
112
-
113
- #data
114
- FOO<!---->BAZ
115
- #errors
116
- (1,3): expected-doctype-but-got-chars
117
- #document
118
- | <html>
119
- | <head>
120
- | <body>
121
- | "FOO"
122
- | <!-- -->
123
- | "BAZ"
124
-
125
- #data
126
- FOO<!--->BAZ
127
- #errors
128
- (1,3): expected-doctype-but-got-chars
129
- (1,9): incorrect-comment
130
- #new-errors
131
- (1:9) abrupt-closing-of-empty-comment
132
- #document
133
- | <html>
134
- | <head>
135
- | <body>
136
- | "FOO"
137
- | <!-- -->
138
- | "BAZ"
139
-
140
- #data
141
- FOO<!-->BAZ
142
- #errors
143
- (1,3): expected-doctype-but-got-chars
144
- (1,8): incorrect-comment
145
- #new-errors
146
- (1:8) abrupt-closing-of-empty-comment
147
- #document
148
- | <html>
149
- | <head>
150
- | <body>
151
- | "FOO"
152
- | <!-- -->
153
- | "BAZ"
154
-
155
- #data
156
- <?xml version="1.0">Hi
157
- #errors
158
- (1,1): expected-tag-name-but-got-question-mark
159
- (1,22): expected-doctype-but-got-chars
160
- #new-errors
161
- (1:2) unexpected-question-mark-instead-of-tag-name
162
- #document
163
- | <!-- ?xml version="1.0" -->
164
- | <html>
165
- | <head>
166
- | <body>
167
- | "Hi"
168
-
169
- #data
170
- <?xml version="1.0">
171
- #errors
172
- (1,1): expected-tag-name-but-got-question-mark
173
- (1,20): expected-doctype-but-got-eof
174
- #new-errors
175
- (1:2) unexpected-question-mark-instead-of-tag-name
176
- #document
177
- | <!-- ?xml version="1.0" -->
178
- | <html>
179
- | <head>
180
- | <body>
181
-
182
- #data
183
- <?xml version
184
- #errors
185
- (1,1): expected-tag-name-but-got-question-mark
186
- (1,13): expected-doctype-but-got-eof
187
- #new-errors
188
- (1:2) unexpected-question-mark-instead-of-tag-name
189
- #document
190
- | <!-- ?xml version -->
191
- | <html>
192
- | <head>
193
- | <body>
194
-
195
- #data
196
- FOO<!----->BAZ
197
- #errors
198
- (1,3): expected-doctype-but-got-chars
199
- #document
200
- | <html>
201
- | <head>
202
- | <body>
203
- | "FOO"
204
- | <!-- - -->
205
- | "BAZ"
206
-
207
- #data
208
- <html><!-- comment --><title>Comment before head</title>
209
- #errors
210
- (1,6): expected-doctype-but-got-start-tag
211
- #document
212
- | <html>
213
- | <!-- comment -->
214
- | <head>
215
- | <title>
216
- | "Comment before head"
217
- | <body>
@@ -1,474 +0,0 @@
1
- #data
2
- <!DOCTYPE html>Hello
3
- #errors
4
- #document
5
- | <!DOCTYPE html>
6
- | <html>
7
- | <head>
8
- | <body>
9
- | "Hello"
10
-
11
- #data
12
- <!dOctYpE HtMl>Hello
13
- #errors
14
- #document
15
- | <!DOCTYPE html>
16
- | <html>
17
- | <head>
18
- | <body>
19
- | "Hello"
20
-
21
- #data
22
- <!DOCTYPEhtml>Hello
23
- #errors
24
- (1,9): need-space-after-doctype
25
- #new-errors
26
- (1:10) missing-whitespace-before-doctype-name
27
- #document
28
- | <!DOCTYPE html>
29
- | <html>
30
- | <head>
31
- | <body>
32
- | "Hello"
33
-
34
- #data
35
- <!DOCTYPE>Hello
36
- #errors
37
- (1,10): expected-doctype-name-but-got-right-bracket
38
- (1,10): unknown-doctype
39
- #new-errors
40
- (1:10) missing-doctype-name
41
- #document
42
- | <!DOCTYPE >
43
- | <html>
44
- | <head>
45
- | <body>
46
- | "Hello"
47
-
48
- #data
49
- <!DOCTYPE >Hello
50
- #errors
51
- (1,11): expected-doctype-name-but-got-right-bracket
52
- (1,11): unknown-doctype
53
- #new-errors
54
- (1:11) missing-doctype-name
55
- #document
56
- | <!DOCTYPE >
57
- | <html>
58
- | <head>
59
- | <body>
60
- | "Hello"
61
-
62
- #data
63
- <!DOCTYPE potato>Hello
64
- #errors
65
- (1,17): unknown-doctype
66
- #document
67
- | <!DOCTYPE potato>
68
- | <html>
69
- | <head>
70
- | <body>
71
- | "Hello"
72
-
73
- #data
74
- <!DOCTYPE potato >Hello
75
- #errors
76
- (1,18): unknown-doctype
77
- #document
78
- | <!DOCTYPE potato>
79
- | <html>
80
- | <head>
81
- | <body>
82
- | "Hello"
83
-
84
- #data
85
- <!DOCTYPE potato taco>Hello
86
- #errors
87
- (1,17): expected-space-or-right-bracket-in-doctype
88
- (1,22): unknown-doctype
89
- #new-errors
90
- (1:18) invalid-character-sequence-after-doctype-name
91
- #document
92
- | <!DOCTYPE potato>
93
- | <html>
94
- | <head>
95
- | <body>
96
- | "Hello"
97
-
98
- #data
99
- <!DOCTYPE potato taco "ddd>Hello
100
- #errors
101
- (1,17): expected-space-or-right-bracket-in-doctype
102
- (1,27): unknown-doctype
103
- #new-errors
104
- (1:18) invalid-character-sequence-after-doctype-name
105
- #document
106
- | <!DOCTYPE potato>
107
- | <html>
108
- | <head>
109
- | <body>
110
- | "Hello"
111
-
112
- #data
113
- <!DOCTYPE potato sYstEM>Hello
114
- #errors
115
- (1,24): unexpected-char-in-doctype
116
- (1,24): unknown-doctype
117
- #new-errors
118
- (1:24) missing-doctype-system-identifier
119
- #document
120
- | <!DOCTYPE potato>
121
- | <html>
122
- | <head>
123
- | <body>
124
- | "Hello"
125
-
126
- #data
127
- <!DOCTYPE potato sYstEM >Hello
128
- #errors
129
- (1,28): unexpected-char-in-doctype
130
- (1,28): unknown-doctype
131
- #new-errors
132
- (1:28) missing-doctype-system-identifier
133
- #document
134
- | <!DOCTYPE potato>
135
- | <html>
136
- | <head>
137
- | <body>
138
- | "Hello"
139
-
140
- #data
141
- <!DOCTYPE potato sYstEM ggg>Hello
142
- #errors
143
- (1,34): unexpected-char-in-doctype
144
- (1,37): unknown-doctype
145
- #new-errors
146
- (1:34) missing-quote-before-doctype-system-identifier
147
- #document
148
- | <!DOCTYPE potato>
149
- | <html>
150
- | <head>
151
- | <body>
152
- | "Hello"
153
-
154
- #data
155
- <!DOCTYPE potato SYSTEM taco >Hello
156
- #errors
157
- (1,25): unexpected-char-in-doctype
158
- (1,31): unknown-doctype
159
- #new-errors
160
- (1:25) missing-quote-before-doctype-system-identifier
161
- #document
162
- | <!DOCTYPE potato>
163
- | <html>
164
- | <head>
165
- | <body>
166
- | "Hello"
167
-
168
- #data
169
- <!DOCTYPE potato SYSTEM 'taco"'>Hello
170
- #errors
171
- (1,32): unknown-doctype
172
- #document
173
- | <!DOCTYPE potato "" "taco"">
174
- | <html>
175
- | <head>
176
- | <body>
177
- | "Hello"
178
-
179
- #data
180
- <!DOCTYPE potato SYSTEM "taco">Hello
181
- #errors
182
- (1,31): unknown-doctype
183
- #document
184
- | <!DOCTYPE potato "" "taco">
185
- | <html>
186
- | <head>
187
- | <body>
188
- | "Hello"
189
-
190
- #data
191
- <!DOCTYPE potato SYSTEM "tai'co">Hello
192
- #errors
193
- (1,33): unknown-doctype
194
- #document
195
- | <!DOCTYPE potato "" "tai'co">
196
- | <html>
197
- | <head>
198
- | <body>
199
- | "Hello"
200
-
201
- #data
202
- <!DOCTYPE potato SYSTEMtaco "ddd">Hello
203
- #errors
204
- (1,24): unexpected-char-in-doctype
205
- (1,34): unknown-doctype
206
- #new-errors
207
- (1:24) missing-quote-before-doctype-system-identifier
208
- #document
209
- | <!DOCTYPE potato>
210
- | <html>
211
- | <head>
212
- | <body>
213
- | "Hello"
214
-
215
- #data
216
- <!DOCTYPE potato grass SYSTEM taco>Hello
217
- #errors
218
- (1,17): expected-space-or-right-bracket-in-doctype
219
- (1,35): unknown-doctype
220
- #new-errors
221
- (1:18) invalid-character-sequence-after-doctype-name
222
- #document
223
- | <!DOCTYPE potato>
224
- | <html>
225
- | <head>
226
- | <body>
227
- | "Hello"
228
-
229
- #data
230
- <!DOCTYPE potato pUbLIc>Hello
231
- #errors
232
- (1,24): unexpected-end-of-doctype
233
- (1,24): unknown-doctype
234
- #new-errors
235
- (1:24) missing-doctype-public-identifier
236
- #document
237
- | <!DOCTYPE potato>
238
- | <html>
239
- | <head>
240
- | <body>
241
- | "Hello"
242
-
243
- #data
244
- <!DOCTYPE potato pUbLIc >Hello
245
- #errors
246
- (1,25): unexpected-end-of-doctype
247
- (1,25): unknown-doctype
248
- #new-errors
249
- (1:25) missing-doctype-public-identifier
250
- #document
251
- | <!DOCTYPE potato>
252
- | <html>
253
- | <head>
254
- | <body>
255
- | "Hello"
256
-
257
- #data
258
- <!DOCTYPE potato pUbLIcgoof>Hello
259
- #errors
260
- (1,24): unexpected-char-in-doctype
261
- (1,28): unknown-doctype
262
- #new-errors
263
- (1:24) missing-quote-before-doctype-public-identifier
264
- #document
265
- | <!DOCTYPE potato>
266
- | <html>
267
- | <head>
268
- | <body>
269
- | "Hello"
270
-
271
- #data
272
- <!DOCTYPE potato PUBLIC goof>Hello
273
- #errors
274
- (1,25): unexpected-char-in-doctype
275
- (1,29): unknown-doctype
276
- #new-errors
277
- (1:25) missing-quote-before-doctype-public-identifier
278
- #document
279
- | <!DOCTYPE potato>
280
- | <html>
281
- | <head>
282
- | <body>
283
- | "Hello"
284
-
285
- #data
286
- <!DOCTYPE potato PUBLIC "go'of">Hello
287
- #errors
288
- (1,32): unknown-doctype
289
- #document
290
- | <!DOCTYPE potato "go'of" "">
291
- | <html>
292
- | <head>
293
- | <body>
294
- | "Hello"
295
-
296
- #data
297
- <!DOCTYPE potato PUBLIC 'go'of'>Hello
298
- #errors
299
- (1,29): unexpected-char-in-doctype
300
- (1,32): unknown-doctype
301
- #new-errors
302
- (1:29) missing-quote-before-doctype-system-identifier
303
- #document
304
- | <!DOCTYPE potato "go" "">
305
- | <html>
306
- | <head>
307
- | <body>
308
- | "Hello"
309
-
310
- #data
311
- <!DOCTYPE potato PUBLIC 'go:hh of' >Hello
312
- #errors
313
- (1,38): unknown-doctype
314
- #document
315
- | <!DOCTYPE potato "go:hh of" "">
316
- | <html>
317
- | <head>
318
- | <body>
319
- | "Hello"
320
-
321
- #data
322
- <!DOCTYPE potato PUBLIC "W3C-//dfdf" SYSTEM ggg>Hello
323
- #errors
324
- (1,38): unexpected-char-in-doctype
325
- (1,48): unknown-doctype
326
- #new-errors
327
- (1:38) missing-quote-before-doctype-system-identifier
328
- #document
329
- | <!DOCTYPE potato "W3C-//dfdf" "">
330
- | <html>
331
- | <head>
332
- | <body>
333
- | "Hello"
334
-
335
- #data
336
- <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN"
337
- "http://www.w3.org/TR/html4/strict.dtd">Hello
338
- #errors
339
- (2,43): unknown-doctype
340
- #document
341
- | <!DOCTYPE html "-//W3C//DTD HTML 4.01//EN" "http://www.w3.org/TR/html4/strict.dtd">
342
- | <html>
343
- | <head>
344
- | <body>
345
- | "Hello"
346
-
347
- #data
348
- <!DOCTYPE ...>Hello
349
- #errors
350
- (1,14): unknown-doctype
351
- #document
352
- | <!DOCTYPE ...>
353
- | <html>
354
- | <head>
355
- | <body>
356
- | "Hello"
357
-
358
- #data
359
- <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
360
- "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
361
- #errors
362
- (2,58): unknown-doctype
363
- #document
364
- | <!DOCTYPE html "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
365
- | <html>
366
- | <head>
367
- | <body>
368
-
369
- #data
370
- <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Frameset//EN"
371
- "http://www.w3.org/TR/xhtml1/DTD/xhtml1-frameset.dtd">
372
- #errors
373
- (2,54): unknown-doctype
374
- #document
375
- | <!DOCTYPE html "-//W3C//DTD XHTML 1.0 Frameset//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-frameset.dtd">
376
- | <html>
377
- | <head>
378
- | <body>
379
-
380
- #data
381
- <!DOCTYPE root-element [SYSTEM OR PUBLIC FPI] "uri" [
382
- <!-- internal declarations -->
383
- ]>
384
- #errors
385
- (1,23): expected-space-or-right-bracket-in-doctype
386
- (2,30): unknown-doctype
387
- #new-errors
388
- (1:24) invalid-character-sequence-after-doctype-name
389
- #document
390
- | <!DOCTYPE root-element>
391
- | <html>
392
- | <head>
393
- | <body>
394
- | "]>"
395
-
396
- #data
397
- <!DOCTYPE html PUBLIC
398
- "-//WAPFORUM//DTD XHTML Mobile 1.0//EN"
399
- "http://www.wapforum.org/DTD/xhtml-mobile10.dtd">
400
- #errors
401
- (3,53): unknown-doctype
402
- #document
403
- | <!DOCTYPE html "-//WAPFORUM//DTD XHTML Mobile 1.0//EN" "http://www.wapforum.org/DTD/xhtml-mobile10.dtd">
404
- | <html>
405
- | <head>
406
- | <body>
407
-
408
- #data
409
- <!DOCTYPE HTML SYSTEM "http://www.w3.org/DTD/HTML4-strict.dtd"><body><b>Mine!</b></body>
410
- #errors
411
- (1,63): unknown-doctype
412
- #document
413
- | <!DOCTYPE html "" "http://www.w3.org/DTD/HTML4-strict.dtd">
414
- | <html>
415
- | <head>
416
- | <body>
417
- | <b>
418
- | "Mine!"
419
-
420
- #data
421
- <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN""http://www.w3.org/TR/html4/strict.dtd">
422
- #errors
423
- (1,50): unexpected-char-in-doctype
424
- (1,89): unknown-doctype
425
- #new-errors
426
- (1:50) missing-whitespace-between-doctype-public-and-system-identifiers
427
- #document
428
- | <!DOCTYPE html "-//W3C//DTD HTML 4.01//EN" "http://www.w3.org/TR/html4/strict.dtd">
429
- | <html>
430
- | <head>
431
- | <body>
432
-
433
- #data
434
- <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN"'http://www.w3.org/TR/html4/strict.dtd'>
435
- #errors
436
- (1,50): unexpected-char-in-doctype
437
- (1,89): unknown-doctype
438
- #new-errors
439
- (1:50) missing-whitespace-between-doctype-public-and-system-identifiers
440
- #document
441
- | <!DOCTYPE html "-//W3C//DTD HTML 4.01//EN" "http://www.w3.org/TR/html4/strict.dtd">
442
- | <html>
443
- | <head>
444
- | <body>
445
-
446
- #data
447
- <!DOCTYPE HTML PUBLIC"-//W3C//DTD HTML 4.01//EN"'http://www.w3.org/TR/html4/strict.dtd'>
448
- #errors
449
- (1,21): unexpected-char-in-doctype
450
- (1,49): unexpected-char-in-doctype
451
- (1,88): unknown-doctype
452
- #new-errors
453
- (1:22) missing-whitespace-after-doctype-public-keyword
454
- (1:49) missing-whitespace-between-doctype-public-and-system-identifiers
455
- #document
456
- | <!DOCTYPE html "-//W3C//DTD HTML 4.01//EN" "http://www.w3.org/TR/html4/strict.dtd">
457
- | <html>
458
- | <head>
459
- | <body>
460
-
461
- #data
462
- <!DOCTYPE HTML PUBLIC'-//W3C//DTD HTML 4.01//EN''http://www.w3.org/TR/html4/strict.dtd'>
463
- #errors
464
- (1,21): unexpected-char-in-doctype
465
- (1,49): unexpected-char-in-doctype
466
- (1,88): unknown-doctype
467
- #new-errors
468
- (1:22) missing-whitespace-after-doctype-public-keyword
469
- (1:49) missing-whitespace-between-doctype-public-and-system-identifiers
470
- #document
471
- | <!DOCTYPE html "-//W3C//DTD HTML 4.01//EN" "http://www.w3.org/TR/html4/strict.dtd">
472
- | <html>
473
- | <head>
474
- | <body>