html-to-markdown 2.24.6 → 2.25.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (231) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile.lock +2 -2
  3. data/README.md +1 -1
  4. data/ext/html-to-markdown-rb/native/Cargo.lock +9 -32
  5. data/ext/html-to-markdown-rb/native/Cargo.toml +1 -1
  6. data/lib/html_to_markdown/version.rb +1 -1
  7. data/rust-vendor/html-to-markdown-rs/Cargo.toml +0 -1
  8. data/rust-vendor/html-to-markdown-rs/src/converter/main_helpers.rs +1 -1
  9. data/rust-vendor/html-to-markdown-rs/src/hocr/converter/hierarchy.rs +20 -5
  10. data/rust-vendor/html-to-markdown-rs/src/lib.rs +1 -0
  11. data/rust-vendor/{markup5ever_rcdom/lib.rs → html-to-markdown-rs/src/rcdom.rs} +56 -91
  12. data/rust-vendor/html-to-markdown-rs/tests/hocr_compliance_test.rs +157 -0
  13. data/rust-vendor/memmap2/.cargo-checksum.json +1 -1
  14. data/rust-vendor/memmap2/.cargo_vcs_info.json +1 -1
  15. data/rust-vendor/memmap2/CHANGELOG.md +8 -0
  16. data/rust-vendor/memmap2/Cargo.lock +1 -1
  17. data/rust-vendor/memmap2/Cargo.toml +2 -1
  18. data/rust-vendor/memmap2/Cargo.toml.orig +2 -1
  19. data/rust-vendor/memmap2/src/lib.rs +25 -1
  20. data/rust-vendor/memmap2/src/stub.rs +1 -4
  21. data/rust-vendor/memmap2/src/unix.rs +14 -1
  22. data/rust-vendor/png/.cargo-checksum.json +1 -1
  23. data/rust-vendor/png/.cargo_vcs_info.json +1 -1
  24. data/rust-vendor/png/CHANGES.md +44 -0
  25. data/rust-vendor/png/Cargo.lock +124 -171
  26. data/rust-vendor/png/Cargo.toml +1 -1
  27. data/rust-vendor/png/Cargo.toml.orig +1 -1
  28. data/rust-vendor/png/benches/expand_paletted.rs +5 -5
  29. data/rust-vendor/png/benches/unfilter.rs +3 -3
  30. data/rust-vendor/png/src/adam7.rs +17 -10
  31. data/rust-vendor/png/src/common.rs +8 -8
  32. data/rust-vendor/png/src/decoder/mod.rs +53 -20
  33. data/rust-vendor/png/src/decoder/stream.rs +263 -78
  34. data/rust-vendor/png/src/decoder/unfiltering_buffer.rs +210 -53
  35. data/rust-vendor/png/src/decoder/zlib.rs +130 -90
  36. data/rust-vendor/png/src/encoder.rs +4 -2
  37. data/rust-vendor/png/src/{filter.rs → filter/mod.rs} +100 -367
  38. data/rust-vendor/png/src/filter/optimization-notes.md +104 -0
  39. data/rust-vendor/png/src/filter/paeth.rs +398 -0
  40. data/rust-vendor/png/src/filter/simd.rs +308 -0
  41. data/rust-vendor/png/src/lib.rs +1 -0
  42. data/rust-vendor/syn/.cargo-checksum.json +1 -1
  43. data/rust-vendor/syn/.cargo_vcs_info.json +1 -1
  44. data/rust-vendor/syn/Cargo.lock +40 -41
  45. data/rust-vendor/syn/Cargo.toml +1 -1
  46. data/rust-vendor/syn/Cargo.toml.orig +1 -1
  47. data/rust-vendor/syn/src/item.rs +61 -40
  48. data/rust-vendor/syn/src/lib.rs +2 -1
  49. data/rust-vendor/syn/tests/test_item.rs +54 -0
  50. data/rust-vendor/unicode-ident/.cargo-checksum.json +1 -1
  51. data/rust-vendor/unicode-ident/.cargo_vcs_info.json +1 -1
  52. data/rust-vendor/unicode-ident/Cargo.lock +21 -21
  53. data/rust-vendor/unicode-ident/Cargo.toml +1 -1
  54. data/rust-vendor/unicode-ident/Cargo.toml.orig +1 -1
  55. data/rust-vendor/unicode-ident/src/lib.rs +1 -1
  56. data/rust-vendor/unicode-ident/src/tables.rs +87 -97
  57. data/rust-vendor/unicode-ident/tests/static_size.rs +1 -1
  58. metadata +7 -177
  59. data/rust-vendor/markup5ever_rcdom/.cargo-checksum.json +0 -1
  60. data/rust-vendor/markup5ever_rcdom/.cargo_vcs_info.json +0 -7
  61. data/rust-vendor/markup5ever_rcdom/Cargo.lock +0 -658
  62. data/rust-vendor/markup5ever_rcdom/Cargo.toml +0 -109
  63. data/rust-vendor/markup5ever_rcdom/Cargo.toml.orig +0 -42
  64. data/rust-vendor/markup5ever_rcdom/LICENSE-APACHE +0 -201
  65. data/rust-vendor/markup5ever_rcdom/LICENSE-MIT +0 -25
  66. data/rust-vendor/markup5ever_rcdom/README.md +0 -7
  67. data/rust-vendor/markup5ever_rcdom/custom-html5lib-tokenizer-tests/regression.test +0 -69
  68. data/rust-vendor/markup5ever_rcdom/data/test/ignore +0 -1
  69. data/rust-vendor/markup5ever_rcdom/examples/hello_xml.rs +0 -39
  70. data/rust-vendor/markup5ever_rcdom/examples/html2html.rs +0 -51
  71. data/rust-vendor/markup5ever_rcdom/examples/print-rcdom.rs +0 -78
  72. data/rust-vendor/markup5ever_rcdom/examples/xml_tree_printer.rs +0 -67
  73. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.gitattributes +0 -2
  74. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.github/workflows/downstream.yml +0 -76
  75. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.github/workflows/lint.yml +0 -25
  76. data/rust-vendor/markup5ever_rcdom/html5lib-tests/.gitignore +0 -79
  77. data/rust-vendor/markup5ever_rcdom/html5lib-tests/AUTHORS.rst +0 -34
  78. data/rust-vendor/markup5ever_rcdom/html5lib-tests/LICENSE +0 -21
  79. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/chardet/test_big5.txt +0 -51
  80. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/scripted/tests1.dat +0 -5
  81. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/test-yahoo-jp.dat +0 -10
  82. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/tests1.dat +0 -388
  83. data/rust-vendor/markup5ever_rcdom/html5lib-tests/encoding/tests2.dat +0 -115
  84. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint +0 -6
  85. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/__init__.py +0 -0
  86. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/__init__.py +0 -0
  87. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/LICENSE +0 -18
  88. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/__init__.py +0 -0
  89. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/lexer.py +0 -211
  90. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/lexer.pyi +0 -34
  91. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/parser.py +0 -872
  92. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/parser.pyi +0 -83
  93. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/py.typed +0 -0
  94. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/util.py +0 -72
  95. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/funcparserlib/util.pyi +0 -7
  96. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor/vendor.txt +0 -1
  97. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/_vendor-patches/funcparserlib.patch +0 -24
  98. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/lint.py +0 -280
  99. data/rust-vendor/markup5ever_rcdom/html5lib-tests/lint_lib/parser.py +0 -177
  100. data/rust-vendor/markup5ever_rcdom/html5lib-tests/pyproject.toml +0 -7
  101. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/core.test +0 -125
  102. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/injectmeta.test +0 -66
  103. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/optionaltags.test +0 -965
  104. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/options.test +0 -60
  105. data/rust-vendor/markup5ever_rcdom/html5lib-tests/serializer/whitespace.test +0 -51
  106. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/README.md +0 -107
  107. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/contentModelFlags.test +0 -93
  108. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/domjs.test +0 -335
  109. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/entities.test +0 -542
  110. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/escapeFlag.test +0 -36
  111. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/namedEntities.test +0 -42422
  112. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/numericEntities.test +0 -1677
  113. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/pendingSpecChanges.test +0 -9
  114. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test1.test +0 -353
  115. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test2.test +0 -275
  116. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test3.test +0 -11233
  117. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/test4.test +0 -532
  118. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/unicodeChars.test +0 -1577
  119. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/unicodeCharsProblematic.test +0 -41
  120. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tokenizer/xmlViolation.test +0 -20
  121. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/README.md +0 -108
  122. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/adoption01.dat +0 -354
  123. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/adoption02.dat +0 -39
  124. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/blocks.dat +0 -695
  125. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/comments01.dat +0 -217
  126. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/doctype01.dat +0 -474
  127. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/domjs-unsafe.dat +0 -0
  128. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/entities01.dat +0 -943
  129. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/entities02.dat +0 -309
  130. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/foreign-fragment.dat +0 -645
  131. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/html5test-com.dat +0 -301
  132. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/inbody01.dat +0 -54
  133. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/isindex.dat +0 -49
  134. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/main-element.dat +0 -46
  135. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/math.dat +0 -104
  136. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/menuitem-element.dat +0 -240
  137. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/namespace-sensitivity.dat +0 -22
  138. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/noscript01.dat +0 -237
  139. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/pending-spec-changes-plain-text-unsafe.dat +0 -0
  140. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/pending-spec-changes.dat +0 -46
  141. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/plain-text-unsafe.dat +0 -0
  142. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/quirks01.dat +0 -53
  143. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/ruby.dat +0 -302
  144. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scriptdata01.dat +0 -372
  145. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/adoption01.dat +0 -16
  146. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/ark.dat +0 -27
  147. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/scripted/webkit01.dat +0 -30
  148. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/search-element.dat +0 -46
  149. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/svg.dat +0 -104
  150. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tables01.dat +0 -322
  151. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/template.dat +0 -1673
  152. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests1.dat +0 -1956
  153. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests10.dat +0 -849
  154. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests11.dat +0 -523
  155. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests12.dat +0 -62
  156. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests14.dat +0 -75
  157. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests15.dat +0 -216
  158. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests16.dat +0 -2602
  159. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests17.dat +0 -179
  160. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests18.dat +0 -558
  161. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests19.dat +0 -1398
  162. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests2.dat +0 -831
  163. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests20.dat +0 -842
  164. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests21.dat +0 -306
  165. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests22.dat +0 -190
  166. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests23.dat +0 -168
  167. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests24.dat +0 -79
  168. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests25.dat +0 -288
  169. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests26.dat +0 -453
  170. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests3.dat +0 -305
  171. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests4.dat +0 -74
  172. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests5.dat +0 -210
  173. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests6.dat +0 -663
  174. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests7.dat +0 -453
  175. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests8.dat +0 -165
  176. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests9.dat +0 -472
  177. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tests_innerHTML_1.dat +0 -843
  178. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/tricky01.dat +0 -336
  179. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/webkit01.dat +0 -785
  180. data/rust-vendor/markup5ever_rcdom/html5lib-tests/tree-construction/webkit02.dat +0 -554
  181. data/rust-vendor/markup5ever_rcdom/tests/foreach_html5lib_test/mod.rs +0 -41
  182. data/rust-vendor/markup5ever_rcdom/tests/html-driver.rs +0 -29
  183. data/rust-vendor/markup5ever_rcdom/tests/html-serializer.rs +0 -265
  184. data/rust-vendor/markup5ever_rcdom/tests/html-tokenizer.rs +0 -487
  185. data/rust-vendor/markup5ever_rcdom/tests/html-tree-builder.rs +0 -298
  186. data/rust-vendor/markup5ever_rcdom/tests/html-tree-sink.rs +0 -141
  187. data/rust-vendor/markup5ever_rcdom/tests/util/find_tests.rs +0 -34
  188. data/rust-vendor/markup5ever_rcdom/tests/util/runner.rs +0 -48
  189. data/rust-vendor/markup5ever_rcdom/tests/xml-driver.rs +0 -101
  190. data/rust-vendor/markup5ever_rcdom/tests/xml-tokenizer.rs +0 -374
  191. data/rust-vendor/markup5ever_rcdom/tests/xml-tree-builder.rs +0 -237
  192. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/AUTHORS.rst +0 -9
  193. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/LICENSE +0 -21
  194. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/README.md +0 -92
  195. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/comments.test +0 -274
  196. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/doctype.test +0 -3232
  197. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/entities.test +0 -283
  198. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/eof.test +0 -113
  199. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/namedEntities.test +0 -42210
  200. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/numericEntities.test +0 -1349
  201. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/test1.test +0 -162
  202. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/test2.test +0 -64
  203. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tokenizer/unicodeChars.test +0 -1295
  204. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/README.md +0 -104
  205. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/namespace.dat +0 -119
  206. data/rust-vendor/markup5ever_rcdom/xml5lib-tests/tree-construction/test1.dat +0 -124
  207. data/rust-vendor/xml5ever/.cargo-checksum.json +0 -1
  208. data/rust-vendor/xml5ever/.cargo_vcs_info.json +0 -6
  209. data/rust-vendor/xml5ever/Cargo.lock +0 -752
  210. data/rust-vendor/xml5ever/Cargo.toml +0 -69
  211. data/rust-vendor/xml5ever/Cargo.toml.orig +0 -29
  212. data/rust-vendor/xml5ever/LICENSE-APACHE +0 -201
  213. data/rust-vendor/xml5ever/LICENSE-MIT +0 -25
  214. data/rust-vendor/xml5ever/README.md +0 -72
  215. data/rust-vendor/xml5ever/benches/xml5ever.rs +0 -77
  216. data/rust-vendor/xml5ever/data/bench/strong.xml +0 -1
  217. data/rust-vendor/xml5ever/examples/README.md +0 -223
  218. data/rust-vendor/xml5ever/examples/example.xml +0 -3
  219. data/rust-vendor/xml5ever/examples/simple_xml_tokenizer.rs +0 -81
  220. data/rust-vendor/xml5ever/examples/xml_tokenizer.rs +0 -115
  221. data/rust-vendor/xml5ever/src/driver.rs +0 -90
  222. data/rust-vendor/xml5ever/src/lib.rs +0 -47
  223. data/rust-vendor/xml5ever/src/macros.rs +0 -18
  224. data/rust-vendor/xml5ever/src/serialize/mod.rs +0 -216
  225. data/rust-vendor/xml5ever/src/tokenizer/char_ref/mod.rs +0 -456
  226. data/rust-vendor/xml5ever/src/tokenizer/interface.rs +0 -116
  227. data/rust-vendor/xml5ever/src/tokenizer/mod.rs +0 -1344
  228. data/rust-vendor/xml5ever/src/tokenizer/qname.rs +0 -84
  229. data/rust-vendor/xml5ever/src/tokenizer/states.rs +0 -167
  230. data/rust-vendor/xml5ever/src/tree_builder/mod.rs +0 -774
  231. data/rust-vendor/xml5ever/src/tree_builder/types.rs +0 -37
@@ -1,943 +0,0 @@
1
- #data
2
- FOO>BAR
3
- #errors
4
- (1,3): expected-doctype-but-got-chars
5
- #document
6
- | <html>
7
- | <head>
8
- | <body>
9
- | "FOO>BAR"
10
-
11
- #data
12
- FOO&gtBAR
13
- #errors
14
- (1,3): expected-doctype-but-got-chars
15
- (1,6): named-entity-without-semicolon
16
- #new-errors
17
- (1:7) missing-semicolon-after-character-reference
18
- #document
19
- | <html>
20
- | <head>
21
- | <body>
22
- | "FOO>BAR"
23
-
24
- #data
25
- FOO&gt BAR
26
- #errors
27
- (1,3): expected-doctype-but-got-chars
28
- (1,6): named-entity-without-semicolon
29
- #new-errors
30
- (1:7) missing-semicolon-after-character-reference
31
- #document
32
- | <html>
33
- | <head>
34
- | <body>
35
- | "FOO> BAR"
36
-
37
- #data
38
- FOO&gt;;;BAR
39
- #errors
40
- (1,3): expected-doctype-but-got-chars
41
- #document
42
- | <html>
43
- | <head>
44
- | <body>
45
- | "FOO>;;BAR"
46
-
47
- #data
48
- I'm &notit; I tell you
49
- #errors
50
- (1,4): expected-doctype-but-got-chars
51
- (1,9): named-entity-without-semicolon
52
- #new-errors
53
- (1:9) missing-semicolon-after-character-reference
54
- #document
55
- | <html>
56
- | <head>
57
- | <body>
58
- | "I'm ¬it; I tell you"
59
-
60
- #data
61
- I'm &notin; I tell you
62
- #errors
63
- (1,4): expected-doctype-but-got-chars
64
- #document
65
- | <html>
66
- | <head>
67
- | <body>
68
- | "I'm ∉ I tell you"
69
-
70
- #data
71
- &ammmp;
72
- #errors
73
- (1,1): expected-doctype-but-got-chars
74
- (1,7): unknown-named-character-reference
75
- #new-errors
76
- (1:7) unknown-named-character-reference
77
- #document
78
- | <html>
79
- | <head>
80
- | <body>
81
- | "&ammmp;"
82
-
83
- #data
84
- &ammmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmp;
85
- #errors
86
- (1,1): expected-doctype-but-got-chars
87
- (1,950): unknown-named-character-reference
88
- #new-errors
89
- (1:950) unknown-named-character-reference
90
- #document
91
- | <html>
92
- | <head>
93
- | <body>
94
- | "&ammmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmmp;"
95
-
96
- #data
97
- FOO& BAR
98
- #errors
99
- (1,3): expected-doctype-but-got-chars
100
- #document
101
- | <html>
102
- | <head>
103
- | <body>
104
- | "FOO& BAR"
105
-
106
- #data
107
- FOO&<BAR>
108
- #errors
109
- (1,3): expected-doctype-but-got-chars
110
- (1,9): expected-closing-tag-but-got-eof
111
- #document
112
- | <html>
113
- | <head>
114
- | <body>
115
- | "FOO&"
116
- | <bar>
117
-
118
- #data
119
- FOO&&&&gt;BAR
120
- #errors
121
- (1,3): expected-doctype-but-got-chars
122
- #document
123
- | <html>
124
- | <head>
125
- | <body>
126
- | "FOO&&&>BAR"
127
-
128
- #data
129
- FOO&#41;BAR
130
- #errors
131
- (1,3): expected-doctype-but-got-chars
132
- #document
133
- | <html>
134
- | <head>
135
- | <body>
136
- | "FOO)BAR"
137
-
138
- #data
139
- FOO&#x41;BAR
140
- #errors
141
- (1,3): expected-doctype-but-got-chars
142
- #document
143
- | <html>
144
- | <head>
145
- | <body>
146
- | "FOOABAR"
147
-
148
- #data
149
- FOO&#X41;BAR
150
- #errors
151
- (1,3): expected-doctype-but-got-chars
152
- #document
153
- | <html>
154
- | <head>
155
- | <body>
156
- | "FOOABAR"
157
-
158
- #data
159
- FOO&#BAR
160
- #errors
161
- (1,3): expected-doctype-but-got-chars
162
- (1,5): expected-numeric-entity
163
- #new-errors
164
- (1:6) absence-of-digits-in-numeric-character-reference
165
- #document
166
- | <html>
167
- | <head>
168
- | <body>
169
- | "FOO&#BAR"
170
-
171
- #data
172
- FOO&#ZOO
173
- #errors
174
- (1,3): expected-doctype-but-got-chars
175
- (1,5): expected-numeric-entity
176
- #new-errors
177
- (1:6) absence-of-digits-in-numeric-character-reference
178
- #document
179
- | <html>
180
- | <head>
181
- | <body>
182
- | "FOO&#ZOO"
183
-
184
- #data
185
- FOO&#xBAR
186
- #errors
187
- (1,3): expected-doctype-but-got-chars
188
- (1,7): expected-numeric-entity
189
- #new-errors
190
- (1:9) missing-semicolon-after-character-reference
191
- #document
192
- | <html>
193
- | <head>
194
- | <body>
195
- | "FOOºR"
196
-
197
- #data
198
- FOO&#xZOO
199
- #errors
200
- (1,3): expected-doctype-but-got-chars
201
- (1,6): expected-numeric-entity
202
- #new-errors
203
- (1:7) absence-of-digits-in-numeric-character-reference
204
- #document
205
- | <html>
206
- | <head>
207
- | <body>
208
- | "FOO&#xZOO"
209
-
210
- #data
211
- FOO&#XZOO
212
- #errors
213
- (1,3): expected-doctype-but-got-chars
214
- (1,6): expected-numeric-entity
215
- #new-errors
216
- (1:7) absence-of-digits-in-numeric-character-reference
217
- #document
218
- | <html>
219
- | <head>
220
- | <body>
221
- | "FOO&#XZOO"
222
-
223
- #data
224
- FOO&#41BAR
225
- #errors
226
- (1,3): expected-doctype-but-got-chars
227
- (1,7): numeric-entity-without-semicolon
228
- #new-errors
229
- (1:8) missing-semicolon-after-character-reference
230
- #document
231
- | <html>
232
- | <head>
233
- | <body>
234
- | "FOO)BAR"
235
-
236
- #data
237
- FOO&#x41BAR
238
- #errors
239
- (1,3): expected-doctype-but-got-chars
240
- (1,10): numeric-entity-without-semicolon
241
- #new-errors
242
- (1:11) missing-semicolon-after-character-reference
243
- #document
244
- | <html>
245
- | <head>
246
- | <body>
247
- | "FOO䆺R"
248
-
249
- #data
250
- FOO&#x41ZOO
251
- #errors
252
- (1,3): expected-doctype-but-got-chars
253
- (1,8): numeric-entity-without-semicolon
254
- #new-errors
255
- (1:9) missing-semicolon-after-character-reference
256
- #document
257
- | <html>
258
- | <head>
259
- | <body>
260
- | "FOOAZOO"
261
-
262
- #data
263
- FOO&#x0000;ZOO
264
- #errors
265
- (1,3): expected-doctype-but-got-chars
266
- (1,11): illegal-codepoint-for-numeric-entity
267
- #new-errors
268
- (1:12) null-character-reference
269
- #document
270
- | <html>
271
- | <head>
272
- | <body>
273
- | "FOO�ZOO"
274
-
275
- #data
276
- FOO&#x0078;ZOO
277
- #errors
278
- (1,3): expected-doctype-but-got-chars
279
- #document
280
- | <html>
281
- | <head>
282
- | <body>
283
- | "FOOxZOO"
284
-
285
- #data
286
- FOO&#x0079;ZOO
287
- #errors
288
- (1,3): expected-doctype-but-got-chars
289
- #document
290
- | <html>
291
- | <head>
292
- | <body>
293
- | "FOOyZOO"
294
-
295
- #data
296
- FOO&#x0080;ZOO
297
- #errors
298
- (1,3): expected-doctype-but-got-chars
299
- (1,11): illegal-codepoint-for-numeric-entity
300
- #new-errors
301
- (1:12) control-character-reference
302
- #document
303
- | <html>
304
- | <head>
305
- | <body>
306
- | "FOO€ZOO"
307
-
308
- #data
309
- FOO&#x0081;ZOO
310
- #errors
311
- (1,3): expected-doctype-but-got-chars
312
- (1,11): illegal-codepoint-for-numeric-entity
313
- #new-errors
314
- (1:12) control-character-reference
315
- #document
316
- | <html>
317
- | <head>
318
- | <body>
319
- | "FOOZOO"
320
-
321
- #data
322
- FOO&#x0082;ZOO
323
- #errors
324
- (1,3): expected-doctype-but-got-chars
325
- (1,11): illegal-codepoint-for-numeric-entity
326
- #new-errors
327
- (1:12) control-character-reference
328
- #document
329
- | <html>
330
- | <head>
331
- | <body>
332
- | "FOO‚ZOO"
333
-
334
- #data
335
- FOO&#x0083;ZOO
336
- #errors
337
- (1,3): expected-doctype-but-got-chars
338
- (1,11): illegal-codepoint-for-numeric-entity
339
- #new-errors
340
- (1:12) control-character-reference
341
- #document
342
- | <html>
343
- | <head>
344
- | <body>
345
- | "FOOƒZOO"
346
-
347
- #data
348
- FOO&#x0084;ZOO
349
- #errors
350
- (1,3): expected-doctype-but-got-chars
351
- (1,11): illegal-codepoint-for-numeric-entity
352
- #new-errors
353
- (1:12) control-character-reference
354
- #document
355
- | <html>
356
- | <head>
357
- | <body>
358
- | "FOO„ZOO"
359
-
360
- #data
361
- FOO&#x0085;ZOO
362
- #errors
363
- (1,3): expected-doctype-but-got-chars
364
- (1,11): illegal-codepoint-for-numeric-entity
365
- #new-errors
366
- (1:12) control-character-reference
367
- #document
368
- | <html>
369
- | <head>
370
- | <body>
371
- | "FOO…ZOO"
372
-
373
- #data
374
- FOO&#x0086;ZOO
375
- #errors
376
- (1,3): expected-doctype-but-got-chars
377
- (1,11): illegal-codepoint-for-numeric-entity
378
- #new-errors
379
- (1:12) control-character-reference
380
- #document
381
- | <html>
382
- | <head>
383
- | <body>
384
- | "FOO†ZOO"
385
-
386
- #data
387
- FOO&#x0087;ZOO
388
- #errors
389
- (1,3): expected-doctype-but-got-chars
390
- (1,11): illegal-codepoint-for-numeric-entity
391
- #new-errors
392
- (1:12) control-character-reference
393
- #document
394
- | <html>
395
- | <head>
396
- | <body>
397
- | "FOO‡ZOO"
398
-
399
- #data
400
- FOO&#x0088;ZOO
401
- #errors
402
- (1,3): expected-doctype-but-got-chars
403
- (1,11): illegal-codepoint-for-numeric-entity
404
- #new-errors
405
- (1:12) control-character-reference
406
- #document
407
- | <html>
408
- | <head>
409
- | <body>
410
- | "FOOˆZOO"
411
-
412
- #data
413
- FOO&#x0089;ZOO
414
- #errors
415
- (1,3): expected-doctype-but-got-chars
416
- (1,11): illegal-codepoint-for-numeric-entity
417
- #new-errors
418
- (1:12) control-character-reference
419
- #document
420
- | <html>
421
- | <head>
422
- | <body>
423
- | "FOO‰ZOO"
424
-
425
- #data
426
- FOO&#x008A;ZOO
427
- #errors
428
- (1,3): expected-doctype-but-got-chars
429
- (1,11): illegal-codepoint-for-numeric-entity
430
- #new-errors
431
- (1:12) control-character-reference
432
- #document
433
- | <html>
434
- | <head>
435
- | <body>
436
- | "FOOŠZOO"
437
-
438
- #data
439
- FOO&#x008B;ZOO
440
- #errors
441
- (1,3): expected-doctype-but-got-chars
442
- (1,11): illegal-codepoint-for-numeric-entity
443
- #new-errors
444
- (1:12) control-character-reference
445
- #document
446
- | <html>
447
- | <head>
448
- | <body>
449
- | "FOO‹ZOO"
450
-
451
- #data
452
- FOO&#x008C;ZOO
453
- #errors
454
- (1,3): expected-doctype-but-got-chars
455
- (1,11): illegal-codepoint-for-numeric-entity
456
- #new-errors
457
- (1:12) control-character-reference
458
- #document
459
- | <html>
460
- | <head>
461
- | <body>
462
- | "FOOŒZOO"
463
-
464
- #data
465
- FOO&#x008D;ZOO
466
- #errors
467
- (1,3): expected-doctype-but-got-chars
468
- (1,11): illegal-codepoint-for-numeric-entity
469
- #new-errors
470
- (1:12) control-character-reference
471
- #document
472
- | <html>
473
- | <head>
474
- | <body>
475
- | "FOOZOO"
476
-
477
- #data
478
- FOO&#x008E;ZOO
479
- #errors
480
- (1,3): expected-doctype-but-got-chars
481
- (1,11): illegal-codepoint-for-numeric-entity
482
- #new-errors
483
- (1:12) control-character-reference
484
- #document
485
- | <html>
486
- | <head>
487
- | <body>
488
- | "FOOŽZOO"
489
-
490
- #data
491
- FOO&#x008F;ZOO
492
- #errors
493
- (1,3): expected-doctype-but-got-chars
494
- (1,11): illegal-codepoint-for-numeric-entity
495
- #new-errors
496
- (1:12) control-character-reference
497
- #document
498
- | <html>
499
- | <head>
500
- | <body>
501
- | "FOOZOO"
502
-
503
- #data
504
- FOO&#x0090;ZOO
505
- #errors
506
- (1,3): expected-doctype-but-got-chars
507
- (1,11): illegal-codepoint-for-numeric-entity
508
- #new-errors
509
- (1:12) control-character-reference
510
- #document
511
- | <html>
512
- | <head>
513
- | <body>
514
- | "FOOZOO"
515
-
516
- #data
517
- FOO&#x0091;ZOO
518
- #errors
519
- (1,3): expected-doctype-but-got-chars
520
- (1,11): illegal-codepoint-for-numeric-entity
521
- #new-errors
522
- (1:12) control-character-reference
523
- #document
524
- | <html>
525
- | <head>
526
- | <body>
527
- | "FOO‘ZOO"
528
-
529
- #data
530
- FOO&#x0092;ZOO
531
- #errors
532
- (1,3): expected-doctype-but-got-chars
533
- (1,11): illegal-codepoint-for-numeric-entity
534
- #new-errors
535
- (1:12) control-character-reference
536
- #document
537
- | <html>
538
- | <head>
539
- | <body>
540
- | "FOO’ZOO"
541
-
542
- #data
543
- FOO&#x0093;ZOO
544
- #errors
545
- (1,3): expected-doctype-but-got-chars
546
- (1,11): illegal-codepoint-for-numeric-entity
547
- #new-errors
548
- (1:12) control-character-reference
549
- #document
550
- | <html>
551
- | <head>
552
- | <body>
553
- | "FOO“ZOO"
554
-
555
- #data
556
- FOO&#x0094;ZOO
557
- #errors
558
- (1,3): expected-doctype-but-got-chars
559
- (1,11): illegal-codepoint-for-numeric-entity
560
- #new-errors
561
- (1:12) control-character-reference
562
- #document
563
- | <html>
564
- | <head>
565
- | <body>
566
- | "FOO”ZOO"
567
-
568
- #data
569
- FOO&#x0095;ZOO
570
- #errors
571
- (1,3): expected-doctype-but-got-chars
572
- (1,11): illegal-codepoint-for-numeric-entity
573
- #new-errors
574
- (1:12) control-character-reference
575
- #document
576
- | <html>
577
- | <head>
578
- | <body>
579
- | "FOO•ZOO"
580
-
581
- #data
582
- FOO&#x0096;ZOO
583
- #errors
584
- (1,3): expected-doctype-but-got-chars
585
- (1,11): illegal-codepoint-for-numeric-entity
586
- #new-errors
587
- (1:12) control-character-reference
588
- #document
589
- | <html>
590
- | <head>
591
- | <body>
592
- | "FOO–ZOO"
593
-
594
- #data
595
- FOO&#x0097;ZOO
596
- #errors
597
- (1,3): expected-doctype-but-got-chars
598
- (1,11): illegal-codepoint-for-numeric-entity
599
- #new-errors
600
- (1:12) control-character-reference
601
- #document
602
- | <html>
603
- | <head>
604
- | <body>
605
- | "FOO—ZOO"
606
-
607
- #data
608
- FOO&#x0098;ZOO
609
- #errors
610
- (1,3): expected-doctype-but-got-chars
611
- (1,11): illegal-codepoint-for-numeric-entity
612
- #new-errors
613
- (1:12) control-character-reference
614
- #document
615
- | <html>
616
- | <head>
617
- | <body>
618
- | "FOO˜ZOO"
619
-
620
- #data
621
- FOO&#x0099;ZOO
622
- #errors
623
- (1,3): expected-doctype-but-got-chars
624
- (1,11): illegal-codepoint-for-numeric-entity
625
- #new-errors
626
- (1:12) control-character-reference
627
- #document
628
- | <html>
629
- | <head>
630
- | <body>
631
- | "FOO™ZOO"
632
-
633
- #data
634
- FOO&#x009A;ZOO
635
- #errors
636
- (1,3): expected-doctype-but-got-chars
637
- (1,11): illegal-codepoint-for-numeric-entity
638
- #new-errors
639
- (1:12) control-character-reference
640
- #document
641
- | <html>
642
- | <head>
643
- | <body>
644
- | "FOOšZOO"
645
-
646
- #data
647
- FOO&#x009B;ZOO
648
- #errors
649
- (1,3): expected-doctype-but-got-chars
650
- (1,11): illegal-codepoint-for-numeric-entity
651
- #new-errors
652
- (1:12) control-character-reference
653
- #document
654
- | <html>
655
- | <head>
656
- | <body>
657
- | "FOO›ZOO"
658
-
659
- #data
660
- FOO&#x009C;ZOO
661
- #errors
662
- (1,3): expected-doctype-but-got-chars
663
- (1,11): illegal-codepoint-for-numeric-entity
664
- #new-errors
665
- (1:12) control-character-reference
666
- #document
667
- | <html>
668
- | <head>
669
- | <body>
670
- | "FOOœZOO"
671
-
672
- #data
673
- FOO&#x009D;ZOO
674
- #errors
675
- (1,3): expected-doctype-but-got-chars
676
- (1,11): illegal-codepoint-for-numeric-entity
677
- #new-errors
678
- (1:12) control-character-reference
679
- #document
680
- | <html>
681
- | <head>
682
- | <body>
683
- | "FOOZOO"
684
-
685
- #data
686
- FOO&#x009E;ZOO
687
- #errors
688
- (1,3): expected-doctype-but-got-chars
689
- (1,11): illegal-codepoint-for-numeric-entity
690
- #new-errors
691
- (1:12) control-character-reference
692
- #document
693
- | <html>
694
- | <head>
695
- | <body>
696
- | "FOOžZOO"
697
-
698
- #data
699
- FOO&#x009F;ZOO
700
- #errors
701
- (1,3): expected-doctype-but-got-chars
702
- (1,11): illegal-codepoint-for-numeric-entity
703
- #new-errors
704
- (1:12) control-character-reference
705
- #document
706
- | <html>
707
- | <head>
708
- | <body>
709
- | "FOOŸZOO"
710
-
711
- #data
712
- FOO&#x00A0;ZOO
713
- #errors
714
- (1,3): expected-doctype-but-got-chars
715
- #document
716
- | <html>
717
- | <head>
718
- | <body>
719
- | "FOO ZOO"
720
-
721
- #data
722
- FOO&#xD7FF;ZOO
723
- #errors
724
- (1,3): expected-doctype-but-got-chars
725
- #document
726
- | <html>
727
- | <head>
728
- | <body>
729
- | "FOO퟿ZOO"
730
-
731
- #data
732
- FOO&#xD800;ZOO
733
- #errors
734
- (1,3): expected-doctype-but-got-chars
735
- (1,11): illegal-codepoint-for-numeric-entity
736
- #new-errors
737
- (1:12) surrogate-character-reference
738
- #document
739
- | <html>
740
- | <head>
741
- | <body>
742
- | "FOO�ZOO"
743
-
744
- #data
745
- FOO&#xD801;ZOO
746
- #errors
747
- (1,3): expected-doctype-but-got-chars
748
- (1,11): illegal-codepoint-for-numeric-entity
749
- #new-errors
750
- (1:12) surrogate-character-reference
751
- #document
752
- | <html>
753
- | <head>
754
- | <body>
755
- | "FOO�ZOO"
756
-
757
- #data
758
- FOO&#xDFFE;ZOO
759
- #errors
760
- (1,3): expected-doctype-but-got-chars
761
- (1,11): illegal-codepoint-for-numeric-entity
762
- #new-errors
763
- (1:12) surrogate-character-reference
764
- #document
765
- | <html>
766
- | <head>
767
- | <body>
768
- | "FOO�ZOO"
769
-
770
- #data
771
- FOO&#xDFFF;ZOO
772
- #errors
773
- (1,3): expected-doctype-but-got-chars
774
- (1,11): illegal-codepoint-for-numeric-entity
775
- #new-errors
776
- (1:12) surrogate-character-reference
777
- #document
778
- | <html>
779
- | <head>
780
- | <body>
781
- | "FOO�ZOO"
782
-
783
- #data
784
- FOO&#xE000;ZOO
785
- #errors
786
- (1,3): expected-doctype-but-got-chars
787
- #document
788
- | <html>
789
- | <head>
790
- | <body>
791
- | "FOOZOO"
792
-
793
- #data
794
- FOO&#x10FFFE;ZOO
795
- #errors
796
- (1,3): expected-doctype-but-got-chars
797
- (1,13): illegal-codepoint-for-numeric-entity
798
- #new-errors
799
- (1:14) noncharacter-character-reference
800
- #document
801
- | <html>
802
- | <head>
803
- | <body>
804
- | "FOO􏿾ZOO"
805
-
806
- #data
807
- FOO&#x1087D4;ZOO
808
- #errors
809
- (1,3): expected-doctype-but-got-chars
810
- #document
811
- | <html>
812
- | <head>
813
- | <body>
814
- | "FOO􈟔ZOO"
815
-
816
- #data
817
- FOO&#x10FFFF;ZOO
818
- #errors
819
- (1,3): expected-doctype-but-got-chars
820
- (1,13): illegal-codepoint-for-numeric-entity
821
- #new-errors
822
- (1:14) noncharacter-character-reference
823
- #document
824
- | <html>
825
- | <head>
826
- | <body>
827
- | "FOO􏿿ZOO"
828
-
829
- #data
830
- FOO&#x110000;ZOO
831
- #errors
832
- (1,3): expected-doctype-but-got-chars
833
- (1,13): illegal-codepoint-for-numeric-entity
834
- #new-errors
835
- (1:14) character-reference-outside-unicode-range
836
- #document
837
- | <html>
838
- | <head>
839
- | <body>
840
- | "FOO�ZOO"
841
-
842
- #data
843
- FOO&#xFFFFFF;ZOO
844
- #errors
845
- (1,3): expected-doctype-but-got-chars
846
- (1,13): illegal-codepoint-for-numeric-entity
847
- #new-errors
848
- (1:14) character-reference-outside-unicode-range
849
- #document
850
- | <html>
851
- | <head>
852
- | <body>
853
- | "FOO�ZOO"
854
-
855
- #data
856
- FOO&#11111111111
857
- #errors
858
- (1,3): expected-doctype-but-got-chars
859
- (1,13): illegal-codepoint-for-numeric-entity
860
- (1,13): eof-in-numeric-entity
861
- #new-errors
862
- (1:17) missing-semicolon-after-character-reference
863
- (1:17) character-reference-outside-unicode-range
864
- #document
865
- | <html>
866
- | <head>
867
- | <body>
868
- | "FOO�"
869
-
870
- #data
871
- FOO&#1111111111
872
- #errors
873
- (1,3): expected-doctype-but-got-chars
874
- (1,13): illegal-codepoint-for-numeric-entity
875
- (1,13): eof-in-numeric-entity
876
- #new-errors
877
- (1:16) missing-semicolon-after-character-reference
878
- (1:16) character-reference-outside-unicode-range
879
- #document
880
- | <html>
881
- | <head>
882
- | <body>
883
- | "FOO�"
884
-
885
- #data
886
- FOO&#111111111111
887
- #errors
888
- (1,3): expected-doctype-but-got-chars
889
- (1,13): illegal-codepoint-for-numeric-entity
890
- (1,13): eof-in-numeric-entity
891
- #new-errors
892
- (1:18) missing-semicolon-after-character-reference
893
- (1:18) character-reference-outside-unicode-range
894
- #document
895
- | <html>
896
- | <head>
897
- | <body>
898
- | "FOO�"
899
-
900
- #data
901
- FOO&#11111111111ZOO
902
- #errors
903
- (1,3): expected-doctype-but-got-chars
904
- (1,16): numeric-entity-without-semicolon
905
- (1,16): illegal-codepoint-for-numeric-entity
906
- #new-errors
907
- (1:17) missing-semicolon-after-character-reference
908
- (1:17) character-reference-outside-unicode-range
909
- #document
910
- | <html>
911
- | <head>
912
- | <body>
913
- | "FOO�ZOO"
914
-
915
- #data
916
- FOO&#1111111111ZOO
917
- #errors
918
- (1,3): expected-doctype-but-got-chars
919
- (1,15): numeric-entity-without-semicolon
920
- (1,15): illegal-codepoint-for-numeric-entity
921
- #new-errors
922
- (1:16) missing-semicolon-after-character-reference
923
- (1:16) character-reference-outside-unicode-range
924
- #document
925
- | <html>
926
- | <head>
927
- | <body>
928
- | "FOO�ZOO"
929
-
930
- #data
931
- FOO&#111111111111ZOO
932
- #errors
933
- (1,3): expected-doctype-but-got-chars
934
- (1,17): numeric-entity-without-semicolon
935
- (1,17): illegal-codepoint-for-numeric-entity
936
- #new-errors
937
- (1:18) missing-semicolon-after-character-reference
938
- (1:18) character-reference-outside-unicode-range
939
- #document
940
- | <html>
941
- | <head>
942
- | <body>
943
- | "FOO�ZOO"