nokogiri 1.6.0 → 1.13.2

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of nokogiri might be problematic. Click here for more details.

Files changed (340) hide show
  1. checksums.yaml +7 -0
  2. data/Gemfile +3 -19
  3. data/LICENSE-DEPENDENCIES.md +1903 -0
  4. data/LICENSE.md +9 -0
  5. data/README.md +280 -0
  6. data/bin/nokogiri +84 -31
  7. data/dependencies.yml +23 -4
  8. data/ext/nokogiri/depend +38 -358
  9. data/ext/nokogiri/extconf.rb +952 -132
  10. data/ext/nokogiri/gumbo.c +584 -0
  11. data/ext/nokogiri/html4_document.c +166 -0
  12. data/ext/nokogiri/html4_element_description.c +294 -0
  13. data/ext/nokogiri/html4_entity_lookup.c +37 -0
  14. data/ext/nokogiri/html4_sax_parser_context.c +120 -0
  15. data/ext/nokogiri/html4_sax_push_parser.c +95 -0
  16. data/ext/nokogiri/libxml2_backwards_compat.c +121 -0
  17. data/ext/nokogiri/nokogiri.c +231 -96
  18. data/ext/nokogiri/nokogiri.h +188 -129
  19. data/ext/nokogiri/test_global_handlers.c +40 -0
  20. data/ext/nokogiri/xml_attr.c +49 -40
  21. data/ext/nokogiri/xml_attribute_decl.c +18 -18
  22. data/ext/nokogiri/xml_cdata.c +24 -23
  23. data/ext/nokogiri/xml_comment.c +29 -21
  24. data/ext/nokogiri/xml_document.c +327 -223
  25. data/ext/nokogiri/xml_document_fragment.c +12 -16
  26. data/ext/nokogiri/xml_dtd.c +56 -50
  27. data/ext/nokogiri/xml_element_content.c +31 -26
  28. data/ext/nokogiri/xml_element_decl.c +22 -22
  29. data/ext/nokogiri/xml_encoding_handler.c +45 -20
  30. data/ext/nokogiri/xml_entity_decl.c +32 -30
  31. data/ext/nokogiri/xml_entity_reference.c +16 -18
  32. data/ext/nokogiri/xml_namespace.c +74 -32
  33. data/ext/nokogiri/xml_node.c +1290 -680
  34. data/ext/nokogiri/xml_node_set.c +239 -208
  35. data/ext/nokogiri/xml_processing_instruction.c +17 -19
  36. data/ext/nokogiri/xml_reader.c +227 -189
  37. data/ext/nokogiri/xml_relax_ng.c +52 -28
  38. data/ext/nokogiri/xml_sax_parser.c +123 -125
  39. data/ext/nokogiri/xml_sax_parser_context.c +138 -79
  40. data/ext/nokogiri/xml_sax_push_parser.c +88 -35
  41. data/ext/nokogiri/xml_schema.c +112 -33
  42. data/ext/nokogiri/xml_syntax_error.c +50 -23
  43. data/ext/nokogiri/xml_text.c +14 -18
  44. data/ext/nokogiri/xml_xpath_context.c +227 -140
  45. data/ext/nokogiri/xslt_stylesheet.c +269 -177
  46. data/gumbo-parser/CHANGES.md +63 -0
  47. data/gumbo-parser/Makefile +101 -0
  48. data/gumbo-parser/THANKS +27 -0
  49. data/gumbo-parser/src/Makefile +34 -0
  50. data/gumbo-parser/src/README.md +41 -0
  51. data/gumbo-parser/src/ascii.c +75 -0
  52. data/gumbo-parser/src/ascii.h +115 -0
  53. data/gumbo-parser/src/attribute.c +42 -0
  54. data/gumbo-parser/src/attribute.h +17 -0
  55. data/gumbo-parser/src/char_ref.c +22225 -0
  56. data/gumbo-parser/src/char_ref.h +29 -0
  57. data/gumbo-parser/src/char_ref.rl +2154 -0
  58. data/gumbo-parser/src/error.c +626 -0
  59. data/gumbo-parser/src/error.h +148 -0
  60. data/gumbo-parser/src/foreign_attrs.c +104 -0
  61. data/gumbo-parser/src/foreign_attrs.gperf +27 -0
  62. data/gumbo-parser/src/gumbo.h +943 -0
  63. data/gumbo-parser/src/insertion_mode.h +33 -0
  64. data/gumbo-parser/src/macros.h +91 -0
  65. data/gumbo-parser/src/parser.c +4875 -0
  66. data/gumbo-parser/src/parser.h +41 -0
  67. data/gumbo-parser/src/replacement.h +33 -0
  68. data/gumbo-parser/src/string_buffer.c +103 -0
  69. data/gumbo-parser/src/string_buffer.h +68 -0
  70. data/gumbo-parser/src/string_piece.c +48 -0
  71. data/gumbo-parser/src/svg_attrs.c +174 -0
  72. data/gumbo-parser/src/svg_attrs.gperf +77 -0
  73. data/gumbo-parser/src/svg_tags.c +137 -0
  74. data/gumbo-parser/src/svg_tags.gperf +55 -0
  75. data/gumbo-parser/src/tag.c +222 -0
  76. data/gumbo-parser/src/tag_lookup.c +382 -0
  77. data/gumbo-parser/src/tag_lookup.gperf +169 -0
  78. data/gumbo-parser/src/tag_lookup.h +13 -0
  79. data/gumbo-parser/src/token_buffer.c +79 -0
  80. data/gumbo-parser/src/token_buffer.h +71 -0
  81. data/gumbo-parser/src/token_type.h +17 -0
  82. data/gumbo-parser/src/tokenizer.c +3463 -0
  83. data/gumbo-parser/src/tokenizer.h +112 -0
  84. data/gumbo-parser/src/tokenizer_states.h +339 -0
  85. data/gumbo-parser/src/utf8.c +245 -0
  86. data/gumbo-parser/src/utf8.h +164 -0
  87. data/gumbo-parser/src/util.c +68 -0
  88. data/gumbo-parser/src/util.h +30 -0
  89. data/gumbo-parser/src/vector.c +111 -0
  90. data/gumbo-parser/src/vector.h +45 -0
  91. data/lib/nokogiri/class_resolver.rb +67 -0
  92. data/lib/nokogiri/css/node.rb +10 -58
  93. data/lib/nokogiri/css/parser.rb +407 -357
  94. data/lib/nokogiri/css/parser.y +265 -246
  95. data/lib/nokogiri/css/parser_extras.rb +52 -49
  96. data/lib/nokogiri/css/syntax_error.rb +3 -1
  97. data/lib/nokogiri/css/tokenizer.rb +107 -104
  98. data/lib/nokogiri/css/tokenizer.rex +8 -7
  99. data/lib/nokogiri/css/xpath_visitor.rb +266 -80
  100. data/lib/nokogiri/css.rb +50 -17
  101. data/lib/nokogiri/decorators/slop.rb +17 -8
  102. data/lib/nokogiri/extension.rb +31 -0
  103. data/lib/nokogiri/gumbo.rb +15 -0
  104. data/lib/nokogiri/html.rb +38 -27
  105. data/lib/nokogiri/{html → html4}/builder.rb +4 -2
  106. data/lib/nokogiri/html4/document.rb +331 -0
  107. data/lib/nokogiri/html4/document_fragment.rb +54 -0
  108. data/lib/nokogiri/{html → html4}/element_description.rb +3 -1
  109. data/lib/nokogiri/html4/element_description_defaults.rb +578 -0
  110. data/lib/nokogiri/{html → html4}/entity_lookup.rb +4 -2
  111. data/lib/nokogiri/{html → html4}/sax/parser.rb +24 -15
  112. data/lib/nokogiri/html4/sax/parser_context.rb +20 -0
  113. data/lib/nokogiri/html4/sax/push_parser.rb +37 -0
  114. data/lib/nokogiri/html4.rb +46 -0
  115. data/lib/nokogiri/html5/document.rb +88 -0
  116. data/lib/nokogiri/html5/document_fragment.rb +83 -0
  117. data/lib/nokogiri/html5/node.rb +96 -0
  118. data/lib/nokogiri/html5.rb +477 -0
  119. data/lib/nokogiri/jruby/dependencies.rb +21 -0
  120. data/lib/nokogiri/syntax_error.rb +2 -0
  121. data/lib/nokogiri/version/constant.rb +6 -0
  122. data/lib/nokogiri/version/info.rb +221 -0
  123. data/lib/nokogiri/version.rb +3 -105
  124. data/lib/nokogiri/xml/attr.rb +6 -3
  125. data/lib/nokogiri/xml/attribute_decl.rb +3 -1
  126. data/lib/nokogiri/xml/builder.rb +96 -54
  127. data/lib/nokogiri/xml/cdata.rb +3 -1
  128. data/lib/nokogiri/xml/character_data.rb +2 -0
  129. data/lib/nokogiri/xml/document.rb +234 -95
  130. data/lib/nokogiri/xml/document_fragment.rb +86 -36
  131. data/lib/nokogiri/xml/dtd.rb +16 -4
  132. data/lib/nokogiri/xml/element_content.rb +2 -0
  133. data/lib/nokogiri/xml/element_decl.rb +3 -1
  134. data/lib/nokogiri/xml/entity_decl.rb +4 -2
  135. data/lib/nokogiri/xml/entity_reference.rb +20 -0
  136. data/lib/nokogiri/xml/namespace.rb +3 -0
  137. data/lib/nokogiri/xml/node/save_options.rb +8 -4
  138. data/lib/nokogiri/xml/node.rb +947 -502
  139. data/lib/nokogiri/xml/node_set.rb +168 -159
  140. data/lib/nokogiri/xml/notation.rb +13 -0
  141. data/lib/nokogiri/xml/parse_options.rb +40 -5
  142. data/lib/nokogiri/xml/pp/character_data.rb +9 -6
  143. data/lib/nokogiri/xml/pp/node.rb +25 -26
  144. data/lib/nokogiri/xml/pp.rb +4 -2
  145. data/lib/nokogiri/xml/processing_instruction.rb +3 -1
  146. data/lib/nokogiri/xml/reader.rb +23 -28
  147. data/lib/nokogiri/xml/relax_ng.rb +8 -2
  148. data/lib/nokogiri/xml/sax/document.rb +45 -49
  149. data/lib/nokogiri/xml/sax/parser.rb +43 -41
  150. data/lib/nokogiri/xml/sax/parser_context.rb +8 -3
  151. data/lib/nokogiri/xml/sax/push_parser.rb +6 -5
  152. data/lib/nokogiri/xml/sax.rb +6 -4
  153. data/lib/nokogiri/xml/schema.rb +19 -9
  154. data/lib/nokogiri/xml/searchable.rb +270 -0
  155. data/lib/nokogiri/xml/syntax_error.rb +25 -1
  156. data/lib/nokogiri/xml/text.rb +2 -0
  157. data/lib/nokogiri/xml/xpath/syntax_error.rb +4 -2
  158. data/lib/nokogiri/xml/xpath.rb +15 -4
  159. data/lib/nokogiri/xml/xpath_context.rb +3 -3
  160. data/lib/nokogiri/xml.rb +38 -36
  161. data/lib/nokogiri/xslt/stylesheet.rb +3 -1
  162. data/lib/nokogiri/xslt.rb +29 -20
  163. data/lib/nokogiri.rb +69 -69
  164. data/lib/xsd/xmlparser/nokogiri.rb +26 -24
  165. data/patches/libxml2/0001-Remove-script-macro-support.patch +40 -0
  166. data/patches/libxml2/0002-Update-entities-to-remove-handling-of-ssi.patch +44 -0
  167. data/patches/libxml2/0003-libxml2.la-is-in-top_builddir.patch +25 -0
  168. data/patches/libxml2/0004-use-glibc-strlen.patch +53 -0
  169. data/patches/libxml2/0005-avoid-isnan-isinf.patch +81 -0
  170. data/patches/libxml2/0006-update-automake-files-for-arm64.patch +3040 -0
  171. data/patches/libxml2/0008-htmlParseComment-handle-abruptly-closed-comments.patch +61 -0
  172. data/patches/libxml2/0009-allow-wildcard-namespaces.patch +77 -0
  173. data/patches/libxslt/0001-update-automake-files-for-arm64.patch +3037 -0
  174. data/ports/archives/libxml2-2.9.13.tar.xz +0 -0
  175. data/ports/archives/libxslt-1.1.35.tar.xz +0 -0
  176. metadata +278 -362
  177. data/.autotest +0 -26
  178. data/.gemtest +0 -0
  179. data/.travis.yml +0 -27
  180. data/CHANGELOG.ja.rdoc +0 -819
  181. data/CHANGELOG.rdoc +0 -819
  182. data/C_CODING_STYLE.rdoc +0 -33
  183. data/Manifest.txt +0 -315
  184. data/README.ja.rdoc +0 -106
  185. data/README.rdoc +0 -175
  186. data/ROADMAP.md +0 -90
  187. data/Rakefile +0 -246
  188. data/STANDARD_RESPONSES.md +0 -47
  189. data/Y_U_NO_GEMSPEC.md +0 -155
  190. data/build_all +0 -105
  191. data/ext/nokogiri/html_document.c +0 -170
  192. data/ext/nokogiri/html_document.h +0 -10
  193. data/ext/nokogiri/html_element_description.c +0 -279
  194. data/ext/nokogiri/html_element_description.h +0 -10
  195. data/ext/nokogiri/html_entity_lookup.c +0 -32
  196. data/ext/nokogiri/html_entity_lookup.h +0 -8
  197. data/ext/nokogiri/html_sax_parser_context.c +0 -116
  198. data/ext/nokogiri/html_sax_parser_context.h +0 -11
  199. data/ext/nokogiri/html_sax_push_parser.c +0 -87
  200. data/ext/nokogiri/html_sax_push_parser.h +0 -9
  201. data/ext/nokogiri/xml_attr.h +0 -9
  202. data/ext/nokogiri/xml_attribute_decl.h +0 -9
  203. data/ext/nokogiri/xml_cdata.h +0 -9
  204. data/ext/nokogiri/xml_comment.h +0 -9
  205. data/ext/nokogiri/xml_document.h +0 -23
  206. data/ext/nokogiri/xml_document_fragment.h +0 -10
  207. data/ext/nokogiri/xml_dtd.h +0 -10
  208. data/ext/nokogiri/xml_element_content.h +0 -10
  209. data/ext/nokogiri/xml_element_decl.h +0 -9
  210. data/ext/nokogiri/xml_encoding_handler.h +0 -8
  211. data/ext/nokogiri/xml_entity_decl.h +0 -10
  212. data/ext/nokogiri/xml_entity_reference.h +0 -9
  213. data/ext/nokogiri/xml_io.c +0 -56
  214. data/ext/nokogiri/xml_io.h +0 -11
  215. data/ext/nokogiri/xml_libxml2_hacks.c +0 -112
  216. data/ext/nokogiri/xml_libxml2_hacks.h +0 -12
  217. data/ext/nokogiri/xml_namespace.h +0 -13
  218. data/ext/nokogiri/xml_node.h +0 -13
  219. data/ext/nokogiri/xml_node_set.h +0 -14
  220. data/ext/nokogiri/xml_processing_instruction.h +0 -9
  221. data/ext/nokogiri/xml_reader.h +0 -10
  222. data/ext/nokogiri/xml_relax_ng.h +0 -9
  223. data/ext/nokogiri/xml_sax_parser.h +0 -39
  224. data/ext/nokogiri/xml_sax_parser_context.h +0 -10
  225. data/ext/nokogiri/xml_sax_push_parser.h +0 -9
  226. data/ext/nokogiri/xml_schema.h +0 -9
  227. data/ext/nokogiri/xml_syntax_error.h +0 -13
  228. data/ext/nokogiri/xml_text.h +0 -9
  229. data/ext/nokogiri/xml_xpath_context.h +0 -10
  230. data/ext/nokogiri/xslt_stylesheet.h +0 -14
  231. data/lib/nokogiri/html/document.rb +0 -254
  232. data/lib/nokogiri/html/document_fragment.rb +0 -41
  233. data/lib/nokogiri/html/element_description_defaults.rb +0 -671
  234. data/lib/nokogiri/html/sax/parser_context.rb +0 -16
  235. data/lib/nokogiri/html/sax/push_parser.rb +0 -16
  236. data/ports/archives/libxml2-2.8.0.tar.gz +0 -0
  237. data/ports/archives/libxslt-1.1.26.tar.gz +0 -0
  238. data/tasks/cross_compile.rb +0 -132
  239. data/tasks/nokogiri.org.rb +0 -24
  240. data/tasks/test.rb +0 -95
  241. data/test/css/test_nthiness.rb +0 -159
  242. data/test/css/test_parser.rb +0 -341
  243. data/test/css/test_tokenizer.rb +0 -198
  244. data/test/css/test_xpath_visitor.rb +0 -91
  245. data/test/decorators/test_slop.rb +0 -16
  246. data/test/files/2ch.html +0 -108
  247. data/test/files/address_book.rlx +0 -12
  248. data/test/files/address_book.xml +0 -10
  249. data/test/files/bar/bar.xsd +0 -4
  250. data/test/files/bogus.xml +0 -0
  251. data/test/files/dont_hurt_em_why.xml +0 -422
  252. data/test/files/encoding.html +0 -82
  253. data/test/files/encoding.xhtml +0 -84
  254. data/test/files/exslt.xml +0 -8
  255. data/test/files/exslt.xslt +0 -35
  256. data/test/files/foo/foo.xsd +0 -4
  257. data/test/files/metacharset.html +0 -10
  258. data/test/files/noencoding.html +0 -47
  259. data/test/files/po.xml +0 -32
  260. data/test/files/po.xsd +0 -66
  261. data/test/files/saml/saml20assertion_schema.xsd +0 -283
  262. data/test/files/saml/saml20protocol_schema.xsd +0 -302
  263. data/test/files/saml/xenc_schema.xsd +0 -146
  264. data/test/files/saml/xmldsig_schema.xsd +0 -318
  265. data/test/files/shift_jis.html +0 -10
  266. data/test/files/shift_jis.xml +0 -5
  267. data/test/files/snuggles.xml +0 -3
  268. data/test/files/staff.dtd +0 -10
  269. data/test/files/staff.xml +0 -59
  270. data/test/files/staff.xslt +0 -32
  271. data/test/files/test_document_url/bar.xml +0 -2
  272. data/test/files/test_document_url/document.dtd +0 -4
  273. data/test/files/test_document_url/document.xml +0 -6
  274. data/test/files/tlm.html +0 -850
  275. data/test/files/to_be_xincluded.xml +0 -2
  276. data/test/files/valid_bar.xml +0 -2
  277. data/test/files/xinclude.xml +0 -4
  278. data/test/helper.rb +0 -154
  279. data/test/html/sax/test_parser.rb +0 -141
  280. data/test/html/sax/test_parser_context.rb +0 -46
  281. data/test/html/test_builder.rb +0 -164
  282. data/test/html/test_document.rb +0 -552
  283. data/test/html/test_document_encoding.rb +0 -138
  284. data/test/html/test_document_fragment.rb +0 -261
  285. data/test/html/test_element_description.rb +0 -105
  286. data/test/html/test_named_characters.rb +0 -14
  287. data/test/html/test_node.rb +0 -196
  288. data/test/html/test_node_encoding.rb +0 -27
  289. data/test/namespaces/test_additional_namespaces_in_builder_doc.rb +0 -14
  290. data/test/namespaces/test_namespaces_in_builder_doc.rb +0 -75
  291. data/test/namespaces/test_namespaces_in_created_doc.rb +0 -75
  292. data/test/namespaces/test_namespaces_in_parsed_doc.rb +0 -66
  293. data/test/test_convert_xpath.rb +0 -135
  294. data/test/test_css_cache.rb +0 -45
  295. data/test/test_encoding_handler.rb +0 -46
  296. data/test/test_memory_leak.rb +0 -156
  297. data/test/test_nokogiri.rb +0 -132
  298. data/test/test_reader.rb +0 -555
  299. data/test/test_soap4r_sax.rb +0 -52
  300. data/test/test_xslt_transforms.rb +0 -254
  301. data/test/xml/node/test_save_options.rb +0 -28
  302. data/test/xml/node/test_subclass.rb +0 -44
  303. data/test/xml/sax/test_parser.rb +0 -366
  304. data/test/xml/sax/test_parser_context.rb +0 -106
  305. data/test/xml/sax/test_push_parser.rb +0 -157
  306. data/test/xml/test_attr.rb +0 -64
  307. data/test/xml/test_attribute_decl.rb +0 -86
  308. data/test/xml/test_builder.rb +0 -306
  309. data/test/xml/test_c14n.rb +0 -151
  310. data/test/xml/test_cdata.rb +0 -48
  311. data/test/xml/test_comment.rb +0 -29
  312. data/test/xml/test_document.rb +0 -828
  313. data/test/xml/test_document_encoding.rb +0 -28
  314. data/test/xml/test_document_fragment.rb +0 -223
  315. data/test/xml/test_dtd.rb +0 -103
  316. data/test/xml/test_dtd_encoding.rb +0 -33
  317. data/test/xml/test_element_content.rb +0 -56
  318. data/test/xml/test_element_decl.rb +0 -73
  319. data/test/xml/test_entity_decl.rb +0 -122
  320. data/test/xml/test_entity_reference.rb +0 -245
  321. data/test/xml/test_namespace.rb +0 -95
  322. data/test/xml/test_node.rb +0 -1137
  323. data/test/xml/test_node_attributes.rb +0 -96
  324. data/test/xml/test_node_encoding.rb +0 -107
  325. data/test/xml/test_node_inheritance.rb +0 -32
  326. data/test/xml/test_node_reparenting.rb +0 -374
  327. data/test/xml/test_node_set.rb +0 -755
  328. data/test/xml/test_parse_options.rb +0 -64
  329. data/test/xml/test_processing_instruction.rb +0 -30
  330. data/test/xml/test_reader_encoding.rb +0 -142
  331. data/test/xml/test_relax_ng.rb +0 -60
  332. data/test/xml/test_schema.rb +0 -103
  333. data/test/xml/test_syntax_error.rb +0 -12
  334. data/test/xml/test_text.rb +0 -45
  335. data/test/xml/test_unparented_node.rb +0 -422
  336. data/test/xml/test_xinclude.rb +0 -83
  337. data/test/xml/test_xpath.rb +0 -295
  338. data/test/xslt/test_custom_functions.rb +0 -133
  339. data/test/xslt/test_exception_handling.rb +0 -37
  340. data/test_all +0 -81
@@ -1,245 +0,0 @@
1
- require "helper"
2
-
3
- module Nokogiri
4
- module XML
5
- class TestEntityReference < Nokogiri::TestCase
6
- def setup
7
- super
8
- @xml = Nokogiri::XML(File.open(XML_FILE), XML_FILE)
9
- end
10
-
11
- def test_new
12
- assert ref = EntityReference.new(@xml, 'ent4')
13
- assert_instance_of EntityReference, ref
14
- end
15
-
16
- def test_many_references
17
- 100.times { EntityReference.new(@xml, 'foo') }
18
- end
19
-
20
- def test_newline_node
21
- # issue 719
22
- xml = <<EOF
23
- <?xml version="1.0" ?>
24
- <item></item>
25
- EOF
26
- doc = Nokogiri::XML xml
27
- lf_node = Nokogiri::XML::EntityReference.new(doc, "#xa")
28
- doc.xpath('/item').first.add_child(lf_node)
29
- assert_match /&#xa;/, doc.to_xml
30
- end
31
- end
32
-
33
- module Common
34
- PATH = 'test/files/test_document_url/'
35
-
36
- attr_accessor :path, :parser
37
-
38
- def xml_document
39
- File.join path, 'document.xml'
40
- end
41
-
42
- def self.included base
43
- def base.test_relative_and_absolute_path method_name, &block
44
- test_relative_path method_name, &block
45
- test_absolute_path method_name, &block
46
- end
47
-
48
- def base.test_absolute_path method_name, &block
49
- define_method "#{method_name}_with_absolute_path" do
50
- self.path = "#{File.expand_path PATH}/"
51
- instance_eval(&block)
52
- end
53
- end
54
-
55
- def base.test_relative_path method_name, &block
56
- define_method method_name do
57
- self.path = PATH
58
- instance_eval(&block)
59
- end
60
- end
61
- end
62
- end
63
-
64
- class TestDOMEntityReference < Nokogiri::TestCase
65
- include Common
66
-
67
- def setup
68
- super
69
- @parser = Nokogiri::XML::Document
70
- end
71
-
72
- test_relative_and_absolute_path :test_dom_entity_reference_with_dtdloda do
73
- # Make sure that we can parse entity references and include them in the document
74
- html = File.read xml_document
75
- doc = @parser.parse html, path do |cfg|
76
- cfg.default_xml
77
- cfg.dtdload
78
- cfg.noent
79
- end
80
- assert_equal [], doc.errors
81
- assert_equal "foobar", doc.xpath('//blah').text
82
- end
83
-
84
- test_relative_and_absolute_path :test_dom_entity_reference_with_dtdvalid do
85
- # Make sure that we can parse entity references and include them in the document
86
- html = File.read xml_document
87
- doc = @parser.parse html, path do |cfg|
88
- cfg.default_xml
89
- cfg.dtdvalid
90
- cfg.noent
91
- end
92
- assert_equal [], doc.errors
93
- assert_equal "foobar", doc.xpath('//blah').text
94
- end
95
-
96
- test_absolute_path :test_dom_dtd_loading_with_absolute_path do
97
- # Make sure that we can parse entity references and include them in the document
98
- html = %Q[<?xml version="1.0" encoding="UTF-8" ?>
99
- <!DOCTYPE document SYSTEM "#{path}/document.dtd">
100
- <document>
101
- <body>&bar;</body>
102
- </document>
103
- ]
104
- doc = @parser.parse html, xml_document do |cfg|
105
- cfg.default_xml
106
- cfg.dtdvalid
107
- cfg.noent
108
- end
109
- assert_equal [], doc.errors
110
- assert_equal "foobar", doc.xpath('//blah').text
111
- end
112
-
113
- test_relative_and_absolute_path :test_dom_entity_reference_with_io do
114
- # Make sure that we can parse entity references and include them in the document
115
- html = File.open xml_document
116
- doc = @parser.parse html, nil do |cfg|
117
- cfg.default_xml
118
- cfg.dtdload
119
- cfg.noent
120
- end
121
- assert_equal [], doc.errors
122
- assert_equal "foobar", doc.xpath('//blah').text
123
- end
124
-
125
- test_relative_and_absolute_path :test_dom_entity_reference_without_noent do
126
- # Make sure that we don't include entity references unless NOENT is set to true
127
- html = File.read xml_document
128
- doc = @parser.parse html, path do |cfg|
129
- cfg.default_xml
130
- cfg.dtdload
131
- end
132
- assert_equal [], doc.errors
133
- assert_kind_of Nokogiri::XML::EntityReference, doc.xpath('//body').first.children.first
134
- end
135
-
136
- test_relative_and_absolute_path :test_dom_entity_reference_without_dtdload do
137
- # Make sure that we don't include entity references unless NOENT is set to true
138
- html = File.read xml_document
139
- doc = @parser.parse html, path do |cfg|
140
- cfg.default_xml
141
- end
142
- assert_kind_of Nokogiri::XML::EntityReference, doc.xpath('//body').first.children.first
143
- if Nokogiri.uses_libxml?
144
- assert_equal ["Entity 'bar' not defined"], doc.errors.map(&:to_s)
145
- end
146
- end
147
-
148
- test_relative_and_absolute_path :test_document_dtd_loading_with_nonet do
149
- # Make sure that we don't include remote entities unless NOENT is set to true
150
- html = %Q[<?xml version="1.0" encoding="UTF-8" ?>
151
- <!DOCTYPE document SYSTEM "http://foo.bar.com/">
152
- <document>
153
- <body>&bar;</body>
154
- </document>
155
- ]
156
- doc = @parser.parse html, path do |cfg|
157
- cfg.default_xml
158
- cfg.dtdload
159
- end
160
- assert_kind_of Nokogiri::XML::EntityReference, doc.xpath('//body').first.children.first
161
- if Nokogiri.uses_libxml?
162
- assert_equal ["Attempt to load network entity http://foo.bar.com/", "Entity 'bar' not defined"], doc.errors.map(&:to_s)
163
- else
164
- assert_equal ["Attempt to load network entity http://foo.bar.com/"], doc.errors.map(&:to_s)
165
- end
166
- end
167
- # TODO: can we retreive a resource pointing to localhost when NONET is set to true ?
168
- end
169
-
170
- class TestSaxEntityReference < Nokogiri::SAX::TestCase
171
- include Common
172
-
173
- def setup
174
- super
175
- @parser = XML::SAX::Parser.new(Doc.new) do |ctx|
176
- ctx.replace_entities = true
177
- end
178
- end
179
-
180
- test_relative_and_absolute_path :test_sax_entity_reference do
181
- # Make sure that we can parse entity references and include them in the document
182
- html = File.read xml_document
183
- @parser.parse html
184
- refute_nil @parser.document.errors
185
- assert_equal ["Entity 'bar' not defined"], @parser.document.errors.map(&:to_s).map(&:strip)
186
- end
187
-
188
- test_relative_and_absolute_path :test_more_sax_entity_reference do
189
- # Make sure that we don't include entity references unless NOENT is set to true
190
- html = %Q[<?xml version="1.0" encoding="UTF-8" ?>
191
- <!DOCTYPE document SYSTEM "http://foo.bar.com/">
192
- <document>
193
- <body>&bar;</body>
194
- </document>
195
- ]
196
- @parser.parse html
197
- refute_nil @parser.document.errors
198
- assert_equal ["Entity 'bar' not defined"], @parser.document.errors.map(&:to_s).map(&:strip)
199
- end
200
- end
201
-
202
- class TestReaderEntityReference < Nokogiri::TestCase
203
- include Common
204
-
205
- def setup
206
- super
207
- end
208
-
209
- test_relative_and_absolute_path :test_reader_entity_reference do
210
- # Make sure that we can parse entity references and include them in the document
211
- html = File.read xml_document
212
- reader = Nokogiri::XML::Reader html, path do |cfg|
213
- cfg.default_xml
214
- cfg.dtdload
215
- cfg.noent
216
- end
217
- nodes = []
218
- reader.each { |n| nodes << n.value }
219
- assert_equal ['foobar'], nodes.compact.map(&:strip).reject(&:empty?)
220
- end
221
-
222
- test_relative_and_absolute_path :test_reader_entity_reference_without_noent do
223
- # Make sure that we can parse entity references and include them in the document
224
- html = File.read xml_document
225
- reader = Nokogiri::XML::Reader html, path do |cfg|
226
- cfg.default_xml
227
- cfg.dtdload
228
- end
229
- nodes = []
230
- reader.each { |n| nodes << n.value }
231
- assert_equal [], nodes.compact.map(&:strip).reject(&:empty?)
232
- end
233
-
234
- test_relative_and_absolute_path :test_reader_entity_reference_without_dtdload do
235
- html = File.read xml_document
236
- assert_raises(Nokogiri::XML::SyntaxError) do
237
- reader = Nokogiri::XML::Reader html, path do |cfg|
238
- cfg.default_xml
239
- end
240
- reader.each { |n| n }
241
- end
242
- end
243
- end
244
- end
245
- end
@@ -1,95 +0,0 @@
1
- require "helper"
2
-
3
- module Nokogiri
4
- module XML
5
- class TestNamespace < Nokogiri::TestCase
6
- def setup
7
- super
8
- @xml = Nokogiri::XML <<-eoxml
9
- <root xmlns="http://tenderlovemaking.com/" xmlns:foo="bar">
10
- <awesome/>
11
- </root>
12
- eoxml
13
- end
14
-
15
- if Nokogiri.uses_libxml?
16
- def test_namespace_is_in_node_cache
17
- node = @xml.root.namespace
18
- assert @xml.instance_variable_get(:@node_cache).include?(node)
19
- end
20
- end
21
-
22
- def test_built_nodes_keep_namespace_decls
23
- doc = Document.new
24
- e = Node.new 'element', doc
25
- c = Node.new 'child', doc
26
- c.default_namespace = 'woop:de:doo'
27
-
28
- assert c.namespace, 'has a namespace'
29
- e.add_child c
30
- assert c.namespace, 'has a namespace'
31
-
32
- doc.add_child e
33
- assert c.namespace, 'has a namespace'
34
- end
35
-
36
- def test_inspect
37
- ns = @xml.root.namespace
38
- assert_equal "#<#{ns.class.name}:#{sprintf("0x%x", ns.object_id)} href=#{ns.href.inspect}>", ns.inspect
39
- end
40
-
41
- def test_namespace_node_prefix
42
- namespaces = @xml.root.namespace_definitions
43
- assert_equal [nil, 'foo'], namespaces.map { |x| x.prefix }
44
- end
45
-
46
- def test_namespace_node_href
47
- namespaces = @xml.root.namespace_definitions
48
- assert_equal [
49
- 'http://tenderlovemaking.com/',
50
- 'bar'
51
- ], namespaces.map { |x| x.href }
52
- end
53
-
54
- def test_equality
55
- namespaces = @xml.root.namespace_definitions
56
- assert_equal namespaces, @xml.root.namespace_definitions
57
- end
58
-
59
- def test_add_definition
60
- @xml.root.add_namespace_definition('baz', 'bar')
61
- assert_equal 3, @xml.root.namespace_definitions.length
62
- end
63
-
64
- def test_add_definition_return
65
- ns = @xml.root.add_namespace_definition('baz', 'bar')
66
- assert_equal 'baz', ns.prefix
67
- end
68
-
69
- def test_remove_entity_namespace
70
- s = %q{<?xml version='1.0'?><!DOCTYPE schema PUBLIC "-//W3C//DTD XMLSCHEMA 200102//EN" "XMLSchema.dtd" [<!ENTITY % p ''>]>}
71
- Nokogiri::XML(s).remove_namespaces!
72
- end
73
-
74
- def test_maintain_element_namespaces
75
- doc = Document.new
76
- subject = Nokogiri::XML::Node.new 'foo', doc
77
- subject << '<foobar xmlns="barfoo"/>'
78
- child = subject.children.first
79
- assert_equal 'foobar', child.name
80
- assert_equal 'barfoo', child.namespace.href
81
- assert_empty child.attributes
82
- end
83
-
84
- def test_maintain_element_namespaces_in_urn
85
- doc = Document.new
86
- subject = Nokogiri::XML::Node.new 'foo', doc
87
- subject << '<foobar xmlns="urn:xmpp:foospec:barfoo"/>'
88
- child = subject.children.first
89
- assert_equal 'foobar', child.name
90
- assert_equal 'urn:xmpp:foospec:barfoo', child.namespace.href
91
- assert_empty child.attributes
92
- end
93
- end
94
- end
95
- end