nokogiri 1.8.5 → 1.9.1

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of nokogiri might be problematic. Click here for more details.

Files changed (147) hide show
  1. checksums.yaml +4 -4
  2. data/README.md +0 -1
  3. data/ext/nokogiri/extconf.rb +10 -6
  4. data/ext/nokogiri/xml_attr.c +26 -21
  5. data/ext/nokogiri/xml_document.c +4 -1
  6. data/ext/nokogiri/xml_namespace.c +3 -3
  7. data/ext/nokogiri/xml_namespace.h +1 -2
  8. data/ext/nokogiri/xml_node.c +55 -15
  9. data/lib/nokogiri/css/parser.rb +61 -61
  10. data/lib/nokogiri/version.rb +1 -1
  11. data/lib/nokogiri/xml/document_fragment.rb +11 -0
  12. data/lib/nokogiri/xml/node.rb +12 -0
  13. data/lib/nokogiri/xml/node_set.rb +4 -8
  14. metadata +17 -153
  15. data/.autotest +0 -22
  16. data/.cross_rubies +0 -8
  17. data/.editorconfig +0 -17
  18. data/.gemtest +0 -0
  19. data/.travis.yml +0 -63
  20. data/CHANGELOG.md +0 -1368
  21. data/CONTRIBUTING.md +0 -42
  22. data/C_CODING_STYLE.rdoc +0 -33
  23. data/Gemfile +0 -23
  24. data/Gemfile-libxml-ruby +0 -3
  25. data/Manifest.txt +0 -370
  26. data/ROADMAP.md +0 -111
  27. data/Rakefile +0 -348
  28. data/SECURITY.md +0 -19
  29. data/STANDARD_RESPONSES.md +0 -47
  30. data/Y_U_NO_GEMSPEC.md +0 -155
  31. data/appveyor.yml +0 -29
  32. data/build_all +0 -44
  33. data/patches/sort-patches-by-date +0 -25
  34. data/suppressions/README.txt +0 -1
  35. data/suppressions/nokogiri_ruby-2.supp +0 -10
  36. data/tasks/test.rb +0 -100
  37. data/test/css/test_nthiness.rb +0 -226
  38. data/test/css/test_parser.rb +0 -386
  39. data/test/css/test_tokenizer.rb +0 -215
  40. data/test/css/test_xpath_visitor.rb +0 -96
  41. data/test/decorators/test_slop.rb +0 -23
  42. data/test/files/2ch.html +0 -108
  43. data/test/files/GH_1042.html +0 -18
  44. data/test/files/address_book.rlx +0 -12
  45. data/test/files/address_book.xml +0 -10
  46. data/test/files/atom.xml +0 -344
  47. data/test/files/bar/bar.xsd +0 -4
  48. data/test/files/bogus.xml +0 -0
  49. data/test/files/dont_hurt_em_why.xml +0 -422
  50. data/test/files/encoding.html +0 -82
  51. data/test/files/encoding.xhtml +0 -84
  52. data/test/files/exslt.xml +0 -8
  53. data/test/files/exslt.xslt +0 -35
  54. data/test/files/foo/foo.xsd +0 -4
  55. data/test/files/metacharset.html +0 -10
  56. data/test/files/namespace_pressure_test.xml +0 -1684
  57. data/test/files/noencoding.html +0 -47
  58. data/test/files/po.xml +0 -32
  59. data/test/files/po.xsd +0 -66
  60. data/test/files/saml/saml20assertion_schema.xsd +0 -283
  61. data/test/files/saml/saml20protocol_schema.xsd +0 -302
  62. data/test/files/saml/xenc_schema.xsd +0 -146
  63. data/test/files/saml/xmldsig_schema.xsd +0 -318
  64. data/test/files/shift_jis.html +0 -10
  65. data/test/files/shift_jis.xml +0 -5
  66. data/test/files/shift_jis_no_charset.html +0 -9
  67. data/test/files/slow-xpath.xml +0 -25509
  68. data/test/files/snuggles.xml +0 -3
  69. data/test/files/staff.dtd +0 -10
  70. data/test/files/staff.xml +0 -59
  71. data/test/files/staff.xslt +0 -32
  72. data/test/files/test_document_url/bar.xml +0 -2
  73. data/test/files/test_document_url/document.dtd +0 -4
  74. data/test/files/test_document_url/document.xml +0 -6
  75. data/test/files/tlm.html +0 -851
  76. data/test/files/to_be_xincluded.xml +0 -2
  77. data/test/files/valid_bar.xml +0 -2
  78. data/test/files/xinclude.xml +0 -4
  79. data/test/helper.rb +0 -271
  80. data/test/html/sax/test_parser.rb +0 -168
  81. data/test/html/sax/test_parser_context.rb +0 -46
  82. data/test/html/sax/test_parser_text.rb +0 -163
  83. data/test/html/sax/test_push_parser.rb +0 -87
  84. data/test/html/test_attributes.rb +0 -85
  85. data/test/html/test_builder.rb +0 -164
  86. data/test/html/test_document.rb +0 -712
  87. data/test/html/test_document_encoding.rb +0 -143
  88. data/test/html/test_document_fragment.rb +0 -310
  89. data/test/html/test_element_description.rb +0 -105
  90. data/test/html/test_named_characters.rb +0 -14
  91. data/test/html/test_node.rb +0 -212
  92. data/test/html/test_node_encoding.rb +0 -91
  93. data/test/namespaces/test_additional_namespaces_in_builder_doc.rb +0 -14
  94. data/test/namespaces/test_namespaces_aliased_default.rb +0 -24
  95. data/test/namespaces/test_namespaces_in_builder_doc.rb +0 -75
  96. data/test/namespaces/test_namespaces_in_cloned_doc.rb +0 -31
  97. data/test/namespaces/test_namespaces_in_created_doc.rb +0 -75
  98. data/test/namespaces/test_namespaces_in_parsed_doc.rb +0 -80
  99. data/test/namespaces/test_namespaces_preservation.rb +0 -31
  100. data/test/test_convert_xpath.rb +0 -135
  101. data/test/test_css_cache.rb +0 -47
  102. data/test/test_encoding_handler.rb +0 -48
  103. data/test/test_memory_leak.rb +0 -156
  104. data/test/test_nokogiri.rb +0 -138
  105. data/test/test_soap4r_sax.rb +0 -52
  106. data/test/test_xslt_transforms.rb +0 -314
  107. data/test/xml/node/test_save_options.rb +0 -28
  108. data/test/xml/node/test_subclass.rb +0 -44
  109. data/test/xml/sax/test_parser.rb +0 -402
  110. data/test/xml/sax/test_parser_context.rb +0 -115
  111. data/test/xml/sax/test_parser_text.rb +0 -202
  112. data/test/xml/sax/test_push_parser.rb +0 -265
  113. data/test/xml/test_attr.rb +0 -74
  114. data/test/xml/test_attribute_decl.rb +0 -86
  115. data/test/xml/test_builder.rb +0 -341
  116. data/test/xml/test_c14n.rb +0 -180
  117. data/test/xml/test_cdata.rb +0 -54
  118. data/test/xml/test_comment.rb +0 -40
  119. data/test/xml/test_document.rb +0 -982
  120. data/test/xml/test_document_encoding.rb +0 -31
  121. data/test/xml/test_document_fragment.rb +0 -298
  122. data/test/xml/test_dtd.rb +0 -187
  123. data/test/xml/test_dtd_encoding.rb +0 -31
  124. data/test/xml/test_element_content.rb +0 -56
  125. data/test/xml/test_element_decl.rb +0 -73
  126. data/test/xml/test_entity_decl.rb +0 -122
  127. data/test/xml/test_entity_reference.rb +0 -262
  128. data/test/xml/test_namespace.rb +0 -96
  129. data/test/xml/test_node.rb +0 -1325
  130. data/test/xml/test_node_attributes.rb +0 -115
  131. data/test/xml/test_node_encoding.rb +0 -75
  132. data/test/xml/test_node_inheritance.rb +0 -32
  133. data/test/xml/test_node_reparenting.rb +0 -592
  134. data/test/xml/test_node_set.rb +0 -809
  135. data/test/xml/test_parse_options.rb +0 -64
  136. data/test/xml/test_processing_instruction.rb +0 -30
  137. data/test/xml/test_reader.rb +0 -620
  138. data/test/xml/test_reader_encoding.rb +0 -134
  139. data/test/xml/test_relax_ng.rb +0 -60
  140. data/test/xml/test_schema.rb +0 -142
  141. data/test/xml/test_syntax_error.rb +0 -36
  142. data/test/xml/test_text.rb +0 -60
  143. data/test/xml/test_unparented_node.rb +0 -483
  144. data/test/xml/test_xinclude.rb +0 -83
  145. data/test/xml/test_xpath.rb +0 -470
  146. data/test/xslt/test_custom_functions.rb +0 -133
  147. data/test/xslt/test_exception_handling.rb +0 -37
@@ -1,87 +0,0 @@
1
- # -*- coding: utf-8 -*-
2
-
3
- require "helper"
4
-
5
- module Nokogiri
6
- module HTML
7
- module SAX
8
- class TestPushParser < Nokogiri::SAX::TestCase
9
- def setup
10
- super
11
- @parser = HTML::SAX::PushParser.new(Doc.new)
12
- end
13
-
14
- def test_end_document_called
15
- @parser.<<(<<-eoxml)
16
- <p id="asdfasdf">
17
- <!-- This is a comment -->
18
- Paragraph 1
19
- </p>
20
- eoxml
21
- assert ! @parser.document.end_document_called
22
- @parser.finish
23
- assert @parser.document.end_document_called
24
- end
25
-
26
- def test_start_element
27
- @parser.<<(<<-eoxml)
28
- <!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN" "http://www.w3.org/TR/REC-html40/loose.dtd">
29
- <html><head><body><p id="asdfasdf">
30
- eoxml
31
-
32
- assert_equal [["html", []], ["head", []], ["body", []], ["p", [["id", "asdfasdf"]]]],
33
- @parser.document.start_elements
34
-
35
- @parser.<<(<<-eoxml)
36
- <!-- This is a comment -->
37
- Paragraph 1
38
- </p></body></html>
39
- eoxml
40
- assert_equal [' This is a comment '], @parser.document.comments
41
- @parser.finish
42
- end
43
-
44
-
45
- def test_chevron_partial_html
46
- @parser.<<(<<-eoxml)
47
- <p id="asdfasdf">
48
- eoxml
49
-
50
- @parser.<<(<<-eoxml)
51
- <!-- This is a comment -->
52
- Paragraph 1
53
- </p>
54
- eoxml
55
- assert_equal [' This is a comment '], @parser.document.comments
56
- @parser.finish
57
- end
58
-
59
- def test_chevron
60
- @parser.<<(<<-eoxml)
61
- <p id="asdfasdf">
62
- <!-- This is a comment -->
63
- Paragraph 1
64
- </p>
65
- eoxml
66
- @parser.finish
67
- assert_equal [' This is a comment '], @parser.document.comments
68
- end
69
-
70
- def test_default_options
71
- assert_equal 0, @parser.options
72
- end
73
-
74
- def test_broken_encoding
75
- skip("ultra hard to fix for pure Java version") if Nokogiri.jruby?
76
- @parser.options |= XML::ParseOptions::RECOVER
77
- # This is ISO_8859-1:
78
- @parser.<< "<?xml version='1.0' encoding='UTF-8'?><r>Gau\337</r>"
79
- @parser.finish
80
- assert(@parser.document.errors.size >= 1)
81
- assert_equal "Gau\337", @parser.document.data.join
82
- assert_equal [["r"], ["body"], ["html"]], @parser.document.end_elements
83
- end
84
- end
85
- end
86
- end
87
- end
@@ -1,85 +0,0 @@
1
- require "helper"
2
-
3
- module Nokogiri
4
- module HTML
5
- class TestAttr < Nokogiri::TestCase
6
- unless Nokogiri::VersionInfo.instance.libxml2? && Nokogiri::VersionInfo.instance.libxml2_using_system?
7
- #
8
- # libxml2 >= 2.9.2 fails to escape comments within some attributes. It
9
- # wants to ensure these comments can be treated as "server-side includes",
10
- # but as a result fails to ensure that serialization is well-formed,
11
- # resulting in an opportunity for XSS injection of code into a final
12
- # re-parsed document (presumably in a browser).
13
- #
14
- # the offending commit is:
15
- #
16
- # https://github.com/GNOME/libxml2/commit/960f0e2
17
- #
18
- # we'll test this by parsing the HTML, serializing it, then
19
- # re-parsing it to ensure there isn't any ambiguity in the output
20
- # that might allow code injection into a browser consuming
21
- # "sanitized" output.
22
- #
23
- # complaints have been made upstream about this behavior, notably at
24
- #
25
- # https://bugzilla.gnome.org/show_bug.cgi?id=769760
26
- #
27
- # and multiple CVEs have been declared and fixed in downstream
28
- # libraries as a result, a list is being kept up to date here:
29
- #
30
- # https://github.com/flavorjones/loofah/issues/144
31
- #
32
- [
33
- #
34
- # these tags and attributes are determined by the code at:
35
- #
36
- # https://git.gnome.org/browse/libxml2/tree/HTMLtree.c?h=v2.9.2#n714
37
- #
38
- {tag: "a", attr: "href"},
39
- {tag: "div", attr: "href"},
40
- {tag: "a", attr: "action"},
41
- {tag: "div", attr: "action"},
42
- {tag: "a", attr: "src"},
43
- {tag: "div", attr: "src"},
44
- {tag: "a", attr: "name"},
45
- #
46
- # note that div+name is _not_ affected by the libxml2 issue.
47
- # but we test it anyway to ensure our logic isn't modifying
48
- # attributes that don't need modifying.
49
- #
50
- {tag: "div", attr: "name", unescaped: true},
51
- ].each do |config|
52
-
53
- define_method "test_uri_escaping_of_#{config[:attr]}_attr_in_#{config[:tag]}_tag" do
54
- html = %{<#{config[:tag]} #{config[:attr]}='examp<!--" unsafeattr=unsafevalue()>-->le.com'>test</#{config[:tag]}>}
55
-
56
- reparsed = HTML.fragment(HTML.fragment(html).to_html)
57
- attributes = reparsed.at_css(config[:tag]).attribute_nodes
58
-
59
- assert_equal [config[:attr]], attributes.collect(&:name)
60
- if Nokogiri::VersionInfo.instance.libxml2?
61
- if config[:unescaped]
62
- #
63
- # this attribute was emitted wrapped in single-quotes, so a double quote is A-OK.
64
- # assert that this attribute's serialization is unaffected.
65
- #
66
- assert_equal %{examp<!--" unsafeattr=unsafevalue()>-->le.com}, attributes.first.value
67
- else
68
- #
69
- # let's match the behavior in libxml < 2.9.2.
70
- # test that this attribute's serialization is well-formed and sanitized.
71
- #
72
- assert_equal %{examp<!--%22%20unsafeattr=unsafevalue()>-->le.com}, attributes.first.value
73
- end
74
- else
75
- #
76
- # yay for consistency in javaland. move along, nothing to see here.
77
- #
78
- assert_equal %{examp<!--%22 unsafeattr=unsafevalue()>-->le.com}, attributes.first.value
79
- end
80
- end
81
- end
82
- end
83
- end
84
- end
85
- end
@@ -1,164 +0,0 @@
1
- require "helper"
2
-
3
- module Nokogiri
4
- module HTML
5
- class TestBuilder < Nokogiri::TestCase
6
- def test_top_level_function_builds
7
- foo = nil
8
- Nokogiri() { |xml| foo = xml }
9
- assert_instance_of Nokogiri::HTML::Builder, foo
10
- end
11
-
12
- def test_builder_with_explicit_tags
13
- html_doc = Nokogiri::HTML::Builder.new {
14
- div.slide(:class => 'another_class') {
15
- node = Nokogiri::XML::Node.new("id", doc)
16
- node.content = "hello"
17
- insert(node)
18
- }
19
- }.doc
20
- assert_equal 1, html_doc.css('div.slide > id').length
21
- assert_equal 'hello', html_doc.at('div.slide > id').content
22
- end
23
-
24
- def test_hash_as_attributes_for_attribute_method
25
- html = Nokogiri::HTML::Builder.new { ||
26
- div.slide(:class => 'another_class') {
27
- span 'Slide 1'
28
- }
29
- }.to_html
30
- assert_match 'class="slide another_class"', html
31
- end
32
-
33
- def test_hash_as_attributes
34
- builder = Nokogiri::HTML::Builder.new do
35
- div(:id => 'awesome') {
36
- h1 "america"
37
- }
38
- end
39
- assert_equal('<div id="awesome"><h1>america</h1></div>',
40
- builder.doc.root.to_html.gsub(/\n/, '').gsub(/>\s*</, '><'))
41
- end
42
-
43
- def test_href_with_attributes
44
- uri = 'http://tenderlovemaking.com/'
45
- built = Nokogiri::XML::Builder.new {
46
- div {
47
- a('King Khan & The Shrines', :href => uri)
48
- }
49
- }
50
- assert_equal 'http://tenderlovemaking.com/',
51
- built.doc.at('a')[:href]
52
- end
53
-
54
- def test_tag_nesting
55
- builder = Nokogiri::HTML::Builder.new do
56
- body {
57
- span.left ''
58
- span.middle {
59
- div.icon ''
60
- }
61
- span.right ''
62
- }
63
- end
64
- assert node = builder.doc.css('span.right').first
65
- assert_equal 'middle', node.previous_sibling['class']
66
- end
67
-
68
- def test_has_ampersand
69
- builder = Nokogiri::HTML::Builder.new do
70
- div.rad.thing! {
71
- text "<awe&some>"
72
- b "hello & world"
73
- }
74
- end
75
- assert_equal(
76
- '<div class="rad" id="thing">&lt;awe&amp;some&gt;<b>hello &amp; world</b></div>',
77
- builder.doc.root.to_html.gsub(/\n/, ''))
78
- end
79
-
80
- def test_multi_tags
81
- builder = Nokogiri::HTML::Builder.new do
82
- div.rad.thing! {
83
- text "<awesome>"
84
- b "hello"
85
- }
86
- end
87
- assert_equal(
88
- '<div class="rad" id="thing">&lt;awesome&gt;<b>hello</b></div>',
89
- builder.doc.root.to_html.gsub(/\n/, ''))
90
- end
91
-
92
- def test_attributes_plus_block
93
- builder = Nokogiri::HTML::Builder.new do
94
- div.rad.thing! {
95
- text "<awesome>"
96
- }
97
- end
98
- assert_equal('<div class="rad" id="thing">&lt;awesome&gt;</div>',
99
- builder.doc.root.to_html.chomp)
100
- end
101
-
102
- def test_builder_adds_attributes
103
- builder = Nokogiri::HTML::Builder.new do
104
- div.rad.thing! "tender div"
105
- end
106
- assert_equal('<div class="rad" id="thing">tender div</div>',
107
- builder.doc.root.to_html.chomp)
108
- end
109
-
110
- def test_bold_tag
111
- builder = Nokogiri::HTML::Builder.new do
112
- b "bold tag"
113
- end
114
- assert_equal('<b>bold tag</b>', builder.doc.root.to_html.chomp)
115
- end
116
-
117
- def test_html_then_body_tag
118
- builder = Nokogiri::HTML::Builder.new do
119
- html {
120
- body {
121
- b "bold tag"
122
- }
123
- }
124
- end
125
- assert_equal('<html><body><b>bold tag</b></body></html>',
126
- builder.doc.root.to_html.chomp.gsub(/>\s*</, '><'))
127
- end
128
-
129
- def test_instance_eval_with_delegation_to_block_context
130
- class << self
131
- def foo
132
- "foo!"
133
- end
134
- end
135
-
136
- builder = Nokogiri::HTML::Builder.new { text foo }
137
- assert builder.to_html.include?("foo!")
138
- end
139
-
140
- def test_builder_with_param
141
- doc = Nokogiri::HTML::Builder.new { |html|
142
- html.body {
143
- html.p "hello world"
144
- }
145
- }.doc
146
-
147
- assert node = doc.xpath('//body/p').first
148
- assert_equal 'hello world', node.content
149
- end
150
-
151
- def test_builder_with_id
152
- text = "hello world"
153
- doc = Nokogiri::HTML::Builder.new { |html|
154
- html.body {
155
- html.id_ text
156
- }
157
- }.doc
158
-
159
- assert node = doc.xpath('//body/id').first
160
- assert_equal text, node.content
161
- end
162
- end
163
- end
164
- end