nokogiri 1.11.0.rc2-x86-linux → 1.11.2-x86-linux
Sign up to get free protection for your applications and to get access to all the features.
Potentially problematic release.
This version of nokogiri might be problematic. Click here for more details.
- checksums.yaml +4 -4
- data/Gemfile +3 -0
- data/LICENSE-DEPENDENCIES.md +1015 -947
- data/LICENSE.md +1 -1
- data/README.md +171 -94
- data/ext/nokogiri/depend +37 -358
- data/ext/nokogiri/extconf.rb +581 -374
- data/ext/nokogiri/html_document.c +78 -82
- data/ext/nokogiri/html_element_description.c +84 -71
- data/ext/nokogiri/html_entity_lookup.c +21 -16
- data/ext/nokogiri/html_sax_parser_context.c +69 -66
- data/ext/nokogiri/html_sax_push_parser.c +42 -34
- data/ext/nokogiri/include/libexslt/exslt.h +102 -0
- data/ext/nokogiri/include/libexslt/exsltconfig.h +70 -0
- data/ext/nokogiri/include/libexslt/exsltexports.h +140 -0
- data/ext/nokogiri/include/libxml2/libxml/DOCBparser.h +96 -0
- data/ext/nokogiri/include/libxml2/libxml/HTMLparser.h +306 -0
- data/ext/nokogiri/include/libxml2/libxml/HTMLtree.h +147 -0
- data/ext/nokogiri/include/libxml2/libxml/SAX.h +173 -0
- data/ext/nokogiri/include/libxml2/libxml/SAX2.h +178 -0
- data/ext/nokogiri/include/libxml2/libxml/c14n.h +126 -0
- data/ext/nokogiri/include/libxml2/libxml/catalog.h +182 -0
- data/ext/nokogiri/include/libxml2/libxml/chvalid.h +230 -0
- data/ext/nokogiri/include/libxml2/libxml/debugXML.h +217 -0
- data/ext/nokogiri/include/libxml2/libxml/dict.h +79 -0
- data/ext/nokogiri/include/libxml2/libxml/encoding.h +245 -0
- data/ext/nokogiri/include/libxml2/libxml/entities.h +151 -0
- data/ext/nokogiri/include/libxml2/libxml/globals.h +508 -0
- data/ext/nokogiri/include/libxml2/libxml/hash.h +236 -0
- data/ext/nokogiri/include/libxml2/libxml/list.h +137 -0
- data/ext/nokogiri/include/libxml2/libxml/nanoftp.h +163 -0
- data/ext/nokogiri/include/libxml2/libxml/nanohttp.h +81 -0
- data/ext/nokogiri/include/libxml2/libxml/parser.h +1241 -0
- data/ext/nokogiri/include/libxml2/libxml/parserInternals.h +644 -0
- data/ext/nokogiri/include/libxml2/libxml/pattern.h +100 -0
- data/ext/nokogiri/include/libxml2/libxml/relaxng.h +217 -0
- data/ext/nokogiri/include/libxml2/libxml/schemasInternals.h +958 -0
- data/ext/nokogiri/include/libxml2/libxml/schematron.h +142 -0
- data/ext/nokogiri/include/libxml2/libxml/threads.h +89 -0
- data/ext/nokogiri/include/libxml2/libxml/tree.h +1311 -0
- data/ext/nokogiri/include/libxml2/libxml/uri.h +94 -0
- data/ext/nokogiri/include/libxml2/libxml/valid.h +458 -0
- data/ext/nokogiri/include/libxml2/libxml/xinclude.h +129 -0
- data/ext/nokogiri/include/libxml2/libxml/xlink.h +189 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlIO.h +366 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlautomata.h +146 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlerror.h +945 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlexports.h +153 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlmemory.h +224 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlmodule.h +57 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlreader.h +428 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlregexp.h +222 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlsave.h +88 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlschemas.h +246 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlschemastypes.h +151 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlstring.h +140 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlunicode.h +202 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlversion.h +485 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlwriter.h +488 -0
- data/ext/nokogiri/include/libxml2/libxml/xpath.h +566 -0
- data/ext/nokogiri/include/libxml2/libxml/xpathInternals.h +632 -0
- data/ext/nokogiri/include/libxml2/libxml/xpointer.h +114 -0
- data/ext/nokogiri/include/libxslt/attributes.h +38 -0
- data/ext/nokogiri/include/libxslt/documents.h +93 -0
- data/ext/nokogiri/include/libxslt/extensions.h +262 -0
- data/ext/nokogiri/include/libxslt/extra.h +72 -0
- data/ext/nokogiri/include/libxslt/functions.h +78 -0
- data/ext/nokogiri/include/libxslt/imports.h +75 -0
- data/ext/nokogiri/include/libxslt/keys.h +53 -0
- data/ext/nokogiri/include/libxslt/namespaces.h +68 -0
- data/ext/nokogiri/include/libxslt/numbersInternals.h +73 -0
- data/ext/nokogiri/include/libxslt/pattern.h +84 -0
- data/ext/nokogiri/include/libxslt/preproc.h +43 -0
- data/ext/nokogiri/include/libxslt/security.h +104 -0
- data/ext/nokogiri/include/libxslt/templates.h +77 -0
- data/ext/nokogiri/include/libxslt/transform.h +207 -0
- data/ext/nokogiri/include/libxslt/variables.h +118 -0
- data/ext/nokogiri/include/libxslt/xslt.h +110 -0
- data/ext/nokogiri/include/libxslt/xsltInternals.h +1978 -0
- data/ext/nokogiri/include/libxslt/xsltconfig.h +180 -0
- data/ext/nokogiri/include/libxslt/xsltexports.h +142 -0
- data/ext/nokogiri/include/libxslt/xsltlocale.h +76 -0
- data/ext/nokogiri/include/libxslt/xsltutils.h +313 -0
- data/ext/nokogiri/libxml2_backwards_compat.c +121 -0
- data/ext/nokogiri/nokogiri.c +192 -93
- data/ext/nokogiri/nokogiri.h +177 -98
- data/ext/nokogiri/test_global_handlers.c +40 -0
- data/ext/nokogiri/xml_attr.c +15 -15
- data/ext/nokogiri/xml_attribute_decl.c +18 -18
- data/ext/nokogiri/xml_cdata.c +13 -18
- data/ext/nokogiri/xml_comment.c +19 -26
- data/ext/nokogiri/xml_document.c +225 -163
- data/ext/nokogiri/xml_document_fragment.c +13 -15
- data/ext/nokogiri/xml_dtd.c +54 -48
- data/ext/nokogiri/xml_element_content.c +30 -27
- data/ext/nokogiri/xml_element_decl.c +22 -22
- data/ext/nokogiri/xml_encoding_handler.c +17 -11
- data/ext/nokogiri/xml_entity_decl.c +32 -30
- data/ext/nokogiri/xml_entity_reference.c +16 -18
- data/ext/nokogiri/xml_namespace.c +56 -49
- data/ext/nokogiri/xml_node.c +338 -286
- data/ext/nokogiri/xml_node_set.c +168 -156
- data/ext/nokogiri/xml_processing_instruction.c +17 -19
- data/ext/nokogiri/xml_reader.c +191 -157
- data/ext/nokogiri/xml_relax_ng.c +52 -28
- data/ext/nokogiri/xml_sax_parser.c +118 -118
- data/ext/nokogiri/xml_sax_parser_context.c +103 -86
- data/ext/nokogiri/xml_sax_push_parser.c +36 -27
- data/ext/nokogiri/xml_schema.c +95 -47
- data/ext/nokogiri/xml_syntax_error.c +42 -21
- data/ext/nokogiri/xml_text.c +13 -17
- data/ext/nokogiri/xml_xpath_context.c +206 -123
- data/ext/nokogiri/xslt_stylesheet.c +158 -161
- data/lib/nokogiri.rb +4 -8
- data/lib/nokogiri/2.5/nokogiri.so +0 -0
- data/lib/nokogiri/2.6/nokogiri.so +0 -0
- data/lib/nokogiri/2.7/nokogiri.so +0 -0
- data/lib/nokogiri/3.0/nokogiri.so +0 -0
- data/lib/nokogiri/css/parser.rb +62 -62
- data/lib/nokogiri/css/parser.y +2 -2
- data/lib/nokogiri/css/xpath_visitor.rb +70 -42
- data/lib/nokogiri/extension.rb +26 -0
- data/lib/nokogiri/html/document.rb +12 -26
- data/lib/nokogiri/html/document_fragment.rb +15 -15
- data/lib/nokogiri/version.rb +2 -148
- data/lib/nokogiri/version/constant.rb +5 -0
- data/lib/nokogiri/version/info.rb +205 -0
- data/lib/nokogiri/xml/builder.rb +2 -2
- data/lib/nokogiri/xml/document.rb +48 -18
- data/lib/nokogiri/xml/document_fragment.rb +4 -6
- data/lib/nokogiri/xml/node.rb +88 -69
- data/lib/nokogiri/xml/parse_options.rb +6 -0
- data/lib/nokogiri/xml/reader.rb +2 -9
- data/lib/nokogiri/xml/relax_ng.rb +6 -2
- data/lib/nokogiri/xml/schema.rb +12 -4
- data/lib/nokogiri/xml/searchable.rb +3 -1
- data/lib/nokogiri/xml/xpath.rb +1 -3
- data/lib/nokogiri/xml/xpath/syntax_error.rb +1 -1
- metadata +151 -158
- data/ext/nokogiri/html_document.h +0 -10
- data/ext/nokogiri/html_element_description.h +0 -10
- data/ext/nokogiri/html_entity_lookup.h +0 -8
- data/ext/nokogiri/html_sax_parser_context.h +0 -11
- data/ext/nokogiri/html_sax_push_parser.h +0 -9
- data/ext/nokogiri/xml_attr.h +0 -9
- data/ext/nokogiri/xml_attribute_decl.h +0 -9
- data/ext/nokogiri/xml_cdata.h +0 -9
- data/ext/nokogiri/xml_comment.h +0 -9
- data/ext/nokogiri/xml_document.h +0 -23
- data/ext/nokogiri/xml_document_fragment.h +0 -10
- data/ext/nokogiri/xml_dtd.h +0 -10
- data/ext/nokogiri/xml_element_content.h +0 -10
- data/ext/nokogiri/xml_element_decl.h +0 -9
- data/ext/nokogiri/xml_encoding_handler.h +0 -8
- data/ext/nokogiri/xml_entity_decl.h +0 -10
- data/ext/nokogiri/xml_entity_reference.h +0 -9
- data/ext/nokogiri/xml_io.c +0 -61
- data/ext/nokogiri/xml_io.h +0 -11
- data/ext/nokogiri/xml_libxml2_hacks.c +0 -112
- data/ext/nokogiri/xml_libxml2_hacks.h +0 -12
- data/ext/nokogiri/xml_namespace.h +0 -14
- data/ext/nokogiri/xml_node.h +0 -13
- data/ext/nokogiri/xml_node_set.h +0 -12
- data/ext/nokogiri/xml_processing_instruction.h +0 -9
- data/ext/nokogiri/xml_reader.h +0 -10
- data/ext/nokogiri/xml_relax_ng.h +0 -9
- data/ext/nokogiri/xml_sax_parser.h +0 -39
- data/ext/nokogiri/xml_sax_parser_context.h +0 -10
- data/ext/nokogiri/xml_sax_push_parser.h +0 -9
- data/ext/nokogiri/xml_schema.h +0 -9
- data/ext/nokogiri/xml_syntax_error.h +0 -13
- data/ext/nokogiri/xml_text.h +0 -9
- data/ext/nokogiri/xml_xpath_context.h +0 -10
- data/ext/nokogiri/xslt_stylesheet.h +0 -14
- data/lib/nokogiri/2.4/nokogiri.so +0 -0
data/lib/nokogiri/css/parser.y
CHANGED
@@ -88,7 +88,7 @@ rule
|
|
88
88
|
)
|
89
89
|
}
|
90
90
|
| LSQUARE NUMBER RSQUARE {
|
91
|
-
#
|
91
|
+
# non-standard, from hpricot
|
92
92
|
result = Node.new(:PSEUDO_CLASS,
|
93
93
|
[Node.new(:FUNCTION, ['nth-child(', val[1]])]
|
94
94
|
)
|
@@ -139,7 +139,7 @@ rule
|
|
139
139
|
when 'n'
|
140
140
|
result = Node.new(:NTH, ['1','n','+','0'])
|
141
141
|
else
|
142
|
-
#
|
142
|
+
# non-standard to support custom functions:
|
143
143
|
# assert_xpath("//a[foo(., @href)]", @parser.parse('a:foo(@href)'))
|
144
144
|
# assert_xpath("//a[foo(., @a, b)]", @parser.parse('a:foo(@a, b)'))
|
145
145
|
# assert_xpath("//a[foo(., a, 10)]", @parser.parse('a:foo(a, 10)'))
|
@@ -3,7 +3,6 @@ module Nokogiri
|
|
3
3
|
module CSS
|
4
4
|
class XPathVisitor # :nodoc:
|
5
5
|
def visit_function node
|
6
|
-
|
7
6
|
msg = :"visit_function_#{node.value.first.gsub(/[(]/, '')}"
|
8
7
|
return self.send(msg, node) if self.respond_to?(msg)
|
9
8
|
|
@@ -13,50 +12,51 @@ module Nokogiri
|
|
13
12
|
when /^self\(/
|
14
13
|
"self::#{node.value[1]}"
|
15
14
|
when /^eq\(/
|
16
|
-
"position()
|
15
|
+
"position()=#{node.value[1]}"
|
17
16
|
when /^(nth|nth-of-type)\(/
|
18
17
|
if node.value[1].is_a?(Nokogiri::CSS::Node) and node.value[1].type == :NTH
|
19
18
|
nth(node.value[1])
|
20
19
|
else
|
21
|
-
"position()
|
20
|
+
"position()=#{node.value[1]}"
|
22
21
|
end
|
23
22
|
when /^nth-child\(/
|
24
23
|
if node.value[1].is_a?(Nokogiri::CSS::Node) and node.value[1].type == :NTH
|
25
24
|
nth(node.value[1], :child => true)
|
26
25
|
else
|
27
|
-
"count(preceding-sibling::*)
|
26
|
+
"count(preceding-sibling::*)=#{node.value[1].to_i-1}"
|
28
27
|
end
|
29
28
|
when /^nth-last-of-type\(/
|
30
29
|
if node.value[1].is_a?(Nokogiri::CSS::Node) and node.value[1].type == :NTH
|
31
30
|
nth(node.value[1], :last => true)
|
32
31
|
else
|
33
32
|
index = node.value[1].to_i - 1
|
34
|
-
index == 0 ? "position()
|
33
|
+
index == 0 ? "position()=last()" : "position()=last()-#{index}"
|
35
34
|
end
|
36
35
|
when /^nth-last-child\(/
|
37
36
|
if node.value[1].is_a?(Nokogiri::CSS::Node) and node.value[1].type == :NTH
|
38
37
|
nth(node.value[1], :last => true, :child => true)
|
39
38
|
else
|
40
|
-
"count(following-sibling::*)
|
39
|
+
"count(following-sibling::*)=#{node.value[1].to_i-1}"
|
41
40
|
end
|
42
41
|
when /^(first|first-of-type)\(/
|
43
|
-
"position()
|
42
|
+
"position()=1"
|
44
43
|
when /^(last|last-of-type)\(/
|
45
|
-
"position()
|
44
|
+
"position()=last()"
|
46
45
|
when /^contains\(/
|
47
|
-
"contains(
|
46
|
+
"contains(.,#{node.value[1]})"
|
48
47
|
when /^gt\(/
|
49
|
-
"position()
|
48
|
+
"position()>#{node.value[1]}"
|
50
49
|
when /^only-child\(/
|
51
|
-
"last()
|
50
|
+
"last()=1"
|
52
51
|
when /^comment\(/
|
53
52
|
"comment()"
|
54
53
|
when /^has\(/
|
55
54
|
is_direct = node.value[1].value[0].nil? # e.g. "has(> a)", "has(~ a)", "has(+ a)"
|
56
55
|
".#{"//" if !is_direct}#{node.value[1].accept(self)}"
|
57
56
|
else
|
57
|
+
# non-standard. this looks like a function call.
|
58
58
|
args = ['.'] + node.value[1..-1]
|
59
|
-
"#{node.value.first}#{args.join(',
|
59
|
+
"#{node.value.first}#{args.join(',')})"
|
60
60
|
end
|
61
61
|
end
|
62
62
|
|
@@ -71,18 +71,18 @@ module Nokogiri
|
|
71
71
|
|
72
72
|
def visit_id node
|
73
73
|
node.value.first =~ /^#(.*)$/
|
74
|
-
"@id
|
74
|
+
"@id='#{$1}'"
|
75
75
|
end
|
76
76
|
|
77
77
|
def visit_attribute_condition node
|
78
|
-
|
79
|
-
|
80
|
-
|
81
|
-
|
82
|
-
|
78
|
+
attribute = if (node.value.first.type == :FUNCTION) or (node.value.first.value.first =~ /::/)
|
79
|
+
''
|
80
|
+
else
|
81
|
+
'@'
|
82
|
+
end
|
83
83
|
attribute += node.value.first.accept(self)
|
84
84
|
|
85
|
-
#
|
85
|
+
# non-standard. attributes starting with '@'
|
86
86
|
attribute.gsub!(/^@@/, '@')
|
87
87
|
|
88
88
|
return attribute unless node.value.length == 3
|
@@ -90,29 +90,30 @@ module Nokogiri
|
|
90
90
|
value = node.value.last
|
91
91
|
value = "'#{value}'" if value !~ /^['"]/
|
92
92
|
|
93
|
+
# quoted values - see test_attribute_value_with_quotes in test/css/test_parser.rb
|
93
94
|
if (value[0]==value[-1]) && %q{"'}.include?(value[0])
|
94
95
|
str_value = value[1..-2]
|
95
96
|
if str_value.include?(value[0])
|
96
|
-
value = 'concat("' + str_value.split('"', -1).join(%q{",
|
97
|
+
value = 'concat("' + str_value.split('"', -1).join(%q{",'"',"}) + '","")'
|
97
98
|
end
|
98
99
|
end
|
99
100
|
|
100
101
|
case node.value[1]
|
101
102
|
when :equal
|
102
|
-
attribute + "
|
103
|
+
attribute + "=" + "#{value}"
|
103
104
|
when :not_equal
|
104
|
-
attribute + "
|
105
|
+
attribute + "!=" + "#{value}"
|
105
106
|
when :substring_match
|
106
|
-
"contains(#{attribute}
|
107
|
+
"contains(#{attribute},#{value})"
|
107
108
|
when :prefix_match
|
108
|
-
"starts-with(#{attribute}
|
109
|
+
"starts-with(#{attribute},#{value})"
|
109
110
|
when :dash_match
|
110
|
-
"#{attribute}
|
111
|
+
"#{attribute}=#{value} or starts-with(#{attribute},concat(#{value},'-'))"
|
111
112
|
when :includes
|
112
|
-
|
113
|
+
value = value[1..-2] # strip quotes
|
114
|
+
css_class(attribute, value)
|
113
115
|
when :suffix_match
|
114
|
-
"substring(#{attribute},
|
115
|
-
"string-length(#{value}) + 1, string-length(#{value})) = #{value}"
|
116
|
+
"substring(#{attribute},string-length(#{attribute})-string-length(#{value})+1,string-length(#{value}))=#{value}"
|
116
117
|
else
|
117
118
|
attribute + " #{node.value[1]} " + "#{value}"
|
118
119
|
end
|
@@ -126,14 +127,14 @@ module Nokogiri
|
|
126
127
|
return self.send(msg, node) if self.respond_to?(msg)
|
127
128
|
|
128
129
|
case node.value.first
|
129
|
-
when "first" then "position()
|
130
|
-
when "first-child" then "count(preceding-sibling::*)
|
131
|
-
when "last" then "position()
|
132
|
-
when "last-child" then "count(following-sibling::*)
|
133
|
-
when "first-of-type" then "position()
|
134
|
-
when "last-of-type" then "position()
|
135
|
-
when "only-child" then "count(preceding-sibling::*)
|
136
|
-
when "only-of-type" then "last()
|
130
|
+
when "first" then "position()=1"
|
131
|
+
when "first-child" then "count(preceding-sibling::*)=0"
|
132
|
+
when "last" then "position()=last()"
|
133
|
+
when "last-child" then "count(following-sibling::*)=0"
|
134
|
+
when "first-of-type" then "position()=1"
|
135
|
+
when "last-of-type" then "position()=last()"
|
136
|
+
when "only-child" then "count(preceding-sibling::*)=0 and count(following-sibling::*)=0"
|
137
|
+
when "only-of-type" then "last()=1"
|
137
138
|
when "empty" then "not(node())"
|
138
139
|
when "parent" then "node()"
|
139
140
|
when "root" then "not(parent::*)"
|
@@ -144,7 +145,7 @@ module Nokogiri
|
|
144
145
|
end
|
145
146
|
|
146
147
|
def visit_class_condition node
|
147
|
-
"
|
148
|
+
css_class("@class", node.value.first)
|
148
149
|
end
|
149
150
|
|
150
151
|
def visit_combinator node
|
@@ -181,25 +182,26 @@ module Nokogiri
|
|
181
182
|
node.accept(self)
|
182
183
|
end
|
183
184
|
|
184
|
-
|
185
|
+
private
|
186
|
+
|
185
187
|
def nth node, options={}
|
186
188
|
raise ArgumentError, "expected an+b node to contain 4 tokens, but is #{node.value.inspect}" unless node.value.size == 4
|
187
189
|
|
188
190
|
a, b = read_a_and_positive_b node.value
|
189
191
|
position = if options[:child]
|
190
|
-
options[:last] ? "(count(following-sibling::*)
|
192
|
+
options[:last] ? "(count(following-sibling::*)+1)" : "(count(preceding-sibling::*)+1)"
|
191
193
|
else
|
192
194
|
options[:last] ? "(last()-position()+1)" : "position()"
|
193
195
|
end
|
194
196
|
|
195
197
|
if b.zero?
|
196
|
-
"(#{position} mod #{a})
|
198
|
+
"(#{position} mod #{a})=0"
|
197
199
|
else
|
198
200
|
compare = a < 0 ? "<=" : ">="
|
199
201
|
if a.abs == 1
|
200
|
-
"#{position}
|
202
|
+
"#{position}#{compare}#{b}"
|
201
203
|
else
|
202
|
-
"(#{position}
|
204
|
+
"(#{position}#{compare}#{b}) and (((#{position}-#{b}) mod #{a.abs})=0)"
|
203
205
|
end
|
204
206
|
end
|
205
207
|
end
|
@@ -227,6 +229,32 @@ module Nokogiri
|
|
227
229
|
end =~ /(nth|first|last|only)-of-type(\()?/
|
228
230
|
end
|
229
231
|
end
|
232
|
+
|
233
|
+
# use only ordinary xpath functions
|
234
|
+
def css_class_standard(hay, needle)
|
235
|
+
"contains(concat(' ',normalize-space(#{hay}),' '),' #{needle} ')"
|
236
|
+
end
|
237
|
+
|
238
|
+
# use the builtin implementation
|
239
|
+
def css_class_builtin(hay, needle)
|
240
|
+
"nokogiri-builtin:css-class(#{hay},'#{needle}')"
|
241
|
+
end
|
242
|
+
|
243
|
+
alias_method :css_class, :css_class_standard
|
244
|
+
end
|
245
|
+
|
246
|
+
class XPathVisitorAlwaysUseBuiltins < XPathVisitor # :nodoc:
|
247
|
+
private
|
248
|
+
alias_method :css_class, :css_class_builtin
|
249
|
+
end
|
250
|
+
|
251
|
+
class XPathVisitorOptimallyUseBuiltins < XPathVisitor # :nodoc:
|
252
|
+
private
|
253
|
+
if Nokogiri.uses_libxml?
|
254
|
+
alias_method :css_class, :css_class_builtin
|
255
|
+
else
|
256
|
+
alias_method :css_class, :css_class_standard
|
257
|
+
end
|
230
258
|
end
|
231
259
|
end
|
232
260
|
end
|
@@ -0,0 +1,26 @@
|
|
1
|
+
# frozen_string_literal: true
|
2
|
+
|
3
|
+
# load the C or Java extension
|
4
|
+
begin
|
5
|
+
::RUBY_VERSION =~ /(\d+\.\d+)/
|
6
|
+
require "nokogiri/#{Regexp.last_match(1)}/nokogiri"
|
7
|
+
rescue LoadError => e
|
8
|
+
if e.message =~ /GLIBC/
|
9
|
+
warn(<<~EOM)
|
10
|
+
|
11
|
+
ERROR: It looks like you're trying to use Nokogiri as a precompiled native gem on a system with glibc < 2.17:
|
12
|
+
|
13
|
+
#{e.message}
|
14
|
+
|
15
|
+
If that's the case, then please install Nokogiri via the `ruby` platform gem:
|
16
|
+
gem install nokogiri --platform=ruby
|
17
|
+
or:
|
18
|
+
bundle config set force_ruby_platform true
|
19
|
+
|
20
|
+
Please visit https://nokogiri.org/tutorials/installing_nokogiri.html for more help.
|
21
|
+
|
22
|
+
EOM
|
23
|
+
raise e
|
24
|
+
end
|
25
|
+
require 'nokogiri/nokogiri'
|
26
|
+
end
|
@@ -1,4 +1,7 @@
|
|
1
1
|
# frozen_string_literal: true
|
2
|
+
|
3
|
+
require 'pathname'
|
4
|
+
|
2
5
|
module Nokogiri
|
3
6
|
module HTML
|
4
7
|
class Document < Nokogiri::XML::Document
|
@@ -161,11 +164,12 @@ module Nokogiri
|
|
161
164
|
# Nokogiri::XML::ParseOptions::RECOVER. See the constants in
|
162
165
|
# Nokogiri::XML::ParseOptions.
|
163
166
|
def parse string_or_io, url = nil, encoding = nil, options = XML::ParseOptions::DEFAULT_HTML
|
164
|
-
|
165
167
|
options = Nokogiri::XML::ParseOptions.new(options) if Integer === options
|
166
|
-
|
168
|
+
|
167
169
|
yield options if block_given?
|
168
170
|
|
171
|
+
url ||= string_or_io.respond_to?(:path) ? string_or_io.path : nil
|
172
|
+
|
169
173
|
if string_or_io.respond_to?(:encoding)
|
170
174
|
unless string_or_io.encoding.name == "ASCII-8BIT"
|
171
175
|
encoding ||= string_or_io.encoding.name
|
@@ -173,7 +177,12 @@ module Nokogiri
|
|
173
177
|
end
|
174
178
|
|
175
179
|
if string_or_io.respond_to?(:read)
|
176
|
-
|
180
|
+
if string_or_io.is_a?(Pathname)
|
181
|
+
# resolve the Pathname to the file and open it as an IO object, see #2110
|
182
|
+
string_or_io = string_or_io.expand_path.open
|
183
|
+
url ||= string_or_io.path
|
184
|
+
end
|
185
|
+
|
177
186
|
unless encoding
|
178
187
|
# Libxml2's parser has poor support for encoding
|
179
188
|
# detection. First, it does not recognize the HTML5
|
@@ -252,9 +261,6 @@ module Nokogiri
|
|
252
261
|
end
|
253
262
|
|
254
263
|
def self.detect_encoding(chunk)
|
255
|
-
if Nokogiri.jruby? && EncodingReader.is_jruby_without_fix?
|
256
|
-
return EncodingReader.detect_encoding_for_jruby_without_fix(chunk)
|
257
|
-
end
|
258
264
|
m = chunk.match(/\A(<\?xml[ \t\r\n]+[^>]*>)/) and
|
259
265
|
return Nokogiri.XML(m[1]).encoding
|
260
266
|
|
@@ -273,26 +279,6 @@ module Nokogiri
|
|
273
279
|
end
|
274
280
|
end
|
275
281
|
|
276
|
-
def self.is_jruby_without_fix?
|
277
|
-
JRUBY_VERSION.split('.').join.to_i < 165
|
278
|
-
end
|
279
|
-
|
280
|
-
def self.detect_encoding_for_jruby_without_fix(chunk)
|
281
|
-
m = chunk.match(/\A(<\?xml[ \t\r\n]+[^>]*>)/) and
|
282
|
-
return Nokogiri.XML(m[1]).encoding
|
283
|
-
|
284
|
-
m = chunk.match(/(<meta\s)(.*)(charset\s*=\s*([\w-]+))(.*)/i) and
|
285
|
-
return m[4]
|
286
|
-
|
287
|
-
catch(:encoding_found) {
|
288
|
-
Nokogiri::HTML::SAX::Parser.new(JumpSAXHandler.new(:encoding_found.to_s)).parse(chunk)
|
289
|
-
nil
|
290
|
-
}
|
291
|
-
rescue Nokogiri::SyntaxError, RuntimeError
|
292
|
-
# Ignore parser errors that nokogiri may raise
|
293
|
-
nil
|
294
|
-
end
|
295
|
-
|
296
282
|
def initialize(io)
|
297
283
|
@io = io
|
298
284
|
@firstchunk = nil
|
@@ -4,26 +4,26 @@ module Nokogiri
|
|
4
4
|
class DocumentFragment < Nokogiri::XML::DocumentFragment
|
5
5
|
####
|
6
6
|
# Create a Nokogiri::XML::DocumentFragment from +tags+, using +encoding+
|
7
|
-
def self.parse
|
7
|
+
def self.parse(tags, encoding = nil)
|
8
8
|
doc = HTML::Document.new
|
9
9
|
|
10
10
|
encoding ||= if tags.respond_to?(:encoding)
|
11
|
-
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
|
19
|
-
|
11
|
+
encoding = tags.encoding
|
12
|
+
if encoding == ::Encoding::ASCII_8BIT
|
13
|
+
'UTF-8'
|
14
|
+
else
|
15
|
+
encoding.name
|
16
|
+
end
|
17
|
+
else
|
18
|
+
'UTF-8'
|
19
|
+
end
|
20
20
|
|
21
21
|
doc.encoding = encoding
|
22
22
|
|
23
23
|
new(doc, tags)
|
24
24
|
end
|
25
25
|
|
26
|
-
def initialize
|
26
|
+
def initialize(document, tags = nil, ctx = nil)
|
27
27
|
return self unless tags
|
28
28
|
|
29
29
|
if ctx
|
@@ -33,13 +33,13 @@ module Nokogiri
|
|
33
33
|
self.errors = document.errors - preexisting_errors
|
34
34
|
else
|
35
35
|
# This is a horrible hack, but I don't care
|
36
|
-
|
37
|
-
|
36
|
+
path = if /^\s*?<body/i.match?(tags)
|
37
|
+
"/html/body"
|
38
38
|
else
|
39
|
-
|
39
|
+
"/html/body/node()"
|
40
40
|
end
|
41
41
|
|
42
|
-
temp_doc = HTML::Document.parse
|
42
|
+
temp_doc = HTML::Document.parse("<html><body>#{tags}", nil, document.encoding)
|
43
43
|
temp_doc.xpath(path).each { |child| child.parent = self }
|
44
44
|
self.errors = temp_doc.errors
|
45
45
|
end
|
data/lib/nokogiri/version.rb
CHANGED
@@ -1,149 +1,3 @@
|
|
1
1
|
# frozen_string_literal: true
|
2
|
-
|
3
|
-
|
4
|
-
VERSION = "1.11.0.rc2"
|
5
|
-
|
6
|
-
class VersionInfo # :nodoc:
|
7
|
-
def jruby?
|
8
|
-
::JRUBY_VERSION if RUBY_PLATFORM == "java"
|
9
|
-
end
|
10
|
-
|
11
|
-
def engine
|
12
|
-
defined?(RUBY_ENGINE) ? RUBY_ENGINE : "mri"
|
13
|
-
end
|
14
|
-
|
15
|
-
def loaded_libxml_version
|
16
|
-
Gem::Version.new(LIBXML_LOADED_VERSION.
|
17
|
-
scan(/^(\d+)(\d\d)(\d\d)(?!\d)/).first.
|
18
|
-
collect(&:to_i).
|
19
|
-
join("."))
|
20
|
-
end
|
21
|
-
|
22
|
-
def compiled_libxml_version
|
23
|
-
Gem::Version.new LIBXML_COMPILED_VERSION
|
24
|
-
end
|
25
|
-
|
26
|
-
def loaded_libxslt_version
|
27
|
-
Gem::Version.new(LIBXSLT_LOADED_VERSION.
|
28
|
-
scan(/^(\d+)(\d\d)(\d\d)(?!\d)/).first.
|
29
|
-
collect(&:to_i).
|
30
|
-
join("."))
|
31
|
-
end
|
32
|
-
|
33
|
-
def compiled_libxslt_version
|
34
|
-
Gem::Version.new LIBXSLT_COMPILED_VERSION
|
35
|
-
end
|
36
|
-
|
37
|
-
def libxml2?
|
38
|
-
defined?(LIBXML_COMPILED_VERSION)
|
39
|
-
end
|
40
|
-
|
41
|
-
def libxml2_using_system?
|
42
|
-
!libxml2_using_packaged?
|
43
|
-
end
|
44
|
-
|
45
|
-
def libxml2_using_packaged?
|
46
|
-
NOKOGIRI_USE_PACKAGED_LIBRARIES
|
47
|
-
end
|
48
|
-
|
49
|
-
def warnings
|
50
|
-
warnings = []
|
51
|
-
|
52
|
-
if libxml2?
|
53
|
-
if compiled_libxml_version != loaded_libxml_version
|
54
|
-
warnings << "Nokogiri was built against libxml version #{compiled_libxml_version}, but has dynamically loaded #{loaded_libxml_version}"
|
55
|
-
end
|
56
|
-
|
57
|
-
if compiled_libxslt_version != loaded_libxslt_version
|
58
|
-
warnings << "Nokogiri was built against libxslt version #{compiled_libxslt_version}, but has dynamically loaded #{loaded_libxslt_version}"
|
59
|
-
end
|
60
|
-
end
|
61
|
-
|
62
|
-
warnings
|
63
|
-
end
|
64
|
-
|
65
|
-
def to_hash
|
66
|
-
{}.tap do |vi|
|
67
|
-
vi["warnings"] = []
|
68
|
-
vi["nokogiri"] = Nokogiri::VERSION
|
69
|
-
vi["ruby"] = {}.tap do |ruby|
|
70
|
-
ruby["version"] = ::RUBY_VERSION
|
71
|
-
ruby["platform"] = ::RUBY_PLATFORM
|
72
|
-
ruby["description"] = ::RUBY_DESCRIPTION
|
73
|
-
ruby["engine"] = engine
|
74
|
-
ruby["jruby"] = jruby? if jruby?
|
75
|
-
end
|
76
|
-
|
77
|
-
if libxml2?
|
78
|
-
vi["libxml"] = {}.tap do |libxml|
|
79
|
-
if libxml2_using_packaged?
|
80
|
-
libxml["source"] = "packaged"
|
81
|
-
libxml["patches"] = NOKOGIRI_LIBXML2_PATCHES
|
82
|
-
else
|
83
|
-
libxml["source"] = "system"
|
84
|
-
end
|
85
|
-
libxml["compiled"] = compiled_libxml_version.to_s
|
86
|
-
libxml["loaded"] = loaded_libxml_version.to_s
|
87
|
-
end
|
88
|
-
|
89
|
-
vi["libxslt"] = {}.tap do |libxslt|
|
90
|
-
if libxml2_using_packaged?
|
91
|
-
libxslt["source"] = "packaged"
|
92
|
-
libxslt["patches"] = NOKOGIRI_LIBXSLT_PATCHES
|
93
|
-
else
|
94
|
-
libxslt["source"] = "system"
|
95
|
-
end
|
96
|
-
libxslt["compiled"] = compiled_libxslt_version.to_s
|
97
|
-
libxslt["loaded"] = loaded_libxslt_version.to_s
|
98
|
-
end
|
99
|
-
|
100
|
-
vi["warnings"] = warnings
|
101
|
-
elsif jruby?
|
102
|
-
vi["xerces"] = Nokogiri::XERCES_VERSION
|
103
|
-
vi["nekohtml"] = Nokogiri::NEKO_VERSION
|
104
|
-
end
|
105
|
-
end
|
106
|
-
end
|
107
|
-
|
108
|
-
def to_markdown
|
109
|
-
begin
|
110
|
-
require "psych"
|
111
|
-
rescue LoadError
|
112
|
-
end
|
113
|
-
require "yaml"
|
114
|
-
"# Nokogiri (#{Nokogiri::VERSION})\n" +
|
115
|
-
YAML.dump(to_hash).each_line.map { |line| " #{line}" }.join
|
116
|
-
end
|
117
|
-
|
118
|
-
# FIXME: maybe switch to singleton?
|
119
|
-
@@instance = new
|
120
|
-
@@instance.warnings.each do |warning|
|
121
|
-
warn "WARNING: #{warning}"
|
122
|
-
end
|
123
|
-
def self.instance; @@instance; end
|
124
|
-
end
|
125
|
-
|
126
|
-
def self.uses_libxml?(requirement = nil) # :nodoc:
|
127
|
-
return false unless VersionInfo.instance.libxml2?
|
128
|
-
return true unless requirement
|
129
|
-
return Gem::Requirement.new(requirement).satisfied_by?(VersionInfo.instance.loaded_libxml_version)
|
130
|
-
end
|
131
|
-
|
132
|
-
def self.jruby? # :nodoc:
|
133
|
-
VersionInfo.instance.jruby?
|
134
|
-
end
|
135
|
-
|
136
|
-
# Ensure constants used in this file are loaded - see #1896
|
137
|
-
if Nokogiri.jruby?
|
138
|
-
require "nokogiri/jruby/dependencies"
|
139
|
-
end
|
140
|
-
begin
|
141
|
-
RUBY_VERSION =~ /(\d+\.\d+)/
|
142
|
-
require "nokogiri/#{$1}/nokogiri"
|
143
|
-
rescue LoadError
|
144
|
-
require "nokogiri/nokogiri"
|
145
|
-
end
|
146
|
-
|
147
|
-
# More complete version information about libxml
|
148
|
-
VERSION_INFO = VersionInfo.instance.to_hash
|
149
|
-
end
|
2
|
+
require_relative "version/constant"
|
3
|
+
require_relative "version/info"
|