nokogiri 1.8.5 → 1.9.1
Sign up to get free protection for your applications and to get access to all the features.
Potentially problematic release.
This version of nokogiri might be problematic. Click here for more details.
- checksums.yaml +4 -4
- data/README.md +0 -1
- data/ext/nokogiri/extconf.rb +10 -6
- data/ext/nokogiri/xml_attr.c +26 -21
- data/ext/nokogiri/xml_document.c +4 -1
- data/ext/nokogiri/xml_namespace.c +3 -3
- data/ext/nokogiri/xml_namespace.h +1 -2
- data/ext/nokogiri/xml_node.c +55 -15
- data/lib/nokogiri/css/parser.rb +61 -61
- data/lib/nokogiri/version.rb +1 -1
- data/lib/nokogiri/xml/document_fragment.rb +11 -0
- data/lib/nokogiri/xml/node.rb +12 -0
- data/lib/nokogiri/xml/node_set.rb +4 -8
- metadata +17 -153
- data/.autotest +0 -22
- data/.cross_rubies +0 -8
- data/.editorconfig +0 -17
- data/.gemtest +0 -0
- data/.travis.yml +0 -63
- data/CHANGELOG.md +0 -1368
- data/CONTRIBUTING.md +0 -42
- data/C_CODING_STYLE.rdoc +0 -33
- data/Gemfile +0 -23
- data/Gemfile-libxml-ruby +0 -3
- data/Manifest.txt +0 -370
- data/ROADMAP.md +0 -111
- data/Rakefile +0 -348
- data/SECURITY.md +0 -19
- data/STANDARD_RESPONSES.md +0 -47
- data/Y_U_NO_GEMSPEC.md +0 -155
- data/appveyor.yml +0 -29
- data/build_all +0 -44
- data/patches/sort-patches-by-date +0 -25
- data/suppressions/README.txt +0 -1
- data/suppressions/nokogiri_ruby-2.supp +0 -10
- data/tasks/test.rb +0 -100
- data/test/css/test_nthiness.rb +0 -226
- data/test/css/test_parser.rb +0 -386
- data/test/css/test_tokenizer.rb +0 -215
- data/test/css/test_xpath_visitor.rb +0 -96
- data/test/decorators/test_slop.rb +0 -23
- data/test/files/2ch.html +0 -108
- data/test/files/GH_1042.html +0 -18
- data/test/files/address_book.rlx +0 -12
- data/test/files/address_book.xml +0 -10
- data/test/files/atom.xml +0 -344
- data/test/files/bar/bar.xsd +0 -4
- data/test/files/bogus.xml +0 -0
- data/test/files/dont_hurt_em_why.xml +0 -422
- data/test/files/encoding.html +0 -82
- data/test/files/encoding.xhtml +0 -84
- data/test/files/exslt.xml +0 -8
- data/test/files/exslt.xslt +0 -35
- data/test/files/foo/foo.xsd +0 -4
- data/test/files/metacharset.html +0 -10
- data/test/files/namespace_pressure_test.xml +0 -1684
- data/test/files/noencoding.html +0 -47
- data/test/files/po.xml +0 -32
- data/test/files/po.xsd +0 -66
- data/test/files/saml/saml20assertion_schema.xsd +0 -283
- data/test/files/saml/saml20protocol_schema.xsd +0 -302
- data/test/files/saml/xenc_schema.xsd +0 -146
- data/test/files/saml/xmldsig_schema.xsd +0 -318
- data/test/files/shift_jis.html +0 -10
- data/test/files/shift_jis.xml +0 -5
- data/test/files/shift_jis_no_charset.html +0 -9
- data/test/files/slow-xpath.xml +0 -25509
- data/test/files/snuggles.xml +0 -3
- data/test/files/staff.dtd +0 -10
- data/test/files/staff.xml +0 -59
- data/test/files/staff.xslt +0 -32
- data/test/files/test_document_url/bar.xml +0 -2
- data/test/files/test_document_url/document.dtd +0 -4
- data/test/files/test_document_url/document.xml +0 -6
- data/test/files/tlm.html +0 -851
- data/test/files/to_be_xincluded.xml +0 -2
- data/test/files/valid_bar.xml +0 -2
- data/test/files/xinclude.xml +0 -4
- data/test/helper.rb +0 -271
- data/test/html/sax/test_parser.rb +0 -168
- data/test/html/sax/test_parser_context.rb +0 -46
- data/test/html/sax/test_parser_text.rb +0 -163
- data/test/html/sax/test_push_parser.rb +0 -87
- data/test/html/test_attributes.rb +0 -85
- data/test/html/test_builder.rb +0 -164
- data/test/html/test_document.rb +0 -712
- data/test/html/test_document_encoding.rb +0 -143
- data/test/html/test_document_fragment.rb +0 -310
- data/test/html/test_element_description.rb +0 -105
- data/test/html/test_named_characters.rb +0 -14
- data/test/html/test_node.rb +0 -212
- data/test/html/test_node_encoding.rb +0 -91
- data/test/namespaces/test_additional_namespaces_in_builder_doc.rb +0 -14
- data/test/namespaces/test_namespaces_aliased_default.rb +0 -24
- data/test/namespaces/test_namespaces_in_builder_doc.rb +0 -75
- data/test/namespaces/test_namespaces_in_cloned_doc.rb +0 -31
- data/test/namespaces/test_namespaces_in_created_doc.rb +0 -75
- data/test/namespaces/test_namespaces_in_parsed_doc.rb +0 -80
- data/test/namespaces/test_namespaces_preservation.rb +0 -31
- data/test/test_convert_xpath.rb +0 -135
- data/test/test_css_cache.rb +0 -47
- data/test/test_encoding_handler.rb +0 -48
- data/test/test_memory_leak.rb +0 -156
- data/test/test_nokogiri.rb +0 -138
- data/test/test_soap4r_sax.rb +0 -52
- data/test/test_xslt_transforms.rb +0 -314
- data/test/xml/node/test_save_options.rb +0 -28
- data/test/xml/node/test_subclass.rb +0 -44
- data/test/xml/sax/test_parser.rb +0 -402
- data/test/xml/sax/test_parser_context.rb +0 -115
- data/test/xml/sax/test_parser_text.rb +0 -202
- data/test/xml/sax/test_push_parser.rb +0 -265
- data/test/xml/test_attr.rb +0 -74
- data/test/xml/test_attribute_decl.rb +0 -86
- data/test/xml/test_builder.rb +0 -341
- data/test/xml/test_c14n.rb +0 -180
- data/test/xml/test_cdata.rb +0 -54
- data/test/xml/test_comment.rb +0 -40
- data/test/xml/test_document.rb +0 -982
- data/test/xml/test_document_encoding.rb +0 -31
- data/test/xml/test_document_fragment.rb +0 -298
- data/test/xml/test_dtd.rb +0 -187
- data/test/xml/test_dtd_encoding.rb +0 -31
- data/test/xml/test_element_content.rb +0 -56
- data/test/xml/test_element_decl.rb +0 -73
- data/test/xml/test_entity_decl.rb +0 -122
- data/test/xml/test_entity_reference.rb +0 -262
- data/test/xml/test_namespace.rb +0 -96
- data/test/xml/test_node.rb +0 -1325
- data/test/xml/test_node_attributes.rb +0 -115
- data/test/xml/test_node_encoding.rb +0 -75
- data/test/xml/test_node_inheritance.rb +0 -32
- data/test/xml/test_node_reparenting.rb +0 -592
- data/test/xml/test_node_set.rb +0 -809
- data/test/xml/test_parse_options.rb +0 -64
- data/test/xml/test_processing_instruction.rb +0 -30
- data/test/xml/test_reader.rb +0 -620
- data/test/xml/test_reader_encoding.rb +0 -134
- data/test/xml/test_relax_ng.rb +0 -60
- data/test/xml/test_schema.rb +0 -142
- data/test/xml/test_syntax_error.rb +0 -36
- data/test/xml/test_text.rb +0 -60
- data/test/xml/test_unparented_node.rb +0 -483
- data/test/xml/test_xinclude.rb +0 -83
- data/test/xml/test_xpath.rb +0 -470
- data/test/xslt/test_custom_functions.rb +0 -133
- data/test/xslt/test_exception_handling.rb +0 -37
data/test/xml/sax/test_parser.rb
DELETED
@@ -1,402 +0,0 @@
|
|
1
|
-
# -*- coding: utf-8 -*-
|
2
|
-
|
3
|
-
require "helper"
|
4
|
-
|
5
|
-
module Nokogiri
|
6
|
-
module XML
|
7
|
-
module SAX
|
8
|
-
class TestParser < Nokogiri::SAX::TestCase
|
9
|
-
def setup
|
10
|
-
super
|
11
|
-
@parser = XML::SAX::Parser.new(Doc.new)
|
12
|
-
end
|
13
|
-
|
14
|
-
def test_parser_context_yielded_io
|
15
|
-
doc = Doc.new
|
16
|
-
parser = XML::SAX::Parser.new doc
|
17
|
-
xml = "<foo a='&b'/>"
|
18
|
-
|
19
|
-
block_called = false
|
20
|
-
parser.parse(StringIO.new(xml)) { |ctx|
|
21
|
-
block_called = true
|
22
|
-
ctx.replace_entities = true
|
23
|
-
}
|
24
|
-
|
25
|
-
assert block_called
|
26
|
-
|
27
|
-
assert_equal [['foo', [['a', '&b']]]], doc.start_elements
|
28
|
-
end
|
29
|
-
|
30
|
-
def test_parser_context_yielded_in_memory
|
31
|
-
doc = Doc.new
|
32
|
-
parser = XML::SAX::Parser.new doc
|
33
|
-
xml = "<foo a='&b'/>"
|
34
|
-
|
35
|
-
block_called = false
|
36
|
-
parser.parse(xml) { |ctx|
|
37
|
-
block_called = true
|
38
|
-
ctx.replace_entities = true
|
39
|
-
}
|
40
|
-
|
41
|
-
assert block_called
|
42
|
-
|
43
|
-
assert_equal [['foo', [['a', '&b']]]], doc.start_elements
|
44
|
-
end
|
45
|
-
|
46
|
-
def test_empty_decl
|
47
|
-
parser = XML::SAX::Parser.new(Doc.new)
|
48
|
-
|
49
|
-
xml = "<root />"
|
50
|
-
parser.parse xml
|
51
|
-
assert parser.document.start_document_called, xml
|
52
|
-
assert_nil parser.document.xmldecls, xml
|
53
|
-
end
|
54
|
-
|
55
|
-
def test_xml_decl
|
56
|
-
[
|
57
|
-
['<?xml version="1.0" ?>',
|
58
|
-
['1.0']],
|
59
|
-
['<?xml version="1.0" encoding="UTF-8" ?>',
|
60
|
-
['1.0', 'UTF-8']],
|
61
|
-
['<?xml version="1.0" standalone="yes"?>',
|
62
|
-
['1.0', 'yes']],
|
63
|
-
['<?xml version="1.0" standalone="no"?>',
|
64
|
-
['1.0', 'no']],
|
65
|
-
['<?xml version="1.0" encoding="UTF-8" standalone="no"?>',
|
66
|
-
['1.0', "UTF-8", 'no']],
|
67
|
-
['<?xml version="1.0" encoding="ISO-8859-1" standalone="yes"?>',
|
68
|
-
['1.0', "ISO-8859-1", 'yes']]
|
69
|
-
].each do |decl, value|
|
70
|
-
parser = XML::SAX::Parser.new(Doc.new)
|
71
|
-
|
72
|
-
xml = "#{decl}\n<root />"
|
73
|
-
parser.parse xml
|
74
|
-
assert parser.document.start_document_called, xml
|
75
|
-
assert_equal value, parser.document.xmldecls, xml
|
76
|
-
end
|
77
|
-
end
|
78
|
-
|
79
|
-
def test_parse_empty
|
80
|
-
assert_raises RuntimeError do
|
81
|
-
@parser.parse('')
|
82
|
-
end
|
83
|
-
end
|
84
|
-
|
85
|
-
def test_namespace_declaration_order_is_saved
|
86
|
-
@parser.parse <<-eoxml
|
87
|
-
<root xmlns:foo='http://foo.example.com/' xmlns='http://example.com/'>
|
88
|
-
<a foo:bar='hello' />
|
89
|
-
</root>
|
90
|
-
eoxml
|
91
|
-
assert_equal 2, @parser.document.start_elements_namespace.length
|
92
|
-
el = @parser.document.start_elements_namespace.first
|
93
|
-
namespaces = el.last
|
94
|
-
assert_equal ['foo', 'http://foo.example.com/'], namespaces.first
|
95
|
-
assert_equal [nil, 'http://example.com/'], namespaces.last
|
96
|
-
end
|
97
|
-
|
98
|
-
def test_bad_document_calls_error_handler
|
99
|
-
@parser.parse('<foo><bar></foo>')
|
100
|
-
assert @parser.document.errors
|
101
|
-
assert @parser.document.errors.length > 0
|
102
|
-
end
|
103
|
-
|
104
|
-
def test_namespace_are_super_fun_to_parse
|
105
|
-
@parser.parse <<-eoxml
|
106
|
-
<root xmlns:foo='http://foo.example.com/'>
|
107
|
-
<a foo:bar='hello' />
|
108
|
-
<b xmlns:foo='http://bar.example.com/'>
|
109
|
-
<a foo:bar='hello' />
|
110
|
-
</b>
|
111
|
-
<foo:bar>hello world</foo:bar>
|
112
|
-
</root>
|
113
|
-
eoxml
|
114
|
-
|
115
|
-
assert @parser.document.start_elements_namespace.length > 0
|
116
|
-
el = @parser.document.start_elements_namespace[1]
|
117
|
-
assert_equal 'a', el.first
|
118
|
-
assert_equal 1, el[1].length
|
119
|
-
|
120
|
-
attribute = el[1].first
|
121
|
-
assert_equal 'bar', attribute.localname
|
122
|
-
assert_equal 'foo', attribute.prefix
|
123
|
-
assert_equal 'hello', attribute.value
|
124
|
-
assert_equal 'http://foo.example.com/', attribute.uri
|
125
|
-
end
|
126
|
-
|
127
|
-
def test_sax_v1_namespace_attribute_declarations
|
128
|
-
@parser.parse <<-eoxml
|
129
|
-
<root xmlns:foo='http://foo.example.com/' xmlns='http://example.com/'>
|
130
|
-
<a foo:bar='hello' />
|
131
|
-
<b xmlns:foo='http://bar.example.com/'>
|
132
|
-
<a foo:bar='hello' />
|
133
|
-
</b>
|
134
|
-
<foo:bar>hello world</foo:bar>
|
135
|
-
</root>
|
136
|
-
eoxml
|
137
|
-
assert @parser.document.start_elements.length > 0
|
138
|
-
elm = @parser.document.start_elements.first
|
139
|
-
assert_equal 'root', elm.first
|
140
|
-
assert elm[1].include?(['xmlns:foo', 'http://foo.example.com/'])
|
141
|
-
assert elm[1].include?(['xmlns', 'http://example.com/'])
|
142
|
-
end
|
143
|
-
|
144
|
-
def test_sax_v1_namespace_nodes
|
145
|
-
@parser.parse <<-eoxml
|
146
|
-
<root xmlns:foo='http://foo.example.com/' xmlns='http://example.com/'>
|
147
|
-
<a foo:bar='hello' />
|
148
|
-
<b xmlns:foo='http://bar.example.com/'>
|
149
|
-
<a foo:bar='hello' />
|
150
|
-
</b>
|
151
|
-
<foo:bar>hello world</foo:bar>
|
152
|
-
</root>
|
153
|
-
eoxml
|
154
|
-
assert_equal 5, @parser.document.start_elements.length
|
155
|
-
assert @parser.document.start_elements.map(&:first).include?('foo:bar')
|
156
|
-
assert @parser.document.end_elements.map(&:first).include?('foo:bar')
|
157
|
-
end
|
158
|
-
|
159
|
-
def test_start_is_called_without_namespace
|
160
|
-
@parser.parse(<<-eoxml)
|
161
|
-
<root xmlns:foo='http://foo.example.com/' xmlns='http://example.com/'>
|
162
|
-
<foo:f><bar></foo:f>
|
163
|
-
</root>
|
164
|
-
eoxml
|
165
|
-
assert_equal ['root', 'foo:f', 'bar'],
|
166
|
-
@parser.document.start_elements.map(&:first)
|
167
|
-
end
|
168
|
-
|
169
|
-
def test_parser_sets_encoding
|
170
|
-
parser = XML::SAX::Parser.new(Doc.new, 'UTF-8')
|
171
|
-
assert_equal 'UTF-8', parser.encoding
|
172
|
-
end
|
173
|
-
|
174
|
-
def test_errors_set_after_parsing_bad_dom
|
175
|
-
doc = Nokogiri::XML('<foo><bar></foo>')
|
176
|
-
assert doc.errors
|
177
|
-
|
178
|
-
@parser.parse('<foo><bar></foo>')
|
179
|
-
assert @parser.document.errors
|
180
|
-
assert @parser.document.errors.length > 0
|
181
|
-
|
182
|
-
doc.errors.each do |error|
|
183
|
-
assert_equal 'UTF-8', error.message.encoding.name
|
184
|
-
end
|
185
|
-
|
186
|
-
# when using JRuby Nokogiri, more errors will be generated as the DOM
|
187
|
-
# parser continue to parse an ill formed document, while the sax parser
|
188
|
-
# will stop at the first error
|
189
|
-
unless Nokogiri.jruby?
|
190
|
-
assert_equal doc.errors.length, @parser.document.errors.length
|
191
|
-
end
|
192
|
-
end
|
193
|
-
|
194
|
-
def test_parse_with_memory_argument
|
195
|
-
@parser.parse(File.read(XML_FILE))
|
196
|
-
assert(@parser.document.cdata_blocks.length > 0)
|
197
|
-
end
|
198
|
-
|
199
|
-
def test_parse_with_io_argument
|
200
|
-
File.open(XML_FILE, 'rb') { |f|
|
201
|
-
@parser.parse(f)
|
202
|
-
}
|
203
|
-
assert(@parser.document.cdata_blocks.length > 0)
|
204
|
-
end
|
205
|
-
|
206
|
-
def test_parse_io
|
207
|
-
call_parse_io_with_encoding 'UTF-8'
|
208
|
-
end
|
209
|
-
|
210
|
-
# issue #828
|
211
|
-
def test_parse_io_lower_case_encoding
|
212
|
-
call_parse_io_with_encoding 'utf-8'
|
213
|
-
end
|
214
|
-
|
215
|
-
def call_parse_io_with_encoding encoding
|
216
|
-
File.open(XML_FILE, 'rb') { |f|
|
217
|
-
@parser.parse_io(f, encoding)
|
218
|
-
}
|
219
|
-
assert(@parser.document.cdata_blocks.length > 0)
|
220
|
-
|
221
|
-
called = false
|
222
|
-
@parser.document.start_elements.flatten.each do |thing|
|
223
|
-
assert_equal 'UTF-8', thing.encoding.name
|
224
|
-
called = true
|
225
|
-
end
|
226
|
-
assert called
|
227
|
-
|
228
|
-
called = false
|
229
|
-
@parser.document.end_elements.flatten.each do |thing|
|
230
|
-
assert_equal 'UTF-8', thing.encoding.name
|
231
|
-
called = true
|
232
|
-
end
|
233
|
-
assert called
|
234
|
-
|
235
|
-
called = false
|
236
|
-
@parser.document.data.each do |thing|
|
237
|
-
assert_equal 'UTF-8', thing.encoding.name
|
238
|
-
called = true
|
239
|
-
end
|
240
|
-
assert called
|
241
|
-
|
242
|
-
called = false
|
243
|
-
@parser.document.comments.flatten.each do |thing|
|
244
|
-
assert_equal 'UTF-8', thing.encoding.name
|
245
|
-
called = true
|
246
|
-
end
|
247
|
-
assert called
|
248
|
-
|
249
|
-
called = false
|
250
|
-
@parser.document.cdata_blocks.flatten.each do |thing|
|
251
|
-
assert_equal 'UTF-8', thing.encoding.name
|
252
|
-
called = true
|
253
|
-
end
|
254
|
-
assert called
|
255
|
-
end
|
256
|
-
|
257
|
-
def test_parse_file
|
258
|
-
@parser.parse_file(XML_FILE)
|
259
|
-
|
260
|
-
assert_raises(ArgumentError) {
|
261
|
-
@parser.parse_file(nil)
|
262
|
-
}
|
263
|
-
|
264
|
-
assert_raises(Errno::ENOENT) {
|
265
|
-
@parser.parse_file('')
|
266
|
-
}
|
267
|
-
assert_raises(Errno::EISDIR) {
|
268
|
-
@parser.parse_file(File.expand_path(File.dirname(__FILE__)))
|
269
|
-
}
|
270
|
-
end
|
271
|
-
|
272
|
-
def test_render_parse_nil_param
|
273
|
-
assert_raises(ArgumentError) { @parser.parse_memory(nil) }
|
274
|
-
end
|
275
|
-
|
276
|
-
def test_bad_encoding_args
|
277
|
-
assert_raises(ArgumentError) { XML::SAX::Parser.new(Doc.new, 'not an encoding') }
|
278
|
-
assert_raises(ArgumentError) { @parser.parse_io(StringIO.new('<root/>'), 'not an encoding')}
|
279
|
-
end
|
280
|
-
|
281
|
-
def test_ctag
|
282
|
-
@parser.parse_memory(<<-eoxml)
|
283
|
-
<p id="asdfasdf">
|
284
|
-
<![CDATA[ This is a comment ]]>
|
285
|
-
Paragraph 1
|
286
|
-
</p>
|
287
|
-
eoxml
|
288
|
-
assert_equal [' This is a comment '], @parser.document.cdata_blocks
|
289
|
-
end
|
290
|
-
|
291
|
-
def test_comment
|
292
|
-
@parser.parse_memory(<<-eoxml)
|
293
|
-
<p id="asdfasdf">
|
294
|
-
<!-- This is a comment -->
|
295
|
-
Paragraph 1
|
296
|
-
</p>
|
297
|
-
eoxml
|
298
|
-
assert_equal [' This is a comment '], @parser.document.comments
|
299
|
-
end
|
300
|
-
|
301
|
-
def test_characters
|
302
|
-
@parser.parse_memory(<<-eoxml)
|
303
|
-
<p id="asdfasdf">Paragraph 1</p>
|
304
|
-
eoxml
|
305
|
-
assert_equal ['Paragraph 1'], @parser.document.data
|
306
|
-
end
|
307
|
-
|
308
|
-
def test_end_document
|
309
|
-
@parser.parse_memory(<<-eoxml)
|
310
|
-
<p id="asdfasdf">Paragraph 1</p>
|
311
|
-
eoxml
|
312
|
-
assert @parser.document.end_document_called
|
313
|
-
end
|
314
|
-
|
315
|
-
def test_end_element
|
316
|
-
@parser.parse_memory(<<-eoxml)
|
317
|
-
<p id="asdfasdf">Paragraph 1</p>
|
318
|
-
eoxml
|
319
|
-
assert_equal [["p"]],
|
320
|
-
@parser.document.end_elements
|
321
|
-
end
|
322
|
-
|
323
|
-
def test_start_element_attrs
|
324
|
-
@parser.parse_memory(<<-eoxml)
|
325
|
-
<p id="asdfasdf">Paragraph 1</p>
|
326
|
-
eoxml
|
327
|
-
assert_equal [["p", [["id", "asdfasdf"]]]],
|
328
|
-
@parser.document.start_elements
|
329
|
-
end
|
330
|
-
|
331
|
-
def test_start_element_attrs_include_namespaces
|
332
|
-
@parser.parse_memory(<<-eoxml)
|
333
|
-
<p xmlns:foo='http://foo.example.com/'>Paragraph 1</p>
|
334
|
-
eoxml
|
335
|
-
assert_equal [["p", [['xmlns:foo', 'http://foo.example.com/']]]],
|
336
|
-
@parser.document.start_elements
|
337
|
-
end
|
338
|
-
|
339
|
-
def test_processing_instruction
|
340
|
-
@parser.parse_memory(<<-eoxml)
|
341
|
-
<?xml-stylesheet href="a.xsl" type="text/xsl"?>
|
342
|
-
<?xml version="1.0"?>
|
343
|
-
eoxml
|
344
|
-
assert_equal [['xml-stylesheet', 'href="a.xsl" type="text/xsl"']],
|
345
|
-
@parser.document.processing_instructions
|
346
|
-
end
|
347
|
-
|
348
|
-
if Nokogiri.uses_libxml? # JRuby SAXParser only parses well-formed XML documents
|
349
|
-
def test_parse_document
|
350
|
-
@parser.parse_memory(<<-eoxml)
|
351
|
-
<p>Paragraph 1</p>
|
352
|
-
<p>Paragraph 2</p>
|
353
|
-
eoxml
|
354
|
-
end
|
355
|
-
end
|
356
|
-
|
357
|
-
def test_parser_attributes
|
358
|
-
xml = <<-eoxml
|
359
|
-
<?xml version="1.0" ?><root><foo a="&b" c=">d" /></root>
|
360
|
-
eoxml
|
361
|
-
|
362
|
-
block_called = false
|
363
|
-
@parser.parse(xml) { |ctx|
|
364
|
-
block_called = true
|
365
|
-
ctx.replace_entities = true
|
366
|
-
}
|
367
|
-
|
368
|
-
assert block_called
|
369
|
-
|
370
|
-
assert_equal [['root', []], ['foo', [['a', '&b'], ['c', '>d']]]], @parser.document.start_elements
|
371
|
-
end
|
372
|
-
|
373
|
-
def test_recovery_from_incorrect_xml
|
374
|
-
xml = <<-eoxml
|
375
|
-
<?xml version="1.0" ?><Root><Data><?xml version='1.0'?><Item>hey</Item></Data><Data><Item>hey yourself</Item></Data></Root>
|
376
|
-
eoxml
|
377
|
-
|
378
|
-
block_called = false
|
379
|
-
@parser.parse(xml) { |ctx|
|
380
|
-
block_called = true
|
381
|
-
ctx.recovery = true
|
382
|
-
}
|
383
|
-
|
384
|
-
assert block_called
|
385
|
-
|
386
|
-
assert_equal [['Root', []], ['Data', []], ['Item', []], ['Data', []], ['Item', []]], @parser.document.start_elements
|
387
|
-
end
|
388
|
-
|
389
|
-
def test_square_bracket_in_text # issue 1261
|
390
|
-
xml = <<-eoxml
|
391
|
-
<tu tuid="87dea04cf60af103ff09d1dba36ae820" segtype="block">
|
392
|
-
<prop type="x-smartling-string-variant">en:#:home_page:#:stories:#:[6]:#:name</prop>
|
393
|
-
<tuv xml:lang="en-US"><seg>Sandy S.</seg></tuv>
|
394
|
-
</tu>
|
395
|
-
eoxml
|
396
|
-
@parser.parse(xml)
|
397
|
-
assert @parser.document.data.must_include "en:#:home_page:#:stories:#:[6]:#:name"
|
398
|
-
end
|
399
|
-
end
|
400
|
-
end
|
401
|
-
end
|
402
|
-
end
|
@@ -1,115 +0,0 @@
|
|
1
|
-
# -*- coding: utf-8 -*-
|
2
|
-
|
3
|
-
require "helper"
|
4
|
-
|
5
|
-
module Nokogiri
|
6
|
-
module XML
|
7
|
-
module SAX
|
8
|
-
class TestParserContext < Nokogiri::SAX::TestCase
|
9
|
-
def setup
|
10
|
-
@xml = '<hello>
|
11
|
-
|
12
|
-
world
|
13
|
-
<inter>
|
14
|
-
<net>
|
15
|
-
</net>
|
16
|
-
</inter>
|
17
|
-
|
18
|
-
</hello>'
|
19
|
-
end
|
20
|
-
|
21
|
-
class Counter < Nokogiri::XML::SAX::Document
|
22
|
-
attr_accessor :context, :lines, :columns
|
23
|
-
def initialize
|
24
|
-
@context = nil
|
25
|
-
@lines = []
|
26
|
-
@columns = []
|
27
|
-
end
|
28
|
-
|
29
|
-
def start_element name, attrs = []
|
30
|
-
@lines << [name, context.line]
|
31
|
-
@columns << [name, context.column]
|
32
|
-
end
|
33
|
-
end
|
34
|
-
|
35
|
-
def test_line_numbers
|
36
|
-
sax_handler = Counter.new
|
37
|
-
|
38
|
-
parser = Nokogiri::XML::SAX::Parser.new(sax_handler)
|
39
|
-
parser.parse(@xml) do |ctx|
|
40
|
-
sax_handler.context = ctx
|
41
|
-
end
|
42
|
-
|
43
|
-
assert_equal [["hello", 1], ["inter", 4], ["net", 5]],
|
44
|
-
sax_handler.lines
|
45
|
-
end
|
46
|
-
|
47
|
-
def test_column_numbers
|
48
|
-
sax_handler = Counter.new
|
49
|
-
|
50
|
-
parser = Nokogiri::XML::SAX::Parser.new(sax_handler)
|
51
|
-
parser.parse(@xml) do |ctx|
|
52
|
-
sax_handler.context = ctx
|
53
|
-
end
|
54
|
-
|
55
|
-
assert_equal [["hello", 7], ["inter", 7], ["net", 9]],
|
56
|
-
sax_handler.columns
|
57
|
-
end
|
58
|
-
|
59
|
-
def test_replace_entities
|
60
|
-
pc = ParserContext.new StringIO.new('<root />'), 'UTF-8'
|
61
|
-
pc.replace_entities = false
|
62
|
-
assert_equal false, pc.replace_entities
|
63
|
-
|
64
|
-
pc.replace_entities = true
|
65
|
-
assert_equal true, pc.replace_entities
|
66
|
-
end
|
67
|
-
|
68
|
-
def test_recovery
|
69
|
-
pc = ParserContext.new StringIO.new('<root />'), 'UTF-8'
|
70
|
-
pc.recovery = false
|
71
|
-
assert_equal false, pc.recovery
|
72
|
-
|
73
|
-
pc.recovery = true
|
74
|
-
assert_equal true, pc.recovery
|
75
|
-
end
|
76
|
-
|
77
|
-
def test_from_io
|
78
|
-
ctx = ParserContext.new StringIO.new('fo'), 'UTF-8'
|
79
|
-
assert ctx
|
80
|
-
end
|
81
|
-
|
82
|
-
def test_from_string
|
83
|
-
assert ParserContext.new 'blah blah'
|
84
|
-
end
|
85
|
-
|
86
|
-
def test_parse_with
|
87
|
-
ctx = ParserContext.new 'blah'
|
88
|
-
assert_raises ArgumentError do
|
89
|
-
ctx.parse_with nil
|
90
|
-
end
|
91
|
-
end
|
92
|
-
|
93
|
-
def test_parse_with_sax_parser
|
94
|
-
xml = "<root />"
|
95
|
-
ctx = ParserContext.new xml
|
96
|
-
parser = Parser.new Doc.new
|
97
|
-
assert_nil ctx.parse_with parser
|
98
|
-
end
|
99
|
-
|
100
|
-
def test_from_file
|
101
|
-
ctx = ParserContext.file XML_FILE
|
102
|
-
parser = Parser.new Doc.new
|
103
|
-
assert_nil ctx.parse_with parser
|
104
|
-
end
|
105
|
-
|
106
|
-
def test_parse_with_returns_nil
|
107
|
-
xml = "<root />"
|
108
|
-
ctx = ParserContext.new xml
|
109
|
-
parser = Parser.new Doc.new
|
110
|
-
assert_nil ctx.parse_with(parser)
|
111
|
-
end
|
112
|
-
end
|
113
|
-
end
|
114
|
-
end
|
115
|
-
end
|