rubyjedi-nokogiri_java 1.4.0.20100513161003-java
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/.autotest +26 -0
- data/CHANGELOG.ja.rdoc +330 -0
- data/CHANGELOG.rdoc +341 -0
- data/Manifest.txt +277 -0
- data/README.ja.rdoc +105 -0
- data/README.rdoc +125 -0
- data/Rakefile +307 -0
- data/bin/nokogiri +49 -0
- data/deps.rip +5 -0
- data/ext/nokogiri/extconf.rb +149 -0
- data/ext/nokogiri/html_document.c +145 -0
- data/ext/nokogiri/html_document.h +10 -0
- data/ext/nokogiri/html_element_description.c +272 -0
- data/ext/nokogiri/html_element_description.h +10 -0
- data/ext/nokogiri/html_entity_lookup.c +32 -0
- data/ext/nokogiri/html_entity_lookup.h +8 -0
- data/ext/nokogiri/html_sax_parser_context.c +92 -0
- data/ext/nokogiri/html_sax_parser_context.h +11 -0
- data/ext/nokogiri/nokogiri.c +96 -0
- data/ext/nokogiri/nokogiri.h +148 -0
- data/ext/nokogiri/xml_attr.c +92 -0
- data/ext/nokogiri/xml_attr.h +9 -0
- data/ext/nokogiri/xml_attribute_decl.c +67 -0
- data/ext/nokogiri/xml_attribute_decl.h +9 -0
- data/ext/nokogiri/xml_cdata.c +54 -0
- data/ext/nokogiri/xml_cdata.h +9 -0
- data/ext/nokogiri/xml_comment.c +52 -0
- data/ext/nokogiri/xml_comment.h +9 -0
- data/ext/nokogiri/xml_document.c +386 -0
- data/ext/nokogiri/xml_document.h +24 -0
- data/ext/nokogiri/xml_document_fragment.c +46 -0
- data/ext/nokogiri/xml_document_fragment.h +10 -0
- data/ext/nokogiri/xml_dtd.c +192 -0
- data/ext/nokogiri/xml_dtd.h +10 -0
- data/ext/nokogiri/xml_element_content.c +123 -0
- data/ext/nokogiri/xml_element_content.h +10 -0
- data/ext/nokogiri/xml_element_decl.c +69 -0
- data/ext/nokogiri/xml_element_decl.h +9 -0
- data/ext/nokogiri/xml_encoding_handler.c +79 -0
- data/ext/nokogiri/xml_encoding_handler.h +8 -0
- data/ext/nokogiri/xml_entity_decl.c +97 -0
- data/ext/nokogiri/xml_entity_decl.h +10 -0
- data/ext/nokogiri/xml_entity_reference.c +50 -0
- data/ext/nokogiri/xml_entity_reference.h +9 -0
- data/ext/nokogiri/xml_io.c +31 -0
- data/ext/nokogiri/xml_io.h +11 -0
- data/ext/nokogiri/xml_namespace.c +82 -0
- data/ext/nokogiri/xml_namespace.h +13 -0
- data/ext/nokogiri/xml_node.c +1080 -0
- data/ext/nokogiri/xml_node.h +13 -0
- data/ext/nokogiri/xml_node_set.c +405 -0
- data/ext/nokogiri/xml_node_set.h +9 -0
- data/ext/nokogiri/xml_processing_instruction.c +54 -0
- data/ext/nokogiri/xml_processing_instruction.h +9 -0
- data/ext/nokogiri/xml_reader.c +593 -0
- data/ext/nokogiri/xml_reader.h +10 -0
- data/ext/nokogiri/xml_relax_ng.c +159 -0
- data/ext/nokogiri/xml_relax_ng.h +9 -0
- data/ext/nokogiri/xml_sax_parser.c +283 -0
- data/ext/nokogiri/xml_sax_parser.h +43 -0
- data/ext/nokogiri/xml_sax_parser_context.c +157 -0
- data/ext/nokogiri/xml_sax_parser_context.h +10 -0
- data/ext/nokogiri/xml_sax_push_parser.c +114 -0
- data/ext/nokogiri/xml_sax_push_parser.h +9 -0
- data/ext/nokogiri/xml_schema.c +156 -0
- data/ext/nokogiri/xml_schema.h +9 -0
- data/ext/nokogiri/xml_syntax_error.c +52 -0
- data/ext/nokogiri/xml_syntax_error.h +13 -0
- data/ext/nokogiri/xml_text.c +48 -0
- data/ext/nokogiri/xml_text.h +9 -0
- data/ext/nokogiri/xml_xpath.c +53 -0
- data/ext/nokogiri/xml_xpath.h +11 -0
- data/ext/nokogiri/xml_xpath_context.c +239 -0
- data/ext/nokogiri/xml_xpath_context.h +9 -0
- data/ext/nokogiri/xslt_stylesheet.c +131 -0
- data/ext/nokogiri/xslt_stylesheet.h +9 -0
- data/lib/isorelax.jar +0 -0
- data/lib/jing.jar +0 -0
- data/lib/nekodtd.jar +0 -0
- data/lib/nekohtml.jar +0 -0
- data/lib/nokogiri.rb +123 -0
- data/lib/nokogiri/css.rb +25 -0
- data/lib/nokogiri/css/generated_parser.rb +659 -0
- data/lib/nokogiri/css/generated_tokenizer.rb +145 -0
- data/lib/nokogiri/css/node.rb +99 -0
- data/lib/nokogiri/css/parser.rb +82 -0
- data/lib/nokogiri/css/parser.y +230 -0
- data/lib/nokogiri/css/syntax_error.rb +7 -0
- data/lib/nokogiri/css/tokenizer.rb +7 -0
- data/lib/nokogiri/css/tokenizer.rex +55 -0
- data/lib/nokogiri/css/xpath_visitor.rb +164 -0
- data/lib/nokogiri/decorators/slop.rb +33 -0
- data/lib/nokogiri/ffi/encoding_handler.rb +42 -0
- data/lib/nokogiri/ffi/html/document.rb +28 -0
- data/lib/nokogiri/ffi/html/element_description.rb +81 -0
- data/lib/nokogiri/ffi/html/entity_lookup.rb +16 -0
- data/lib/nokogiri/ffi/html/sax/parser_context.rb +38 -0
- data/lib/nokogiri/ffi/io_callbacks.rb +42 -0
- data/lib/nokogiri/ffi/libxml.rb +372 -0
- data/lib/nokogiri/ffi/structs/common_node.rb +26 -0
- data/lib/nokogiri/ffi/structs/html_elem_desc.rb +24 -0
- data/lib/nokogiri/ffi/structs/html_entity_desc.rb +13 -0
- data/lib/nokogiri/ffi/structs/xml_alloc.rb +16 -0
- data/lib/nokogiri/ffi/structs/xml_attr.rb +19 -0
- data/lib/nokogiri/ffi/structs/xml_attribute.rb +27 -0
- data/lib/nokogiri/ffi/structs/xml_buffer.rb +16 -0
- data/lib/nokogiri/ffi/structs/xml_char_encoding_handler.rb +11 -0
- data/lib/nokogiri/ffi/structs/xml_document.rb +108 -0
- data/lib/nokogiri/ffi/structs/xml_dtd.rb +28 -0
- data/lib/nokogiri/ffi/structs/xml_element.rb +26 -0
- data/lib/nokogiri/ffi/structs/xml_element_content.rb +17 -0
- data/lib/nokogiri/ffi/structs/xml_entity.rb +32 -0
- data/lib/nokogiri/ffi/structs/xml_enumeration.rb +12 -0
- data/lib/nokogiri/ffi/structs/xml_node.rb +28 -0
- data/lib/nokogiri/ffi/structs/xml_node_set.rb +53 -0
- data/lib/nokogiri/ffi/structs/xml_notation.rb +11 -0
- data/lib/nokogiri/ffi/structs/xml_ns.rb +15 -0
- data/lib/nokogiri/ffi/structs/xml_parser_context.rb +19 -0
- data/lib/nokogiri/ffi/structs/xml_relax_ng.rb +14 -0
- data/lib/nokogiri/ffi/structs/xml_sax_handler.rb +51 -0
- data/lib/nokogiri/ffi/structs/xml_sax_push_parser_context.rb +124 -0
- data/lib/nokogiri/ffi/structs/xml_schema.rb +13 -0
- data/lib/nokogiri/ffi/structs/xml_syntax_error.rb +31 -0
- data/lib/nokogiri/ffi/structs/xml_text_reader.rb +12 -0
- data/lib/nokogiri/ffi/structs/xml_xpath_context.rb +37 -0
- data/lib/nokogiri/ffi/structs/xml_xpath_object.rb +35 -0
- data/lib/nokogiri/ffi/structs/xml_xpath_parser_context.rb +20 -0
- data/lib/nokogiri/ffi/structs/xslt_stylesheet.rb +13 -0
- data/lib/nokogiri/ffi/xml/attr.rb +41 -0
- data/lib/nokogiri/ffi/xml/attribute_decl.rb +27 -0
- data/lib/nokogiri/ffi/xml/cdata.rb +19 -0
- data/lib/nokogiri/ffi/xml/comment.rb +18 -0
- data/lib/nokogiri/ffi/xml/document.rb +135 -0
- data/lib/nokogiri/ffi/xml/document_fragment.rb +21 -0
- data/lib/nokogiri/ffi/xml/dtd.rb +67 -0
- data/lib/nokogiri/ffi/xml/element_content.rb +43 -0
- data/lib/nokogiri/ffi/xml/element_decl.rb +19 -0
- data/lib/nokogiri/ffi/xml/entity_decl.rb +27 -0
- data/lib/nokogiri/ffi/xml/entity_reference.rb +19 -0
- data/lib/nokogiri/ffi/xml/namespace.rb +44 -0
- data/lib/nokogiri/ffi/xml/node.rb +465 -0
- data/lib/nokogiri/ffi/xml/node_set.rb +146 -0
- data/lib/nokogiri/ffi/xml/processing_instruction.rb +20 -0
- data/lib/nokogiri/ffi/xml/reader.rb +227 -0
- data/lib/nokogiri/ffi/xml/relax_ng.rb +85 -0
- data/lib/nokogiri/ffi/xml/sax/parser.rb +135 -0
- data/lib/nokogiri/ffi/xml/sax/parser_context.rb +67 -0
- data/lib/nokogiri/ffi/xml/sax/push_parser.rb +55 -0
- data/lib/nokogiri/ffi/xml/schema.rb +92 -0
- data/lib/nokogiri/ffi/xml/syntax_error.rb +98 -0
- data/lib/nokogiri/ffi/xml/text.rb +18 -0
- data/lib/nokogiri/ffi/xml/xpath.rb +19 -0
- data/lib/nokogiri/ffi/xml/xpath_context.rb +135 -0
- data/lib/nokogiri/ffi/xslt/stylesheet.rb +50 -0
- data/lib/nokogiri/html.rb +36 -0
- data/lib/nokogiri/html/builder.rb +35 -0
- data/lib/nokogiri/html/document.rb +88 -0
- data/lib/nokogiri/html/document_fragment.rb +15 -0
- data/lib/nokogiri/html/element_description.rb +23 -0
- data/lib/nokogiri/html/element_description_defaults.rb +671 -0
- data/lib/nokogiri/html/entity_lookup.rb +13 -0
- data/lib/nokogiri/html/sax/parser.rb +48 -0
- data/lib/nokogiri/html/sax/parser_context.rb +16 -0
- data/lib/nokogiri/nokogiri.jar +0 -0
- data/lib/nokogiri/syntax_error.rb +4 -0
- data/lib/nokogiri/version.rb +33 -0
- data/lib/nokogiri/version_warning.rb +11 -0
- data/lib/nokogiri/xml.rb +67 -0
- data/lib/nokogiri/xml/attr.rb +14 -0
- data/lib/nokogiri/xml/attribute_decl.rb +18 -0
- data/lib/nokogiri/xml/builder.rb +405 -0
- data/lib/nokogiri/xml/cdata.rb +11 -0
- data/lib/nokogiri/xml/character_data.rb +7 -0
- data/lib/nokogiri/xml/document.rb +163 -0
- data/lib/nokogiri/xml/document_fragment.rb +73 -0
- data/lib/nokogiri/xml/dtd.rb +11 -0
- data/lib/nokogiri/xml/element_content.rb +36 -0
- data/lib/nokogiri/xml/element_decl.rb +13 -0
- data/lib/nokogiri/xml/entity_decl.rb +15 -0
- data/lib/nokogiri/xml/fragment_handler.rb +73 -0
- data/lib/nokogiri/xml/namespace.rb +13 -0
- data/lib/nokogiri/xml/node.rb +730 -0
- data/lib/nokogiri/xml/node/save_options.rb +42 -0
- data/lib/nokogiri/xml/node_set.rb +318 -0
- data/lib/nokogiri/xml/notation.rb +6 -0
- data/lib/nokogiri/xml/parse_options.rb +85 -0
- data/lib/nokogiri/xml/pp.rb +2 -0
- data/lib/nokogiri/xml/pp/character_data.rb +18 -0
- data/lib/nokogiri/xml/pp/node.rb +56 -0
- data/lib/nokogiri/xml/processing_instruction.rb +8 -0
- data/lib/nokogiri/xml/reader.rb +74 -0
- data/lib/nokogiri/xml/relax_ng.rb +32 -0
- data/lib/nokogiri/xml/sax.rb +4 -0
- data/lib/nokogiri/xml/sax/document.rb +160 -0
- data/lib/nokogiri/xml/sax/parser.rb +115 -0
- data/lib/nokogiri/xml/sax/parser_context.rb +16 -0
- data/lib/nokogiri/xml/sax/push_parser.rb +60 -0
- data/lib/nokogiri/xml/schema.rb +61 -0
- data/lib/nokogiri/xml/syntax_error.rb +43 -0
- data/lib/nokogiri/xml/xpath.rb +10 -0
- data/lib/nokogiri/xml/xpath/syntax_error.rb +8 -0
- data/lib/nokogiri/xml/xpath_context.rb +16 -0
- data/lib/nokogiri/xslt.rb +48 -0
- data/lib/nokogiri/xslt/stylesheet.rb +25 -0
- data/lib/xercesImpl.jar +0 -0
- data/lib/xsd/xmlparser/nokogiri.rb +90 -0
- data/tasks/test.rb +100 -0
- data/test/css/test_nthiness.rb +159 -0
- data/test/css/test_parser.rb +282 -0
- data/test/css/test_tokenizer.rb +190 -0
- data/test/css/test_xpath_visitor.rb +76 -0
- data/test/ffi/test_document.rb +35 -0
- data/test/files/2ch.html +108 -0
- data/test/files/address_book.rlx +12 -0
- data/test/files/address_book.xml +10 -0
- data/test/files/bar/bar.xsd +4 -0
- data/test/files/dont_hurt_em_why.xml +422 -0
- data/test/files/exslt.xml +8 -0
- data/test/files/exslt.xslt +35 -0
- data/test/files/foo/foo.xsd +4 -0
- data/test/files/po.xml +32 -0
- data/test/files/po.xsd +66 -0
- data/test/files/shift_jis.html +10 -0
- data/test/files/shift_jis.xml +5 -0
- data/test/files/snuggles.xml +3 -0
- data/test/files/staff.dtd +10 -0
- data/test/files/staff.xml +59 -0
- data/test/files/staff.xslt +32 -0
- data/test/files/tlm.html +850 -0
- data/test/files/valid_bar.xml +2 -0
- data/test/helper.rb +137 -0
- data/test/html/sax/test_parser.rb +83 -0
- data/test/html/sax/test_parser_context.rb +48 -0
- data/test/html/test_builder.rb +164 -0
- data/test/html/test_document.rb +385 -0
- data/test/html/test_document_encoding.rb +77 -0
- data/test/html/test_document_fragment.rb +157 -0
- data/test/html/test_element_description.rb +98 -0
- data/test/html/test_named_characters.rb +14 -0
- data/test/html/test_node.rb +242 -0
- data/test/html/test_node_encoding.rb +27 -0
- data/test/test_convert_xpath.rb +135 -0
- data/test/test_css_cache.rb +45 -0
- data/test/test_encoding_handler.rb +46 -0
- data/test/test_jruby.rb +40 -0
- data/test/test_memory_leak.rb +87 -0
- data/test/test_nokogiri.rb +140 -0
- data/test/test_reader.rb +358 -0
- data/test/test_soap4r_sax.rb +52 -0
- data/test/test_xslt_transforms.rb +150 -0
- data/test/xml/node/test_save_options.rb +20 -0
- data/test/xml/node/test_subclass.rb +44 -0
- data/test/xml/sax/test_parser.rb +314 -0
- data/test/xml/sax/test_parser_context.rb +63 -0
- data/test/xml/sax/test_push_parser.rb +135 -0
- data/test/xml/test_attr.rb +38 -0
- data/test/xml/test_attribute_decl.rb +90 -0
- data/test/xml/test_builder.rb +167 -0
- data/test/xml/test_cdata.rb +38 -0
- data/test/xml/test_comment.rb +29 -0
- data/test/xml/test_document.rb +638 -0
- data/test/xml/test_document_encoding.rb +26 -0
- data/test/xml/test_document_fragment.rb +149 -0
- data/test/xml/test_dtd.rb +92 -0
- data/test/xml/test_dtd_encoding.rb +33 -0
- data/test/xml/test_element_content.rb +56 -0
- data/test/xml/test_element_decl.rb +73 -0
- data/test/xml/test_entity_decl.rb +83 -0
- data/test/xml/test_entity_reference.rb +21 -0
- data/test/xml/test_namespace.rb +70 -0
- data/test/xml/test_node.rb +740 -0
- data/test/xml/test_node_attributes.rb +34 -0
- data/test/xml/test_node_encoding.rb +107 -0
- data/test/xml/test_node_reparenting.rb +279 -0
- data/test/xml/test_node_set.rb +577 -0
- data/test/xml/test_parse_options.rb +52 -0
- data/test/xml/test_processing_instruction.rb +30 -0
- data/test/xml/test_reader_encoding.rb +126 -0
- data/test/xml/test_relax_ng.rb +60 -0
- data/test/xml/test_schema.rb +89 -0
- data/test/xml/test_syntax_error.rb +12 -0
- data/test/xml/test_text.rb +30 -0
- data/test/xml/test_unparented_node.rb +381 -0
- data/test/xml/test_xpath.rb +169 -0
- metadata +477 -0
@@ -0,0 +1,27 @@
|
|
1
|
+
# -*- coding: utf-8 -*-
|
2
|
+
require "helper"
|
3
|
+
|
4
|
+
module Nokogiri
|
5
|
+
module HTML
|
6
|
+
if RUBY_VERSION =~ /^1\.9/
|
7
|
+
class TestNodeEncoding < Nokogiri::TestCase
|
8
|
+
def test_inner_html
|
9
|
+
doc = Nokogiri::HTML File.open(SHIFT_JIS_HTML, 'rb')
|
10
|
+
|
11
|
+
hello = "こんにちは"
|
12
|
+
|
13
|
+
contents = doc.at('h2').inner_html
|
14
|
+
assert_equal doc.encoding, contents.encoding.name
|
15
|
+
assert_match hello.encode('Shift_JIS'), contents
|
16
|
+
|
17
|
+
contents = doc.at('h2').inner_html(:encoding => 'UTF-8')
|
18
|
+
assert_match hello, contents
|
19
|
+
|
20
|
+
doc.encoding = 'UTF-8'
|
21
|
+
contents = doc.at('h2').inner_html
|
22
|
+
assert_match hello, contents
|
23
|
+
end
|
24
|
+
end
|
25
|
+
end
|
26
|
+
end
|
27
|
+
end
|
@@ -0,0 +1,135 @@
|
|
1
|
+
require "helper"
|
2
|
+
|
3
|
+
class TestConvertXPath < Nokogiri::TestCase
|
4
|
+
|
5
|
+
def setup
|
6
|
+
super
|
7
|
+
@N = Nokogiri(File.read(HTML_FILE))
|
8
|
+
end
|
9
|
+
|
10
|
+
def assert_syntactical_equivalence(hpath, xpath, match, &blk)
|
11
|
+
blk ||= lambda {|j| j.first}
|
12
|
+
assert_equal match, blk.call(@N.search(xpath)), "xpath result did not match"
|
13
|
+
end
|
14
|
+
|
15
|
+
def test_child_tag
|
16
|
+
assert_syntactical_equivalence("h1[a]", ".//h1[child::a]", "Tender Lovemaking") do |j|
|
17
|
+
j.inner_text
|
18
|
+
end
|
19
|
+
end
|
20
|
+
|
21
|
+
def test_child_tag_equals
|
22
|
+
assert_syntactical_equivalence("h1[a='Tender Lovemaking']", ".//h1[child::a = 'Tender Lovemaking']", "Tender Lovemaking") do |j|
|
23
|
+
j.inner_text
|
24
|
+
end
|
25
|
+
end
|
26
|
+
|
27
|
+
def test_filter_contains
|
28
|
+
assert_syntactical_equivalence("title:contains('Tender')", ".//title[contains(., 'Tender')]",
|
29
|
+
"Tender Lovemaking ") do |j|
|
30
|
+
j.inner_text
|
31
|
+
end
|
32
|
+
end
|
33
|
+
|
34
|
+
def test_filter_comment
|
35
|
+
assert_syntactical_equivalence("div comment()[2]", ".//div//comment()[position() = 2]", "<!-- end of header -->") do |j|
|
36
|
+
j.first.to_s
|
37
|
+
end
|
38
|
+
end
|
39
|
+
|
40
|
+
def test_filter_text
|
41
|
+
assert_syntactical_equivalence("a[text()]", ".//a[normalize-space(child::text())]", "<a href=\"http://tenderlovemaking.com\">Tender Lovemaking</a>") do |j|
|
42
|
+
j.first.to_s
|
43
|
+
end
|
44
|
+
assert_syntactical_equivalence("a[text()='Tender Lovemaking']", ".//a[normalize-space(child::text()) = 'Tender Lovemaking']", "<a href=\"http://tenderlovemaking.com\">Tender Lovemaking</a>") do |j|
|
45
|
+
j.first.to_s
|
46
|
+
end
|
47
|
+
assert_syntactical_equivalence("a/text()", ".//a/child::text()", "Tender Lovemaking") do |j|
|
48
|
+
j.first.to_s
|
49
|
+
end
|
50
|
+
assert_syntactical_equivalence("h2//a[text()!='Back Home!']", ".//h2//a[normalize-space(child::text()) != 'Back Home!']", "Meow meow meow meow meow") do |j|
|
51
|
+
j.first.inner_text
|
52
|
+
end
|
53
|
+
end
|
54
|
+
|
55
|
+
def test_filter_by_attr
|
56
|
+
assert_syntactical_equivalence("a[@href='http://blog.geminigeek.com/wordpress-theme']",
|
57
|
+
".//a[@href = 'http://blog.geminigeek.com/wordpress-theme']",
|
58
|
+
"http://blog.geminigeek.com/wordpress-theme") do |j|
|
59
|
+
j.first["href"]
|
60
|
+
end
|
61
|
+
end
|
62
|
+
|
63
|
+
def test_css_id
|
64
|
+
assert_syntactical_equivalence("#linkcat-7", ".//*[@id = 'linkcat-7']", "linkcat-7") do |j|
|
65
|
+
j.first["id"]
|
66
|
+
end
|
67
|
+
assert_syntactical_equivalence("li#linkcat-7", ".//li[@id = 'linkcat-7']", "linkcat-7") do |j|
|
68
|
+
j.first["id"]
|
69
|
+
end
|
70
|
+
end
|
71
|
+
|
72
|
+
def test_css_class
|
73
|
+
assert_syntactical_equivalence(".cat-item-15", ".//*[contains(concat(' ', @class, ' '), ' cat-item-15 ')]",
|
74
|
+
"cat-item cat-item-15") do |j|
|
75
|
+
j.first["class"]
|
76
|
+
end
|
77
|
+
assert_syntactical_equivalence("li.cat-item-15", ".//li[contains(concat(' ', @class, ' '), ' cat-item-15 ')]",
|
78
|
+
"cat-item cat-item-15") do |j|
|
79
|
+
j.first["class"]
|
80
|
+
end
|
81
|
+
end
|
82
|
+
|
83
|
+
def test_css_tags
|
84
|
+
assert_syntactical_equivalence("div li a", ".//div//li//a", "http://brobinius.org/") do |j|
|
85
|
+
j.first.inner_text
|
86
|
+
end
|
87
|
+
assert_syntactical_equivalence("div li > a", ".//div//li/a", "http://brobinius.org/") do |j|
|
88
|
+
j.first.inner_text
|
89
|
+
end
|
90
|
+
assert_syntactical_equivalence("h1 ~ small", ".//small[preceding-sibling::h1]", "The act of making love, tenderly.") do |j|
|
91
|
+
j.first.inner_text
|
92
|
+
end
|
93
|
+
assert_syntactical_equivalence("h1 ~ small", ".//small[preceding-sibling::h1]", "The act of making love, tenderly.") do |j|
|
94
|
+
j.first.inner_text
|
95
|
+
end
|
96
|
+
end
|
97
|
+
|
98
|
+
def test_positional
|
99
|
+
assert_syntactical_equivalence("div/div:first()", ".//div/div[position() = 1]", "\r\nTender Lovemaking\r\nThe act of making love, tenderly.\r\n".gsub(/[\r\n]/, '')) do |j|
|
100
|
+
j.first.inner_text.gsub(/[\r\n]/, '')
|
101
|
+
end
|
102
|
+
assert_syntactical_equivalence("div/div:first", ".//div/div[position() = 1]", "\r\nTender Lovemaking\r\nThe act of making love, tenderly.\r\n".gsub(/[\r\n]/, '')) do |j|
|
103
|
+
j.first.inner_text.gsub(/[\r\n]/, '')
|
104
|
+
end
|
105
|
+
assert_syntactical_equivalence("div//a:last()", ".//div//a[position() = last()]", "Wordpress") do |j|
|
106
|
+
j.last.inner_text
|
107
|
+
end
|
108
|
+
assert_syntactical_equivalence("div//a:last", ".//div//a[position() = last()]", "Wordpress") do |j|
|
109
|
+
j.last.inner_text
|
110
|
+
end
|
111
|
+
end
|
112
|
+
|
113
|
+
def test_multiple_filters
|
114
|
+
assert_syntactical_equivalence("a[@rel='bookmark'][1]", ".//a[@rel = 'bookmark' and position() = 1]", "Back Home!") do |j|
|
115
|
+
j.first.inner_text
|
116
|
+
end
|
117
|
+
end
|
118
|
+
|
119
|
+
# TODO:
|
120
|
+
# doc/'title ~ link' -> links that are siblings of title
|
121
|
+
# doc/'p[@class~="final"]' -> class includes string (whitespacy)
|
122
|
+
# doc/'p[text()*="final"]' -> class includes string (index) (broken: always returns true?)
|
123
|
+
# doc/'p[text()$="final"]' -> /final$/
|
124
|
+
# doc/'p[text()|="final"]' -> /^final$/
|
125
|
+
# doc/'p[text()^="final"]' -> string starts with 'final
|
126
|
+
# nth_first
|
127
|
+
# nth_last
|
128
|
+
# even
|
129
|
+
# odd
|
130
|
+
# first-child, nth-child, last-child, nth-last-child, nth-last-of-type
|
131
|
+
# only-of-type, only-child
|
132
|
+
# parent
|
133
|
+
# empty
|
134
|
+
# root
|
135
|
+
end
|
@@ -0,0 +1,45 @@
|
|
1
|
+
require "helper"
|
2
|
+
|
3
|
+
class TestCssCache < Nokogiri::TestCase
|
4
|
+
|
5
|
+
def setup
|
6
|
+
super
|
7
|
+
@css = "a1 > b2 > c3"
|
8
|
+
@parse_result = Nokogiri::CSS.parse(@css)
|
9
|
+
@to_xpath_result = @parse_result.map {|ast| ast.to_xpath}
|
10
|
+
Nokogiri::CSS::Parser.class_eval do
|
11
|
+
class << @cache
|
12
|
+
alias :old_bracket :[]
|
13
|
+
attr_reader :count
|
14
|
+
def [](key)
|
15
|
+
@count ||= 0
|
16
|
+
@count += 1
|
17
|
+
old_bracket(key)
|
18
|
+
end
|
19
|
+
end
|
20
|
+
end
|
21
|
+
assert Nokogiri::CSS::Parser.cache_on?
|
22
|
+
end
|
23
|
+
|
24
|
+
def teardown
|
25
|
+
Nokogiri::CSS::Parser.clear_cache
|
26
|
+
Nokogiri::CSS::Parser.set_cache true
|
27
|
+
end
|
28
|
+
|
29
|
+
[ false, true ].each do |cache_setting|
|
30
|
+
define_method "test_css_cache_#{cache_setting ? "true" : "false"}" do
|
31
|
+
times = cache_setting ? 4 : nil
|
32
|
+
|
33
|
+
Nokogiri::CSS::Parser.set_cache cache_setting
|
34
|
+
|
35
|
+
Nokogiri::CSS.xpath_for(@css)
|
36
|
+
Nokogiri::CSS.xpath_for(@css)
|
37
|
+
Nokogiri::CSS::Parser.new.xpath_for(@css)
|
38
|
+
Nokogiri::CSS::Parser.new.xpath_for(@css)
|
39
|
+
|
40
|
+
assert_equal(times, Nokogiri::CSS::Parser.class_eval { @cache.count })
|
41
|
+
end
|
42
|
+
end
|
43
|
+
|
44
|
+
|
45
|
+
end
|
@@ -0,0 +1,46 @@
|
|
1
|
+
# -*- coding: utf-8 -*-
|
2
|
+
|
3
|
+
require "helper"
|
4
|
+
|
5
|
+
class TestEncodingHandler < Nokogiri::TestCase
|
6
|
+
def teardown
|
7
|
+
Nokogiri::EncodingHandler.clear_aliases!
|
8
|
+
end
|
9
|
+
|
10
|
+
def test_get
|
11
|
+
assert_not_nil Nokogiri::EncodingHandler['UTF-8']
|
12
|
+
assert_nil Nokogiri::EncodingHandler['alsdkjfhaldskjfh']
|
13
|
+
end
|
14
|
+
|
15
|
+
def test_name
|
16
|
+
eh = Nokogiri::EncodingHandler['UTF-8']
|
17
|
+
assert_equal "UTF-8", eh.name
|
18
|
+
end
|
19
|
+
|
20
|
+
def test_alias
|
21
|
+
Nokogiri::EncodingHandler.alias('UTF-8', 'UTF-18')
|
22
|
+
assert_equal 'UTF-8', Nokogiri::EncodingHandler['UTF-18'].name
|
23
|
+
end
|
24
|
+
|
25
|
+
def test_cleanup_aliases
|
26
|
+
assert_nil Nokogiri::EncodingHandler['UTF-9']
|
27
|
+
Nokogiri::EncodingHandler.alias('UTF-8', 'UTF-9')
|
28
|
+
assert_not_nil Nokogiri::EncodingHandler['UTF-9']
|
29
|
+
|
30
|
+
Nokogiri::EncodingHandler.clear_aliases!
|
31
|
+
assert_nil Nokogiri::EncodingHandler['UTF-9']
|
32
|
+
end
|
33
|
+
|
34
|
+
def test_delete
|
35
|
+
assert_nil Nokogiri::EncodingHandler['UTF-9']
|
36
|
+
Nokogiri::EncodingHandler.alias('UTF-8', 'UTF-9')
|
37
|
+
assert_not_nil Nokogiri::EncodingHandler['UTF-9']
|
38
|
+
|
39
|
+
Nokogiri::EncodingHandler.delete 'UTF-9'
|
40
|
+
assert_nil Nokogiri::EncodingHandler['UTF-9']
|
41
|
+
end
|
42
|
+
|
43
|
+
def test_delete_non_existent
|
44
|
+
assert_nil Nokogiri::EncodingHandler.delete('UTF-9')
|
45
|
+
end
|
46
|
+
end
|
data/test/test_jruby.rb
ADDED
@@ -0,0 +1,40 @@
|
|
1
|
+
FAILURES = 14
|
2
|
+
ERRORS = 27
|
3
|
+
ROOT_DIR = File.dirname(__FILE__)
|
4
|
+
$LOAD_PATH << ROOT_DIR
|
5
|
+
$LOAD_PATH << File.join(ROOT_DIR, '..', 'lib')
|
6
|
+
#require File.join(ROOT_DIR, 'helper')
|
7
|
+
XML_DIR = File.join(ROOT_DIR,'xml')
|
8
|
+
HTML_DIR = File.join(ROOT_DIR, 'html')
|
9
|
+
HTML_SAX_DIR = File.join(HTML_DIR, 'sax')
|
10
|
+
load File.join(ROOT_DIR, 'test_reader.rb')
|
11
|
+
load File.join(ROOT_DIR, 'test_xslt_transforms.rb')
|
12
|
+
load File.join(XML_DIR, 'test_namespace.rb')
|
13
|
+
load File.join(XML_DIR, 'test_node.rb')
|
14
|
+
load File.join(XML_DIR, 'test_node_attributes.rb')
|
15
|
+
load File.join(XML_DIR, 'test_node_set.rb')
|
16
|
+
load File.join(XML_DIR, 'test_attr.rb')
|
17
|
+
load File.join(XML_DIR, 'test_cdata.rb')
|
18
|
+
load File.join(XML_DIR, 'test_comment.rb')
|
19
|
+
load File.join(XML_DIR, 'test_document.rb')
|
20
|
+
load File.join(HTML_DIR, 'test_document.rb')
|
21
|
+
load File.join(HTML_DIR, 'test_document_fragment.rb')
|
22
|
+
load File.join(XML_DIR, 'test_text.rb')
|
23
|
+
load File.join(XML_DIR, 'test_xpath.rb')
|
24
|
+
load File.join(XML_DIR, 'test_schema.rb')
|
25
|
+
load File.join(XML_DIR, 'test_relax_ng.rb')
|
26
|
+
load File.join(HTML_SAX_DIR, 'test_parser.rb')
|
27
|
+
|
28
|
+
#suite = TestSuite.new "JRuby test"
|
29
|
+
#suite << TestReader
|
30
|
+
#suite << Nokogiri::XML::TestNamespace
|
31
|
+
#suite << Nokogiri::XML::TestNodeAttributes
|
32
|
+
|
33
|
+
# Failures and errors related to:
|
34
|
+
# · XPath
|
35
|
+
# · HTML
|
36
|
+
# · Things I don't know if I'm going to implement
|
37
|
+
#
|
38
|
+
# does not count.
|
39
|
+
# Que lo sepas.
|
40
|
+
puts '#{FAILURES} failures, #{ERRORS} errors'
|
@@ -0,0 +1,87 @@
|
|
1
|
+
require "helper"
|
2
|
+
|
3
|
+
class TestMemoryLeak < Nokogiri::TestCase
|
4
|
+
|
5
|
+
if ENV['NOKOGIRI_GC'] # turning these off by default for now
|
6
|
+
|
7
|
+
def test_dont_hurt_em_why
|
8
|
+
content = File.open("#{File.dirname(__FILE__)}/files/dont_hurt_em_why.xml").read
|
9
|
+
ndoc = Nokogiri::XML(content)
|
10
|
+
2.times do
|
11
|
+
info = ndoc.search('status text').first.inner_text
|
12
|
+
url = ndoc.search('user name').first.inner_text
|
13
|
+
GC.start
|
14
|
+
end
|
15
|
+
end
|
16
|
+
|
17
|
+
def test_for_memory_leak
|
18
|
+
begin
|
19
|
+
# we don't use Dike in any tests, but requiring it has side effects
|
20
|
+
# that can create memory leaks, and that's what we're testing for.
|
21
|
+
require 'rubygems'
|
22
|
+
require 'dike' # do not remove!
|
23
|
+
|
24
|
+
count_start = count_object_space_documents
|
25
|
+
xml_data = <<-EOS
|
26
|
+
<test>
|
27
|
+
<items>
|
28
|
+
<item>abc</item>
|
29
|
+
<item>1234</item>
|
30
|
+
<item>Zzz</item>
|
31
|
+
<items>
|
32
|
+
</test>
|
33
|
+
EOS
|
34
|
+
20.times do
|
35
|
+
doc = Nokogiri::XML(xml_data)
|
36
|
+
doc.xpath("//item")
|
37
|
+
end
|
38
|
+
2.times { GC.start }
|
39
|
+
count_end = count_object_space_documents
|
40
|
+
assert((count_end - count_start) <= 2, "memory leak detected")
|
41
|
+
rescue LoadError
|
42
|
+
puts "\ndike is not installed, skipping memory leak test"
|
43
|
+
end
|
44
|
+
end
|
45
|
+
|
46
|
+
if Nokogiri.ffi?
|
47
|
+
[ ['Node', 'p', nil],
|
48
|
+
['CDATA', nil, 'content'],
|
49
|
+
['Comment', nil, 'content'],
|
50
|
+
['DocumentFragment', nil],
|
51
|
+
['EntityReference', nil, 'p'],
|
52
|
+
['ProcessingInstruction', nil, 'p', 'content'] ].each do |klass, *args|
|
53
|
+
|
54
|
+
define_method "test_for_leaked_#{klass}_nodes" do
|
55
|
+
Nokogiri::LibXML.expects(:xmlAddChild).at_least(1) # more than once shows we're GCing properly
|
56
|
+
10.times {
|
57
|
+
xml = Nokogiri::XML("<root></root>")
|
58
|
+
2.times { Nokogiri::XML.const_get(klass).new(*(args.collect{|arg| arg || xml})) }
|
59
|
+
GC.start
|
60
|
+
}
|
61
|
+
GC.start
|
62
|
+
end
|
63
|
+
|
64
|
+
end
|
65
|
+
|
66
|
+
def test_for_leaked_attr_nodes
|
67
|
+
Nokogiri::LibXML.expects(:xmlFreePropList).at_least(1) # more than once shows we're GCing properly
|
68
|
+
10.times {
|
69
|
+
xml = Nokogiri::XML("<root></root>")
|
70
|
+
2.times { Nokogiri::XML::Attr.new(xml, "p") }
|
71
|
+
GC.start
|
72
|
+
}
|
73
|
+
GC.start
|
74
|
+
end
|
75
|
+
|
76
|
+
end # if ffi
|
77
|
+
|
78
|
+
end # if NOKOGIRI_GC
|
79
|
+
|
80
|
+
private
|
81
|
+
|
82
|
+
def count_object_space_documents
|
83
|
+
count = 0
|
84
|
+
ObjectSpace.each_object {|j| count += 1 if j.is_a?(Nokogiri::XML::Document) }
|
85
|
+
count
|
86
|
+
end
|
87
|
+
end
|
@@ -0,0 +1,140 @@
|
|
1
|
+
require "helper"
|
2
|
+
|
3
|
+
class TestNokogiri < Nokogiri::TestCase
|
4
|
+
def test_versions
|
5
|
+
version_match = /\d+\.\d+\.\d+/
|
6
|
+
assert_match version_match, Nokogiri::VERSION
|
7
|
+
assert_match version_match, Nokogiri::LIBXML_VERSION if Nokogiri.uses_libxml?
|
8
|
+
|
9
|
+
if defined?(FFI) && defined?(Nokogiri::LibXML)
|
10
|
+
assert_equal 'ffi', Nokogiri::VERSION_INFO['libxml']['binding']
|
11
|
+
if RUBY_PLATFORM =~ /java/
|
12
|
+
assert_equal 'jruby', Nokogiri::VERSION_INFO['libxml']['platform']
|
13
|
+
else
|
14
|
+
assert_equal 'ruby', Nokogiri::VERSION_INFO['libxml']['platform']
|
15
|
+
end
|
16
|
+
assert Nokogiri.ffi?
|
17
|
+
elsif Nokogiri.uses_libxml?
|
18
|
+
assert_equal 'extension', Nokogiri::VERSION_INFO['libxml']['binding']
|
19
|
+
|
20
|
+
assert_match version_match, Nokogiri::VERSION_INFO['libxml']['compiled']
|
21
|
+
assert_equal Nokogiri::LIBXML_VERSION, Nokogiri::VERSION_INFO['libxml']['compiled']
|
22
|
+
assert ! Nokogiri.ffi?
|
23
|
+
end
|
24
|
+
|
25
|
+
if Nokogiri.uses_libxml?
|
26
|
+
assert_match version_match, Nokogiri::VERSION_INFO['libxml']['loaded']
|
27
|
+
Nokogiri::LIBXML_PARSER_VERSION =~ /(\d)(\d{2})(\d{2})/
|
28
|
+
major = $1.to_i
|
29
|
+
minor = $2.to_i
|
30
|
+
bug = $3.to_i
|
31
|
+
assert_equal "#{major}.#{minor}.#{bug}", Nokogiri::VERSION_INFO['libxml']['loaded']
|
32
|
+
end
|
33
|
+
end
|
34
|
+
|
35
|
+
def test_libxml_iconv
|
36
|
+
assert Nokogiri.const_defined?(:LIBXML_ICONV_ENABLED) if Nokogiri.uses_libxml?
|
37
|
+
end
|
38
|
+
|
39
|
+
def test_parse_with_io
|
40
|
+
doc = Nokogiri.parse(
|
41
|
+
StringIO.new("<html><head><title></title><body></body></html>")
|
42
|
+
)
|
43
|
+
assert_instance_of Nokogiri::HTML::Document, doc
|
44
|
+
end
|
45
|
+
|
46
|
+
def test_xml?
|
47
|
+
doc = Nokogiri.parse(File.read(XML_FILE))
|
48
|
+
assert doc.xml?
|
49
|
+
assert !doc.html?
|
50
|
+
end
|
51
|
+
|
52
|
+
def test_html?
|
53
|
+
doc = Nokogiri.parse(File.read(HTML_FILE))
|
54
|
+
assert !doc.xml?
|
55
|
+
assert doc.html?
|
56
|
+
end
|
57
|
+
|
58
|
+
def test_nokogiri_method_with_html
|
59
|
+
doc1 = Nokogiri(File.read(HTML_FILE))
|
60
|
+
doc2 = Nokogiri.parse(File.read(HTML_FILE))
|
61
|
+
assert_equal doc1.serialize, doc2.serialize
|
62
|
+
end
|
63
|
+
|
64
|
+
def test_nokogiri_method_with_block
|
65
|
+
doc = Nokogiri { b "bold tag" }
|
66
|
+
assert_equal('<b>bold tag</b>', doc.to_html.chomp)
|
67
|
+
end
|
68
|
+
|
69
|
+
def test_make_with_html
|
70
|
+
doc = Nokogiri.make("<b>bold tag</b>")
|
71
|
+
assert_equal('<b>bold tag</b>', doc.to_html.chomp)
|
72
|
+
end
|
73
|
+
|
74
|
+
def test_make_with_block
|
75
|
+
doc = Nokogiri.make { b "bold tag" }
|
76
|
+
assert_equal('<b>bold tag</b>', doc.to_html.chomp)
|
77
|
+
end
|
78
|
+
|
79
|
+
SLOP_HTML = <<-END
|
80
|
+
<html>
|
81
|
+
<body>
|
82
|
+
<ul>
|
83
|
+
<li class='red'>one</li>
|
84
|
+
<li class='blue'>two</li>
|
85
|
+
</ul>
|
86
|
+
<div>
|
87
|
+
one
|
88
|
+
<div>div two</div>
|
89
|
+
</div>
|
90
|
+
</body>
|
91
|
+
</html>
|
92
|
+
END
|
93
|
+
|
94
|
+
def test_slop_css
|
95
|
+
doc = Nokogiri::Slop(<<-eohtml)
|
96
|
+
<html>
|
97
|
+
<body>
|
98
|
+
<div>
|
99
|
+
one
|
100
|
+
<div class='foo'>
|
101
|
+
div two
|
102
|
+
<div class='foo'>
|
103
|
+
div three
|
104
|
+
</div>
|
105
|
+
</div>
|
106
|
+
</div>
|
107
|
+
</body>
|
108
|
+
</html>
|
109
|
+
eohtml
|
110
|
+
assert_equal "div", doc.html.body.div.div('.foo').name
|
111
|
+
end
|
112
|
+
|
113
|
+
def test_slop
|
114
|
+
doc = Nokogiri::Slop(SLOP_HTML)
|
115
|
+
|
116
|
+
assert_equal "one", doc.html.body.ul.li.first.text
|
117
|
+
assert_equal "two", doc.html.body.ul.li(".blue").text
|
118
|
+
assert_equal "div two", doc.html.body.div.div.text
|
119
|
+
|
120
|
+
assert_equal "two", doc.html.body.ul.li(:css => ".blue").text
|
121
|
+
|
122
|
+
assert_equal "two", doc.html.body.ul.li(:xpath => "position()=2").text
|
123
|
+
assert_equal "one", doc.html.body.ul.li(:xpath => ["contains(text(),'o')"]).first.text
|
124
|
+
assert_equal "two", doc.html.body.ul.li(:xpath => ["contains(text(),'o')","contains(text(),'t')"]).text
|
125
|
+
|
126
|
+
assert_raise(NoMethodError) { doc.nonexistent }
|
127
|
+
end
|
128
|
+
|
129
|
+
def test_slop_decorator
|
130
|
+
doc = Nokogiri(SLOP_HTML)
|
131
|
+
assert !doc.decorators(Nokogiri::XML::Node).include?(Nokogiri::Decorators::Slop)
|
132
|
+
|
133
|
+
doc.slop!
|
134
|
+
assert doc.decorators(Nokogiri::XML::Node).include?(Nokogiri::Decorators::Slop)
|
135
|
+
|
136
|
+
doc.slop!
|
137
|
+
assert_equal 1, doc.decorators(Nokogiri::XML::Node).select { |d| d == Nokogiri::Decorators::Slop }.size
|
138
|
+
end
|
139
|
+
|
140
|
+
end
|