glebm-nokogiri 1.4.2.1
Sign up to get free protection for your applications and to get access to all the features.
- data/.autotest +26 -0
- data/CHANGELOG.ja.rdoc +411 -0
- data/CHANGELOG.rdoc +397 -0
- data/Manifest.txt +276 -0
- data/README.ja.rdoc +106 -0
- data/README.rdoc +132 -0
- data/Rakefile +183 -0
- data/bin/nokogiri +49 -0
- data/deps.rip +5 -0
- data/ext/nokogiri/extconf.rb +97 -0
- data/ext/nokogiri/html_document.c +154 -0
- data/ext/nokogiri/html_document.h +10 -0
- data/ext/nokogiri/html_element_description.c +276 -0
- data/ext/nokogiri/html_element_description.h +10 -0
- data/ext/nokogiri/html_entity_lookup.c +32 -0
- data/ext/nokogiri/html_entity_lookup.h +8 -0
- data/ext/nokogiri/html_sax_parser_context.c +94 -0
- data/ext/nokogiri/html_sax_parser_context.h +11 -0
- data/ext/nokogiri/nokogiri.c +95 -0
- data/ext/nokogiri/nokogiri.h +153 -0
- data/ext/nokogiri/xml_attr.c +94 -0
- data/ext/nokogiri/xml_attr.h +9 -0
- data/ext/nokogiri/xml_attribute_decl.c +70 -0
- data/ext/nokogiri/xml_attribute_decl.h +9 -0
- data/ext/nokogiri/xml_cdata.c +56 -0
- data/ext/nokogiri/xml_cdata.h +9 -0
- data/ext/nokogiri/xml_comment.c +54 -0
- data/ext/nokogiri/xml_comment.h +9 -0
- data/ext/nokogiri/xml_document.c +464 -0
- data/ext/nokogiri/xml_document.h +23 -0
- data/ext/nokogiri/xml_document_fragment.c +48 -0
- data/ext/nokogiri/xml_document_fragment.h +10 -0
- data/ext/nokogiri/xml_dtd.c +202 -0
- data/ext/nokogiri/xml_dtd.h +10 -0
- data/ext/nokogiri/xml_element_content.c +123 -0
- data/ext/nokogiri/xml_element_content.h +10 -0
- data/ext/nokogiri/xml_element_decl.c +69 -0
- data/ext/nokogiri/xml_element_decl.h +9 -0
- data/ext/nokogiri/xml_encoding_handler.c +79 -0
- data/ext/nokogiri/xml_encoding_handler.h +8 -0
- data/ext/nokogiri/xml_entity_decl.c +110 -0
- data/ext/nokogiri/xml_entity_decl.h +10 -0
- data/ext/nokogiri/xml_entity_reference.c +52 -0
- data/ext/nokogiri/xml_entity_reference.h +9 -0
- data/ext/nokogiri/xml_io.c +31 -0
- data/ext/nokogiri/xml_io.h +11 -0
- data/ext/nokogiri/xml_namespace.c +84 -0
- data/ext/nokogiri/xml_namespace.h +13 -0
- data/ext/nokogiri/xml_node.c +1347 -0
- data/ext/nokogiri/xml_node.h +13 -0
- data/ext/nokogiri/xml_node_set.c +418 -0
- data/ext/nokogiri/xml_node_set.h +9 -0
- data/ext/nokogiri/xml_processing_instruction.c +56 -0
- data/ext/nokogiri/xml_processing_instruction.h +9 -0
- data/ext/nokogiri/xml_reader.c +665 -0
- data/ext/nokogiri/xml_reader.h +10 -0
- data/ext/nokogiri/xml_relax_ng.c +168 -0
- data/ext/nokogiri/xml_relax_ng.h +9 -0
- data/ext/nokogiri/xml_sax_parser.c +286 -0
- data/ext/nokogiri/xml_sax_parser.h +39 -0
- data/ext/nokogiri/xml_sax_parser_context.c +159 -0
- data/ext/nokogiri/xml_sax_parser_context.h +10 -0
- data/ext/nokogiri/xml_sax_push_parser.c +115 -0
- data/ext/nokogiri/xml_sax_push_parser.h +9 -0
- data/ext/nokogiri/xml_schema.c +205 -0
- data/ext/nokogiri/xml_schema.h +9 -0
- data/ext/nokogiri/xml_syntax_error.c +58 -0
- data/ext/nokogiri/xml_syntax_error.h +13 -0
- data/ext/nokogiri/xml_text.c +50 -0
- data/ext/nokogiri/xml_text.h +9 -0
- data/ext/nokogiri/xml_xpath_context.c +276 -0
- data/ext/nokogiri/xml_xpath_context.h +9 -0
- data/ext/nokogiri/xslt_stylesheet.c +142 -0
- data/ext/nokogiri/xslt_stylesheet.h +9 -0
- data/lib/nokogiri.rb +133 -0
- data/lib/nokogiri/css.rb +25 -0
- data/lib/nokogiri/css/generated_parser.rb +669 -0
- data/lib/nokogiri/css/generated_tokenizer.rb +145 -0
- data/lib/nokogiri/css/node.rb +99 -0
- data/lib/nokogiri/css/parser.rb +82 -0
- data/lib/nokogiri/css/parser.y +232 -0
- data/lib/nokogiri/css/syntax_error.rb +7 -0
- data/lib/nokogiri/css/tokenizer.rb +7 -0
- data/lib/nokogiri/css/tokenizer.rex +55 -0
- data/lib/nokogiri/css/xpath_visitor.rb +169 -0
- data/lib/nokogiri/decorators/slop.rb +33 -0
- data/lib/nokogiri/ffi/encoding_handler.rb +42 -0
- data/lib/nokogiri/ffi/html/document.rb +28 -0
- data/lib/nokogiri/ffi/html/element_description.rb +81 -0
- data/lib/nokogiri/ffi/html/entity_lookup.rb +16 -0
- data/lib/nokogiri/ffi/html/sax/parser_context.rb +38 -0
- data/lib/nokogiri/ffi/io_callbacks.rb +42 -0
- data/lib/nokogiri/ffi/libxml.rb +386 -0
- data/lib/nokogiri/ffi/structs/common_node.rb +38 -0
- data/lib/nokogiri/ffi/structs/html_elem_desc.rb +24 -0
- data/lib/nokogiri/ffi/structs/html_entity_desc.rb +13 -0
- data/lib/nokogiri/ffi/structs/xml_alloc.rb +16 -0
- data/lib/nokogiri/ffi/structs/xml_attr.rb +19 -0
- data/lib/nokogiri/ffi/structs/xml_attribute.rb +27 -0
- data/lib/nokogiri/ffi/structs/xml_buffer.rb +16 -0
- data/lib/nokogiri/ffi/structs/xml_char_encoding_handler.rb +11 -0
- data/lib/nokogiri/ffi/structs/xml_document.rb +117 -0
- data/lib/nokogiri/ffi/structs/xml_dtd.rb +28 -0
- data/lib/nokogiri/ffi/structs/xml_element.rb +26 -0
- data/lib/nokogiri/ffi/structs/xml_element_content.rb +17 -0
- data/lib/nokogiri/ffi/structs/xml_entity.rb +32 -0
- data/lib/nokogiri/ffi/structs/xml_enumeration.rb +12 -0
- data/lib/nokogiri/ffi/structs/xml_node.rb +28 -0
- data/lib/nokogiri/ffi/structs/xml_node_set.rb +53 -0
- data/lib/nokogiri/ffi/structs/xml_notation.rb +11 -0
- data/lib/nokogiri/ffi/structs/xml_ns.rb +15 -0
- data/lib/nokogiri/ffi/structs/xml_parser_context.rb +19 -0
- data/lib/nokogiri/ffi/structs/xml_relax_ng.rb +14 -0
- data/lib/nokogiri/ffi/structs/xml_sax_handler.rb +51 -0
- data/lib/nokogiri/ffi/structs/xml_sax_push_parser_context.rb +124 -0
- data/lib/nokogiri/ffi/structs/xml_schema.rb +13 -0
- data/lib/nokogiri/ffi/structs/xml_syntax_error.rb +31 -0
- data/lib/nokogiri/ffi/structs/xml_text_reader.rb +12 -0
- data/lib/nokogiri/ffi/structs/xml_xpath_context.rb +38 -0
- data/lib/nokogiri/ffi/structs/xml_xpath_object.rb +35 -0
- data/lib/nokogiri/ffi/structs/xml_xpath_parser_context.rb +20 -0
- data/lib/nokogiri/ffi/structs/xslt_stylesheet.rb +13 -0
- data/lib/nokogiri/ffi/weak_bucket.rb +40 -0
- data/lib/nokogiri/ffi/xml/attr.rb +41 -0
- data/lib/nokogiri/ffi/xml/attribute_decl.rb +27 -0
- data/lib/nokogiri/ffi/xml/cdata.rb +19 -0
- data/lib/nokogiri/ffi/xml/comment.rb +18 -0
- data/lib/nokogiri/ffi/xml/document.rb +162 -0
- data/lib/nokogiri/ffi/xml/document_fragment.rb +21 -0
- data/lib/nokogiri/ffi/xml/dtd.rb +67 -0
- data/lib/nokogiri/ffi/xml/element_content.rb +43 -0
- data/lib/nokogiri/ffi/xml/element_decl.rb +19 -0
- data/lib/nokogiri/ffi/xml/entity_decl.rb +36 -0
- data/lib/nokogiri/ffi/xml/entity_reference.rb +19 -0
- data/lib/nokogiri/ffi/xml/namespace.rb +44 -0
- data/lib/nokogiri/ffi/xml/node.rb +556 -0
- data/lib/nokogiri/ffi/xml/node_set.rb +149 -0
- data/lib/nokogiri/ffi/xml/processing_instruction.rb +20 -0
- data/lib/nokogiri/ffi/xml/reader.rb +232 -0
- data/lib/nokogiri/ffi/xml/relax_ng.rb +85 -0
- data/lib/nokogiri/ffi/xml/sax/parser.rb +135 -0
- data/lib/nokogiri/ffi/xml/sax/parser_context.rb +67 -0
- data/lib/nokogiri/ffi/xml/sax/push_parser.rb +51 -0
- data/lib/nokogiri/ffi/xml/schema.rb +109 -0
- data/lib/nokogiri/ffi/xml/syntax_error.rb +98 -0
- data/lib/nokogiri/ffi/xml/text.rb +18 -0
- data/lib/nokogiri/ffi/xml/xpath.rb +9 -0
- data/lib/nokogiri/ffi/xml/xpath_context.rb +148 -0
- data/lib/nokogiri/ffi/xslt/stylesheet.rb +53 -0
- data/lib/nokogiri/html.rb +35 -0
- data/lib/nokogiri/html/builder.rb +35 -0
- data/lib/nokogiri/html/document.rb +90 -0
- data/lib/nokogiri/html/document_fragment.rb +36 -0
- data/lib/nokogiri/html/element_description.rb +23 -0
- data/lib/nokogiri/html/entity_lookup.rb +13 -0
- data/lib/nokogiri/html/sax/parser.rb +48 -0
- data/lib/nokogiri/html/sax/parser_context.rb +16 -0
- data/lib/nokogiri/syntax_error.rb +4 -0
- data/lib/nokogiri/version.rb +37 -0
- data/lib/nokogiri/version_warning.rb +14 -0
- data/lib/nokogiri/xml.rb +67 -0
- data/lib/nokogiri/xml/attr.rb +14 -0
- data/lib/nokogiri/xml/attribute_decl.rb +18 -0
- data/lib/nokogiri/xml/builder.rb +418 -0
- data/lib/nokogiri/xml/cdata.rb +11 -0
- data/lib/nokogiri/xml/character_data.rb +7 -0
- data/lib/nokogiri/xml/document.rb +194 -0
- data/lib/nokogiri/xml/document_fragment.rb +77 -0
- data/lib/nokogiri/xml/dtd.rb +11 -0
- data/lib/nokogiri/xml/element_content.rb +36 -0
- data/lib/nokogiri/xml/element_decl.rb +13 -0
- data/lib/nokogiri/xml/entity_decl.rb +19 -0
- data/lib/nokogiri/xml/namespace.rb +13 -0
- data/lib/nokogiri/xml/node.rb +793 -0
- data/lib/nokogiri/xml/node/save_options.rb +42 -0
- data/lib/nokogiri/xml/node_set.rb +325 -0
- data/lib/nokogiri/xml/notation.rb +6 -0
- data/lib/nokogiri/xml/parse_options.rb +85 -0
- data/lib/nokogiri/xml/pp.rb +2 -0
- data/lib/nokogiri/xml/pp/character_data.rb +18 -0
- data/lib/nokogiri/xml/pp/node.rb +56 -0
- data/lib/nokogiri/xml/processing_instruction.rb +8 -0
- data/lib/nokogiri/xml/reader.rb +74 -0
- data/lib/nokogiri/xml/relax_ng.rb +32 -0
- data/lib/nokogiri/xml/sax.rb +4 -0
- data/lib/nokogiri/xml/sax/document.rb +160 -0
- data/lib/nokogiri/xml/sax/parser.rb +115 -0
- data/lib/nokogiri/xml/sax/parser_context.rb +16 -0
- data/lib/nokogiri/xml/sax/push_parser.rb +60 -0
- data/lib/nokogiri/xml/schema.rb +57 -0
- data/lib/nokogiri/xml/syntax_error.rb +47 -0
- data/lib/nokogiri/xml/text.rb +9 -0
- data/lib/nokogiri/xml/xpath.rb +10 -0
- data/lib/nokogiri/xml/xpath/syntax_error.rb +11 -0
- data/lib/nokogiri/xml/xpath_context.rb +16 -0
- data/lib/nokogiri/xslt.rb +48 -0
- data/lib/nokogiri/xslt/stylesheet.rb +25 -0
- data/lib/xsd/xmlparser/nokogiri.rb +90 -0
- data/tasks/cross_compile.rb +158 -0
- data/tasks/test.rb +94 -0
- data/test/css/test_nthiness.rb +159 -0
- data/test/css/test_parser.rb +282 -0
- data/test/css/test_tokenizer.rb +190 -0
- data/test/css/test_xpath_visitor.rb +85 -0
- data/test/ffi/test_document.rb +35 -0
- data/test/files/2ch.html +108 -0
- data/test/files/address_book.rlx +12 -0
- data/test/files/address_book.xml +10 -0
- data/test/files/bar/bar.xsd +4 -0
- data/test/files/dont_hurt_em_why.xml +422 -0
- data/test/files/exslt.xml +8 -0
- data/test/files/exslt.xslt +35 -0
- data/test/files/foo/foo.xsd +4 -0
- data/test/files/po.xml +32 -0
- data/test/files/po.xsd +66 -0
- data/test/files/shift_jis.html +10 -0
- data/test/files/shift_jis.xml +5 -0
- data/test/files/snuggles.xml +3 -0
- data/test/files/staff.dtd +10 -0
- data/test/files/staff.xml +59 -0
- data/test/files/staff.xslt +32 -0
- data/test/files/tlm.html +850 -0
- data/test/files/valid_bar.xml +2 -0
- data/test/helper.rb +169 -0
- data/test/html/sax/test_parser.rb +74 -0
- data/test/html/sax/test_parser_context.rb +48 -0
- data/test/html/test_builder.rb +164 -0
- data/test/html/test_document.rb +398 -0
- data/test/html/test_document_encoding.rb +77 -0
- data/test/html/test_document_fragment.rb +182 -0
- data/test/html/test_element_description.rb +98 -0
- data/test/html/test_named_characters.rb +14 -0
- data/test/html/test_node.rb +181 -0
- data/test/html/test_node_encoding.rb +27 -0
- data/test/test_convert_xpath.rb +135 -0
- data/test/test_css_cache.rb +45 -0
- data/test/test_encoding_handler.rb +46 -0
- data/test/test_memory_leak.rb +87 -0
- data/test/test_nokogiri.rb +138 -0
- data/test/test_reader.rb +386 -0
- data/test/test_soap4r_sax.rb +52 -0
- data/test/test_xslt_transforms.rb +188 -0
- data/test/xml/node/test_save_options.rb +20 -0
- data/test/xml/node/test_subclass.rb +44 -0
- data/test/xml/sax/test_parser.rb +307 -0
- data/test/xml/sax/test_parser_context.rb +63 -0
- data/test/xml/sax/test_push_parser.rb +139 -0
- data/test/xml/test_attr.rb +38 -0
- data/test/xml/test_attribute_decl.rb +82 -0
- data/test/xml/test_builder.rb +210 -0
- data/test/xml/test_cdata.rb +50 -0
- data/test/xml/test_comment.rb +29 -0
- data/test/xml/test_document.rb +668 -0
- data/test/xml/test_document_encoding.rb +26 -0
- data/test/xml/test_document_fragment.rb +180 -0
- data/test/xml/test_dtd.rb +82 -0
- data/test/xml/test_dtd_encoding.rb +33 -0
- data/test/xml/test_element_content.rb +56 -0
- data/test/xml/test_element_decl.rb +73 -0
- data/test/xml/test_entity_decl.rb +120 -0
- data/test/xml/test_entity_reference.rb +21 -0
- data/test/xml/test_namespace.rb +68 -0
- data/test/xml/test_node.rb +865 -0
- data/test/xml/test_node_attributes.rb +34 -0
- data/test/xml/test_node_encoding.rb +107 -0
- data/test/xml/test_node_reparenting.rb +293 -0
- data/test/xml/test_node_set.rb +649 -0
- data/test/xml/test_parse_options.rb +52 -0
- data/test/xml/test_processing_instruction.rb +30 -0
- data/test/xml/test_reader_encoding.rb +126 -0
- data/test/xml/test_relax_ng.rb +60 -0
- data/test/xml/test_schema.rb +89 -0
- data/test/xml/test_syntax_error.rb +12 -0
- data/test/xml/test_text.rb +38 -0
- data/test/xml/test_unparented_node.rb +381 -0
- data/test/xml/test_xpath.rb +138 -0
- metadata +533 -0
@@ -0,0 +1,48 @@
|
|
1
|
+
module Nokogiri
|
2
|
+
module HTML
|
3
|
+
###
|
4
|
+
# Nokogiri lets you write a SAX parser to process HTML but get HTML
|
5
|
+
# correction features.
|
6
|
+
#
|
7
|
+
# See Nokogiri::HTML::SAX::Parser for a basic example of using a
|
8
|
+
# SAX parser with HTML.
|
9
|
+
#
|
10
|
+
# For more information on SAX parsers, see Nokogiri::XML::SAX
|
11
|
+
module SAX
|
12
|
+
###
|
13
|
+
# This class lets you perform SAX style parsing on HTML with HTML
|
14
|
+
# error correction.
|
15
|
+
#
|
16
|
+
# Here is a basic usage example:
|
17
|
+
#
|
18
|
+
# class MyDoc < Nokogiri::XML::SAX::Document
|
19
|
+
# def start_element name, attributes = []
|
20
|
+
# puts "found a #{name}"
|
21
|
+
# end
|
22
|
+
# end
|
23
|
+
#
|
24
|
+
# parser = Nokogiri::HTML::SAX::Parser.new(MyDoc.new)
|
25
|
+
# parser.parse(File.read(ARGV[0], 'rb'))
|
26
|
+
#
|
27
|
+
# For more information on SAX parsers, see Nokogiri::XML::SAX
|
28
|
+
class Parser < Nokogiri::XML::SAX::Parser
|
29
|
+
###
|
30
|
+
# Parse html stored in +data+ using +encoding+
|
31
|
+
def parse_memory data, encoding = 'UTF-8'
|
32
|
+
raise ArgumentError unless data
|
33
|
+
return unless data.length > 0
|
34
|
+
ParserContext.memory(data, encoding).parse_with self
|
35
|
+
end
|
36
|
+
|
37
|
+
###
|
38
|
+
# Parse a file with +filename+
|
39
|
+
def parse_file filename, encoding = 'UTF-8'
|
40
|
+
raise ArgumentError unless filename
|
41
|
+
raise Errno::ENOENT unless File.exists?(filename)
|
42
|
+
raise Errno::EISDIR if File.directory?(filename)
|
43
|
+
ParserContext.file(filename, encoding).parse_with self
|
44
|
+
end
|
45
|
+
end
|
46
|
+
end
|
47
|
+
end
|
48
|
+
end
|
@@ -0,0 +1,16 @@
|
|
1
|
+
module Nokogiri
|
2
|
+
module HTML
|
3
|
+
module SAX
|
4
|
+
###
|
5
|
+
# Context for HTML SAX parsers. This class is usually not instantiated
|
6
|
+
# by the user. Instead, you should be looking at
|
7
|
+
# Nokogiri::HTML::SAX::Parser
|
8
|
+
class ParserContext < Nokogiri::XML::SAX::ParserContext
|
9
|
+
def self.new thing, encoding = 'UTF-8'
|
10
|
+
[:read, :close].all? { |x| thing.respond_to?(x) } ? super :
|
11
|
+
memory(thing, encoding)
|
12
|
+
end
|
13
|
+
end
|
14
|
+
end
|
15
|
+
end
|
16
|
+
end
|
@@ -0,0 +1,37 @@
|
|
1
|
+
module Nokogiri
|
2
|
+
# The version of Nokogiri you are using
|
3
|
+
VERSION = '1.4.2.1'
|
4
|
+
|
5
|
+
# More complete version information about libxml
|
6
|
+
VERSION_INFO = {}
|
7
|
+
VERSION_INFO['warnings'] = []
|
8
|
+
VERSION_INFO['nokogiri'] = Nokogiri::VERSION
|
9
|
+
VERSION_INFO['ruby'] = {}
|
10
|
+
VERSION_INFO['ruby']['version'] = ::RUBY_VERSION
|
11
|
+
VERSION_INFO['ruby']['platform'] = ::RUBY_PLATFORM
|
12
|
+
VERSION_INFO['ruby']['jruby'] = ::JRUBY_VERSION if RUBY_PLATFORM == "java"
|
13
|
+
if defined?(LIBXML_VERSION)
|
14
|
+
VERSION_INFO['libxml'] = {}
|
15
|
+
VERSION_INFO['libxml']['binding'] = 'extension'
|
16
|
+
VERSION_INFO['libxml']['compiled'] = LIBXML_VERSION
|
17
|
+
VERSION_INFO['libxml']['loaded'] = LIBXML_PARSER_VERSION.scan(/^(.*)(..)(..)$/).first.collect{|j|j.to_i}.join(".")
|
18
|
+
|
19
|
+
if VERSION_INFO['libxml']['compiled'] != VERSION_INFO['libxml']['loaded']
|
20
|
+
warning = "Nokogiri was built against LibXML version #{VERSION_INFO['libxml']['compiled']}, but has dynamically loaded #{VERSION_INFO['libxml']['loaded']}"
|
21
|
+
VERSION_INFO['warnings'] << warning
|
22
|
+
warn "WARNING: #{warning}"
|
23
|
+
end
|
24
|
+
end
|
25
|
+
|
26
|
+
def self.uses_libxml? # :nodoc:
|
27
|
+
!Nokogiri::VERSION_INFO['libxml'].nil?
|
28
|
+
end
|
29
|
+
|
30
|
+
def self.ffi? # :nodoc:
|
31
|
+
uses_libxml? && Nokogiri::VERSION_INFO['libxml']['binding'] == 'ffi'
|
32
|
+
end
|
33
|
+
|
34
|
+
def self.is_2_6_16? # :nodoc:
|
35
|
+
Nokogiri::VERSION_INFO['libxml']['loaded'] <= '2.6.16'
|
36
|
+
end
|
37
|
+
end
|
@@ -0,0 +1,14 @@
|
|
1
|
+
module Nokogiri
|
2
|
+
if self.is_2_6_16?
|
3
|
+
VERSION_INFO['warnings'] << "libxml 2.6.16 is old and buggy."
|
4
|
+
if !defined?(I_KNOW_I_AM_USING_AN_OLD_AND_BUGGY_VERSION_OF_LIBXML2)
|
5
|
+
warn <<-eom
|
6
|
+
HI. You're using libxml2 version 2.6.16 which is over 4 years old and has
|
7
|
+
plenty of bugs. We suggest that for maximum HTML/XML parsing pleasure, you
|
8
|
+
upgrade your version of libxml2 and re-install nokogiri. If you like using
|
9
|
+
libxml2 version 2.6.16, but don't like this warning, please define the constant
|
10
|
+
I_KNOW_I_AM_USING_AN_OLD_AND_BUGGY_VERSION_OF_LIBXML2 before requring nokogiri.
|
11
|
+
eom
|
12
|
+
end
|
13
|
+
end
|
14
|
+
end
|
data/lib/nokogiri/xml.rb
ADDED
@@ -0,0 +1,67 @@
|
|
1
|
+
require 'nokogiri/xml/pp'
|
2
|
+
require 'nokogiri/xml/parse_options'
|
3
|
+
require 'nokogiri/xml/sax'
|
4
|
+
require 'nokogiri/xml/node'
|
5
|
+
require 'nokogiri/xml/attribute_decl'
|
6
|
+
require 'nokogiri/xml/element_decl'
|
7
|
+
require 'nokogiri/xml/element_content'
|
8
|
+
require 'nokogiri/xml/character_data'
|
9
|
+
require 'nokogiri/xml/namespace'
|
10
|
+
require 'nokogiri/xml/attr'
|
11
|
+
require 'nokogiri/xml/dtd'
|
12
|
+
require 'nokogiri/xml/cdata'
|
13
|
+
require 'nokogiri/xml/text'
|
14
|
+
require 'nokogiri/xml/document'
|
15
|
+
require 'nokogiri/xml/document_fragment'
|
16
|
+
require 'nokogiri/xml/processing_instruction'
|
17
|
+
require 'nokogiri/xml/node_set'
|
18
|
+
require 'nokogiri/xml/syntax_error'
|
19
|
+
require 'nokogiri/xml/xpath'
|
20
|
+
require 'nokogiri/xml/xpath_context'
|
21
|
+
require 'nokogiri/xml/builder'
|
22
|
+
require 'nokogiri/xml/reader'
|
23
|
+
require 'nokogiri/xml/notation'
|
24
|
+
require 'nokogiri/xml/entity_decl'
|
25
|
+
require 'nokogiri/xml/schema'
|
26
|
+
require 'nokogiri/xml/relax_ng'
|
27
|
+
|
28
|
+
module Nokogiri
|
29
|
+
class << self
|
30
|
+
###
|
31
|
+
# Parse XML. Convenience method for Nokogiri::XML::Document.parse
|
32
|
+
def XML thing, url = nil, encoding = nil, options = XML::ParseOptions::DEFAULT_XML, &block
|
33
|
+
Nokogiri::XML::Document.parse(thing, url, encoding, options, &block)
|
34
|
+
end
|
35
|
+
end
|
36
|
+
|
37
|
+
module XML
|
38
|
+
class << self
|
39
|
+
###
|
40
|
+
# Parse an XML document using the Nokogiri::XML::Reader API. See
|
41
|
+
# Nokogiri::XML::Reader for mor information
|
42
|
+
def Reader string_or_io, url = nil, encoding = nil, options = ParseOptions::STRICT
|
43
|
+
|
44
|
+
options = Nokogiri::XML::ParseOptions.new(options) if Fixnum === options
|
45
|
+
# Give the options to the user
|
46
|
+
yield options if block_given?
|
47
|
+
|
48
|
+
if string_or_io.respond_to? :read
|
49
|
+
return Reader.from_io(string_or_io, url, encoding, options.to_i)
|
50
|
+
end
|
51
|
+
Reader.from_memory(string_or_io, url, encoding, options.to_i)
|
52
|
+
end
|
53
|
+
|
54
|
+
###
|
55
|
+
# Parse XML. Convenience method for Nokogiri::XML::Document.parse
|
56
|
+
def parse thing, url = nil, encoding = nil, options = ParseOptions::DEFAULT_XML, &block
|
57
|
+
Document.parse(thing, url, encoding, options, &block)
|
58
|
+
end
|
59
|
+
|
60
|
+
####
|
61
|
+
# Parse a fragment from +string+ in to a NodeSet.
|
62
|
+
def fragment string
|
63
|
+
XML::DocumentFragment.parse(string)
|
64
|
+
end
|
65
|
+
end
|
66
|
+
end
|
67
|
+
end
|
@@ -0,0 +1,18 @@
|
|
1
|
+
module Nokogiri
|
2
|
+
module XML
|
3
|
+
###
|
4
|
+
# Represents an attribute declaration in a DTD
|
5
|
+
class AttributeDecl < Nokogiri::XML::Node
|
6
|
+
undef_method :attribute_nodes
|
7
|
+
undef_method :attributes
|
8
|
+
undef_method :content
|
9
|
+
undef_method :namespace
|
10
|
+
undef_method :namespace_definitions
|
11
|
+
undef_method :line
|
12
|
+
|
13
|
+
def inspect
|
14
|
+
"#<#{self.class.name}:#{sprintf("0x%x", object_id)} #{to_s.inspect}>"
|
15
|
+
end
|
16
|
+
end
|
17
|
+
end
|
18
|
+
end
|
@@ -0,0 +1,418 @@
|
|
1
|
+
module Nokogiri
|
2
|
+
module XML
|
3
|
+
###
|
4
|
+
# Nokogiri builder can be used for building XML and HTML documents.
|
5
|
+
#
|
6
|
+
# == Synopsis:
|
7
|
+
#
|
8
|
+
# builder = Nokogiri::XML::Builder.new do |xml|
|
9
|
+
# xml.root {
|
10
|
+
# xml.products {
|
11
|
+
# xml.widget {
|
12
|
+
# xml.id_ "10"
|
13
|
+
# xml.name "Awesome widget"
|
14
|
+
# }
|
15
|
+
# }
|
16
|
+
# }
|
17
|
+
# end
|
18
|
+
# puts builder.to_xml
|
19
|
+
#
|
20
|
+
# Will output:
|
21
|
+
#
|
22
|
+
# <?xml version="1.0"?>
|
23
|
+
# <root>
|
24
|
+
# <products>
|
25
|
+
# <widget>
|
26
|
+
# <id>10</id>
|
27
|
+
# <name>Awesome widget</name>
|
28
|
+
# </widget>
|
29
|
+
# </products>
|
30
|
+
# </root>
|
31
|
+
#
|
32
|
+
#
|
33
|
+
# === Builder scope
|
34
|
+
#
|
35
|
+
# The builder allows two forms. When the builder is supplied with a block
|
36
|
+
# that has a parameter, the outside scope is maintained. This means you
|
37
|
+
# can access variables that are outside your builder. If you don't need
|
38
|
+
# outside scope, you can use the builder without the "xml" prefix like
|
39
|
+
# this:
|
40
|
+
#
|
41
|
+
# builder = Nokogiri::XML::Builder.new do
|
42
|
+
# root {
|
43
|
+
# products {
|
44
|
+
# widget {
|
45
|
+
# id_ "10"
|
46
|
+
# name "Awesome widget"
|
47
|
+
# }
|
48
|
+
# }
|
49
|
+
# }
|
50
|
+
# end
|
51
|
+
#
|
52
|
+
# == Special Tags
|
53
|
+
#
|
54
|
+
# The builder works by taking advantage of method_missing. Unfortunately
|
55
|
+
# some methods are defined in ruby that are difficult or dangerous to
|
56
|
+
# remove. You may want to create tags with the name "type", "class", and
|
57
|
+
# "id" for example. In that case, you can use an underscore to
|
58
|
+
# disambiguate your tag name from the method call.
|
59
|
+
#
|
60
|
+
# Here is an example of using the underscore to disambiguate tag names from
|
61
|
+
# ruby methods:
|
62
|
+
#
|
63
|
+
# @objects = [Object.new, Object.new, Object.new]
|
64
|
+
#
|
65
|
+
# builder = Nokogiri::XML::Builder.new do |xml|
|
66
|
+
# xml.root {
|
67
|
+
# xml.objects {
|
68
|
+
# @objects.each do |o|
|
69
|
+
# xml.object {
|
70
|
+
# xml.type_ o.type
|
71
|
+
# xml.class_ o.class.name
|
72
|
+
# xml.id_ o.id
|
73
|
+
# }
|
74
|
+
# end
|
75
|
+
# }
|
76
|
+
# }
|
77
|
+
# end
|
78
|
+
# puts builder.to_xml
|
79
|
+
#
|
80
|
+
# The underscore may be used with any tag name, and the last underscore
|
81
|
+
# will just be removed. This code will output the following XML:
|
82
|
+
#
|
83
|
+
# <?xml version="1.0"?>
|
84
|
+
# <root>
|
85
|
+
# <objects>
|
86
|
+
# <object>
|
87
|
+
# <type>Object</type>
|
88
|
+
# <class>Object</class>
|
89
|
+
# <id>48390</id>
|
90
|
+
# </object>
|
91
|
+
# <object>
|
92
|
+
# <type>Object</type>
|
93
|
+
# <class>Object</class>
|
94
|
+
# <id>48380</id>
|
95
|
+
# </object>
|
96
|
+
# <object>
|
97
|
+
# <type>Object</type>
|
98
|
+
# <class>Object</class>
|
99
|
+
# <id>48370</id>
|
100
|
+
# </object>
|
101
|
+
# </objects>
|
102
|
+
# </root>
|
103
|
+
#
|
104
|
+
# == Tag Attributes
|
105
|
+
#
|
106
|
+
# Tag attributes may be supplied as method arguments. Here is our
|
107
|
+
# previous example, but using attributes rather than tags:
|
108
|
+
#
|
109
|
+
# @objects = [Object.new, Object.new, Object.new]
|
110
|
+
#
|
111
|
+
# builder = Nokogiri::XML::Builder.new do |xml|
|
112
|
+
# xml.root {
|
113
|
+
# xml.objects {
|
114
|
+
# @objects.each do |o|
|
115
|
+
# xml.object(:type => o.type, :class => o.class, :id => o.id)
|
116
|
+
# end
|
117
|
+
# }
|
118
|
+
# }
|
119
|
+
# end
|
120
|
+
# puts builder.to_xml
|
121
|
+
#
|
122
|
+
# === Tag Attribute Short Cuts
|
123
|
+
#
|
124
|
+
# A couple attribute short cuts are available when building tags. The
|
125
|
+
# short cuts are available by special method calls when building a tag.
|
126
|
+
#
|
127
|
+
# This example builds an "object" tag with the class attribute "classy"
|
128
|
+
# and the id of "thing":
|
129
|
+
#
|
130
|
+
# builder = Nokogiri::XML::Builder.new do |xml|
|
131
|
+
# xml.root {
|
132
|
+
# xml.objects {
|
133
|
+
# xml.object.classy.thing!
|
134
|
+
# }
|
135
|
+
# }
|
136
|
+
# end
|
137
|
+
# puts builder.to_xml
|
138
|
+
#
|
139
|
+
# Which will output:
|
140
|
+
#
|
141
|
+
# <?xml version="1.0"?>
|
142
|
+
# <root>
|
143
|
+
# <objects>
|
144
|
+
# <object class="classy" id="thing"/>
|
145
|
+
# </objects>
|
146
|
+
# </root>
|
147
|
+
#
|
148
|
+
# All other options are still supported with this syntax, including
|
149
|
+
# blocks and extra tag attributes.
|
150
|
+
#
|
151
|
+
# == Namespaces
|
152
|
+
#
|
153
|
+
# Namespaces are added similarly to attributes. Nokogiri::XML::Builder
|
154
|
+
# assumes that when an attribute starts with "xmlns", it is meant to be
|
155
|
+
# a namespace:
|
156
|
+
#
|
157
|
+
# builder = Nokogiri::XML::Builder.new { |xml|
|
158
|
+
# xml.root('xmlns' => 'default', 'xmlns:foo' => 'bar') do
|
159
|
+
# xml.tenderlove
|
160
|
+
# end
|
161
|
+
# }
|
162
|
+
# puts builder.to_xml
|
163
|
+
#
|
164
|
+
# Will output XML like this:
|
165
|
+
#
|
166
|
+
# <?xml version="1.0"?>
|
167
|
+
# <root xmlns:foo="bar" xmlns="default">
|
168
|
+
# <tenderlove/>
|
169
|
+
# </root>
|
170
|
+
#
|
171
|
+
# === Referencing declared namespaces
|
172
|
+
#
|
173
|
+
# Tags that reference non-default namespaces (i.e. a tag "foo:bar") can be
|
174
|
+
# built by using the Nokogiri::XML::Builder#[] method.
|
175
|
+
#
|
176
|
+
# For example:
|
177
|
+
#
|
178
|
+
# builder = Nokogiri::XML::Builder.new do |xml|
|
179
|
+
# xml.root('xmlns:foo' => 'bar') {
|
180
|
+
# xml.objects {
|
181
|
+
# xml['foo'].object.classy.thing!
|
182
|
+
# }
|
183
|
+
# }
|
184
|
+
# end
|
185
|
+
# puts builder.to_xml
|
186
|
+
#
|
187
|
+
# Will output this XML:
|
188
|
+
#
|
189
|
+
# <?xml version="1.0"?>
|
190
|
+
# <root xmlns:foo="bar">
|
191
|
+
# <objects>
|
192
|
+
# <foo:object class="classy" id="thing"/>
|
193
|
+
# </objects>
|
194
|
+
# </root>
|
195
|
+
#
|
196
|
+
# Note the "foo:object" tag.
|
197
|
+
#
|
198
|
+
# == Document Types
|
199
|
+
#
|
200
|
+
# To create a document type (DTD), access use the Builder#doc method to get
|
201
|
+
# the current context document. Then call Node#create_internal_subset to
|
202
|
+
# create the DTD node.
|
203
|
+
#
|
204
|
+
# For example, this Ruby:
|
205
|
+
#
|
206
|
+
# builder = Nokogiri::XML::Builder.new do |xml|
|
207
|
+
# xml.doc.create_internal_subset(
|
208
|
+
# 'html',
|
209
|
+
# "-//W3C//DTD HTML 4.01 Transitional//EN",
|
210
|
+
# "http://www.w3.org/TR/html4/loose.dtd"
|
211
|
+
# )
|
212
|
+
# xml.root do
|
213
|
+
# xml.foo
|
214
|
+
# end
|
215
|
+
# end
|
216
|
+
#
|
217
|
+
# puts builder.to_xml
|
218
|
+
#
|
219
|
+
# Will output this xml:
|
220
|
+
#
|
221
|
+
# <?xml version="1.0"?>
|
222
|
+
# <!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
|
223
|
+
# <root>
|
224
|
+
# <foo/>
|
225
|
+
# </root>
|
226
|
+
#
|
227
|
+
class Builder
|
228
|
+
# The current Document object being built
|
229
|
+
attr_accessor :doc
|
230
|
+
|
231
|
+
# The parent of the current node being built
|
232
|
+
attr_accessor :parent
|
233
|
+
|
234
|
+
# A context object for use when the block has no arguments
|
235
|
+
attr_accessor :context
|
236
|
+
|
237
|
+
attr_accessor :arity # :nodoc:
|
238
|
+
|
239
|
+
###
|
240
|
+
# Create a builder with an existing root object. This is for use when
|
241
|
+
# you have an existing document that you would like to augment with
|
242
|
+
# builder methods. The builder context created will start with the
|
243
|
+
# given +root+ node.
|
244
|
+
#
|
245
|
+
# For example:
|
246
|
+
#
|
247
|
+
# doc = Nokogiri::XML(open('somedoc.xml'))
|
248
|
+
# Nokogiri::XML::Builder.with(doc.at('some_tag')) do |xml|
|
249
|
+
# # ... Use normal builder methods here ...
|
250
|
+
# xml.awesome # add the "awesome" tag below "some_tag"
|
251
|
+
# end
|
252
|
+
#
|
253
|
+
def self.with root, &block
|
254
|
+
builder = self.new({}, root, &block)
|
255
|
+
end
|
256
|
+
|
257
|
+
###
|
258
|
+
# Create a new Builder object. +options+ are sent to the top level
|
259
|
+
# Document that is being built.
|
260
|
+
#
|
261
|
+
# Building a document with a particular encoding for example:
|
262
|
+
#
|
263
|
+
# Nokogiri::XML::Builder.new(:encoding => 'UTF-8') do |xml|
|
264
|
+
# ...
|
265
|
+
# end
|
266
|
+
def initialize options = {}, root = nil, &block
|
267
|
+
|
268
|
+
if root
|
269
|
+
@doc = root.document
|
270
|
+
@parent = root
|
271
|
+
else
|
272
|
+
namespace = self.class.name.split('::')
|
273
|
+
namespace[-1] = 'Document'
|
274
|
+
@doc = eval(namespace.join('::')).new
|
275
|
+
@parent = @doc
|
276
|
+
end
|
277
|
+
|
278
|
+
@context = nil
|
279
|
+
@arity = nil
|
280
|
+
@ns = nil
|
281
|
+
|
282
|
+
options.each do |k,v|
|
283
|
+
@doc.send(:"#{k}=", v)
|
284
|
+
end
|
285
|
+
|
286
|
+
return unless block_given?
|
287
|
+
|
288
|
+
@arity = block.arity
|
289
|
+
if @arity <= 0
|
290
|
+
@context = eval('self', block.binding)
|
291
|
+
instance_eval(&block)
|
292
|
+
else
|
293
|
+
yield self
|
294
|
+
end
|
295
|
+
|
296
|
+
@parent = @doc
|
297
|
+
end
|
298
|
+
|
299
|
+
###
|
300
|
+
# Create a Text Node with content of +string+
|
301
|
+
def text string
|
302
|
+
insert @doc.create_text_node(string)
|
303
|
+
end
|
304
|
+
|
305
|
+
###
|
306
|
+
# Create a CDATA Node with content of +string+
|
307
|
+
def cdata string
|
308
|
+
insert(doc.create_cdata(string))
|
309
|
+
end
|
310
|
+
|
311
|
+
###
|
312
|
+
# Build a tag that is associated with namespace +ns+. Raises an
|
313
|
+
# ArgumentError if +ns+ has not been defined higher in the tree.
|
314
|
+
def [] ns
|
315
|
+
@ns = @parent.namespace_definitions.find { |x| x.prefix == ns.to_s }
|
316
|
+
return self if @ns
|
317
|
+
|
318
|
+
@parent.ancestors.each do |a|
|
319
|
+
next if a == doc
|
320
|
+
@ns = a.namespace_definitions.find { |x| x.prefix == ns.to_s }
|
321
|
+
return self if @ns
|
322
|
+
end
|
323
|
+
|
324
|
+
raise ArgumentError, "Namespace #{ns} has not been defined"
|
325
|
+
end
|
326
|
+
|
327
|
+
###
|
328
|
+
# Convert this Builder object to XML
|
329
|
+
def to_xml(*args)
|
330
|
+
@doc.to_xml(*args)
|
331
|
+
end
|
332
|
+
|
333
|
+
###
|
334
|
+
# Append the given raw XML +string+ to the document
|
335
|
+
def << string
|
336
|
+
@doc.fragment(string).children.each { |x| insert(x) }
|
337
|
+
end
|
338
|
+
|
339
|
+
def method_missing method, *args, &block # :nodoc:
|
340
|
+
if @context && @context.respond_to?(method)
|
341
|
+
@context.send(method, *args, &block)
|
342
|
+
else
|
343
|
+
node = @doc.create_element(method.to_s.sub(/[_!]$/, ''),*args) { |n|
|
344
|
+
# Set up the namespace
|
345
|
+
if @ns
|
346
|
+
n.namespace = @ns
|
347
|
+
@ns = nil
|
348
|
+
end
|
349
|
+
}
|
350
|
+
insert(node, &block)
|
351
|
+
end
|
352
|
+
end
|
353
|
+
|
354
|
+
private
|
355
|
+
###
|
356
|
+
# Insert +node+ as a child of the current Node
|
357
|
+
def insert(node, &block)
|
358
|
+
node.parent = @parent
|
359
|
+
if block_given?
|
360
|
+
old_parent = @parent
|
361
|
+
@parent = node
|
362
|
+
@arity ||= block.arity
|
363
|
+
if @arity <= 0
|
364
|
+
instance_eval(&block)
|
365
|
+
else
|
366
|
+
block.call(self)
|
367
|
+
end
|
368
|
+
@parent = old_parent
|
369
|
+
end
|
370
|
+
NodeBuilder.new(node, self)
|
371
|
+
end
|
372
|
+
|
373
|
+
class NodeBuilder # :nodoc:
|
374
|
+
def initialize node, doc_builder
|
375
|
+
@node = node
|
376
|
+
@doc_builder = doc_builder
|
377
|
+
end
|
378
|
+
|
379
|
+
def []= k, v
|
380
|
+
@node[k] = v
|
381
|
+
end
|
382
|
+
|
383
|
+
def [] k
|
384
|
+
@node[k]
|
385
|
+
end
|
386
|
+
|
387
|
+
def method_missing(method, *args, &block)
|
388
|
+
opts = args.last.is_a?(Hash) ? args.pop : {}
|
389
|
+
case method.to_s
|
390
|
+
when /^(.*)!$/
|
391
|
+
@node['id'] = $1
|
392
|
+
@node.content = args.first if args.first
|
393
|
+
when /^(.*)=/
|
394
|
+
@node[$1] = args.first
|
395
|
+
else
|
396
|
+
@node['class'] =
|
397
|
+
((@node['class'] || '').split(/\s/) + [method.to_s]).join(' ')
|
398
|
+
@node.content = args.first if args.first
|
399
|
+
end
|
400
|
+
|
401
|
+
# Assign any extra options
|
402
|
+
opts.each do |k,v|
|
403
|
+
@node[k.to_s] = ((@node[k.to_s] || '').split(/\s/) + [v]).join(' ')
|
404
|
+
end
|
405
|
+
|
406
|
+
if block_given?
|
407
|
+
old_parent = @doc_builder.parent
|
408
|
+
@doc_builder.parent = @node
|
409
|
+
value = @doc_builder.instance_eval(&block)
|
410
|
+
@doc_builder.parent = old_parent
|
411
|
+
return value
|
412
|
+
end
|
413
|
+
self
|
414
|
+
end
|
415
|
+
end
|
416
|
+
end
|
417
|
+
end
|
418
|
+
end
|