nokogiri-maven 1.5.0-java

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (278) hide show
  1. data/CHANGELOG.ja.rdoc +544 -0
  2. data/CHANGELOG.rdoc +532 -0
  3. data/Manifest.txt +283 -0
  4. data/README.ja.rdoc +106 -0
  5. data/README.rdoc +174 -0
  6. data/Rakefile +164 -0
  7. data/bin/nokogiri +53 -0
  8. data/ext/java/nokogiri/EncodingHandler.java +124 -0
  9. data/ext/java/nokogiri/HtmlDocument.java +119 -0
  10. data/ext/java/nokogiri/HtmlElementDescription.java +145 -0
  11. data/ext/java/nokogiri/HtmlEntityLookup.java +79 -0
  12. data/ext/java/nokogiri/HtmlSaxParserContext.java +259 -0
  13. data/ext/java/nokogiri/NokogiriService.java +590 -0
  14. data/ext/java/nokogiri/XmlAttr.java +180 -0
  15. data/ext/java/nokogiri/XmlAttributeDecl.java +130 -0
  16. data/ext/java/nokogiri/XmlCdata.java +84 -0
  17. data/ext/java/nokogiri/XmlComment.java +86 -0
  18. data/ext/java/nokogiri/XmlDocument.java +519 -0
  19. data/ext/java/nokogiri/XmlDocumentFragment.java +223 -0
  20. data/ext/java/nokogiri/XmlDtd.java +469 -0
  21. data/ext/java/nokogiri/XmlElement.java +195 -0
  22. data/ext/java/nokogiri/XmlElementContent.java +382 -0
  23. data/ext/java/nokogiri/XmlElementDecl.java +152 -0
  24. data/ext/java/nokogiri/XmlEntityDecl.java +162 -0
  25. data/ext/java/nokogiri/XmlEntityReference.java +97 -0
  26. data/ext/java/nokogiri/XmlNamespace.java +183 -0
  27. data/ext/java/nokogiri/XmlNode.java +1378 -0
  28. data/ext/java/nokogiri/XmlNodeSet.java +267 -0
  29. data/ext/java/nokogiri/XmlProcessingInstruction.java +99 -0
  30. data/ext/java/nokogiri/XmlReader.java +408 -0
  31. data/ext/java/nokogiri/XmlRelaxng.java +144 -0
  32. data/ext/java/nokogiri/XmlSaxParserContext.java +367 -0
  33. data/ext/java/nokogiri/XmlSaxPushParser.java +184 -0
  34. data/ext/java/nokogiri/XmlSchema.java +324 -0
  35. data/ext/java/nokogiri/XmlSyntaxError.java +119 -0
  36. data/ext/java/nokogiri/XmlText.java +119 -0
  37. data/ext/java/nokogiri/XmlXpathContext.java +199 -0
  38. data/ext/java/nokogiri/XsltStylesheet.java +197 -0
  39. data/ext/java/nokogiri/internals/HtmlDomParserContext.java +204 -0
  40. data/ext/java/nokogiri/internals/NokogiriDocumentCache.java +73 -0
  41. data/ext/java/nokogiri/internals/NokogiriErrorHandler.java +86 -0
  42. data/ext/java/nokogiri/internals/NokogiriHandler.java +327 -0
  43. data/ext/java/nokogiri/internals/NokogiriHelpers.java +639 -0
  44. data/ext/java/nokogiri/internals/NokogiriNamespaceCache.java +167 -0
  45. data/ext/java/nokogiri/internals/NokogiriNamespaceContext.java +130 -0
  46. data/ext/java/nokogiri/internals/NokogiriNonStrictErrorHandler.java +74 -0
  47. data/ext/java/nokogiri/internals/NokogiriNonStrictErrorHandler4NekoHtml.java +121 -0
  48. data/ext/java/nokogiri/internals/NokogiriStrictErrorHandler.java +79 -0
  49. data/ext/java/nokogiri/internals/NokogiriXPathFunction.java +141 -0
  50. data/ext/java/nokogiri/internals/NokogiriXPathFunctionResolver.java +73 -0
  51. data/ext/java/nokogiri/internals/NokogiriXPathVariableResolver.java +67 -0
  52. data/ext/java/nokogiri/internals/NokogiriXsltErrorListener.java +86 -0
  53. data/ext/java/nokogiri/internals/ParserContext.java +276 -0
  54. data/ext/java/nokogiri/internals/PushInputStream.java +411 -0
  55. data/ext/java/nokogiri/internals/ReaderNode.java +531 -0
  56. data/ext/java/nokogiri/internals/SaveContextVisitor.java +567 -0
  57. data/ext/java/nokogiri/internals/SchemaErrorHandler.java +76 -0
  58. data/ext/java/nokogiri/internals/XmlDeclHandler.java +42 -0
  59. data/ext/java/nokogiri/internals/XmlDomParser.java +76 -0
  60. data/ext/java/nokogiri/internals/XmlDomParserContext.java +244 -0
  61. data/ext/java/nokogiri/internals/XmlSaxParser.java +65 -0
  62. data/ext/java/nokogiri/internals/XsltExtensionFunction.java +72 -0
  63. data/ext/nokogiri/depend +358 -0
  64. data/ext/nokogiri/extconf.rb +124 -0
  65. data/ext/nokogiri/html_document.c +154 -0
  66. data/ext/nokogiri/html_document.h +10 -0
  67. data/ext/nokogiri/html_element_description.c +276 -0
  68. data/ext/nokogiri/html_element_description.h +10 -0
  69. data/ext/nokogiri/html_entity_lookup.c +32 -0
  70. data/ext/nokogiri/html_entity_lookup.h +8 -0
  71. data/ext/nokogiri/html_sax_parser_context.c +94 -0
  72. data/ext/nokogiri/html_sax_parser_context.h +11 -0
  73. data/ext/nokogiri/nokogiri.c +115 -0
  74. data/ext/nokogiri/nokogiri.h +160 -0
  75. data/ext/nokogiri/xml_attr.c +94 -0
  76. data/ext/nokogiri/xml_attr.h +9 -0
  77. data/ext/nokogiri/xml_attribute_decl.c +70 -0
  78. data/ext/nokogiri/xml_attribute_decl.h +9 -0
  79. data/ext/nokogiri/xml_cdata.c +56 -0
  80. data/ext/nokogiri/xml_cdata.h +9 -0
  81. data/ext/nokogiri/xml_comment.c +54 -0
  82. data/ext/nokogiri/xml_comment.h +9 -0
  83. data/ext/nokogiri/xml_document.c +478 -0
  84. data/ext/nokogiri/xml_document.h +23 -0
  85. data/ext/nokogiri/xml_document_fragment.c +48 -0
  86. data/ext/nokogiri/xml_document_fragment.h +10 -0
  87. data/ext/nokogiri/xml_dtd.c +202 -0
  88. data/ext/nokogiri/xml_dtd.h +10 -0
  89. data/ext/nokogiri/xml_element_content.c +123 -0
  90. data/ext/nokogiri/xml_element_content.h +10 -0
  91. data/ext/nokogiri/xml_element_decl.c +69 -0
  92. data/ext/nokogiri/xml_element_decl.h +9 -0
  93. data/ext/nokogiri/xml_encoding_handler.c +79 -0
  94. data/ext/nokogiri/xml_encoding_handler.h +8 -0
  95. data/ext/nokogiri/xml_entity_decl.c +110 -0
  96. data/ext/nokogiri/xml_entity_decl.h +10 -0
  97. data/ext/nokogiri/xml_entity_reference.c +52 -0
  98. data/ext/nokogiri/xml_entity_reference.h +9 -0
  99. data/ext/nokogiri/xml_io.c +56 -0
  100. data/ext/nokogiri/xml_io.h +11 -0
  101. data/ext/nokogiri/xml_libxml2_hacks.c +112 -0
  102. data/ext/nokogiri/xml_libxml2_hacks.h +12 -0
  103. data/ext/nokogiri/xml_namespace.c +84 -0
  104. data/ext/nokogiri/xml_namespace.h +13 -0
  105. data/ext/nokogiri/xml_node.c +1385 -0
  106. data/ext/nokogiri/xml_node.h +13 -0
  107. data/ext/nokogiri/xml_node_set.c +418 -0
  108. data/ext/nokogiri/xml_node_set.h +9 -0
  109. data/ext/nokogiri/xml_processing_instruction.c +56 -0
  110. data/ext/nokogiri/xml_processing_instruction.h +9 -0
  111. data/ext/nokogiri/xml_reader.c +684 -0
  112. data/ext/nokogiri/xml_reader.h +10 -0
  113. data/ext/nokogiri/xml_relax_ng.c +161 -0
  114. data/ext/nokogiri/xml_relax_ng.h +9 -0
  115. data/ext/nokogiri/xml_sax_parser.c +293 -0
  116. data/ext/nokogiri/xml_sax_parser.h +39 -0
  117. data/ext/nokogiri/xml_sax_parser_context.c +199 -0
  118. data/ext/nokogiri/xml_sax_parser_context.h +10 -0
  119. data/ext/nokogiri/xml_sax_push_parser.c +115 -0
  120. data/ext/nokogiri/xml_sax_push_parser.h +9 -0
  121. data/ext/nokogiri/xml_schema.c +205 -0
  122. data/ext/nokogiri/xml_schema.h +9 -0
  123. data/ext/nokogiri/xml_syntax_error.c +58 -0
  124. data/ext/nokogiri/xml_syntax_error.h +13 -0
  125. data/ext/nokogiri/xml_text.c +50 -0
  126. data/ext/nokogiri/xml_text.h +9 -0
  127. data/ext/nokogiri/xml_xpath_context.c +309 -0
  128. data/ext/nokogiri/xml_xpath_context.h +9 -0
  129. data/ext/nokogiri/xslt_stylesheet.c +264 -0
  130. data/ext/nokogiri/xslt_stylesheet.h +9 -0
  131. data/lib/nokogiri.rb +127 -0
  132. data/lib/nokogiri/css.rb +27 -0
  133. data/lib/nokogiri/css/node.rb +99 -0
  134. data/lib/nokogiri/css/parser.rb +677 -0
  135. data/lib/nokogiri/css/parser.y +237 -0
  136. data/lib/nokogiri/css/parser_extras.rb +91 -0
  137. data/lib/nokogiri/css/syntax_error.rb +7 -0
  138. data/lib/nokogiri/css/tokenizer.rb +152 -0
  139. data/lib/nokogiri/css/tokenizer.rex +55 -0
  140. data/lib/nokogiri/css/xpath_visitor.rb +171 -0
  141. data/lib/nokogiri/decorators/slop.rb +35 -0
  142. data/lib/nokogiri/html.rb +36 -0
  143. data/lib/nokogiri/html/builder.rb +35 -0
  144. data/lib/nokogiri/html/document.rb +213 -0
  145. data/lib/nokogiri/html/document_fragment.rb +41 -0
  146. data/lib/nokogiri/html/element_description.rb +23 -0
  147. data/lib/nokogiri/html/element_description_defaults.rb +671 -0
  148. data/lib/nokogiri/html/entity_lookup.rb +13 -0
  149. data/lib/nokogiri/html/sax/parser.rb +52 -0
  150. data/lib/nokogiri/html/sax/parser_context.rb +16 -0
  151. data/lib/nokogiri/nokogiri.jar +0 -0
  152. data/lib/nokogiri/syntax_error.rb +4 -0
  153. data/lib/nokogiri/version.rb +88 -0
  154. data/lib/nokogiri/xml.rb +67 -0
  155. data/lib/nokogiri/xml/attr.rb +14 -0
  156. data/lib/nokogiri/xml/attribute_decl.rb +18 -0
  157. data/lib/nokogiri/xml/builder.rb +425 -0
  158. data/lib/nokogiri/xml/cdata.rb +11 -0
  159. data/lib/nokogiri/xml/character_data.rb +7 -0
  160. data/lib/nokogiri/xml/document.rb +234 -0
  161. data/lib/nokogiri/xml/document_fragment.rb +98 -0
  162. data/lib/nokogiri/xml/dtd.rb +22 -0
  163. data/lib/nokogiri/xml/element_content.rb +36 -0
  164. data/lib/nokogiri/xml/element_decl.rb +13 -0
  165. data/lib/nokogiri/xml/entity_decl.rb +19 -0
  166. data/lib/nokogiri/xml/namespace.rb +13 -0
  167. data/lib/nokogiri/xml/node.rb +915 -0
  168. data/lib/nokogiri/xml/node/save_options.rb +61 -0
  169. data/lib/nokogiri/xml/node_set.rb +357 -0
  170. data/lib/nokogiri/xml/notation.rb +6 -0
  171. data/lib/nokogiri/xml/parse_options.rb +93 -0
  172. data/lib/nokogiri/xml/pp.rb +2 -0
  173. data/lib/nokogiri/xml/pp/character_data.rb +18 -0
  174. data/lib/nokogiri/xml/pp/node.rb +56 -0
  175. data/lib/nokogiri/xml/processing_instruction.rb +8 -0
  176. data/lib/nokogiri/xml/reader.rb +112 -0
  177. data/lib/nokogiri/xml/relax_ng.rb +32 -0
  178. data/lib/nokogiri/xml/sax.rb +4 -0
  179. data/lib/nokogiri/xml/sax/document.rb +164 -0
  180. data/lib/nokogiri/xml/sax/parser.rb +115 -0
  181. data/lib/nokogiri/xml/sax/parser_context.rb +16 -0
  182. data/lib/nokogiri/xml/sax/push_parser.rb +60 -0
  183. data/lib/nokogiri/xml/schema.rb +63 -0
  184. data/lib/nokogiri/xml/syntax_error.rb +47 -0
  185. data/lib/nokogiri/xml/text.rb +9 -0
  186. data/lib/nokogiri/xml/xpath.rb +10 -0
  187. data/lib/nokogiri/xml/xpath/syntax_error.rb +11 -0
  188. data/lib/nokogiri/xml/xpath_context.rb +16 -0
  189. data/lib/nokogiri/xslt.rb +52 -0
  190. data/lib/nokogiri/xslt/stylesheet.rb +25 -0
  191. data/lib/xsd/xmlparser/nokogiri.rb +90 -0
  192. data/nokogiri_help_responses.md +40 -0
  193. data/tasks/cross_compile.rb +152 -0
  194. data/tasks/nokogiri.org.rb +18 -0
  195. data/tasks/test.rb +94 -0
  196. data/test/css/test_nthiness.rb +159 -0
  197. data/test/css/test_parser.rb +303 -0
  198. data/test/css/test_tokenizer.rb +198 -0
  199. data/test/css/test_xpath_visitor.rb +85 -0
  200. data/test/decorators/test_slop.rb +16 -0
  201. data/test/files/2ch.html +108 -0
  202. data/test/files/address_book.rlx +12 -0
  203. data/test/files/address_book.xml +10 -0
  204. data/test/files/bar/bar.xsd +4 -0
  205. data/test/files/dont_hurt_em_why.xml +422 -0
  206. data/test/files/encoding.html +82 -0
  207. data/test/files/encoding.xhtml +84 -0
  208. data/test/files/exslt.xml +8 -0
  209. data/test/files/exslt.xslt +35 -0
  210. data/test/files/foo/foo.xsd +4 -0
  211. data/test/files/metacharset.html +10 -0
  212. data/test/files/noencoding.html +47 -0
  213. data/test/files/po.xml +32 -0
  214. data/test/files/po.xsd +66 -0
  215. data/test/files/shift_jis.html +10 -0
  216. data/test/files/shift_jis.xml +5 -0
  217. data/test/files/snuggles.xml +3 -0
  218. data/test/files/staff.dtd +10 -0
  219. data/test/files/staff.xml +59 -0
  220. data/test/files/staff.xslt +32 -0
  221. data/test/files/tlm.html +850 -0
  222. data/test/files/valid_bar.xml +2 -0
  223. data/test/helper.rb +173 -0
  224. data/test/html/sax/test_parser.rb +136 -0
  225. data/test/html/sax/test_parser_context.rb +48 -0
  226. data/test/html/test_builder.rb +164 -0
  227. data/test/html/test_document.rb +472 -0
  228. data/test/html/test_document_encoding.rb +138 -0
  229. data/test/html/test_document_fragment.rb +255 -0
  230. data/test/html/test_element_description.rb +100 -0
  231. data/test/html/test_named_characters.rb +14 -0
  232. data/test/html/test_node.rb +190 -0
  233. data/test/html/test_node_encoding.rb +27 -0
  234. data/test/test_convert_xpath.rb +135 -0
  235. data/test/test_css_cache.rb +45 -0
  236. data/test/test_encoding_handler.rb +46 -0
  237. data/test/test_memory_leak.rb +72 -0
  238. data/test/test_nokogiri.rb +132 -0
  239. data/test/test_reader.rb +425 -0
  240. data/test/test_soap4r_sax.rb +52 -0
  241. data/test/test_xslt_transforms.rb +193 -0
  242. data/test/xml/node/test_save_options.rb +28 -0
  243. data/test/xml/node/test_subclass.rb +44 -0
  244. data/test/xml/sax/test_parser.rb +338 -0
  245. data/test/xml/sax/test_parser_context.rb +113 -0
  246. data/test/xml/sax/test_push_parser.rb +156 -0
  247. data/test/xml/test_attr.rb +65 -0
  248. data/test/xml/test_attribute_decl.rb +86 -0
  249. data/test/xml/test_builder.rb +227 -0
  250. data/test/xml/test_cdata.rb +50 -0
  251. data/test/xml/test_comment.rb +29 -0
  252. data/test/xml/test_document.rb +697 -0
  253. data/test/xml/test_document_encoding.rb +26 -0
  254. data/test/xml/test_document_fragment.rb +192 -0
  255. data/test/xml/test_dtd.rb +107 -0
  256. data/test/xml/test_dtd_encoding.rb +33 -0
  257. data/test/xml/test_element_content.rb +56 -0
  258. data/test/xml/test_element_decl.rb +73 -0
  259. data/test/xml/test_entity_decl.rb +122 -0
  260. data/test/xml/test_entity_reference.rb +21 -0
  261. data/test/xml/test_namespace.rb +70 -0
  262. data/test/xml/test_node.rb +917 -0
  263. data/test/xml/test_node_attributes.rb +34 -0
  264. data/test/xml/test_node_encoding.rb +107 -0
  265. data/test/xml/test_node_reparenting.rb +334 -0
  266. data/test/xml/test_node_set.rb +742 -0
  267. data/test/xml/test_parse_options.rb +52 -0
  268. data/test/xml/test_processing_instruction.rb +30 -0
  269. data/test/xml/test_reader_encoding.rb +126 -0
  270. data/test/xml/test_relax_ng.rb +60 -0
  271. data/test/xml/test_schema.rb +94 -0
  272. data/test/xml/test_syntax_error.rb +12 -0
  273. data/test/xml/test_text.rb +47 -0
  274. data/test/xml/test_unparented_node.rb +381 -0
  275. data/test/xml/test_xpath.rb +237 -0
  276. data/test/xslt/test_custom_functions.rb +94 -0
  277. data/test/xslt/test_exception_handling.rb +37 -0
  278. metadata +552 -0
@@ -0,0 +1,184 @@
1
+ /**
2
+ * (The MIT License)
3
+ *
4
+ * Copyright (c) 2008 - 2011:
5
+ *
6
+ * * {Aaron Patterson}[http://tenderlovemaking.com]
7
+ * * {Mike Dalessio}[http://mike.daless.io]
8
+ * * {Charles Nutter}[http://blog.headius.com]
9
+ * * {Sergio Arbeo}[http://www.serabe.com]
10
+ * * {Patrick Mahoney}[http://polycrystal.org]
11
+ * * {Yoko Harada}[http://yokolet.blogspot.com]
12
+ *
13
+ * Permission is hereby granted, free of charge, to any person obtaining
14
+ * a copy of this software and associated documentation files (the
15
+ * 'Software'), to deal in the Software without restriction, including
16
+ * without limitation the rights to use, copy, modify, merge, publish,
17
+ * distribute, sublicense, and/or sell copies of the Software, and to
18
+ * permit persons to whom the Software is furnished to do so, subject to
19
+ * the following conditions:
20
+ *
21
+ * The above copyright notice and this permission notice shall be
22
+ * included in all copies or substantial portions of the Software.
23
+ *
24
+ * THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND,
25
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26
+ * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
27
+ * IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
28
+ * CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
29
+ * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
30
+ * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
31
+ */
32
+
33
+ package nokogiri;
34
+
35
+ import static nokogiri.internals.NokogiriHelpers.getNokogiriClass;
36
+ import static org.jruby.javasupport.util.RuntimeHelpers.invoke;
37
+
38
+ import java.io.IOException;
39
+ import java.io.InputStream;
40
+ import java.nio.channels.ClosedChannelException;
41
+
42
+ import nokogiri.internals.ParserContext;
43
+ import nokogiri.internals.PushInputStream;
44
+
45
+ import org.jruby.Ruby;
46
+ import org.jruby.RubyClass;
47
+ import org.jruby.RubyException;
48
+ import org.jruby.RubyObject;
49
+ import org.jruby.RubyString;
50
+ import org.jruby.anno.JRubyClass;
51
+ import org.jruby.anno.JRubyMethod;
52
+ import org.jruby.exceptions.RaiseException;
53
+ import org.jruby.runtime.ThreadContext;
54
+ import org.jruby.runtime.builtin.IRubyObject;
55
+
56
+ /**
57
+ * Class for Nokogiri::XML::SAX::PushParser
58
+ *
59
+ * @author Patrick Mahoney <pat@polycrystal.org>
60
+ * @author Yoko Harada <yokolet@gmail.com>
61
+ */
62
+ @JRubyClass(name="Nokogiri::XML::SAX::PushParser")
63
+ public class XmlSaxPushParser extends RubyObject {
64
+ ParserContext.Options options;
65
+ IRubyObject optionsRuby;
66
+ PushInputStream stream;
67
+ Thread reader;
68
+ Runner runner;
69
+
70
+ public XmlSaxPushParser(Ruby ruby, RubyClass rubyClass) {
71
+ super(ruby, rubyClass);
72
+ }
73
+
74
+ @JRubyMethod
75
+ public IRubyObject initialize_native(final ThreadContext context,
76
+ IRubyObject _saxParser,
77
+ IRubyObject fileName) {
78
+ optionsRuby = invoke(context,
79
+ context.getRuntime().getClassFromPath("Nokogiri::XML::ParseOptions"),
80
+ "new");
81
+ options = new ParserContext.Options(0);
82
+ stream = new PushInputStream();
83
+
84
+ runner = new Runner(context, this, stream);
85
+ reader = new Thread(runner);
86
+ reader.start();
87
+
88
+ return this;
89
+ }
90
+
91
+ /**
92
+ * Returns an integer.
93
+ */
94
+ @JRubyMethod(name="options")
95
+ public IRubyObject getOptions(ThreadContext context) {
96
+ return invoke(context, optionsRuby, "options");
97
+ }
98
+
99
+ /**
100
+ * <code>val</code> is an integer.
101
+ */
102
+ @JRubyMethod(name="options=")
103
+ public IRubyObject setOptions(ThreadContext context, IRubyObject val) {
104
+ invoke(context, optionsRuby, "options=", val);
105
+ options =
106
+ new ParserContext.Options(val.convertToInteger().getLongValue());
107
+ return getOptions(context);
108
+ }
109
+
110
+ @JRubyMethod
111
+ public IRubyObject native_write(ThreadContext context, IRubyObject chunk,
112
+ IRubyObject isLast) {
113
+ byte[] data = null;
114
+ if (chunk instanceof RubyString || chunk.respondsTo("to_str")) {
115
+ data = chunk.convertToString().getBytes();
116
+ } else {
117
+ XmlSyntaxError xmlSyntaxError = (XmlSyntaxError) NokogiriService.XML_SYNTAXERROR_ALLOCATOR.allocate(context.getRuntime(), getNokogiriClass(context.getRuntime(), "Nokogiri::XML::SyntaxError"));
118
+ throw new RaiseException(xmlSyntaxError);
119
+ }
120
+
121
+ int errorCount0 = runner.getErrorCount();
122
+
123
+ try {
124
+ stream.writeAndWaitForRead(data);
125
+ } catch (ClosedChannelException e) {
126
+ // ignore
127
+ } catch (IOException e) {
128
+ throw context.getRuntime().newRuntimeError(e.toString());
129
+ }
130
+
131
+ if (isLast.isTrue()) {
132
+ try {
133
+ stream.close();
134
+ } catch (IOException e) {
135
+ // ignore
136
+ }
137
+
138
+ for (;;) {
139
+ try {
140
+ reader.join();
141
+ break;
142
+ } catch (InterruptedException e) {
143
+ // continue loop
144
+ }
145
+ }
146
+ }
147
+
148
+ if (!options.recover && runner.getErrorCount() > errorCount0) {
149
+ throw new RaiseException(runner.getLastError(), true);
150
+ }
151
+
152
+ return this;
153
+ }
154
+
155
+ protected static class Runner implements Runnable {
156
+ protected ThreadContext context;
157
+ protected IRubyObject handler;
158
+ protected XmlSaxParserContext parser;
159
+
160
+ public Runner(ThreadContext context,
161
+ IRubyObject handler,
162
+ InputStream stream) {
163
+ RubyClass klazz = getNokogiriClass(context.getRuntime(), "Nokogiri::XML::SAX::ParserContext");
164
+
165
+ this.context = context;
166
+ this.handler = handler;
167
+ this.parser = (XmlSaxParserContext) XmlSaxParserContext.parse_stream(context, klazz, stream);
168
+ }
169
+
170
+ public void run() {
171
+ parser.parse_with(context, handler);
172
+ }
173
+
174
+ public int getErrorCount() {
175
+ // check for null because thread may nto have started yet
176
+ if (parser.getNokogiriHandler() == null) return 0;
177
+ else return parser.getNokogiriHandler().getErrorCount();
178
+ }
179
+
180
+ public RubyException getLastError() {
181
+ return (RubyException) parser.getNokogiriHandler().getLastError();
182
+ }
183
+ }
184
+ }
@@ -0,0 +1,324 @@
1
+ /**
2
+ * (The MIT License)
3
+ *
4
+ * Copyright (c) 2008 - 2011:
5
+ *
6
+ * * {Aaron Patterson}[http://tenderlovemaking.com]
7
+ * * {Mike Dalessio}[http://mike.daless.io]
8
+ * * {Charles Nutter}[http://blog.headius.com]
9
+ * * {Sergio Arbeo}[http://www.serabe.com]
10
+ * * {Patrick Mahoney}[http://polycrystal.org]
11
+ * * {Yoko Harada}[http://yokolet.blogspot.com]
12
+ *
13
+ * Permission is hereby granted, free of charge, to any person obtaining
14
+ * a copy of this software and associated documentation files (the
15
+ * 'Software'), to deal in the Software without restriction, including
16
+ * without limitation the rights to use, copy, modify, merge, publish,
17
+ * distribute, sublicense, and/or sell copies of the Software, and to
18
+ * permit persons to whom the Software is furnished to do so, subject to
19
+ * the following conditions:
20
+ *
21
+ * The above copyright notice and this permission notice shall be
22
+ * included in all copies or substantial portions of the Software.
23
+ *
24
+ * THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND,
25
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26
+ * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
27
+ * IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
28
+ * CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
29
+ * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
30
+ * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
31
+ */
32
+
33
+ package nokogiri;
34
+
35
+ import static nokogiri.internals.NokogiriHelpers.getNokogiriClass;
36
+ import static nokogiri.internals.NokogiriHelpers.adjustSystemIdIfNecessary;
37
+
38
+ import java.io.IOException;
39
+ import java.io.InputStream;
40
+ import java.io.Reader;
41
+ import java.io.StringReader;
42
+
43
+ import javax.xml.XMLConstants;
44
+ import javax.xml.transform.Source;
45
+ import javax.xml.transform.dom.DOMSource;
46
+ import javax.xml.transform.stream.StreamSource;
47
+ import javax.xml.validation.Schema;
48
+ import javax.xml.validation.SchemaFactory;
49
+ import javax.xml.validation.Validator;
50
+
51
+ import nokogiri.internals.SchemaErrorHandler;
52
+ import nokogiri.internals.XmlDomParserContext;
53
+
54
+ import org.jruby.Ruby;
55
+ import org.jruby.RubyArray;
56
+ import org.jruby.RubyClass;
57
+ import org.jruby.RubyFixnum;
58
+ import org.jruby.RubyObject;
59
+ import org.jruby.anno.JRubyClass;
60
+ import org.jruby.anno.JRubyMethod;
61
+ import org.jruby.exceptions.RaiseException;
62
+ import org.jruby.runtime.ThreadContext;
63
+ import org.jruby.runtime.Visibility;
64
+ import org.jruby.runtime.builtin.IRubyObject;
65
+ import org.w3c.dom.Document;
66
+ import org.w3c.dom.ls.LSInput;
67
+ import org.w3c.dom.ls.LSResourceResolver;
68
+ import org.xml.sax.ErrorHandler;
69
+ import org.xml.sax.SAXException;
70
+
71
+ /**
72
+ * Class for Nokogiri::XML::Schema
73
+ *
74
+ * @author sergio
75
+ * @author Yoko Harada <yokolet@gmail.com>
76
+ */
77
+ @JRubyClass(name="Nokogiri::XML::Schema")
78
+ public class XmlSchema extends RubyObject {
79
+ private Validator validator;
80
+
81
+ public XmlSchema(Ruby ruby, RubyClass klazz) {
82
+ super(ruby, klazz);
83
+ }
84
+
85
+ /**
86
+ * Create and return a copy of this object.
87
+ *
88
+ * @return a clone of this object
89
+ */
90
+ @Override
91
+ public Object clone() throws CloneNotSupportedException {
92
+ return super.clone();
93
+ }
94
+
95
+ private Schema getSchema(Source source, String currentDir, String scriptFileName) throws SAXException {
96
+ SchemaFactory schemaFactory = SchemaFactory.newInstance(XMLConstants.W3C_XML_SCHEMA_NS_URI);
97
+ SchemaResourceResolver resourceResolver = new SchemaResourceResolver(currentDir, scriptFileName, null);
98
+ schemaFactory.setResourceResolver(resourceResolver);
99
+ return schemaFactory.newSchema(source);
100
+ }
101
+
102
+ private void setValidator(Validator validator) {
103
+ this.validator = validator;
104
+ }
105
+
106
+ static XmlSchema createSchemaInstance(ThreadContext context, RubyClass klazz, Source source) {
107
+ Ruby runtime = context.getRuntime();
108
+ XmlSchema xmlSchema = (XmlSchema) NokogiriService.XML_SCHEMA_ALLOCATOR.allocate(runtime, klazz);
109
+ xmlSchema.setInstanceVariable("@errors", runtime.newEmptyArray());
110
+
111
+ try {
112
+ Schema schema = xmlSchema.getSchema(source, context.getRuntime().getCurrentDirectory(), context.getRuntime().getInstanceConfig().getScriptFileName());
113
+ xmlSchema.setValidator(schema.newValidator());
114
+ return xmlSchema;
115
+ } catch (SAXException ex) {
116
+ throw context.getRuntime().newRuntimeError("Could not parse document: " + ex.getMessage());
117
+ }
118
+ }
119
+
120
+ /*
121
+ * call-seq:
122
+ * from_document(doc)
123
+ *
124
+ * Create a new Schema from the Nokogiri::XML::Document +doc+
125
+ */
126
+ @JRubyMethod(meta=true)
127
+ public static IRubyObject from_document(ThreadContext context, IRubyObject klazz, IRubyObject document) {
128
+ XmlDocument doc = ((XmlDocument) ((XmlNode) document).document(context));
129
+
130
+ RubyArray errors = (RubyArray) doc.getInstanceVariable("@errors");
131
+ if (!errors.isEmpty()) {
132
+ throw new RaiseException((XmlSyntaxError) errors.first());
133
+ }
134
+
135
+ DOMSource source = new DOMSource(doc.getDocument());
136
+
137
+ IRubyObject uri = doc.url(context);
138
+
139
+ if (!uri.isNil()) {
140
+ source.setSystemId(uri.convertToString().asJavaString());
141
+ }
142
+
143
+ return getSchema(context, (RubyClass)klazz, source);
144
+ }
145
+
146
+ private static IRubyObject getSchema(ThreadContext context, RubyClass klazz, Source source) {
147
+ String moduleName = klazz.getName();
148
+ if ("Nokogiri::XML::Schema".equals(moduleName)) {
149
+ return XmlSchema.createSchemaInstance(context, klazz, source);
150
+ } else if ("Nokogiri::XML::RelaxNG".equals(moduleName)) {
151
+ return XmlRelaxng.createSchemaInstance(context, klazz, source);
152
+ }
153
+ return context.getRuntime().getNil();
154
+ }
155
+
156
+ @JRubyMethod(meta=true)
157
+ public static IRubyObject read_memory(ThreadContext context, IRubyObject klazz, IRubyObject content) {
158
+ String data = content.convertToString().asJavaString();
159
+ return getSchema(context, (RubyClass) klazz, new StreamSource(new StringReader(data)));
160
+ }
161
+
162
+ @JRubyMethod(visibility=Visibility.PRIVATE)
163
+ public IRubyObject validate_document(ThreadContext context, IRubyObject document) {
164
+ return validate_document_or_file(context, (XmlDocument)document);
165
+ }
166
+
167
+ @JRubyMethod(visibility=Visibility.PRIVATE)
168
+ public IRubyObject validate_file(ThreadContext context, IRubyObject file) {
169
+ Ruby ruby = context.getRuntime();
170
+
171
+ XmlDomParserContext ctx = new XmlDomParserContext(ruby, RubyFixnum.newFixnum(ruby, 1L));
172
+ ctx.setInputSource(context, file, context.getRuntime().getNil());
173
+ XmlDocument xmlDocument = ctx.parse(context, getNokogiriClass(ruby, "Nokogiri::XML::Document"), ruby.getNil());
174
+ return validate_document_or_file(context, xmlDocument);
175
+ }
176
+
177
+ IRubyObject validate_document_or_file(ThreadContext context, XmlDocument xmlDocument) {
178
+ RubyArray errors = (RubyArray) this.getInstanceVariable("@errors");
179
+ ErrorHandler errorHandler = new SchemaErrorHandler(context.getRuntime(), errors);
180
+ setErrorHandler(errorHandler);
181
+
182
+ try {
183
+ validate(xmlDocument.getDocument());
184
+ } catch(SAXException ex) {
185
+ XmlSyntaxError xmlSyntaxError = (XmlSyntaxError) NokogiriService.XML_SYNTAXERROR_ALLOCATOR.allocate(context.getRuntime(), getNokogiriClass(context.getRuntime(), "Nokogiri::XML::SyntaxError"));
186
+ xmlSyntaxError.setException(ex);
187
+ errors.append(xmlSyntaxError);
188
+ } catch (IOException ex) {
189
+ throw context.getRuntime().newIOError(ex.getMessage());
190
+ }
191
+
192
+ return errors;
193
+ }
194
+
195
+ protected void setErrorHandler(ErrorHandler errorHandler) {
196
+ validator.setErrorHandler(errorHandler);
197
+ }
198
+
199
+ protected void validate(Document document) throws SAXException, IOException {
200
+ DOMSource docSource = new DOMSource(document);
201
+ validator.validate(docSource);
202
+ }
203
+
204
+ private class SchemaResourceResolver implements LSResourceResolver {
205
+ SchemaLSInput lsInput = new SchemaLSInput();
206
+ String currentDir;
207
+ String scriptFileName;
208
+ //String defaultURI;
209
+
210
+ SchemaResourceResolver(String currentDir, String scriptFileName, Object input) {
211
+ this.currentDir = currentDir;
212
+ this.scriptFileName = scriptFileName;
213
+ if (input == null) return;
214
+ if (input instanceof String) {
215
+ lsInput.setStringData((String)input);
216
+ } else if (input instanceof Reader) {
217
+ lsInput.setCharacterStream((Reader)input);
218
+ } else if (input instanceof InputStream) {
219
+ lsInput.setByteStream((InputStream)input);
220
+ }
221
+ }
222
+
223
+ @Override
224
+ public LSInput resolveResource(String type, String namespaceURI, String publicId, String systemId, String baseURI) {
225
+ String adjusted = adjustSystemIdIfNecessary(currentDir, scriptFileName, baseURI, systemId);
226
+ lsInput.setPublicId(publicId);
227
+ lsInput.setSystemId(adjusted);
228
+ lsInput.setBaseURI(baseURI);
229
+ return lsInput;
230
+ }
231
+ }
232
+
233
+ private class SchemaLSInput implements LSInput {
234
+ protected String fPublicId;
235
+ protected String fSystemId;
236
+ protected String fBaseSystemId;
237
+ protected InputStream fByteStream;
238
+ protected Reader fCharStream;
239
+ protected String fData;
240
+ protected String fEncoding;
241
+ protected boolean fCertifiedText = false;
242
+
243
+ @Override
244
+ public String getBaseURI() {
245
+ return fBaseSystemId;
246
+ }
247
+
248
+ @Override
249
+ public InputStream getByteStream() {
250
+ return fByteStream;
251
+ }
252
+
253
+ @Override
254
+ public boolean getCertifiedText() {
255
+ return fCertifiedText;
256
+ }
257
+
258
+ @Override
259
+ public Reader getCharacterStream() {
260
+ return fCharStream;
261
+ }
262
+
263
+ @Override
264
+ public String getEncoding() {
265
+ return fEncoding;
266
+ }
267
+
268
+ @Override
269
+ public String getPublicId() {
270
+ return fPublicId;
271
+ }
272
+
273
+ @Override
274
+ public String getStringData() {
275
+ return fData;
276
+ }
277
+
278
+ @Override
279
+ public String getSystemId() {
280
+ return fSystemId;
281
+ }
282
+
283
+ @Override
284
+ public void setBaseURI(String baseURI) {
285
+ fBaseSystemId = baseURI;
286
+ }
287
+
288
+ @Override
289
+ public void setByteStream(InputStream byteStream) {
290
+ fByteStream = byteStream;
291
+ }
292
+
293
+ @Override
294
+ public void setCertifiedText(boolean certified) {
295
+ fCertifiedText = certified;
296
+ }
297
+
298
+ @Override
299
+ public void setCharacterStream(Reader charStream) {
300
+ fCharStream = charStream;
301
+ }
302
+
303
+ @Override
304
+ public void setEncoding(String encoding) {
305
+ fEncoding = encoding;
306
+ }
307
+
308
+ @Override
309
+ public void setPublicId(String pubId) {
310
+ fPublicId = pubId;
311
+ }
312
+
313
+ @Override
314
+ public void setStringData(String stringData) {
315
+ fData = stringData;
316
+ }
317
+
318
+ @Override
319
+ public void setSystemId(String sysId) {
320
+ fSystemId = sysId;
321
+ }
322
+
323
+ }
324
+ }