nokogiri 1.2.3-x86-mswin32-60 → 1.4.5-x86-mswin32-60

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of nokogiri might be problematic. Click here for more details.

Files changed (319) hide show
  1. data/.autotest +18 -7
  2. data/.gemtest +0 -0
  3. data/CHANGELOG.ja.rdoc +297 -3
  4. data/CHANGELOG.rdoc +289 -0
  5. data/Manifest.txt +148 -37
  6. data/README.ja.rdoc +20 -20
  7. data/README.rdoc +53 -22
  8. data/Rakefile +127 -211
  9. data/bin/nokogiri +54 -0
  10. data/ext/nokogiri/depend +358 -0
  11. data/ext/nokogiri/extconf.rb +89 -54
  12. data/ext/nokogiri/html_document.c +34 -27
  13. data/ext/nokogiri/html_document.h +1 -1
  14. data/ext/nokogiri/html_element_description.c +276 -0
  15. data/ext/nokogiri/html_element_description.h +10 -0
  16. data/ext/nokogiri/html_entity_lookup.c +7 -5
  17. data/ext/nokogiri/html_entity_lookup.h +1 -1
  18. data/ext/nokogiri/html_sax_parser_context.c +94 -0
  19. data/ext/nokogiri/html_sax_parser_context.h +11 -0
  20. data/ext/nokogiri/{native.c → nokogiri.c} +31 -7
  21. data/ext/nokogiri/{native.h → nokogiri.h} +68 -41
  22. data/ext/nokogiri/xml_attr.c +20 -9
  23. data/ext/nokogiri/xml_attr.h +1 -1
  24. data/ext/nokogiri/xml_attribute_decl.c +70 -0
  25. data/ext/nokogiri/xml_attribute_decl.h +9 -0
  26. data/ext/nokogiri/xml_cdata.c +21 -9
  27. data/ext/nokogiri/xml_cdata.h +1 -1
  28. data/ext/nokogiri/xml_comment.c +18 -6
  29. data/ext/nokogiri/xml_comment.h +1 -1
  30. data/ext/nokogiri/xml_document.c +247 -68
  31. data/ext/nokogiri/xml_document.h +5 -3
  32. data/ext/nokogiri/xml_document_fragment.c +15 -7
  33. data/ext/nokogiri/xml_document_fragment.h +1 -1
  34. data/ext/nokogiri/xml_dtd.c +110 -10
  35. data/ext/nokogiri/xml_dtd.h +3 -1
  36. data/ext/nokogiri/xml_element_content.c +123 -0
  37. data/ext/nokogiri/xml_element_content.h +10 -0
  38. data/ext/nokogiri/xml_element_decl.c +69 -0
  39. data/ext/nokogiri/xml_element_decl.h +9 -0
  40. data/ext/nokogiri/xml_encoding_handler.c +79 -0
  41. data/ext/nokogiri/xml_encoding_handler.h +8 -0
  42. data/ext/nokogiri/xml_entity_decl.c +110 -0
  43. data/ext/nokogiri/xml_entity_decl.h +10 -0
  44. data/ext/nokogiri/xml_entity_reference.c +16 -5
  45. data/ext/nokogiri/xml_entity_reference.h +1 -1
  46. data/ext/nokogiri/xml_io.c +40 -8
  47. data/ext/nokogiri/xml_io.h +2 -1
  48. data/ext/nokogiri/xml_libxml2_hacks.c +112 -0
  49. data/ext/nokogiri/xml_libxml2_hacks.h +12 -0
  50. data/ext/nokogiri/xml_namespace.c +84 -0
  51. data/ext/nokogiri/xml_namespace.h +13 -0
  52. data/ext/nokogiri/xml_node.c +782 -225
  53. data/ext/nokogiri/xml_node.h +2 -4
  54. data/ext/nokogiri/xml_node_set.c +253 -34
  55. data/ext/nokogiri/xml_node_set.h +2 -2
  56. data/ext/nokogiri/xml_processing_instruction.c +17 -5
  57. data/ext/nokogiri/xml_processing_instruction.h +1 -1
  58. data/ext/nokogiri/xml_reader.c +277 -85
  59. data/ext/nokogiri/xml_reader.h +1 -1
  60. data/ext/nokogiri/xml_relax_ng.c +168 -0
  61. data/ext/nokogiri/xml_relax_ng.h +9 -0
  62. data/ext/nokogiri/xml_sax_parser.c +183 -111
  63. data/ext/nokogiri/xml_sax_parser.h +30 -1
  64. data/ext/nokogiri/xml_sax_parser_context.c +199 -0
  65. data/ext/nokogiri/xml_sax_parser_context.h +10 -0
  66. data/ext/nokogiri/xml_sax_push_parser.c +42 -12
  67. data/ext/nokogiri/xml_sax_push_parser.h +1 -1
  68. data/ext/nokogiri/xml_schema.c +205 -0
  69. data/ext/nokogiri/xml_schema.h +9 -0
  70. data/ext/nokogiri/xml_syntax_error.c +28 -173
  71. data/ext/nokogiri/xml_syntax_error.h +2 -1
  72. data/ext/nokogiri/xml_text.c +16 -6
  73. data/ext/nokogiri/xml_text.h +1 -1
  74. data/ext/nokogiri/xml_xpath_context.c +104 -47
  75. data/ext/nokogiri/xml_xpath_context.h +1 -1
  76. data/ext/nokogiri/xslt_stylesheet.c +161 -19
  77. data/ext/nokogiri/xslt_stylesheet.h +1 -1
  78. data/lib/nokogiri.rb +47 -8
  79. data/lib/nokogiri/1.8/nokogiri.so +0 -0
  80. data/lib/nokogiri/1.9/nokogiri.so +0 -0
  81. data/lib/nokogiri/css.rb +6 -3
  82. data/lib/nokogiri/css/node.rb +14 -12
  83. data/lib/nokogiri/css/parser.rb +665 -62
  84. data/lib/nokogiri/css/parser.y +20 -10
  85. data/lib/nokogiri/css/parser_extras.rb +91 -0
  86. data/lib/nokogiri/css/tokenizer.rb +148 -5
  87. data/lib/nokogiri/css/tokenizer.rex +10 -9
  88. data/lib/nokogiri/css/xpath_visitor.rb +47 -44
  89. data/lib/nokogiri/decorators/slop.rb +8 -4
  90. data/lib/nokogiri/ffi/encoding_handler.rb +42 -0
  91. data/lib/nokogiri/ffi/html/document.rb +28 -0
  92. data/lib/nokogiri/ffi/html/element_description.rb +81 -0
  93. data/lib/nokogiri/ffi/html/entity_lookup.rb +16 -0
  94. data/lib/nokogiri/ffi/html/sax/parser_context.rb +38 -0
  95. data/lib/nokogiri/ffi/io_callbacks.rb +42 -0
  96. data/lib/nokogiri/ffi/libxml.rb +420 -0
  97. data/lib/nokogiri/ffi/structs/common_node.rb +38 -0
  98. data/lib/nokogiri/ffi/structs/html_elem_desc.rb +24 -0
  99. data/lib/nokogiri/ffi/structs/html_entity_desc.rb +13 -0
  100. data/lib/nokogiri/ffi/structs/xml_alloc.rb +16 -0
  101. data/lib/nokogiri/ffi/structs/xml_attr.rb +20 -0
  102. data/lib/nokogiri/ffi/structs/xml_attribute.rb +27 -0
  103. data/lib/nokogiri/ffi/structs/xml_buffer.rb +16 -0
  104. data/lib/nokogiri/ffi/structs/xml_char_encoding_handler.rb +11 -0
  105. data/lib/nokogiri/ffi/structs/xml_document.rb +117 -0
  106. data/lib/nokogiri/ffi/structs/xml_dtd.rb +28 -0
  107. data/lib/nokogiri/ffi/structs/xml_element.rb +26 -0
  108. data/lib/nokogiri/ffi/structs/xml_element_content.rb +17 -0
  109. data/lib/nokogiri/ffi/structs/xml_entity.rb +32 -0
  110. data/lib/nokogiri/ffi/structs/xml_enumeration.rb +12 -0
  111. data/lib/nokogiri/ffi/structs/xml_node.rb +28 -0
  112. data/lib/nokogiri/ffi/structs/xml_node_set.rb +53 -0
  113. data/lib/nokogiri/ffi/structs/xml_notation.rb +11 -0
  114. data/lib/nokogiri/ffi/structs/xml_ns.rb +15 -0
  115. data/lib/nokogiri/ffi/structs/xml_parser_context.rb +20 -0
  116. data/lib/nokogiri/ffi/structs/xml_parser_input.rb +19 -0
  117. data/lib/nokogiri/ffi/structs/xml_relax_ng.rb +14 -0
  118. data/lib/nokogiri/ffi/structs/xml_sax_handler.rb +51 -0
  119. data/lib/nokogiri/ffi/structs/xml_sax_push_parser_context.rb +124 -0
  120. data/lib/nokogiri/ffi/structs/xml_schema.rb +13 -0
  121. data/lib/nokogiri/ffi/structs/xml_syntax_error.rb +31 -0
  122. data/lib/nokogiri/ffi/structs/xml_text_reader.rb +12 -0
  123. data/lib/nokogiri/ffi/structs/xml_xpath_context.rb +38 -0
  124. data/lib/nokogiri/ffi/structs/xml_xpath_object.rb +35 -0
  125. data/lib/nokogiri/ffi/structs/xml_xpath_parser_context.rb +20 -0
  126. data/lib/nokogiri/ffi/structs/xslt_stylesheet.rb +13 -0
  127. data/lib/nokogiri/ffi/weak_bucket.rb +40 -0
  128. data/lib/nokogiri/ffi/xml/attr.rb +41 -0
  129. data/lib/nokogiri/ffi/xml/attribute_decl.rb +27 -0
  130. data/lib/nokogiri/ffi/xml/cdata.rb +19 -0
  131. data/lib/nokogiri/ffi/xml/comment.rb +18 -0
  132. data/lib/nokogiri/ffi/xml/document.rb +174 -0
  133. data/lib/nokogiri/ffi/xml/document_fragment.rb +21 -0
  134. data/lib/nokogiri/ffi/xml/dtd.rb +67 -0
  135. data/lib/nokogiri/ffi/xml/element_content.rb +43 -0
  136. data/lib/nokogiri/ffi/xml/element_decl.rb +19 -0
  137. data/lib/nokogiri/ffi/xml/entity_decl.rb +36 -0
  138. data/lib/nokogiri/ffi/xml/entity_reference.rb +19 -0
  139. data/lib/nokogiri/ffi/xml/namespace.rb +44 -0
  140. data/lib/nokogiri/ffi/xml/node.rb +559 -0
  141. data/lib/nokogiri/ffi/xml/node_set.rb +150 -0
  142. data/lib/nokogiri/ffi/xml/processing_instruction.rb +20 -0
  143. data/lib/nokogiri/ffi/xml/reader.rb +236 -0
  144. data/lib/nokogiri/ffi/xml/relax_ng.rb +85 -0
  145. data/lib/nokogiri/ffi/xml/sax/parser.rb +143 -0
  146. data/lib/nokogiri/ffi/xml/sax/parser_context.rb +79 -0
  147. data/lib/nokogiri/ffi/xml/sax/push_parser.rb +51 -0
  148. data/lib/nokogiri/ffi/xml/schema.rb +109 -0
  149. data/lib/nokogiri/ffi/xml/syntax_error.rb +98 -0
  150. data/lib/nokogiri/ffi/xml/text.rb +18 -0
  151. data/lib/nokogiri/ffi/xml/xpath.rb +9 -0
  152. data/lib/nokogiri/ffi/xml/xpath_context.rb +153 -0
  153. data/lib/nokogiri/ffi/xslt/stylesheet.rb +77 -0
  154. data/lib/nokogiri/html.rb +13 -47
  155. data/lib/nokogiri/html/builder.rb +27 -1
  156. data/lib/nokogiri/html/document.rb +201 -7
  157. data/lib/nokogiri/html/document_fragment.rb +41 -0
  158. data/lib/nokogiri/html/element_description.rb +23 -0
  159. data/lib/nokogiri/html/entity_lookup.rb +2 -0
  160. data/lib/nokogiri/html/sax/parser.rb +34 -3
  161. data/lib/nokogiri/html/sax/parser_context.rb +16 -0
  162. data/lib/nokogiri/nokogiri.rb +1 -0
  163. data/lib/nokogiri/version.rb +40 -1
  164. data/lib/nokogiri/version_warning.rb +14 -0
  165. data/lib/nokogiri/xml.rb +32 -53
  166. data/lib/nokogiri/xml/attr.rb +5 -0
  167. data/lib/nokogiri/xml/attribute_decl.rb +18 -0
  168. data/lib/nokogiri/xml/builder.rb +349 -29
  169. data/lib/nokogiri/xml/cdata.rb +3 -1
  170. data/lib/nokogiri/xml/character_data.rb +7 -0
  171. data/lib/nokogiri/xml/document.rb +166 -14
  172. data/lib/nokogiri/xml/document_fragment.rb +76 -1
  173. data/lib/nokogiri/xml/dtd.rb +16 -3
  174. data/lib/nokogiri/xml/element_content.rb +36 -0
  175. data/lib/nokogiri/xml/element_decl.rb +13 -0
  176. data/lib/nokogiri/xml/entity_decl.rb +19 -0
  177. data/lib/nokogiri/xml/namespace.rb +13 -0
  178. data/lib/nokogiri/xml/node.rb +561 -166
  179. data/lib/nokogiri/xml/node/save_options.rb +22 -2
  180. data/lib/nokogiri/xml/node_set.rb +202 -40
  181. data/lib/nokogiri/xml/parse_options.rb +93 -0
  182. data/lib/nokogiri/xml/pp.rb +2 -0
  183. data/lib/nokogiri/xml/pp/character_data.rb +18 -0
  184. data/lib/nokogiri/xml/pp/node.rb +56 -0
  185. data/lib/nokogiri/xml/processing_instruction.rb +2 -0
  186. data/lib/nokogiri/xml/reader.rb +93 -8
  187. data/lib/nokogiri/xml/relax_ng.rb +32 -0
  188. data/lib/nokogiri/xml/sax.rb +1 -7
  189. data/lib/nokogiri/xml/sax/document.rb +107 -2
  190. data/lib/nokogiri/xml/sax/parser.rb +57 -7
  191. data/lib/nokogiri/xml/sax/parser_context.rb +16 -0
  192. data/lib/nokogiri/xml/sax/push_parser.rb +13 -1
  193. data/lib/nokogiri/xml/schema.rb +63 -0
  194. data/lib/nokogiri/xml/syntax_error.rb +25 -1
  195. data/lib/nokogiri/xml/text.rb +4 -1
  196. data/lib/nokogiri/xml/xpath.rb +1 -1
  197. data/lib/nokogiri/xml/xpath/syntax_error.rb +3 -0
  198. data/lib/nokogiri/xml/xpath_context.rb +2 -0
  199. data/lib/nokogiri/xslt.rb +26 -2
  200. data/lib/nokogiri/xslt/stylesheet.rb +19 -0
  201. data/lib/xsd/xmlparser/nokogiri.rb +45 -9
  202. data/tasks/cross_compile.rb +173 -0
  203. data/tasks/test.rb +25 -69
  204. data/test/css/test_nthiness.rb +3 -4
  205. data/test/css/test_parser.rb +75 -20
  206. data/test/css/test_tokenizer.rb +23 -1
  207. data/test/css/test_xpath_visitor.rb +10 -1
  208. data/test/decorators/test_slop.rb +16 -0
  209. data/test/ffi/test_document.rb +35 -0
  210. data/test/files/2ch.html +108 -0
  211. data/test/files/address_book.rlx +12 -0
  212. data/test/files/address_book.xml +10 -0
  213. data/test/files/bar/bar.xsd +4 -0
  214. data/test/files/encoding.html +82 -0
  215. data/test/files/encoding.xhtml +84 -0
  216. data/test/files/foo/foo.xsd +4 -0
  217. data/test/files/po.xml +32 -0
  218. data/test/files/po.xsd +66 -0
  219. data/test/files/shift_jis.html +10 -0
  220. data/test/files/shift_jis.xml +5 -0
  221. data/test/files/snuggles.xml +3 -0
  222. data/test/files/staff.dtd +10 -0
  223. data/test/files/valid_bar.xml +2 -0
  224. data/test/helper.rb +101 -23
  225. data/test/html/sax/test_parser.rb +81 -2
  226. data/test/html/sax/test_parser_context.rb +48 -0
  227. data/test/html/test_builder.rb +39 -8
  228. data/test/html/test_document.rb +186 -23
  229. data/test/html/test_document_encoding.rb +78 -1
  230. data/test/html/test_document_fragment.rb +253 -0
  231. data/test/html/test_element_description.rb +98 -0
  232. data/test/html/test_named_characters.rb +1 -1
  233. data/test/html/test_node.rb +124 -36
  234. data/test/html/test_node_encoding.rb +27 -0
  235. data/test/test_convert_xpath.rb +1 -52
  236. data/test/test_css_cache.rb +2 -13
  237. data/test/test_encoding_handler.rb +46 -0
  238. data/test/test_memory_leak.rb +88 -19
  239. data/test/test_nokogiri.rb +38 -5
  240. data/test/test_reader.rb +188 -6
  241. data/test/test_soap4r_sax.rb +52 -0
  242. data/test/test_xslt_transforms.rb +183 -83
  243. data/test/xml/node/test_save_options.rb +1 -1
  244. data/test/xml/node/test_subclass.rb +44 -0
  245. data/test/xml/sax/test_parser.rb +175 -4
  246. data/test/xml/sax/test_parser_context.rb +113 -0
  247. data/test/xml/sax/test_push_parser.rb +90 -2
  248. data/test/xml/test_attr.rb +35 -1
  249. data/test/xml/test_attribute_decl.rb +82 -0
  250. data/test/xml/test_builder.rb +186 -1
  251. data/test/xml/test_cdata.rb +32 -1
  252. data/test/xml/test_comment.rb +13 -1
  253. data/test/xml/test_document.rb +415 -43
  254. data/test/xml/test_document_encoding.rb +1 -1
  255. data/test/xml/test_document_fragment.rb +173 -5
  256. data/test/xml/test_dtd.rb +61 -6
  257. data/test/xml/test_dtd_encoding.rb +3 -1
  258. data/test/xml/test_element_content.rb +56 -0
  259. data/test/xml/test_element_decl.rb +73 -0
  260. data/test/xml/test_entity_decl.rb +120 -0
  261. data/test/xml/test_entity_reference.rb +5 -1
  262. data/test/xml/test_namespace.rb +68 -0
  263. data/test/xml/test_node.rb +546 -201
  264. data/test/xml/test_node_attributes.rb +34 -0
  265. data/test/xml/test_node_encoding.rb +33 -3
  266. data/test/xml/test_node_reparenting.rb +321 -0
  267. data/test/xml/test_node_set.rb +538 -2
  268. data/test/xml/test_parse_options.rb +52 -0
  269. data/test/xml/test_processing_instruction.rb +6 -1
  270. data/test/xml/test_reader_encoding.rb +1 -1
  271. data/test/xml/test_relax_ng.rb +60 -0
  272. data/test/xml/test_schema.rb +94 -0
  273. data/test/xml/test_syntax_error.rb +12 -0
  274. data/test/xml/test_text.rb +35 -1
  275. data/test/xml/test_unparented_node.rb +5 -5
  276. data/test/xml/test_xpath.rb +142 -11
  277. data/test/xslt/test_custom_functions.rb +94 -0
  278. metadata +328 -92
  279. data/ext/nokogiri/html_sax_parser.c +0 -57
  280. data/ext/nokogiri/html_sax_parser.h +0 -11
  281. data/ext/nokogiri/iconv.dll +0 -0
  282. data/ext/nokogiri/libexslt.dll +0 -0
  283. data/ext/nokogiri/libxml2.dll +0 -0
  284. data/ext/nokogiri/libxslt.dll +0 -0
  285. data/ext/nokogiri/native.so +0 -0
  286. data/ext/nokogiri/xml_xpath.c +0 -53
  287. data/ext/nokogiri/xml_xpath.h +0 -11
  288. data/ext/nokogiri/zlib1.dll +0 -0
  289. data/lib/action-nokogiri.rb +0 -30
  290. data/lib/nokogiri/css/generated_parser.rb +0 -713
  291. data/lib/nokogiri/css/generated_tokenizer.rb +0 -144
  292. data/lib/nokogiri/decorators.rb +0 -2
  293. data/lib/nokogiri/decorators/hpricot.rb +0 -3
  294. data/lib/nokogiri/decorators/hpricot/node.rb +0 -56
  295. data/lib/nokogiri/decorators/hpricot/node_set.rb +0 -54
  296. data/lib/nokogiri/decorators/hpricot/xpath_visitor.rb +0 -28
  297. data/lib/nokogiri/hpricot.rb +0 -51
  298. data/lib/nokogiri/xml/comment.rb +0 -6
  299. data/lib/nokogiri/xml/element.rb +0 -6
  300. data/lib/nokogiri/xml/entity_declaration.rb +0 -9
  301. data/lib/nokogiri/xml/fragment_handler.rb +0 -34
  302. data/test/hpricot/files/basic.xhtml +0 -17
  303. data/test/hpricot/files/boingboing.html +0 -2266
  304. data/test/hpricot/files/cy0.html +0 -3653
  305. data/test/hpricot/files/immob.html +0 -400
  306. data/test/hpricot/files/pace_application.html +0 -1320
  307. data/test/hpricot/files/tenderlove.html +0 -16
  308. data/test/hpricot/files/uswebgen.html +0 -220
  309. data/test/hpricot/files/utf8.html +0 -1054
  310. data/test/hpricot/files/week9.html +0 -1723
  311. data/test/hpricot/files/why.xml +0 -19
  312. data/test/hpricot/load_files.rb +0 -11
  313. data/test/hpricot/test_alter.rb +0 -68
  314. data/test/hpricot/test_builder.rb +0 -20
  315. data/test/hpricot/test_parser.rb +0 -426
  316. data/test/hpricot/test_paths.rb +0 -15
  317. data/test/hpricot/test_preserved.rb +0 -77
  318. data/test/hpricot/test_xml.rb +0 -30
  319. data/test/test_gc.rb +0 -15
@@ -8,15 +8,20 @@
8
8
  */
9
9
  static VALUE new(int argc, VALUE *argv, VALUE klass)
10
10
  {
11
- VALUE uri, external_id;
11
+ VALUE uri, external_id, rest, rb_doc;
12
+ htmlDocPtr doc;
12
13
 
13
- rb_scan_args(argc, argv, "02", &uri, &external_id);
14
+ rb_scan_args(argc, argv, "0*", &rest);
15
+ uri = rb_ary_entry(rest, (long)0);
16
+ external_id = rb_ary_entry(rest, (long)1);
14
17
 
15
- htmlDocPtr doc = htmlNewDoc(
18
+ doc = htmlNewDoc(
16
19
  RTEST(uri) ? (const xmlChar *)StringValuePtr(uri) : NULL,
17
20
  RTEST(external_id) ? (const xmlChar *)StringValuePtr(external_id) : NULL
18
21
  );
19
- return Nokogiri_wrap_xml_document(klass, doc);
22
+ rb_doc = Nokogiri_wrap_xml_document(klass, doc);
23
+ rb_obj_call_init(rb_doc, argc, argv);
24
+ return rb_doc ;
20
25
  }
21
26
 
22
27
  /*
@@ -32,40 +37,41 @@ static VALUE read_io( VALUE klass,
32
37
  VALUE encoding,
33
38
  VALUE options )
34
39
  {
35
- const char * c_url = (url == Qnil) ? NULL : StringValuePtr(url);
36
- const char * c_enc = (encoding == Qnil) ? NULL : StringValuePtr(encoding);
40
+ const char * c_url = NIL_P(url) ? NULL : StringValuePtr(url);
41
+ const char * c_enc = NIL_P(encoding) ? NULL : StringValuePtr(encoding);
37
42
  VALUE error_list = rb_ary_new();
43
+ VALUE document;
44
+ htmlDocPtr doc;
38
45
 
39
- xmlInitParser();
40
46
  xmlResetLastError();
41
47
  xmlSetStructuredErrorFunc((void *)error_list, Nokogiri_error_array_pusher);
42
48
 
43
- htmlDocPtr doc = htmlReadIO(
49
+ doc = htmlReadIO(
44
50
  io_read_callback,
45
51
  io_close_callback,
46
52
  (void *)io,
47
53
  c_url,
48
54
  c_enc,
49
- NUM2INT(options)
55
+ (int)NUM2INT(options)
50
56
  );
51
57
  xmlSetStructuredErrorFunc(NULL, NULL);
52
58
 
53
59
  if(doc == NULL) {
60
+ xmlErrorPtr error;
61
+
54
62
  xmlFreeDoc(doc);
55
63
 
56
- xmlErrorPtr error = xmlGetLastError();
64
+ error = xmlGetLastError();
57
65
  if(error)
58
- rb_funcall(rb_mKernel, rb_intern("raise"), 1,
59
- Nokogiri_wrap_xml_syntax_error((VALUE)NULL, error)
60
- );
66
+ rb_exc_raise(Nokogiri_wrap_xml_syntax_error((VALUE)NULL, error));
61
67
  else
62
68
  rb_raise(rb_eRuntimeError, "Could not parse document");
63
69
 
64
70
  return Qnil;
65
71
  }
66
72
 
67
- VALUE document = Nokogiri_wrap_xml_document(klass, doc);
68
- rb_funcall(document, rb_intern("errors="), 1, error_list);
73
+ document = Nokogiri_wrap_xml_document(klass, doc);
74
+ rb_iv_set(document, "@errors", error_list);
69
75
  return document;
70
76
  }
71
77
 
@@ -83,34 +89,35 @@ static VALUE read_memory( VALUE klass,
83
89
  VALUE options )
84
90
  {
85
91
  const char * c_buffer = StringValuePtr(string);
86
- const char * c_url = (url == Qnil) ? NULL : StringValuePtr(url);
87
- const char * c_enc = (encoding == Qnil) ? NULL : StringValuePtr(encoding);
88
- int len = RSTRING_LEN(string);
92
+ const char * c_url = NIL_P(url) ? NULL : StringValuePtr(url);
93
+ const char * c_enc = NIL_P(encoding) ? NULL : StringValuePtr(encoding);
94
+ int len = (int)RSTRING_LEN(string);
89
95
  VALUE error_list = rb_ary_new();
96
+ VALUE document;
97
+ htmlDocPtr doc;
90
98
 
91
- xmlInitParser();
92
99
  xmlResetLastError();
93
100
  xmlSetStructuredErrorFunc((void *)error_list, Nokogiri_error_array_pusher);
94
101
 
95
- htmlDocPtr doc = htmlReadMemory(c_buffer, len, c_url, c_enc, NUM2INT(options));
102
+ doc = htmlReadMemory(c_buffer, len, c_url, c_enc, (int)NUM2INT(options));
96
103
  xmlSetStructuredErrorFunc(NULL, NULL);
97
104
 
98
105
  if(doc == NULL) {
106
+ xmlErrorPtr error;
107
+
99
108
  xmlFreeDoc(doc);
100
109
 
101
- xmlErrorPtr error = xmlGetLastError();
110
+ error = xmlGetLastError();
102
111
  if(error)
103
- rb_funcall(rb_mKernel, rb_intern("raise"), 1,
104
- Nokogiri_wrap_xml_syntax_error((VALUE)NULL, error)
105
- );
112
+ rb_exc_raise(Nokogiri_wrap_xml_syntax_error((VALUE)NULL, error));
106
113
  else
107
114
  rb_raise(rb_eRuntimeError, "Could not parse document");
108
115
 
109
116
  return Qnil;
110
117
  }
111
118
 
112
- VALUE document = Nokogiri_wrap_xml_document(klass, doc);
113
- rb_funcall(document, rb_intern("errors="), 1, error_list);
119
+ document = Nokogiri_wrap_xml_document(klass, doc);
120
+ rb_iv_set(document, "@errors", error_list);
114
121
  return document;
115
122
  }
116
123
 
@@ -124,7 +131,7 @@ static VALUE type(VALUE self)
124
131
  {
125
132
  htmlDocPtr doc;
126
133
  Data_Get_Struct(self, xmlDoc, doc);
127
- return INT2NUM((int)doc->type);
134
+ return INT2NUM((long)doc->type);
128
135
  }
129
136
 
130
137
  VALUE cNokogiriHtmlDocument ;
@@ -1,7 +1,7 @@
1
1
  #ifndef NOKOGIRI_HTML_DOCUMENT
2
2
  #define NOKOGIRI_HTML_DOCUMENT
3
3
 
4
- #include <native.h>
4
+ #include <nokogiri.h>
5
5
 
6
6
  void init_html_document();
7
7
 
@@ -0,0 +1,276 @@
1
+ #include <html_element_description.h>
2
+
3
+ /*
4
+ * call-seq:
5
+ * required_attributes
6
+ *
7
+ * A list of required attributes for this element
8
+ */
9
+ static VALUE required_attributes(VALUE self)
10
+ {
11
+ htmlElemDesc * description;
12
+ VALUE list;
13
+ int i;
14
+
15
+ Data_Get_Struct(self, htmlElemDesc, description);
16
+
17
+ list = rb_ary_new();
18
+
19
+ if(NULL == description->attrs_req) return list;
20
+
21
+ for(i = 0; description->attrs_depr[i]; i++) {
22
+ rb_ary_push(list, NOKOGIRI_STR_NEW2(description->attrs_req[i]));
23
+ }
24
+
25
+ return list;
26
+ }
27
+
28
+ /*
29
+ * call-seq:
30
+ * deprecated_attributes
31
+ *
32
+ * A list of deprecated attributes for this element
33
+ */
34
+ static VALUE deprecated_attributes(VALUE self)
35
+ {
36
+ htmlElemDesc * description;
37
+ VALUE list;
38
+ int i;
39
+
40
+ Data_Get_Struct(self, htmlElemDesc, description);
41
+
42
+ list = rb_ary_new();
43
+
44
+ if(NULL == description->attrs_depr) return list;
45
+
46
+ for(i = 0; description->attrs_depr[i]; i++) {
47
+ rb_ary_push(list, NOKOGIRI_STR_NEW2(description->attrs_depr[i]));
48
+ }
49
+
50
+ return list;
51
+ }
52
+
53
+ /*
54
+ * call-seq:
55
+ * optional_attributes
56
+ *
57
+ * A list of optional attributes for this element
58
+ */
59
+ static VALUE optional_attributes(VALUE self)
60
+ {
61
+ htmlElemDesc * description;
62
+ VALUE list;
63
+ int i;
64
+
65
+ Data_Get_Struct(self, htmlElemDesc, description);
66
+
67
+ list = rb_ary_new();
68
+
69
+ if(NULL == description->attrs_opt) return list;
70
+
71
+ for(i = 0; description->attrs_opt[i]; i++) {
72
+ rb_ary_push(list, NOKOGIRI_STR_NEW2(description->attrs_opt[i]));
73
+ }
74
+
75
+ return list;
76
+ }
77
+
78
+ /*
79
+ * call-seq:
80
+ * default_sub_element
81
+ *
82
+ * The default sub element for this element
83
+ */
84
+ static VALUE default_sub_element(VALUE self)
85
+ {
86
+ htmlElemDesc * description;
87
+ Data_Get_Struct(self, htmlElemDesc, description);
88
+
89
+ return NOKOGIRI_STR_NEW2(description->defaultsubelt);
90
+ }
91
+
92
+ /*
93
+ * call-seq:
94
+ * sub_elements
95
+ *
96
+ * A list of allowed sub elements for this element.
97
+ */
98
+ static VALUE sub_elements(VALUE self)
99
+ {
100
+ htmlElemDesc * description;
101
+ VALUE list;
102
+ int i;
103
+
104
+ Data_Get_Struct(self, htmlElemDesc, description);
105
+
106
+ list = rb_ary_new();
107
+
108
+ if(NULL == description->subelts) return list;
109
+
110
+ for(i = 0; description->subelts[i]; i++) {
111
+ rb_ary_push(list, NOKOGIRI_STR_NEW2(description->subelts[i]));
112
+ }
113
+
114
+ return list;
115
+ }
116
+
117
+ /*
118
+ * call-seq:
119
+ * description
120
+ *
121
+ * The description for this element
122
+ */
123
+ static VALUE description(VALUE self)
124
+ {
125
+ htmlElemDesc * description;
126
+ Data_Get_Struct(self, htmlElemDesc, description);
127
+
128
+ return NOKOGIRI_STR_NEW2(description->desc);
129
+ }
130
+
131
+ /*
132
+ * call-seq:
133
+ * inline?
134
+ *
135
+ * Is this element an inline element?
136
+ */
137
+ static VALUE inline_eh(VALUE self)
138
+ {
139
+ htmlElemDesc * description;
140
+ Data_Get_Struct(self, htmlElemDesc, description);
141
+
142
+ if(description->isinline) return Qtrue;
143
+ return Qfalse;
144
+ }
145
+
146
+ /*
147
+ * call-seq:
148
+ * deprecated?
149
+ *
150
+ * Is this element deprecated?
151
+ */
152
+ static VALUE deprecated_eh(VALUE self)
153
+ {
154
+ htmlElemDesc * description;
155
+ Data_Get_Struct(self, htmlElemDesc, description);
156
+
157
+ if(description->depr) return Qtrue;
158
+ return Qfalse;
159
+ }
160
+
161
+ /*
162
+ * call-seq:
163
+ * empty?
164
+ *
165
+ * Is this an empty element?
166
+ */
167
+ static VALUE empty_eh(VALUE self)
168
+ {
169
+ htmlElemDesc * description;
170
+ Data_Get_Struct(self, htmlElemDesc, description);
171
+
172
+ if(description->empty) return Qtrue;
173
+ return Qfalse;
174
+ }
175
+
176
+ /*
177
+ * call-seq:
178
+ * save_end_tag?
179
+ *
180
+ * Should the end tag be saved?
181
+ */
182
+ static VALUE save_end_tag_eh(VALUE self)
183
+ {
184
+ htmlElemDesc * description;
185
+ Data_Get_Struct(self, htmlElemDesc, description);
186
+
187
+ if(description->saveEndTag) return Qtrue;
188
+ return Qfalse;
189
+ }
190
+
191
+ /*
192
+ * call-seq:
193
+ * implied_end_tag?
194
+ *
195
+ * Can the end tag be implied for this tag?
196
+ */
197
+ static VALUE implied_end_tag_eh(VALUE self)
198
+ {
199
+ htmlElemDesc * description;
200
+ Data_Get_Struct(self, htmlElemDesc, description);
201
+
202
+ if(description->endTag) return Qtrue;
203
+ return Qfalse;
204
+ }
205
+
206
+ /*
207
+ * call-seq:
208
+ * implied_start_tag?
209
+ *
210
+ * Can the start tag be implied for this tag?
211
+ */
212
+ static VALUE implied_start_tag_eh(VALUE self)
213
+ {
214
+ htmlElemDesc * description;
215
+ Data_Get_Struct(self, htmlElemDesc, description);
216
+
217
+ if(description->startTag) return Qtrue;
218
+ return Qfalse;
219
+ }
220
+
221
+ /*
222
+ * call-seq:
223
+ * name
224
+ *
225
+ * Get the tag name for this ElemementDescription
226
+ */
227
+ static VALUE name(VALUE self)
228
+ {
229
+ htmlElemDesc * description;
230
+ Data_Get_Struct(self, htmlElemDesc, description);
231
+
232
+ if(NULL == description->name) return Qnil;
233
+ return NOKOGIRI_STR_NEW2(description->name);
234
+ }
235
+
236
+ /*
237
+ * call-seq:
238
+ * [](tag_name)
239
+ *
240
+ * Get ElemementDescription for +tag_name+
241
+ */
242
+ static VALUE get_description(VALUE klass, VALUE tag_name)
243
+ {
244
+ const htmlElemDesc * description = htmlTagLookup(
245
+ (const xmlChar *)StringValuePtr(tag_name)
246
+ );
247
+
248
+ if(NULL == description) return Qnil;
249
+ return Data_Wrap_Struct(klass, 0, 0, (void *)description);
250
+ }
251
+
252
+ VALUE cNokogiriHtmlElementDescription ;
253
+ void init_html_element_description()
254
+ {
255
+ VALUE nokogiri = rb_define_module("Nokogiri");
256
+ VALUE html = rb_define_module_under(nokogiri, "HTML");
257
+ VALUE klass = rb_define_class_under(html, "ElementDescription",rb_cObject);
258
+
259
+ cNokogiriHtmlElementDescription = klass;
260
+
261
+ rb_define_singleton_method(klass, "[]", get_description, 1);
262
+
263
+ rb_define_method(klass, "name", name, 0);
264
+ rb_define_method(klass, "implied_start_tag?", implied_start_tag_eh, 0);
265
+ rb_define_method(klass, "implied_end_tag?", implied_end_tag_eh, 0);
266
+ rb_define_method(klass, "save_end_tag?", save_end_tag_eh, 0);
267
+ rb_define_method(klass, "empty?", empty_eh, 0);
268
+ rb_define_method(klass, "deprecated?", deprecated_eh, 0);
269
+ rb_define_method(klass, "inline?", inline_eh, 0);
270
+ rb_define_method(klass, "description", description, 0);
271
+ rb_define_method(klass, "sub_elements", sub_elements, 0);
272
+ rb_define_method(klass, "default_sub_element", default_sub_element, 0);
273
+ rb_define_method(klass, "optional_attributes", optional_attributes, 0);
274
+ rb_define_method(klass, "deprecated_attributes", deprecated_attributes, 0);
275
+ rb_define_method(klass, "required_attributes", required_attributes, 0);
276
+ }
@@ -0,0 +1,10 @@
1
+ #ifndef NOKOGIRI_HTML_ELEMENT_DESCRIPTION
2
+ #define NOKOGIRI_HTML_ELEMENT_DESCRIPTION
3
+
4
+ #include <nokogiri.h>
5
+
6
+ void init_html_element_description();
7
+
8
+ extern VALUE cNokogiriHtmlElementDescription ;
9
+
10
+ #endif
@@ -10,14 +10,16 @@ static VALUE get(VALUE self, VALUE key)
10
10
  {
11
11
  const htmlEntityDesc * desc =
12
12
  htmlEntityLookup((const xmlChar *)StringValuePtr(key));
13
+ VALUE klass, args[3];
13
14
 
14
15
  if(NULL == desc) return Qnil;
15
- VALUE klass = rb_const_get(mNokogiriHtml, rb_intern("EntityDescription"));
16
+ klass = rb_const_get(mNokogiriHtml, rb_intern("EntityDescription"));
16
17
 
17
- return rb_funcall(klass, rb_intern("new"), 3,
18
- INT2NUM((int)desc->value),
19
- NOKOGIRI_STR_NEW2(desc->name, "UTF-8"),
20
- NOKOGIRI_STR_NEW2(desc->desc, "UTF-8"));
18
+ args[0] = INT2NUM((long)desc->value);
19
+ args[1] = NOKOGIRI_STR_NEW2(desc->name);
20
+ args[2] = NOKOGIRI_STR_NEW2(desc->desc);
21
+
22
+ return rb_class_new_instance(3, args, klass);
21
23
  }
22
24
 
23
25
  void init_html_entity_lookup()