nokogiri 1.10.7 → 1.16.0

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of nokogiri might be problematic. Click here for more details.

Files changed (224) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile +42 -0
  3. data/LICENSE-DEPENDENCIES.md +1632 -1022
  4. data/LICENSE.md +1 -1
  5. data/README.md +188 -96
  6. data/bin/nokogiri +63 -50
  7. data/dependencies.yml +34 -66
  8. data/ext/nokogiri/depend +38 -358
  9. data/ext/nokogiri/extconf.rb +862 -421
  10. data/ext/nokogiri/gumbo.c +594 -0
  11. data/ext/nokogiri/html4_document.c +165 -0
  12. data/ext/nokogiri/html4_element_description.c +299 -0
  13. data/ext/nokogiri/html4_entity_lookup.c +37 -0
  14. data/ext/nokogiri/html4_sax_parser_context.c +108 -0
  15. data/ext/nokogiri/html4_sax_push_parser.c +95 -0
  16. data/ext/nokogiri/libxml2_backwards_compat.c +121 -0
  17. data/ext/nokogiri/nokogiri.c +251 -105
  18. data/ext/nokogiri/nokogiri.h +222 -90
  19. data/ext/nokogiri/test_global_handlers.c +40 -0
  20. data/ext/nokogiri/xml_attr.c +17 -17
  21. data/ext/nokogiri/xml_attribute_decl.c +22 -22
  22. data/ext/nokogiri/xml_cdata.c +39 -31
  23. data/ext/nokogiri/xml_comment.c +20 -27
  24. data/ext/nokogiri/xml_document.c +408 -243
  25. data/ext/nokogiri/xml_document_fragment.c +13 -17
  26. data/ext/nokogiri/xml_dtd.c +64 -58
  27. data/ext/nokogiri/xml_element_content.c +63 -55
  28. data/ext/nokogiri/xml_element_decl.c +31 -31
  29. data/ext/nokogiri/xml_encoding_handler.c +54 -21
  30. data/ext/nokogiri/xml_entity_decl.c +37 -35
  31. data/ext/nokogiri/xml_entity_reference.c +17 -19
  32. data/ext/nokogiri/xml_namespace.c +131 -61
  33. data/ext/nokogiri/xml_node.c +1343 -674
  34. data/ext/nokogiri/xml_node_set.c +246 -216
  35. data/ext/nokogiri/xml_processing_instruction.c +18 -20
  36. data/ext/nokogiri/xml_reader.c +305 -213
  37. data/ext/nokogiri/xml_relax_ng.c +87 -78
  38. data/ext/nokogiri/xml_sax_parser.c +149 -124
  39. data/ext/nokogiri/xml_sax_parser_context.c +149 -103
  40. data/ext/nokogiri/xml_sax_push_parser.c +65 -37
  41. data/ext/nokogiri/xml_schema.c +138 -82
  42. data/ext/nokogiri/xml_syntax_error.c +42 -21
  43. data/ext/nokogiri/xml_text.c +35 -26
  44. data/ext/nokogiri/xml_xpath_context.c +363 -178
  45. data/ext/nokogiri/xslt_stylesheet.c +335 -189
  46. data/gumbo-parser/CHANGES.md +63 -0
  47. data/gumbo-parser/Makefile +126 -0
  48. data/gumbo-parser/THANKS +27 -0
  49. data/gumbo-parser/src/Makefile +34 -0
  50. data/gumbo-parser/src/README.md +41 -0
  51. data/gumbo-parser/src/ascii.c +75 -0
  52. data/gumbo-parser/src/ascii.h +115 -0
  53. data/gumbo-parser/src/attribute.c +42 -0
  54. data/gumbo-parser/src/attribute.h +17 -0
  55. data/gumbo-parser/src/char_ref.c +22225 -0
  56. data/gumbo-parser/src/char_ref.h +29 -0
  57. data/gumbo-parser/src/char_ref.rl +2154 -0
  58. data/gumbo-parser/src/error.c +630 -0
  59. data/gumbo-parser/src/error.h +148 -0
  60. data/gumbo-parser/src/foreign_attrs.c +103 -0
  61. data/gumbo-parser/src/foreign_attrs.gperf +27 -0
  62. data/gumbo-parser/src/insertion_mode.h +33 -0
  63. data/gumbo-parser/src/macros.h +91 -0
  64. data/gumbo-parser/src/nokogiri_gumbo.h +944 -0
  65. data/gumbo-parser/src/parser.c +4891 -0
  66. data/gumbo-parser/src/parser.h +41 -0
  67. data/gumbo-parser/src/replacement.h +33 -0
  68. data/gumbo-parser/src/string_buffer.c +103 -0
  69. data/gumbo-parser/src/string_buffer.h +68 -0
  70. data/gumbo-parser/src/string_piece.c +48 -0
  71. data/gumbo-parser/src/svg_attrs.c +174 -0
  72. data/gumbo-parser/src/svg_attrs.gperf +77 -0
  73. data/gumbo-parser/src/svg_tags.c +137 -0
  74. data/gumbo-parser/src/svg_tags.gperf +55 -0
  75. data/gumbo-parser/src/tag.c +223 -0
  76. data/gumbo-parser/src/tag_lookup.c +382 -0
  77. data/gumbo-parser/src/tag_lookup.gperf +170 -0
  78. data/gumbo-parser/src/tag_lookup.h +13 -0
  79. data/gumbo-parser/src/token_buffer.c +79 -0
  80. data/gumbo-parser/src/token_buffer.h +71 -0
  81. data/gumbo-parser/src/token_type.h +17 -0
  82. data/gumbo-parser/src/tokenizer.c +3464 -0
  83. data/gumbo-parser/src/tokenizer.h +112 -0
  84. data/gumbo-parser/src/tokenizer_states.h +339 -0
  85. data/gumbo-parser/src/utf8.c +245 -0
  86. data/gumbo-parser/src/utf8.h +164 -0
  87. data/gumbo-parser/src/util.c +66 -0
  88. data/gumbo-parser/src/util.h +34 -0
  89. data/gumbo-parser/src/vector.c +111 -0
  90. data/gumbo-parser/src/vector.h +45 -0
  91. data/lib/nokogiri/class_resolver.rb +67 -0
  92. data/lib/nokogiri/css/node.rb +10 -8
  93. data/lib/nokogiri/css/parser.rb +397 -377
  94. data/lib/nokogiri/css/parser.y +250 -245
  95. data/lib/nokogiri/css/parser_extras.rb +54 -49
  96. data/lib/nokogiri/css/syntax_error.rb +3 -1
  97. data/lib/nokogiri/css/tokenizer.rb +5 -3
  98. data/lib/nokogiri/css/tokenizer.rex +3 -2
  99. data/lib/nokogiri/css/xpath_visitor.rb +205 -96
  100. data/lib/nokogiri/css.rb +56 -17
  101. data/lib/nokogiri/decorators/slop.rb +9 -7
  102. data/lib/nokogiri/encoding_handler.rb +57 -0
  103. data/lib/nokogiri/extension.rb +32 -0
  104. data/lib/nokogiri/gumbo.rb +15 -0
  105. data/lib/nokogiri/html.rb +38 -27
  106. data/lib/nokogiri/{html → html4}/builder.rb +4 -2
  107. data/lib/nokogiri/html4/document.rb +214 -0
  108. data/lib/nokogiri/html4/document_fragment.rb +54 -0
  109. data/lib/nokogiri/{html → html4}/element_description.rb +3 -1
  110. data/lib/nokogiri/html4/element_description_defaults.rb +2040 -0
  111. data/lib/nokogiri/html4/encoding_reader.rb +121 -0
  112. data/lib/nokogiri/{html → html4}/entity_lookup.rb +4 -2
  113. data/lib/nokogiri/{html → html4}/sax/parser.rb +17 -16
  114. data/lib/nokogiri/html4/sax/parser_context.rb +20 -0
  115. data/lib/nokogiri/{html → html4}/sax/push_parser.rb +12 -11
  116. data/lib/nokogiri/html4.rb +47 -0
  117. data/lib/nokogiri/html5/document.rb +168 -0
  118. data/lib/nokogiri/html5/document_fragment.rb +90 -0
  119. data/lib/nokogiri/html5/node.rb +103 -0
  120. data/lib/nokogiri/html5.rb +326 -0
  121. data/lib/nokogiri/jruby/dependencies.rb +3 -0
  122. data/lib/nokogiri/jruby/nokogiri_jars.rb +43 -0
  123. data/lib/nokogiri/syntax_error.rb +2 -0
  124. data/lib/nokogiri/version/constant.rb +6 -0
  125. data/lib/nokogiri/version/info.rb +224 -0
  126. data/lib/nokogiri/version.rb +3 -108
  127. data/lib/nokogiri/xml/attr.rb +55 -3
  128. data/lib/nokogiri/xml/attribute_decl.rb +6 -2
  129. data/lib/nokogiri/xml/builder.rb +75 -34
  130. data/lib/nokogiri/xml/cdata.rb +3 -1
  131. data/lib/nokogiri/xml/character_data.rb +2 -0
  132. data/lib/nokogiri/xml/document.rb +312 -127
  133. data/lib/nokogiri/xml/document_fragment.rb +93 -48
  134. data/lib/nokogiri/xml/dtd.rb +4 -2
  135. data/lib/nokogiri/xml/element_content.rb +12 -2
  136. data/lib/nokogiri/xml/element_decl.rb +6 -2
  137. data/lib/nokogiri/xml/entity_decl.rb +7 -3
  138. data/lib/nokogiri/xml/entity_reference.rb +2 -0
  139. data/lib/nokogiri/xml/namespace.rb +44 -0
  140. data/lib/nokogiri/xml/node/save_options.rb +23 -8
  141. data/lib/nokogiri/xml/node.rb +1096 -419
  142. data/lib/nokogiri/xml/node_set.rb +137 -61
  143. data/lib/nokogiri/xml/notation.rb +13 -0
  144. data/lib/nokogiri/xml/parse_options.rb +145 -52
  145. data/lib/nokogiri/xml/pp/character_data.rb +9 -6
  146. data/lib/nokogiri/xml/pp/node.rb +42 -30
  147. data/lib/nokogiri/xml/pp.rb +4 -2
  148. data/lib/nokogiri/xml/processing_instruction.rb +4 -1
  149. data/lib/nokogiri/xml/reader.rb +21 -28
  150. data/lib/nokogiri/xml/relax_ng.rb +8 -2
  151. data/lib/nokogiri/xml/sax/document.rb +45 -49
  152. data/lib/nokogiri/xml/sax/parser.rb +39 -36
  153. data/lib/nokogiri/xml/sax/parser_context.rb +8 -3
  154. data/lib/nokogiri/xml/sax/push_parser.rb +6 -5
  155. data/lib/nokogiri/xml/sax.rb +6 -4
  156. data/lib/nokogiri/xml/schema.rb +19 -9
  157. data/lib/nokogiri/xml/searchable.rb +120 -72
  158. data/lib/nokogiri/xml/syntax_error.rb +7 -5
  159. data/lib/nokogiri/xml/text.rb +2 -0
  160. data/lib/nokogiri/xml/xpath/syntax_error.rb +4 -2
  161. data/lib/nokogiri/xml/xpath.rb +15 -4
  162. data/lib/nokogiri/xml/xpath_context.rb +3 -3
  163. data/lib/nokogiri/xml.rb +39 -38
  164. data/lib/nokogiri/xslt/stylesheet.rb +3 -1
  165. data/lib/nokogiri/xslt.rb +101 -22
  166. data/lib/nokogiri.rb +59 -75
  167. data/lib/xsd/xmlparser/nokogiri.rb +29 -25
  168. data/patches/libxml2/{0004-libxml2.la-is-in-top_builddir.patch → 0003-libxml2.la-is-in-top_builddir.patch} +1 -1
  169. data/patches/libxml2/0009-allow-wildcard-namespaces.patch +77 -0
  170. data/patches/libxml2/0010-update-config.guess-and-config.sub-for-libxml2.patch +224 -0
  171. data/patches/libxml2/0011-rip-out-libxml2-s-libc_single_threaded-support.patch +30 -0
  172. data/patches/libxslt/0001-update-config.guess-and-config.sub-for-libxslt.patch +224 -0
  173. data/ports/archives/libxml2-2.12.3.tar.xz +0 -0
  174. data/ports/archives/libxslt-1.1.39.tar.xz +0 -0
  175. metadata +121 -291
  176. data/ext/nokogiri/html_document.c +0 -170
  177. data/ext/nokogiri/html_document.h +0 -10
  178. data/ext/nokogiri/html_element_description.c +0 -279
  179. data/ext/nokogiri/html_element_description.h +0 -10
  180. data/ext/nokogiri/html_entity_lookup.c +0 -32
  181. data/ext/nokogiri/html_entity_lookup.h +0 -8
  182. data/ext/nokogiri/html_sax_parser_context.c +0 -116
  183. data/ext/nokogiri/html_sax_parser_context.h +0 -11
  184. data/ext/nokogiri/html_sax_push_parser.c +0 -87
  185. data/ext/nokogiri/html_sax_push_parser.h +0 -9
  186. data/ext/nokogiri/xml_attr.h +0 -9
  187. data/ext/nokogiri/xml_attribute_decl.h +0 -9
  188. data/ext/nokogiri/xml_cdata.h +0 -9
  189. data/ext/nokogiri/xml_comment.h +0 -9
  190. data/ext/nokogiri/xml_document.h +0 -23
  191. data/ext/nokogiri/xml_document_fragment.h +0 -10
  192. data/ext/nokogiri/xml_dtd.h +0 -10
  193. data/ext/nokogiri/xml_element_content.h +0 -10
  194. data/ext/nokogiri/xml_element_decl.h +0 -9
  195. data/ext/nokogiri/xml_encoding_handler.h +0 -8
  196. data/ext/nokogiri/xml_entity_decl.h +0 -10
  197. data/ext/nokogiri/xml_entity_reference.h +0 -9
  198. data/ext/nokogiri/xml_io.c +0 -61
  199. data/ext/nokogiri/xml_io.h +0 -11
  200. data/ext/nokogiri/xml_libxml2_hacks.c +0 -112
  201. data/ext/nokogiri/xml_libxml2_hacks.h +0 -12
  202. data/ext/nokogiri/xml_namespace.h +0 -14
  203. data/ext/nokogiri/xml_node.h +0 -13
  204. data/ext/nokogiri/xml_node_set.h +0 -12
  205. data/ext/nokogiri/xml_processing_instruction.h +0 -9
  206. data/ext/nokogiri/xml_reader.h +0 -10
  207. data/ext/nokogiri/xml_relax_ng.h +0 -9
  208. data/ext/nokogiri/xml_sax_parser.h +0 -39
  209. data/ext/nokogiri/xml_sax_parser_context.h +0 -10
  210. data/ext/nokogiri/xml_sax_push_parser.h +0 -9
  211. data/ext/nokogiri/xml_schema.h +0 -9
  212. data/ext/nokogiri/xml_syntax_error.h +0 -13
  213. data/ext/nokogiri/xml_text.h +0 -9
  214. data/ext/nokogiri/xml_xpath_context.h +0 -10
  215. data/ext/nokogiri/xslt_stylesheet.h +0 -14
  216. data/lib/nokogiri/html/document.rb +0 -335
  217. data/lib/nokogiri/html/document_fragment.rb +0 -49
  218. data/lib/nokogiri/html/element_description_defaults.rb +0 -671
  219. data/lib/nokogiri/html/sax/parser_context.rb +0 -16
  220. data/patches/libxml2/0001-Revert-Do-not-URI-escape-in-server-side-includes.patch +0 -78
  221. data/ports/archives/libxml2-2.9.10.tar.gz +0 -0
  222. data/ports/archives/libxslt-1.1.34.tar.gz +0 -0
  223. /data/patches/libxml2/{0002-Remove-script-macro-support.patch → 0001-Remove-script-macro-support.patch} +0 -0
  224. /data/patches/libxml2/{0003-Update-entities-to-remove-handling-of-ssi.patch → 0002-Update-entities-to-remove-handling-of-ssi.patch} +0 -0
@@ -1,26 +1,41 @@
1
1
  #ifndef NOKOGIRI_NATIVE
2
2
  #define NOKOGIRI_NATIVE
3
3
 
4
+ #include <ruby/defines.h> // https://github.com/sparklemotion/nokogiri/issues/2696
5
+
6
+ #ifdef _MSC_VER
7
+ # ifndef WIN32_LEAN_AND_MEAN
8
+ # define WIN32_LEAN_AND_MEAN
9
+ # endif /* WIN32_LEAN_AND_MEAN */
10
+
11
+ # ifndef WIN32
12
+ # define WIN32
13
+ # endif /* WIN32 */
14
+
15
+ # include <winsock2.h>
16
+ # include <ws2tcpip.h>
17
+ # include <windows.h>
18
+ #endif
19
+
20
+ #ifdef _WIN32
21
+ # define NOKOPUBFUN __declspec(dllexport)
22
+ # define NOKOPUBVAR __declspec(dllexport) extern
23
+ #else
24
+ # define NOKOPUBFUN
25
+ # define NOKOPUBVAR extern
26
+ #endif
27
+
4
28
  #include <stdlib.h>
5
29
  #include <string.h>
6
30
  #include <assert.h>
7
31
  #include <stdarg.h>
32
+ #include <stdio.h>
8
33
 
9
- #ifdef USE_INCLUDED_VASPRINTF
10
- int vasprintf (char **strp, const char *fmt, va_list ap);
11
- #else
12
-
13
- #define _GNU_SOURCE
14
- # include <stdio.h>
15
- #undef _GNU_SOURCE
16
-
17
- #endif
18
34
 
19
35
  #include <libxml/parser.h>
36
+ #include <libxml/tree.h>
20
37
  #include <libxml/entities.h>
21
- #include <libxml/parserInternals.h>
22
38
  #include <libxml/xpath.h>
23
- #include <libxml/xpathInternals.h>
24
39
  #include <libxml/xmlreader.h>
25
40
  #include <libxml/xmlsave.h>
26
41
  #include <libxml/xmlschemas.h>
@@ -28,94 +43,211 @@ int vasprintf (char **strp, const char *fmt, va_list ap);
28
43
  #include <libxml/HTMLtree.h>
29
44
  #include <libxml/relaxng.h>
30
45
  #include <libxml/xinclude.h>
31
- #include <libxslt/extensions.h>
32
46
  #include <libxml/c14n.h>
33
- #include <ruby.h>
34
- #include <ruby/st.h>
35
- #include <ruby/encoding.h>
47
+ #include <libxml/parserInternals.h>
48
+ #include <libxml/xpathInternals.h>
36
49
 
37
- #ifndef NORETURN
38
- # if defined(__GNUC__)
39
- # define NORETURN(name) __attribute__((noreturn)) name
40
- # else
41
- # define NORETURN(name) name
42
- # endif
50
+ #include <libxslt/extensions.h>
51
+ #include <libxslt/xsltconfig.h>
52
+ #include <libxslt/xsltutils.h>
53
+ #include <libxslt/transform.h>
54
+ #include <libxslt/imports.h>
55
+ #include <libxslt/xsltInternals.h>
56
+
57
+ #include <libexslt/exslt.h>
58
+
59
+ /* libxml2_backwards_compat.c */
60
+ #ifndef HAVE_XMLFIRSTELEMENTCHILD
61
+ xmlNodePtr xmlFirstElementChild(xmlNodePtr parent);
62
+ xmlNodePtr xmlNextElementSibling(xmlNodePtr node);
63
+ xmlNodePtr xmlLastElementChild(xmlNodePtr parent);
43
64
  #endif
44
65
 
45
- #define NOKOGIRI_STR_NEW2(str) \
46
- NOKOGIRI_STR_NEW(str, strlen((const char *)(str)))
47
-
48
- #define NOKOGIRI_STR_NEW(str, len) \
49
- rb_external_str_new_with_enc((const char *)(str), (long)(len), rb_utf8_encoding())
50
-
51
- #define RBSTR_OR_QNIL(_str) \
52
- (_str ? NOKOGIRI_STR_NEW2(_str) : Qnil)
53
-
54
- #include <xml_libxml2_hacks.h>
55
-
56
- #include <xml_io.h>
57
- #include <xml_document.h>
58
- #include <html_entity_lookup.h>
59
- #include <html_document.h>
60
- #include <xml_node.h>
61
- #include <xml_text.h>
62
- #include <xml_cdata.h>
63
- #include <xml_attr.h>
64
- #include <xml_processing_instruction.h>
65
- #include <xml_entity_reference.h>
66
- #include <xml_document_fragment.h>
67
- #include <xml_comment.h>
68
- #include <xml_node_set.h>
69
- #include <xml_dtd.h>
70
- #include <xml_attribute_decl.h>
71
- #include <xml_element_decl.h>
72
- #include <xml_entity_decl.h>
73
- #include <xml_xpath_context.h>
74
- #include <xml_element_content.h>
75
- #include <xml_sax_parser_context.h>
76
- #include <xml_sax_parser.h>
77
- #include <xml_sax_push_parser.h>
78
- #include <xml_reader.h>
79
- #include <html_sax_parser_context.h>
80
- #include <html_sax_push_parser.h>
81
- #include <xslt_stylesheet.h>
82
- #include <xml_syntax_error.h>
83
- #include <xml_schema.h>
84
- #include <xml_relax_ng.h>
85
- #include <html_element_description.h>
86
- #include <xml_namespace.h>
87
- #include <xml_encoding_handler.h>
88
-
89
- extern VALUE mNokogiri ;
90
- extern VALUE mNokogiriXml ;
91
- extern VALUE mNokogiriXmlSax ;
92
- extern VALUE mNokogiriHtml ;
93
- extern VALUE mNokogiriHtmlSax ;
94
- extern VALUE mNokogiriXslt ;
95
-
96
- void nokogiri_root_node(xmlNodePtr);
97
- void nokogiri_root_nsdef(xmlNsPtr, xmlDocPtr);
98
-
99
- #ifdef DEBUG
100
-
101
- #define NOKOGIRI_DEBUG_START(p) if (getenv("NOKOGIRI_NO_FREE")) return ; if (getenv("NOKOGIRI_DEBUG")) fprintf(stderr,"nokogiri: %s:%d %p start\n", __FILE__, __LINE__, p);
102
- #define NOKOGIRI_DEBUG_END(p) if (getenv("NOKOGIRI_DEBUG")) fprintf(stderr,"nokogiri: %s:%d %p end\n", __FILE__, __LINE__, p);
103
-
104
- #else
66
+ #define XMLNS_PREFIX "xmlns"
67
+ #define XMLNS_PREFIX_LEN 6 /* including either colon or \0 */
105
68
 
106
- #define NOKOGIRI_DEBUG_START(p)
107
- #define NOKOGIRI_DEBUG_END(p)
69
+ #ifndef xmlErrorConstPtr
70
+ # if LIBXML_VERSION >= 21200
71
+ # define xmlErrorConstPtr const xmlError *
72
+ # else
73
+ # define xmlErrorConstPtr xmlError *
74
+ # endif
75
+ #endif
108
76
 
77
+ #include <ruby.h>
78
+ #include <ruby/st.h>
79
+ #include <ruby/encoding.h>
80
+ #include <ruby/util.h>
81
+ #include <ruby/version.h>
82
+
83
+ #define NOKOGIRI_STR_NEW2(str) NOKOGIRI_STR_NEW(str, strlen((const char *)(str)))
84
+ #define NOKOGIRI_STR_NEW(str, len) rb_external_str_new_with_enc((const char *)(str), (long)(len), rb_utf8_encoding())
85
+ #define RBSTR_OR_QNIL(_str) (_str ? NOKOGIRI_STR_NEW2(_str) : Qnil)
86
+
87
+ #ifndef NORETURN_DECL
88
+ # if defined(__GNUC__)
89
+ # define NORETURN_DECL __attribute__ ((noreturn))
90
+ # else
91
+ # define NORETURN_DECL
92
+ # endif
109
93
  #endif
110
94
 
111
- #ifndef __builtin_expect
112
- # if defined(__GNUC__)
113
- # define __builtin_expect(expr, c) __builtin_expect((long)(expr), (long)(c))
114
- # endif
95
+ #ifndef PRINTFLIKE_DECL
96
+ # if defined(__GNUC__)
97
+ # define PRINTFLIKE_DECL(stringidx, argidx) __attribute__ ((format(printf,stringidx,argidx)))
98
+ # else
99
+ # define PRINTFLIKE_DECL(stringidx, argidx)
100
+ # endif
115
101
  #endif
116
102
 
117
- #define XMLNS_PREFIX "xmlns"
118
- #define XMLNS_PREFIX_LEN 6 /* including either colon or \0 */
119
- #define XMLNS_BUFFER_LEN 128
103
+ #if defined(TRUFFLERUBY) && !defined(NOKOGIRI_PACKAGED_LIBRARIES)
104
+ # define TRUFFLERUBY_NOKOGIRI_SYSTEM_LIBRARIES
105
+ #endif
120
106
 
107
+ NOKOPUBVAR VALUE mNokogiri ;
108
+ NOKOPUBVAR VALUE mNokogiriGumbo ;
109
+ NOKOPUBVAR VALUE mNokogiriHtml4 ;
110
+ NOKOPUBVAR VALUE mNokogiriHtml4Sax ;
111
+ NOKOPUBVAR VALUE mNokogiriHtml5 ;
112
+ NOKOPUBVAR VALUE mNokogiriXml ;
113
+ NOKOPUBVAR VALUE mNokogiriXmlSax ;
114
+ NOKOPUBVAR VALUE mNokogiriXmlXpath ;
115
+ NOKOPUBVAR VALUE mNokogiriXslt ;
116
+
117
+ NOKOPUBVAR VALUE cNokogiriEncodingHandler;
118
+ NOKOPUBVAR VALUE cNokogiriSyntaxError;
119
+ NOKOPUBVAR VALUE cNokogiriXmlAttr;
120
+ NOKOPUBVAR VALUE cNokogiriXmlAttributeDecl;
121
+ NOKOPUBVAR VALUE cNokogiriXmlCData;
122
+ NOKOPUBVAR VALUE cNokogiriXmlCharacterData;
123
+ NOKOPUBVAR VALUE cNokogiriXmlComment;
124
+ NOKOPUBVAR VALUE cNokogiriXmlDocument ;
125
+ NOKOPUBVAR VALUE cNokogiriXmlDocumentFragment;
126
+ NOKOPUBVAR VALUE cNokogiriXmlDtd;
127
+ NOKOPUBVAR VALUE cNokogiriXmlElement ;
128
+ NOKOPUBVAR VALUE cNokogiriXmlElementContent;
129
+ NOKOPUBVAR VALUE cNokogiriXmlElementDecl;
130
+ NOKOPUBVAR VALUE cNokogiriXmlEntityDecl;
131
+ NOKOPUBVAR VALUE cNokogiriXmlEntityReference;
132
+ NOKOPUBVAR VALUE cNokogiriXmlNamespace ;
133
+ NOKOPUBVAR VALUE cNokogiriXmlNode ;
134
+ NOKOPUBVAR VALUE cNokogiriXmlNodeSet ;
135
+ NOKOPUBVAR VALUE cNokogiriXmlProcessingInstruction;
136
+ NOKOPUBVAR VALUE cNokogiriXmlReader;
137
+ NOKOPUBVAR VALUE cNokogiriXmlRelaxNG;
138
+ NOKOPUBVAR VALUE cNokogiriXmlSaxParser ;
139
+ NOKOPUBVAR VALUE cNokogiriXmlSaxParserContext;
140
+ NOKOPUBVAR VALUE cNokogiriXmlSaxPushParser ;
141
+ NOKOPUBVAR VALUE cNokogiriXmlSchema;
142
+ NOKOPUBVAR VALUE cNokogiriXmlSyntaxError;
143
+ NOKOPUBVAR VALUE cNokogiriXmlText ;
144
+ NOKOPUBVAR VALUE cNokogiriXmlXpathContext;
145
+ NOKOPUBVAR VALUE cNokogiriXmlXpathSyntaxError;
146
+ NOKOPUBVAR VALUE cNokogiriXsltStylesheet ;
147
+
148
+ NOKOPUBVAR VALUE cNokogiriHtml4Document ;
149
+ NOKOPUBVAR VALUE cNokogiriHtml4SaxPushParser ;
150
+ NOKOPUBVAR VALUE cNokogiriHtml4ElementDescription ;
151
+ NOKOPUBVAR VALUE cNokogiriHtml4SaxParserContext;
152
+ NOKOPUBVAR VALUE cNokogiriHtml5Document ;
153
+
154
+ typedef struct _nokogiriTuple {
155
+ VALUE doc;
156
+ st_table *unlinkedNodes;
157
+ VALUE node_cache;
158
+ } nokogiriTuple;
159
+ typedef nokogiriTuple *nokogiriTuplePtr;
160
+
161
+ typedef struct _nokogiriSAXTuple {
162
+ xmlParserCtxtPtr ctxt;
163
+ VALUE self;
164
+ } nokogiriSAXTuple;
165
+ typedef nokogiriSAXTuple *nokogiriSAXTuplePtr;
166
+
167
+ typedef struct _libxmlStructuredErrorHandlerState {
168
+ void *user_data;
169
+ xmlStructuredErrorFunc handler;
170
+ } libxmlStructuredErrorHandlerState ;
171
+
172
+ typedef struct _nokogiriXsltStylesheetTuple {
173
+ xsltStylesheetPtr ss;
174
+ VALUE func_instances;
175
+ } nokogiriXsltStylesheetTuple;
176
+
177
+ void noko_xml_document_pin_node(xmlNodePtr);
178
+ void noko_xml_document_pin_namespace(xmlNsPtr, xmlDocPtr);
179
+ int noko_xml_document_has_wrapped_blank_nodes_p(xmlDocPtr c_document);
180
+
181
+ int noko_io_read(void *ctx, char *buffer, int len);
182
+ int noko_io_write(void *ctx, char *buffer, int len);
183
+ int noko_io_close(void *ctx);
184
+
185
+ #define Noko_Node_Get_Struct(obj,type,sval) ((sval) = (type*)DATA_PTR(obj))
186
+ #define Noko_Namespace_Get_Struct(obj,type,sval) ((sval) = (type*)DATA_PTR(obj))
187
+
188
+ VALUE noko_xml_node_wrap(VALUE klass, xmlNodePtr node) ;
189
+ VALUE noko_xml_node_wrap_node_set_result(xmlNodePtr node, VALUE node_set) ;
190
+ VALUE noko_xml_node_attrs(xmlNodePtr node) ;
191
+
192
+ VALUE noko_xml_namespace_wrap(xmlNsPtr node, xmlDocPtr doc);
193
+ VALUE noko_xml_namespace_wrap_xpath_copy(xmlNsPtr node);
194
+
195
+ VALUE noko_xml_element_content_wrap(VALUE doc, xmlElementContentPtr element);
196
+
197
+ VALUE noko_xml_node_set_wrap(xmlNodeSetPtr node_set, VALUE document) ;
198
+ xmlNodeSetPtr noko_xml_node_set_unwrap(VALUE rb_node_set) ;
199
+
200
+ VALUE noko_xml_document_wrap_with_init_args(VALUE klass, xmlDocPtr doc, int argc, VALUE *argv);
201
+ VALUE noko_xml_document_wrap(VALUE klass, xmlDocPtr doc);
202
+ xmlDocPtr noko_xml_document_unwrap(VALUE rb_document);
203
+ NOKOPUBFUN VALUE Nokogiri_wrap_xml_document(VALUE klass,
204
+ xmlDocPtr doc); /* deprecated. use noko_xml_document_wrap() instead. */
205
+
206
+ xmlSAXHandlerPtr noko_sax_handler_unwrap(VALUE rb_sax_handler);
207
+
208
+ xmlParserCtxtPtr noko_xml_sax_push_parser_unwrap(VALUE rb_parser);
209
+
210
+ VALUE noko_xml_sax_parser_context_wrap(VALUE klass, xmlParserCtxtPtr c_context);
211
+ xmlParserCtxtPtr noko_xml_sax_parser_context_unwrap(VALUE rb_context);
212
+
213
+ #define DOC_RUBY_OBJECT_TEST(x) ((nokogiriTuplePtr)(x->_private))
214
+ #define DOC_RUBY_OBJECT(x) (((nokogiriTuplePtr)(x->_private))->doc)
215
+ #define DOC_UNLINKED_NODE_HASH(x) (((nokogiriTuplePtr)(x->_private))->unlinkedNodes)
216
+ #define DOC_NODE_CACHE(x) (((nokogiriTuplePtr)(x->_private))->node_cache)
217
+ #define NOKOGIRI_NAMESPACE_EH(node) ((node)->type == XML_NAMESPACE_DECL)
218
+
219
+ #define NOKOGIRI_SAX_SELF(_ctxt) ((nokogiriSAXTuplePtr)(_ctxt))->self
220
+ #define NOKOGIRI_SAX_CTXT(_ctxt) ((nokogiriSAXTuplePtr)(_ctxt))->ctxt
221
+ #define NOKOGIRI_SAX_TUPLE_NEW(_ctxt, _self) nokogiri_sax_tuple_new(_ctxt, _self)
222
+ #define NOKOGIRI_SAX_TUPLE_DESTROY(_tuple) ruby_xfree(_tuple)
223
+
224
+ #define DISCARD_CONST_QUAL(t, v) ((t)(uintptr_t)(v))
225
+ #define DISCARD_CONST_QUAL_XMLCHAR(v) DISCARD_CONST_QUAL(xmlChar *, v)
226
+
227
+ #if HAVE_RB_CATEGORY_WARNING
228
+ # define NOKO_WARN_DEPRECATION(message...) rb_category_warning(RB_WARN_CATEGORY_DEPRECATED, message)
229
+ #else
230
+ # define NOKO_WARN_DEPRECATION(message...) rb_warning(message)
121
231
  #endif
232
+
233
+ void Nokogiri_structured_error_func_save(libxmlStructuredErrorHandlerState *handler_state);
234
+ void Nokogiri_structured_error_func_save_and_set(libxmlStructuredErrorHandlerState *handler_state, void *user_data,
235
+ xmlStructuredErrorFunc handler);
236
+ void Nokogiri_structured_error_func_restore(libxmlStructuredErrorHandlerState *handler_state);
237
+ VALUE Nokogiri_wrap_xml_syntax_error(xmlErrorConstPtr error);
238
+ void Nokogiri_error_array_pusher(void *ctx, xmlErrorConstPtr error);
239
+ NORETURN_DECL void Nokogiri_error_raise(void *ctx, xmlErrorConstPtr error);
240
+ void Nokogiri_marshal_xpath_funcall_and_return_values(xmlXPathParserContextPtr ctx, int nargs, VALUE handler,
241
+ const char *function_name) ;
242
+
243
+ static inline
244
+ nokogiriSAXTuplePtr
245
+ nokogiri_sax_tuple_new(xmlParserCtxtPtr ctxt, VALUE self)
246
+ {
247
+ nokogiriSAXTuplePtr tuple = ruby_xmalloc(sizeof(nokogiriSAXTuple));
248
+ tuple->self = self;
249
+ tuple->ctxt = ctxt;
250
+ return tuple;
251
+ }
252
+
253
+ #endif /* NOKOGIRI_NATIVE */
@@ -0,0 +1,40 @@
1
+ #include <nokogiri.h>
2
+
3
+ static VALUE foreign_error_handler_block = Qnil;
4
+
5
+ static void
6
+ foreign_error_handler(void *user_data, xmlErrorConstPtr c_error)
7
+ {
8
+ rb_funcall(foreign_error_handler_block, rb_intern("call"), 0);
9
+ }
10
+
11
+ /*
12
+ * call-seq:
13
+ * __foreign_error_handler { ... } -> nil
14
+ *
15
+ * Override libxml2's global error handlers to call the block. This method thus has very little
16
+ * value except to test that Nokogiri is properly setting error handlers elsewhere in the code. See
17
+ * test/helper.rb for how this is being used.
18
+ */
19
+ static VALUE
20
+ rb_foreign_error_handler(VALUE klass)
21
+ {
22
+ rb_need_block();
23
+ foreign_error_handler_block = rb_block_proc();
24
+ xmlSetStructuredErrorFunc(NULL, foreign_error_handler);
25
+ return Qnil;
26
+ }
27
+
28
+ /*
29
+ * Document-module: Nokogiri::Test
30
+ *
31
+ * The Nokogiri::Test module should only be used for testing Nokogiri.
32
+ * Do NOT use this outside of the Nokogiri test suite.
33
+ */
34
+ void
35
+ noko_init_test_global_handlers(void)
36
+ {
37
+ VALUE mNokogiriTest = rb_define_module_under(mNokogiri, "Test");
38
+
39
+ rb_define_singleton_method(mNokogiriTest, "__foreign_error_handler", rb_foreign_error_handler, 0);
40
+ }
@@ -1,4 +1,6 @@
1
- #include <xml_attr.h>
1
+ #include <nokogiri.h>
2
+
3
+ VALUE cNokogiriXmlAttr;
2
4
 
3
5
  /*
4
6
  * call-seq:
@@ -7,13 +9,14 @@
7
9
  * Set the value for this Attr to +content+. Use `nil` to remove the value
8
10
  * (e.g., a HTML boolean attribute).
9
11
  */
10
- static VALUE set_value(VALUE self, VALUE content)
12
+ static VALUE
13
+ set_value(VALUE self, VALUE content)
11
14
  {
12
15
  xmlAttrPtr attr;
13
16
  xmlChar *value;
14
17
  xmlNode *cur;
15
18
 
16
- Data_Get_Struct(self, xmlAttr, attr);
19
+ Noko_Node_Get_Struct(self, xmlAttr, attr);
17
20
 
18
21
  if (attr->children) {
19
22
  xmlFreeNodeList(attr->children);
@@ -49,7 +52,8 @@ static VALUE set_value(VALUE self, VALUE content)
49
52
  *
50
53
  * Create a new Attr element on the +document+ with +name+
51
54
  */
52
- static VALUE new(int argc, VALUE *argv, VALUE klass)
55
+ static VALUE
56
+ new (int argc, VALUE *argv, VALUE klass)
53
57
  {
54
58
  xmlDocPtr xml_doc;
55
59
  VALUE document;
@@ -64,7 +68,7 @@ static VALUE new(int argc, VALUE *argv, VALUE klass)
64
68
  rb_raise(rb_eArgError, "parameter must be a Nokogiri::XML::Document");
65
69
  }
66
70
 
67
- Data_Get_Struct(document, xmlDoc, xml_doc);
71
+ xml_doc = noko_xml_document_unwrap(document);
68
72
 
69
73
  node = xmlNewDocProp(
70
74
  xml_doc,
@@ -72,9 +76,9 @@ static VALUE new(int argc, VALUE *argv, VALUE klass)
72
76
  NULL
73
77
  );
74
78
 
75
- nokogiri_root_node((xmlNodePtr)node);
79
+ noko_xml_document_pin_node((xmlNodePtr)node);
76
80
 
77
- rb_node = Nokogiri_wrap_xml_node(klass, (xmlNodePtr)node);
81
+ rb_node = noko_xml_node_wrap(klass, (xmlNodePtr)node);
78
82
  rb_obj_call_init(rb_node, argc, argv);
79
83
 
80
84
  if (rb_block_given_p()) {
@@ -84,20 +88,16 @@ static VALUE new(int argc, VALUE *argv, VALUE klass)
84
88
  return rb_node;
85
89
  }
86
90
 
87
- VALUE cNokogiriXmlAttr;
88
- void init_xml_attr()
91
+ void
92
+ noko_init_xml_attr(void)
89
93
  {
90
- VALUE nokogiri = rb_define_module("Nokogiri");
91
- VALUE xml = rb_define_module_under(nokogiri, "XML");
92
- VALUE node = rb_define_class_under(xml, "Node", rb_cObject);
93
-
94
+ assert(cNokogiriXmlNode);
94
95
  /*
95
96
  * Attr represents a Attr node in an xml document.
96
97
  */
97
- VALUE klass = rb_define_class_under(xml, "Attr", node);
98
+ cNokogiriXmlAttr = rb_define_class_under(mNokogiriXml, "Attr", cNokogiriXmlNode);
98
99
 
99
- cNokogiriXmlAttr = klass;
100
+ rb_define_singleton_method(cNokogiriXmlAttr, "new", new, -1);
100
101
 
101
- rb_define_singleton_method(klass, "new", new, -1);
102
- rb_define_method(klass, "value=", set_value, 1);
102
+ rb_define_method(cNokogiriXmlAttr, "value=", set_value, 1);
103
103
  }
@@ -1,4 +1,6 @@
1
- #include <xml_attribute_decl.h>
1
+ #include <nokogiri.h>
2
+
3
+ VALUE cNokogiriXmlAttributeDecl;
2
4
 
3
5
  /*
4
6
  * call-seq:
@@ -6,11 +8,12 @@
6
8
  *
7
9
  * The attribute_type for this AttributeDecl
8
10
  */
9
- static VALUE attribute_type(VALUE self)
11
+ static VALUE
12
+ attribute_type(VALUE self)
10
13
  {
11
14
  xmlAttributePtr node;
12
- Data_Get_Struct(self, xmlAttribute, node);
13
- return INT2NUM((long)node->atype);
15
+ Noko_Node_Get_Struct(self, xmlAttribute, node);
16
+ return INT2NUM(node->atype);
14
17
  }
15
18
 
16
19
  /*
@@ -19,12 +22,13 @@ static VALUE attribute_type(VALUE self)
19
22
  *
20
23
  * The default value
21
24
  */
22
- static VALUE default_value(VALUE self)
25
+ static VALUE
26
+ default_value(VALUE self)
23
27
  {
24
28
  xmlAttributePtr node;
25
- Data_Get_Struct(self, xmlAttribute, node);
29
+ Noko_Node_Get_Struct(self, xmlAttribute, node);
26
30
 
27
- if(node->defaultValue) return NOKOGIRI_STR_NEW2(node->defaultValue);
31
+ if (node->defaultValue) { return NOKOGIRI_STR_NEW2(node->defaultValue); }
28
32
  return Qnil;
29
33
  }
30
34
 
@@ -34,18 +38,19 @@ static VALUE default_value(VALUE self)
34
38
  *
35
39
  * An enumeration of possible values
36
40
  */
37
- static VALUE enumeration(VALUE self)
41
+ static VALUE
42
+ enumeration(VALUE self)
38
43
  {
39
44
  xmlAttributePtr node;
40
45
  xmlEnumerationPtr enm;
41
46
  VALUE list;
42
47
 
43
- Data_Get_Struct(self, xmlAttribute, node);
48
+ Noko_Node_Get_Struct(self, xmlAttribute, node);
44
49
 
45
50
  list = rb_ary_new();
46
51
  enm = node->tree;
47
52
 
48
- while(enm) {
53
+ while (enm) {
49
54
  rb_ary_push(list, NOKOGIRI_STR_NEW2(enm->name));
50
55
  enm = enm->next;
51
56
  }
@@ -53,18 +58,13 @@ static VALUE enumeration(VALUE self)
53
58
  return list;
54
59
  }
55
60
 
56
- VALUE cNokogiriXmlAttributeDecl;
57
-
58
- void init_xml_attribute_decl()
61
+ void
62
+ noko_init_xml_attribute_decl(void)
59
63
  {
60
- VALUE nokogiri = rb_define_module("Nokogiri");
61
- VALUE xml = rb_define_module_under(nokogiri, "XML");
62
- VALUE node = rb_define_class_under(xml, "Node", rb_cObject);
63
- VALUE klass = rb_define_class_under(xml, "AttributeDecl", node);
64
-
65
- cNokogiriXmlAttributeDecl = klass;
64
+ assert(cNokogiriXmlNode);
65
+ cNokogiriXmlAttributeDecl = rb_define_class_under(mNokogiriXml, "AttributeDecl", cNokogiriXmlNode);
66
66
 
67
- rb_define_method(klass, "attribute_type", attribute_type, 0);
68
- rb_define_method(klass, "default", default_value, 0);
69
- rb_define_method(klass, "enumeration", enumeration, 0);
67
+ rb_define_method(cNokogiriXmlAttributeDecl, "attribute_type", attribute_type, 0);
68
+ rb_define_method(cNokogiriXmlAttributeDecl, "default", default_value, 0);
69
+ rb_define_method(cNokogiriXmlAttributeDecl, "enumeration", enumeration, 0);
70
70
  }
@@ -1,4 +1,6 @@
1
- #include <xml_cdata.h>
1
+ #include <nokogiri.h>
2
+
3
+ VALUE cNokogiriXmlCData;
2
4
 
3
5
  /*
4
6
  * call-seq:
@@ -9,54 +11,60 @@
9
11
  * If +content+ cannot be implicitly converted to a string, this method will
10
12
  * raise a TypeError exception.
11
13
  */
12
- static VALUE new(int argc, VALUE *argv, VALUE klass)
14
+ static VALUE
15
+ rb_xml_cdata_s_new(int argc, VALUE *argv, VALUE klass)
13
16
  {
14
- xmlDocPtr xml_doc;
15
- xmlNodePtr node;
16
- VALUE doc;
17
- VALUE content;
18
- VALUE rest;
17
+ xmlDocPtr c_document;
18
+ xmlNodePtr c_node;
19
+ VALUE rb_document;
20
+ VALUE rb_content;
21
+ VALUE rb_rest;
19
22
  VALUE rb_node;
20
- xmlChar *content_str = NULL;
21
- int content_str_len = 0;
23
+ xmlChar *c_content = NULL;
24
+ int c_content_len = 0;
22
25
 
23
- rb_scan_args(argc, argv, "2*", &doc, &content, &rest);
26
+ rb_scan_args(argc, argv, "2*", &rb_document, &rb_content, &rb_rest);
24
27
 
25
- Data_Get_Struct(doc, xmlDoc, xml_doc);
28
+ if (!rb_obj_is_kind_of(rb_document, cNokogiriXmlNode)) {
29
+ rb_raise(rb_eTypeError,
30
+ "expected first parameter to be a Nokogiri::XML::Document, received %"PRIsVALUE,
31
+ rb_obj_class(rb_document));
32
+ }
33
+
34
+ if (!rb_obj_is_kind_of(rb_document, cNokogiriXmlDocument)) {
35
+ xmlNodePtr deprecated_node_type_arg;
36
+ NOKO_WARN_DEPRECATION("Passing a Node as the first parameter to CDATA.new is deprecated. Please pass a Document instead. This will become an error in Nokogiri v1.17.0."); // TODO: deprecated in v1.15.3, remove in v1.17.0
37
+ Noko_Node_Get_Struct(rb_document, xmlNode, deprecated_node_type_arg);
38
+ c_document = deprecated_node_type_arg->doc;
39
+ } else {
40
+ c_document = noko_xml_document_unwrap(rb_document);
41
+ }
26
42
 
27
- if (!NIL_P(content)) {
28
- content_str = (xmlChar *)StringValuePtr(content);
29
- content_str_len = RSTRING_LEN(content);
43
+ if (!NIL_P(rb_content)) {
44
+ c_content = (xmlChar *)StringValuePtr(rb_content);
45
+ c_content_len = RSTRING_LENINT(rb_content);
30
46
  }
31
47
 
32
- node = xmlNewCDataBlock(xml_doc->doc, content_str, content_str_len);
48
+ c_node = xmlNewCDataBlock(c_document, c_content, c_content_len);
33
49
 
34
- nokogiri_root_node(node);
50
+ noko_xml_document_pin_node(c_node);
35
51
 
36
- rb_node = Nokogiri_wrap_xml_node(klass, node);
52
+ rb_node = noko_xml_node_wrap(klass, c_node);
37
53
  rb_obj_call_init(rb_node, argc, argv);
38
54
 
39
- if(rb_block_given_p()) { rb_yield(rb_node); }
55
+ if (rb_block_given_p()) { rb_yield(rb_node); }
40
56
 
41
57
  return rb_node;
42
58
  }
43
59
 
44
- VALUE cNokogiriXmlCData;
45
- void init_xml_cdata()
60
+ void
61
+ noko_init_xml_cdata(void)
46
62
  {
47
- VALUE nokogiri = rb_define_module("Nokogiri");
48
- VALUE xml = rb_define_module_under(nokogiri, "XML");
49
- VALUE node = rb_define_class_under(xml, "Node", rb_cObject);
50
- VALUE char_data = rb_define_class_under(xml, "CharacterData", node);
51
- VALUE text = rb_define_class_under(xml, "Text", char_data);
52
-
63
+ assert(cNokogiriXmlText);
53
64
  /*
54
65
  * CData represents a CData node in an xml document.
55
66
  */
56
- VALUE klass = rb_define_class_under(xml, "CDATA", text);
57
-
58
-
59
- cNokogiriXmlCData = klass;
67
+ cNokogiriXmlCData = rb_define_class_under(mNokogiriXml, "CDATA", cNokogiriXmlText);
60
68
 
61
- rb_define_singleton_method(klass, "new", new, -1);
69
+ rb_define_singleton_method(cNokogiriXmlCData, "new", rb_xml_cdata_s_new, -1);
62
70
  }