nokogiri-maglev- 1.5.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (225) hide show
  1. data/.autotest +26 -0
  2. data/.gemtest +0 -0
  3. data/CHANGELOG.ja.rdoc +544 -0
  4. data/CHANGELOG.rdoc +532 -0
  5. data/Manifest.txt +283 -0
  6. data/README.ja.rdoc +106 -0
  7. data/README.rdoc +174 -0
  8. data/Rakefile +171 -0
  9. data/bin/nokogiri +53 -0
  10. data/ext/nokogiri/depend +358 -0
  11. data/ext/nokogiri/extconf.rb +124 -0
  12. data/ext/nokogiri/html_document.c +154 -0
  13. data/ext/nokogiri/html_document.h +10 -0
  14. data/ext/nokogiri/html_element_description.c +276 -0
  15. data/ext/nokogiri/html_element_description.h +10 -0
  16. data/ext/nokogiri/html_entity_lookup.c +32 -0
  17. data/ext/nokogiri/html_entity_lookup.h +8 -0
  18. data/ext/nokogiri/html_sax_parser_context.c +94 -0
  19. data/ext/nokogiri/html_sax_parser_context.h +11 -0
  20. data/ext/nokogiri/nokogiri.c +115 -0
  21. data/ext/nokogiri/nokogiri.h +160 -0
  22. data/ext/nokogiri/st.c +576 -0
  23. data/ext/nokogiri/xml_attr.c +94 -0
  24. data/ext/nokogiri/xml_attr.h +9 -0
  25. data/ext/nokogiri/xml_attribute_decl.c +70 -0
  26. data/ext/nokogiri/xml_attribute_decl.h +9 -0
  27. data/ext/nokogiri/xml_cdata.c +56 -0
  28. data/ext/nokogiri/xml_cdata.h +9 -0
  29. data/ext/nokogiri/xml_comment.c +54 -0
  30. data/ext/nokogiri/xml_comment.h +9 -0
  31. data/ext/nokogiri/xml_document.c +478 -0
  32. data/ext/nokogiri/xml_document.h +23 -0
  33. data/ext/nokogiri/xml_document_fragment.c +48 -0
  34. data/ext/nokogiri/xml_document_fragment.h +10 -0
  35. data/ext/nokogiri/xml_dtd.c +202 -0
  36. data/ext/nokogiri/xml_dtd.h +10 -0
  37. data/ext/nokogiri/xml_element_content.c +123 -0
  38. data/ext/nokogiri/xml_element_content.h +10 -0
  39. data/ext/nokogiri/xml_element_decl.c +69 -0
  40. data/ext/nokogiri/xml_element_decl.h +9 -0
  41. data/ext/nokogiri/xml_encoding_handler.c +79 -0
  42. data/ext/nokogiri/xml_encoding_handler.h +8 -0
  43. data/ext/nokogiri/xml_entity_decl.c +110 -0
  44. data/ext/nokogiri/xml_entity_decl.h +10 -0
  45. data/ext/nokogiri/xml_entity_reference.c +52 -0
  46. data/ext/nokogiri/xml_entity_reference.h +9 -0
  47. data/ext/nokogiri/xml_io.c +56 -0
  48. data/ext/nokogiri/xml_io.h +11 -0
  49. data/ext/nokogiri/xml_libxml2_hacks.c +112 -0
  50. data/ext/nokogiri/xml_libxml2_hacks.h +12 -0
  51. data/ext/nokogiri/xml_namespace.c +84 -0
  52. data/ext/nokogiri/xml_namespace.h +13 -0
  53. data/ext/nokogiri/xml_node.c +1397 -0
  54. data/ext/nokogiri/xml_node.h +13 -0
  55. data/ext/nokogiri/xml_node_set.c +418 -0
  56. data/ext/nokogiri/xml_node_set.h +9 -0
  57. data/ext/nokogiri/xml_processing_instruction.c +56 -0
  58. data/ext/nokogiri/xml_processing_instruction.h +9 -0
  59. data/ext/nokogiri/xml_reader.c +684 -0
  60. data/ext/nokogiri/xml_reader.h +10 -0
  61. data/ext/nokogiri/xml_relax_ng.c +162 -0
  62. data/ext/nokogiri/xml_relax_ng.h +9 -0
  63. data/ext/nokogiri/xml_sax_parser.c +293 -0
  64. data/ext/nokogiri/xml_sax_parser.h +39 -0
  65. data/ext/nokogiri/xml_sax_parser_context.c +199 -0
  66. data/ext/nokogiri/xml_sax_parser_context.h +10 -0
  67. data/ext/nokogiri/xml_sax_push_parser.c +115 -0
  68. data/ext/nokogiri/xml_sax_push_parser.h +9 -0
  69. data/ext/nokogiri/xml_schema.c +205 -0
  70. data/ext/nokogiri/xml_schema.h +9 -0
  71. data/ext/nokogiri/xml_syntax_error.c +58 -0
  72. data/ext/nokogiri/xml_syntax_error.h +13 -0
  73. data/ext/nokogiri/xml_text.c +50 -0
  74. data/ext/nokogiri/xml_text.h +9 -0
  75. data/ext/nokogiri/xml_xpath_context.c +315 -0
  76. data/ext/nokogiri/xml_xpath_context.h +9 -0
  77. data/ext/nokogiri/xslt_stylesheet.c +265 -0
  78. data/ext/nokogiri/xslt_stylesheet.h +9 -0
  79. data/lib/nokogiri.rb +127 -0
  80. data/lib/nokogiri/css.rb +27 -0
  81. data/lib/nokogiri/css/node.rb +99 -0
  82. data/lib/nokogiri/css/parser.rb +677 -0
  83. data/lib/nokogiri/css/parser.y +237 -0
  84. data/lib/nokogiri/css/parser_extras.rb +91 -0
  85. data/lib/nokogiri/css/syntax_error.rb +7 -0
  86. data/lib/nokogiri/css/tokenizer.rb +152 -0
  87. data/lib/nokogiri/css/tokenizer.rex +55 -0
  88. data/lib/nokogiri/css/xpath_visitor.rb +171 -0
  89. data/lib/nokogiri/decorators/slop.rb +35 -0
  90. data/lib/nokogiri/html.rb +36 -0
  91. data/lib/nokogiri/html/builder.rb +35 -0
  92. data/lib/nokogiri/html/document.rb +213 -0
  93. data/lib/nokogiri/html/document_fragment.rb +41 -0
  94. data/lib/nokogiri/html/element_description.rb +23 -0
  95. data/lib/nokogiri/html/element_description_defaults.rb +671 -0
  96. data/lib/nokogiri/html/entity_lookup.rb +13 -0
  97. data/lib/nokogiri/html/sax/parser.rb +52 -0
  98. data/lib/nokogiri/html/sax/parser_context.rb +16 -0
  99. data/lib/nokogiri/syntax_error.rb +4 -0
  100. data/lib/nokogiri/version.rb +88 -0
  101. data/lib/nokogiri/xml.rb +67 -0
  102. data/lib/nokogiri/xml/attr.rb +14 -0
  103. data/lib/nokogiri/xml/attribute_decl.rb +18 -0
  104. data/lib/nokogiri/xml/builder.rb +426 -0
  105. data/lib/nokogiri/xml/cdata.rb +11 -0
  106. data/lib/nokogiri/xml/character_data.rb +7 -0
  107. data/lib/nokogiri/xml/document.rb +234 -0
  108. data/lib/nokogiri/xml/document_fragment.rb +98 -0
  109. data/lib/nokogiri/xml/dtd.rb +22 -0
  110. data/lib/nokogiri/xml/element_content.rb +36 -0
  111. data/lib/nokogiri/xml/element_decl.rb +13 -0
  112. data/lib/nokogiri/xml/entity_decl.rb +19 -0
  113. data/lib/nokogiri/xml/namespace.rb +13 -0
  114. data/lib/nokogiri/xml/node.rb +915 -0
  115. data/lib/nokogiri/xml/node/save_options.rb +61 -0
  116. data/lib/nokogiri/xml/node_set.rb +357 -0
  117. data/lib/nokogiri/xml/notation.rb +6 -0
  118. data/lib/nokogiri/xml/parse_options.rb +93 -0
  119. data/lib/nokogiri/xml/pp.rb +2 -0
  120. data/lib/nokogiri/xml/pp/character_data.rb +18 -0
  121. data/lib/nokogiri/xml/pp/node.rb +56 -0
  122. data/lib/nokogiri/xml/processing_instruction.rb +8 -0
  123. data/lib/nokogiri/xml/reader.rb +112 -0
  124. data/lib/nokogiri/xml/relax_ng.rb +32 -0
  125. data/lib/nokogiri/xml/sax.rb +4 -0
  126. data/lib/nokogiri/xml/sax/document.rb +164 -0
  127. data/lib/nokogiri/xml/sax/parser.rb +115 -0
  128. data/lib/nokogiri/xml/sax/parser_context.rb +16 -0
  129. data/lib/nokogiri/xml/sax/push_parser.rb +60 -0
  130. data/lib/nokogiri/xml/schema.rb +63 -0
  131. data/lib/nokogiri/xml/syntax_error.rb +47 -0
  132. data/lib/nokogiri/xml/text.rb +9 -0
  133. data/lib/nokogiri/xml/xpath.rb +10 -0
  134. data/lib/nokogiri/xml/xpath/syntax_error.rb +11 -0
  135. data/lib/nokogiri/xml/xpath_context.rb +16 -0
  136. data/lib/nokogiri/xslt.rb +52 -0
  137. data/lib/nokogiri/xslt/stylesheet.rb +25 -0
  138. data/lib/xsd/xmlparser/nokogiri.rb +90 -0
  139. data/nokogiri_help_responses.md +40 -0
  140. data/tasks/cross_compile.rb +152 -0
  141. data/tasks/nokogiri.org.rb +18 -0
  142. data/tasks/test.rb +94 -0
  143. data/test/css/test_nthiness.rb +159 -0
  144. data/test/css/test_parser.rb +303 -0
  145. data/test/css/test_tokenizer.rb +198 -0
  146. data/test/css/test_xpath_visitor.rb +85 -0
  147. data/test/decorators/test_slop.rb +16 -0
  148. data/test/files/2ch.html +108 -0
  149. data/test/files/address_book.rlx +12 -0
  150. data/test/files/address_book.xml +10 -0
  151. data/test/files/bar/bar.xsd +4 -0
  152. data/test/files/dont_hurt_em_why.xml +422 -0
  153. data/test/files/encoding.html +82 -0
  154. data/test/files/encoding.xhtml +84 -0
  155. data/test/files/exslt.xml +8 -0
  156. data/test/files/exslt.xslt +35 -0
  157. data/test/files/foo/foo.xsd +4 -0
  158. data/test/files/metacharset.html +10 -0
  159. data/test/files/noencoding.html +47 -0
  160. data/test/files/po.xml +32 -0
  161. data/test/files/po.xsd +66 -0
  162. data/test/files/shift_jis.html +10 -0
  163. data/test/files/shift_jis.xml +5 -0
  164. data/test/files/snuggles.xml +3 -0
  165. data/test/files/staff.dtd +10 -0
  166. data/test/files/staff.xml +59 -0
  167. data/test/files/staff.xslt +32 -0
  168. data/test/files/tlm.html +850 -0
  169. data/test/files/valid_bar.xml +2 -0
  170. data/test/helper.rb +173 -0
  171. data/test/html/sax/test_parser.rb +139 -0
  172. data/test/html/sax/test_parser_context.rb +48 -0
  173. data/test/html/test_builder.rb +165 -0
  174. data/test/html/test_document.rb +472 -0
  175. data/test/html/test_document_encoding.rb +138 -0
  176. data/test/html/test_document_fragment.rb +255 -0
  177. data/test/html/test_element_description.rb +101 -0
  178. data/test/html/test_named_characters.rb +14 -0
  179. data/test/html/test_node.rb +193 -0
  180. data/test/html/test_node_encoding.rb +27 -0
  181. data/test/test_convert_xpath.rb +135 -0
  182. data/test/test_css_cache.rb +45 -0
  183. data/test/test_encoding_handler.rb +46 -0
  184. data/test/test_memory_leak.rb +72 -0
  185. data/test/test_nokogiri.rb +133 -0
  186. data/test/test_reader.rb +425 -0
  187. data/test/test_soap4r_sax.rb +52 -0
  188. data/test/test_xslt_transforms.rb +193 -0
  189. data/test/xml/node/test_save_options.rb +28 -0
  190. data/test/xml/node/test_subclass.rb +44 -0
  191. data/test/xml/sax/test_parser.rb +338 -0
  192. data/test/xml/sax/test_parser_context.rb +113 -0
  193. data/test/xml/sax/test_push_parser.rb +156 -0
  194. data/test/xml/test_attr.rb +65 -0
  195. data/test/xml/test_attribute_decl.rb +86 -0
  196. data/test/xml/test_builder.rb +227 -0
  197. data/test/xml/test_cdata.rb +50 -0
  198. data/test/xml/test_comment.rb +29 -0
  199. data/test/xml/test_document.rb +697 -0
  200. data/test/xml/test_document_encoding.rb +26 -0
  201. data/test/xml/test_document_fragment.rb +192 -0
  202. data/test/xml/test_dtd.rb +107 -0
  203. data/test/xml/test_dtd_encoding.rb +33 -0
  204. data/test/xml/test_element_content.rb +56 -0
  205. data/test/xml/test_element_decl.rb +73 -0
  206. data/test/xml/test_entity_decl.rb +122 -0
  207. data/test/xml/test_entity_reference.rb +21 -0
  208. data/test/xml/test_namespace.rb +70 -0
  209. data/test/xml/test_node.rb +917 -0
  210. data/test/xml/test_node_attributes.rb +34 -0
  211. data/test/xml/test_node_encoding.rb +107 -0
  212. data/test/xml/test_node_reparenting.rb +334 -0
  213. data/test/xml/test_node_set.rb +742 -0
  214. data/test/xml/test_parse_options.rb +52 -0
  215. data/test/xml/test_processing_instruction.rb +30 -0
  216. data/test/xml/test_reader_encoding.rb +126 -0
  217. data/test/xml/test_relax_ng.rb +60 -0
  218. data/test/xml/test_schema.rb +94 -0
  219. data/test/xml/test_syntax_error.rb +12 -0
  220. data/test/xml/test_text.rb +47 -0
  221. data/test/xml/test_unparented_node.rb +381 -0
  222. data/test/xml/test_xpath.rb +237 -0
  223. data/test/xslt/test_custom_functions.rb +94 -0
  224. data/test/xslt/test_exception_handling.rb +37 -0
  225. metadata +548 -0
@@ -0,0 +1,13 @@
1
+ #ifndef NOKOGIRI_XML_NODE
2
+ #define NOKOGIRI_XML_NODE
3
+
4
+ #include <nokogiri.h>
5
+
6
+ void init_xml_node();
7
+
8
+ extern VALUE cNokogiriXmlNode ;
9
+ extern VALUE cNokogiriXmlElement ;
10
+
11
+ VALUE Nokogiri_wrap_xml_node(VALUE klass, xmlNodePtr node) ;
12
+ void Nokogiri_xml_node_properties(xmlNodePtr node, VALUE attr_hash) ;
13
+ #endif
@@ -0,0 +1,418 @@
1
+ #include <xml_node_set.h>
2
+ #include <libxml/xpathInternals.h>
3
+
4
+ static ID decorate ;
5
+
6
+ /*
7
+ * call-seq:
8
+ * dup
9
+ *
10
+ * Duplicate this node set
11
+ */
12
+ static VALUE duplicate(VALUE self)
13
+ {
14
+ xmlNodeSetPtr node_set;
15
+ xmlNodeSetPtr dupl;
16
+
17
+ Data_Get_Struct(self, xmlNodeSet, node_set);
18
+
19
+ dupl = xmlXPathNodeSetMerge(NULL, node_set);
20
+
21
+ return Nokogiri_wrap_xml_node_set(dupl, rb_iv_get(self, "@document"));
22
+ }
23
+
24
+ /*
25
+ * call-seq:
26
+ * length
27
+ *
28
+ * Get the length of the node set
29
+ */
30
+ static VALUE length(VALUE self)
31
+ {
32
+ xmlNodeSetPtr node_set;
33
+ Data_Get_Struct(self, xmlNodeSet, node_set);
34
+
35
+ if(node_set)
36
+ return INT2NUM(node_set->nodeNr);
37
+
38
+ return INT2NUM(0);
39
+ }
40
+
41
+ /*
42
+ * call-seq:
43
+ * push(node)
44
+ *
45
+ * Append +node+ to the NodeSet.
46
+ */
47
+ static VALUE push(VALUE self, VALUE rb_node)
48
+ {
49
+ xmlNodeSetPtr node_set;
50
+ xmlNodePtr node;
51
+
52
+ if(!( rb_obj_is_kind_of_(rb_node, cNokogiriXmlNode) || rb_obj_is_kind_of_(rb_node, cNokogiriXmlNamespace)))
53
+ rb_raise(rb_eArgError, "node must be a Nokogiri::XML::Node or Nokogiri::XML::Namespace");
54
+
55
+ Data_Get_Struct(self, xmlNodeSet, node_set);
56
+ Data_Get_Struct(rb_node, xmlNode, node);
57
+ xmlXPathNodeSetAdd(node_set, node);
58
+ return self;
59
+ }
60
+
61
+ /*
62
+ * call-seq:
63
+ * delete(node)
64
+ *
65
+ * Delete +node+ from the Nodeset, if it is a member. Returns the deleted node
66
+ * if found, otherwise returns nil.
67
+ */
68
+ static VALUE delete(VALUE self, VALUE rb_node)
69
+ {
70
+ xmlNodeSetPtr node_set ;
71
+ xmlNodePtr node ;
72
+
73
+ if(!( rb_obj_is_kind_of_(rb_node, cNokogiriXmlNode) || rb_obj_is_kind_of_(rb_node, cNokogiriXmlNamespace)))
74
+ rb_raise(rb_eArgError, "node must be a Nokogiri::XML::Node or Nokogiri::XML::Namespace");
75
+
76
+ Data_Get_Struct(self, xmlNodeSet, node_set);
77
+ Data_Get_Struct(rb_node, xmlNode, node);
78
+
79
+ if (xmlXPathNodeSetContains(node_set, node)) {
80
+ xmlXPathNodeSetDel(node_set, node);
81
+ return rb_node ;
82
+ }
83
+
84
+ return Qnil ;
85
+ }
86
+
87
+
88
+ /*
89
+ * call-seq:
90
+ * &(node_set)
91
+ *
92
+ * Set Intersection — Returns a new NodeSet containing nodes common to the two NodeSets.
93
+ */
94
+ static VALUE intersection(VALUE self, VALUE rb_other)
95
+ {
96
+ xmlNodeSetPtr node_set;
97
+ xmlNodeSetPtr other;
98
+
99
+ if(! rb_obj_is_kind_of_(rb_other, cNokogiriXmlNodeSet))
100
+ rb_raise(rb_eArgError, "node_set must be a Nokogiri::XML::NodeSet");
101
+
102
+ Data_Get_Struct(self, xmlNodeSet, node_set);
103
+ Data_Get_Struct(rb_other, xmlNodeSet, other);
104
+
105
+ return Nokogiri_wrap_xml_node_set(xmlXPathIntersection(node_set, other), rb_iv_get(self, "@document"));
106
+ }
107
+
108
+
109
+ /*
110
+ * call-seq:
111
+ * include?(node)
112
+ *
113
+ * Returns true if any member of node set equals +node+.
114
+ */
115
+ static VALUE include_eh(VALUE self, VALUE rb_node)
116
+ {
117
+ xmlNodeSetPtr node_set;
118
+ xmlNodePtr node;
119
+
120
+ if(!( rb_obj_is_kind_of_(rb_node, cNokogiriXmlNode) || rb_obj_is_kind_of_(rb_node, cNokogiriXmlNamespace)))
121
+ rb_raise(rb_eArgError, "node must be a Nokogiri::XML::Node or Nokogiri::XML::Namespace");
122
+
123
+ Data_Get_Struct(self, xmlNodeSet, node_set);
124
+ Data_Get_Struct(rb_node, xmlNode, node);
125
+
126
+ return (xmlXPathNodeSetContains(node_set, node) ? Qtrue : Qfalse);
127
+ }
128
+
129
+
130
+ /*
131
+ * call-seq:
132
+ * |(node_set)
133
+ *
134
+ * Returns a new set built by merging the set and the elements of the given
135
+ * set.
136
+ */
137
+ static VALUE set_union(VALUE self, VALUE rb_other)
138
+ {
139
+ xmlNodeSetPtr node_set;
140
+ xmlNodeSetPtr other;
141
+ xmlNodeSetPtr new;
142
+
143
+ if(! rb_obj_is_kind_of_(rb_other, cNokogiriXmlNodeSet))
144
+ rb_raise(rb_eArgError, "node_set must be a Nokogiri::XML::NodeSet");
145
+
146
+ Data_Get_Struct(self, xmlNodeSet, node_set);
147
+ Data_Get_Struct(rb_other, xmlNodeSet, other);
148
+
149
+ new = xmlXPathNodeSetMerge(NULL, node_set);
150
+ new = xmlXPathNodeSetMerge(new, other);
151
+
152
+ return Nokogiri_wrap_xml_node_set(new, rb_iv_get(self, "@document"));
153
+ }
154
+
155
+ /*
156
+ * call-seq:
157
+ * -(node_set)
158
+ *
159
+ * Difference - returns a new NodeSet that is a copy of this NodeSet, removing
160
+ * each item that also appears in +node_set+
161
+ */
162
+ static VALUE minus(VALUE self, VALUE rb_other)
163
+ {
164
+ xmlNodeSetPtr node_set;
165
+ xmlNodeSetPtr other;
166
+ xmlNodeSetPtr new;
167
+ int j ;
168
+
169
+ if(! rb_obj_is_kind_of_(rb_other, cNokogiriXmlNodeSet))
170
+ rb_raise(rb_eArgError, "node_set must be a Nokogiri::XML::NodeSet");
171
+
172
+ Data_Get_Struct(self, xmlNodeSet, node_set);
173
+ Data_Get_Struct(rb_other, xmlNodeSet, other);
174
+
175
+ new = xmlXPathNodeSetMerge(NULL, node_set);
176
+ for (j = 0 ; j < other->nodeNr ; ++j) {
177
+ xmlXPathNodeSetDel(new, other->nodeTab[j]);
178
+ }
179
+
180
+ return Nokogiri_wrap_xml_node_set(new, rb_iv_get(self, "@document"));
181
+ }
182
+
183
+
184
+ static VALUE index_at(VALUE self, long offset)
185
+ {
186
+ xmlNodeSetPtr node_set;
187
+ Data_Get_Struct(self, xmlNodeSet, node_set);
188
+
189
+ if(offset >= node_set->nodeNr || abs((int)offset) > node_set->nodeNr) return Qnil;
190
+ if(offset < 0) offset = offset + node_set->nodeNr;
191
+
192
+ if (XML_NAMESPACE_DECL == node_set->nodeTab[offset]->type)
193
+ return Nokogiri_wrap_xml_namespace2(rb_iv_get(self, "@document"), (xmlNsPtr)(node_set->nodeTab[offset]));
194
+ return Nokogiri_wrap_xml_node(Qnil, node_set->nodeTab[offset]);
195
+ }
196
+
197
+ static VALUE subseq(VALUE self, long beg, long len)
198
+ {
199
+ long j;
200
+ xmlNodeSetPtr node_set;
201
+ xmlNodeSetPtr new_set ;
202
+
203
+ Data_Get_Struct(self, xmlNodeSet, node_set);
204
+
205
+ if (beg > node_set->nodeNr) return Qnil ;
206
+ if (beg < 0 || len < 0) return Qnil ;
207
+
208
+ if ((beg + len) > node_set->nodeNr) {
209
+ len = node_set->nodeNr - beg ;
210
+ }
211
+
212
+ new_set = xmlXPathNodeSetCreate(NULL);
213
+ for (j = beg ; j < beg+len ; ++j) {
214
+ xmlXPathNodeSetAddUnique(new_set, node_set->nodeTab[j]);
215
+ }
216
+ return Nokogiri_wrap_xml_node_set(new_set, rb_iv_get(self, "@document"));
217
+ }
218
+
219
+ /*
220
+ * call-seq:
221
+ * [index] -> Node or nil
222
+ * [start, length] -> NodeSet or nil
223
+ * [range] -> NodeSet or nil
224
+ * slice(index) -> Node or nil
225
+ * slice(start, length) -> NodeSet or nil
226
+ * slice(range) -> NodeSet or nil
227
+ *
228
+ * Element reference - returns the node at +index+, or returns a NodeSet
229
+ * containing nodes starting at +start+ and continuing for +length+ elements, or
230
+ * returns a NodeSet containing nodes specified by +range+. Negative +indices+
231
+ * count backward from the end of the +node_set+ (-1 is the last node). Returns
232
+ * nil if the +index+ (or +start+) are out of range.
233
+ */
234
+ static VALUE slice(int argc, VALUE *argv, VALUE self)
235
+ {
236
+ VALUE arg ;
237
+ long beg, len ;
238
+ xmlNodeSetPtr node_set;
239
+ Data_Get_Struct(self, xmlNodeSet, node_set);
240
+
241
+ if (argc == 2) {
242
+ beg = NUM2LONG(argv[0]);
243
+ len = NUM2LONG(argv[1]);
244
+ if (beg < 0) {
245
+ beg += node_set->nodeNr ;
246
+ }
247
+ return subseq(self, beg, len);
248
+ }
249
+
250
+ if (argc != 1) {
251
+ rb_scan_args(argc, argv, "11", NULL, NULL);
252
+ }
253
+ arg = argv[0];
254
+
255
+ if (FIXNUM_P(arg)) {
256
+ return index_at(self, FIX2LONG(arg));
257
+ }
258
+
259
+ /* if arg is Range */
260
+ switch (rb_range_beg_len(arg, &beg, &len, (long)node_set->nodeNr, 0)) {
261
+ case Qfalse:
262
+ break;
263
+ case Qnil:
264
+ return Qnil;
265
+ default:
266
+ return subseq(self, beg, len);
267
+ }
268
+
269
+ return index_at(self, NUM2LONG(arg));
270
+ }
271
+
272
+
273
+ /*
274
+ * call-seq:
275
+ * to_a
276
+ *
277
+ * Return this list as an Array
278
+ */
279
+ static VALUE to_array(VALUE self, VALUE rb_node)
280
+ {
281
+ xmlNodeSetPtr set;
282
+ VALUE *elts;
283
+ VALUE list;
284
+ int i;
285
+
286
+ Data_Get_Struct(self, xmlNodeSet, set);
287
+
288
+ elts = calloc((size_t)set->nodeNr, sizeof(VALUE *));
289
+ for(i = 0; i < set->nodeNr; i++) {
290
+ if (XML_NAMESPACE_DECL == set->nodeTab[i]->type) {
291
+ elts[i] = Nokogiri_wrap_xml_namespace2(rb_iv_get(self, "@document"), (xmlNsPtr)(set->nodeTab[i]));
292
+ } else {
293
+ xmlNodePtr node = set->nodeTab[i];
294
+
295
+ if(node->_private) {
296
+ if(node->type == XML_DOCUMENT_NODE || node->type == XML_HTML_DOCUMENT_NODE)
297
+ elts[i] = DOC_RUBY_OBJECT(node->doc);
298
+ else
299
+ elts[i] = (VALUE)node->_private;
300
+ } else {
301
+ elts[i] = Nokogiri_wrap_xml_node(Qnil, node);
302
+ }
303
+ }
304
+ }
305
+
306
+ list = rb_ary_new4((long)set->nodeNr, elts);
307
+
308
+ /*free(elts); */
309
+
310
+ return list;
311
+ }
312
+
313
+ /*
314
+ * call-seq:
315
+ * unlink
316
+ *
317
+ * Unlink this NodeSet and all Node objects it contains from their current context.
318
+ */
319
+ static VALUE unlink_nodeset(VALUE self)
320
+ {
321
+ xmlNodeSetPtr node_set;
322
+ int j, nodeNr ;
323
+
324
+ Data_Get_Struct(self, xmlNodeSet, node_set);
325
+ nodeNr = node_set->nodeNr ;
326
+ for (j = 0 ; j < nodeNr ; j++) {
327
+ if (XML_NAMESPACE_DECL != node_set->nodeTab[j]->type) {
328
+ VALUE node ;
329
+ xmlNodePtr node_ptr;
330
+ node = Nokogiri_wrap_xml_node(Qnil, node_set->nodeTab[j]);
331
+ rb_funcall(node, rb_intern("unlink"), 0); /* modifies the C struct out from under the object */
332
+ Data_Get_Struct(node, xmlNode, node_ptr);
333
+ node_set->nodeTab[j] = node_ptr ;
334
+ }
335
+ }
336
+ return self ;
337
+ }
338
+
339
+
340
+ static void deallocate(xmlNodeSetPtr node_set)
341
+ {
342
+ /*
343
+ * xmlXPathFreeNodeSet() contains an implicit assumption that it is being
344
+ * called before any of its pointed-to nodes have been free()d. this
345
+ * assumption lies in the operation where it dereferences nodeTab pointers
346
+ * while searching for namespace nodes to free.
347
+ *
348
+ * however, since Ruby's GC mechanism cannot guarantee the strict order in
349
+ * which ruby objects will be GC'd, nodes may be garbage collected before a
350
+ * nodeset containing pointers to those nodes. (this is true regardless of
351
+ * how we declare dependencies between objects with rb_gc_mark().)
352
+ *
353
+ * as a result, xmlXPathFreeNodeSet() will perform unsafe memory operations,
354
+ * and calling it would be evil.
355
+ *
356
+ * on the bright side, though, Nokogiri's API currently does not cause
357
+ * namespace nodes to be included in node sets, ever.
358
+ *
359
+ * armed with that fact, we examined xmlXPathFreeNodeSet() and related libxml
360
+ * code and determined that, within the Nokogiri abstraction, we will not
361
+ * leak memory if we simply free the node set's memory directly. that's only
362
+ * quasi-evil!
363
+ *
364
+ * there's probably a lesson in here somewhere about intermingling, within a
365
+ * single array, structs with different memory-ownership semantics. or more
366
+ * generally, a lesson about building an API in C/C++ that does not contain
367
+ * assumptions about the strict order in which memory will be released. hey,
368
+ * that sounds like a great idea for a blog post! get to it!
369
+ *
370
+ * "In Valgrind We Trust." seriously.
371
+ */
372
+ NOKOGIRI_DEBUG_START(node_set) ;
373
+ if (node_set->nodeTab != NULL)
374
+ xmlFree(node_set->nodeTab);
375
+ xmlFree(node_set);
376
+ NOKOGIRI_DEBUG_END(node_set) ;
377
+ }
378
+
379
+ static VALUE allocate(VALUE klass)
380
+ {
381
+ return Nokogiri_wrap_xml_node_set(xmlXPathNodeSetCreate(NULL), Qnil);
382
+ }
383
+
384
+ VALUE Nokogiri_wrap_xml_node_set(xmlNodeSetPtr node_set, VALUE document)
385
+ {
386
+ VALUE new_set ;
387
+ new_set = Data_Wrap_Struct(cNokogiriXmlNodeSet, 0, deallocate, node_set);
388
+ if (document != Qnil) {
389
+ rb_iv_set(new_set, "@document", document);
390
+ rb_funcall(document, decorate, 1, new_set);
391
+ }
392
+ return new_set ;
393
+ }
394
+
395
+ VALUE cNokogiriXmlNodeSet ;
396
+ void init_xml_node_set(void)
397
+ {
398
+ VALUE nokogiri = rb_define_module("Nokogiri");
399
+ VALUE xml = rb_define_module_under(nokogiri, "XML");
400
+ VALUE klass = rb_define_class_under(xml, "NodeSet", rb_cObject);
401
+ cNokogiriXmlNodeSet = klass;
402
+
403
+ rb_define_alloc_func(klass, allocate);
404
+ rb_define_method(klass, "length", length, 0);
405
+ rb_define_method(klass, "[]", slice, -1);
406
+ rb_define_method(klass, "slice", slice, -1);
407
+ rb_define_method(klass, "push", push, 1);
408
+ rb_define_method(klass, "|", set_union, 1);
409
+ rb_define_method(klass, "-", minus, 1);
410
+ rb_define_method(klass, "unlink", unlink_nodeset, 0);
411
+ rb_define_method(klass, "to_a", to_array, 0);
412
+ rb_define_method(klass, "dup", duplicate, 0);
413
+ rb_define_method(klass, "delete", delete, 1);
414
+ rb_define_method(klass, "&", intersection, 1);
415
+ rb_define_method(klass, "include?", include_eh, 1);
416
+
417
+ decorate = rb_intern("decorate");
418
+ }
@@ -0,0 +1,9 @@
1
+ #ifndef NOKOGIRI_XML_NODE_SET
2
+ #define NOKOGIRI_XML_NODE_SET
3
+
4
+ #include <nokogiri.h>
5
+ void init_xml_node_set();
6
+
7
+ extern VALUE cNokogiriXmlNodeSet ;
8
+ VALUE Nokogiri_wrap_xml_node_set(xmlNodeSetPtr node_set, VALUE document) ;
9
+ #endif
@@ -0,0 +1,56 @@
1
+ #include <xml_processing_instruction.h>
2
+
3
+ /*
4
+ * call-seq:
5
+ * new(document, name, content)
6
+ *
7
+ * Create a new ProcessingInstruction element on the +document+ with +name+
8
+ * and +content+
9
+ */
10
+ static VALUE new(int argc, VALUE *argv, VALUE klass)
11
+ {
12
+ xmlDocPtr xml_doc;
13
+ xmlNodePtr node;
14
+ VALUE document;
15
+ VALUE name;
16
+ VALUE content;
17
+ VALUE rest;
18
+ VALUE rb_node;
19
+
20
+ rb_scan_args(argc, argv, "3*", &document, &name, &content, &rest);
21
+
22
+ Data_Get_Struct(document, xmlDoc, xml_doc);
23
+
24
+ node = xmlNewDocPI(
25
+ xml_doc,
26
+ (const xmlChar *)StringValuePtr(name),
27
+ (const xmlChar *)StringValuePtr(content)
28
+ );
29
+
30
+ NOKOGIRI_ROOT_NODE(node);
31
+
32
+ rb_node = Nokogiri_wrap_xml_node(klass, node);
33
+ rb_obj_call_init(rb_node, argc, argv);
34
+
35
+ if(rb_block_given_p()) rb_yield(rb_node);
36
+
37
+ return rb_node;
38
+ }
39
+
40
+ VALUE cNokogiriXmlProcessingInstruction;
41
+ void init_xml_processing_instruction()
42
+ {
43
+ VALUE nokogiri = rb_define_module("Nokogiri");
44
+ VALUE xml = rb_define_module_under(nokogiri, "XML");
45
+ VALUE node = rb_define_class_under(xml, "Node", rb_cObject);
46
+
47
+ /*
48
+ * ProcessingInstruction represents a ProcessingInstruction node in an xml
49
+ * document.
50
+ */
51
+ VALUE klass = rb_define_class_under(xml, "ProcessingInstruction", node);
52
+
53
+ cNokogiriXmlProcessingInstruction = klass;
54
+
55
+ rb_define_singleton_method(klass, "new", new, -1);
56
+ }