libxml-ruby 3.2.2-x64-mingw-ucrt
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/HISTORY +848 -0
- data/LICENSE +21 -0
- data/MANIFEST +166 -0
- data/README.rdoc +217 -0
- data/Rakefile +99 -0
- data/ext/libxml/extconf.rb +61 -0
- data/ext/libxml/libxml.c +80 -0
- data/ext/libxml/libxml_ruby.def +35 -0
- data/ext/libxml/ruby_libxml.h +67 -0
- data/ext/libxml/ruby_xml.c +933 -0
- data/ext/libxml/ruby_xml.h +10 -0
- data/ext/libxml/ruby_xml_attr.c +333 -0
- data/ext/libxml/ruby_xml_attr.h +12 -0
- data/ext/libxml/ruby_xml_attr_decl.c +153 -0
- data/ext/libxml/ruby_xml_attr_decl.h +11 -0
- data/ext/libxml/ruby_xml_attributes.c +275 -0
- data/ext/libxml/ruby_xml_attributes.h +15 -0
- data/ext/libxml/ruby_xml_cbg.c +85 -0
- data/ext/libxml/ruby_xml_document.c +1123 -0
- data/ext/libxml/ruby_xml_document.h +11 -0
- data/ext/libxml/ruby_xml_dtd.c +248 -0
- data/ext/libxml/ruby_xml_dtd.h +9 -0
- data/ext/libxml/ruby_xml_encoding.c +250 -0
- data/ext/libxml/ruby_xml_encoding.h +16 -0
- data/ext/libxml/ruby_xml_error.c +996 -0
- data/ext/libxml/ruby_xml_error.h +12 -0
- data/ext/libxml/ruby_xml_html_parser.c +89 -0
- data/ext/libxml/ruby_xml_html_parser.h +10 -0
- data/ext/libxml/ruby_xml_html_parser_context.c +337 -0
- data/ext/libxml/ruby_xml_html_parser_context.h +10 -0
- data/ext/libxml/ruby_xml_html_parser_options.c +46 -0
- data/ext/libxml/ruby_xml_html_parser_options.h +10 -0
- data/ext/libxml/ruby_xml_input_cbg.c +191 -0
- data/ext/libxml/ruby_xml_input_cbg.h +20 -0
- data/ext/libxml/ruby_xml_io.c +47 -0
- data/ext/libxml/ruby_xml_io.h +10 -0
- data/ext/libxml/ruby_xml_namespace.c +153 -0
- data/ext/libxml/ruby_xml_namespace.h +10 -0
- data/ext/libxml/ruby_xml_namespaces.c +293 -0
- data/ext/libxml/ruby_xml_namespaces.h +9 -0
- data/ext/libxml/ruby_xml_node.c +1402 -0
- data/ext/libxml/ruby_xml_node.h +13 -0
- data/ext/libxml/ruby_xml_parser.c +91 -0
- data/ext/libxml/ruby_xml_parser.h +12 -0
- data/ext/libxml/ruby_xml_parser_context.c +999 -0
- data/ext/libxml/ruby_xml_parser_context.h +10 -0
- data/ext/libxml/ruby_xml_parser_options.c +66 -0
- data/ext/libxml/ruby_xml_parser_options.h +12 -0
- data/ext/libxml/ruby_xml_reader.c +1239 -0
- data/ext/libxml/ruby_xml_reader.h +17 -0
- data/ext/libxml/ruby_xml_relaxng.c +110 -0
- data/ext/libxml/ruby_xml_relaxng.h +10 -0
- data/ext/libxml/ruby_xml_sax2_handler.c +326 -0
- data/ext/libxml/ruby_xml_sax2_handler.h +10 -0
- data/ext/libxml/ruby_xml_sax_parser.c +116 -0
- data/ext/libxml/ruby_xml_sax_parser.h +10 -0
- data/ext/libxml/ruby_xml_schema.c +278 -0
- data/ext/libxml/ruby_xml_schema.h +809 -0
- data/ext/libxml/ruby_xml_schema_attribute.c +109 -0
- data/ext/libxml/ruby_xml_schema_attribute.h +15 -0
- data/ext/libxml/ruby_xml_schema_element.c +95 -0
- data/ext/libxml/ruby_xml_schema_element.h +14 -0
- data/ext/libxml/ruby_xml_schema_facet.c +52 -0
- data/ext/libxml/ruby_xml_schema_facet.h +13 -0
- data/ext/libxml/ruby_xml_schema_type.c +232 -0
- data/ext/libxml/ruby_xml_schema_type.h +9 -0
- data/ext/libxml/ruby_xml_version.h +9 -0
- data/ext/libxml/ruby_xml_writer.c +1133 -0
- data/ext/libxml/ruby_xml_writer.h +10 -0
- data/ext/libxml/ruby_xml_xinclude.c +16 -0
- data/ext/libxml/ruby_xml_xinclude.h +11 -0
- data/ext/libxml/ruby_xml_xpath.c +194 -0
- data/ext/libxml/ruby_xml_xpath.h +13 -0
- data/ext/libxml/ruby_xml_xpath_context.c +360 -0
- data/ext/libxml/ruby_xml_xpath_context.h +9 -0
- data/ext/libxml/ruby_xml_xpath_expression.c +81 -0
- data/ext/libxml/ruby_xml_xpath_expression.h +10 -0
- data/ext/libxml/ruby_xml_xpath_object.c +338 -0
- data/ext/libxml/ruby_xml_xpath_object.h +17 -0
- data/ext/libxml/ruby_xml_xpointer.c +99 -0
- data/ext/libxml/ruby_xml_xpointer.h +11 -0
- data/ext/vc/libxml_ruby.sln +28 -0
- data/lib/3.1/libxml_ruby.so +0 -0
- data/lib/libxml/attr.rb +123 -0
- data/lib/libxml/attr_decl.rb +80 -0
- data/lib/libxml/attributes.rb +14 -0
- data/lib/libxml/document.rb +194 -0
- data/lib/libxml/error.rb +95 -0
- data/lib/libxml/hpricot.rb +78 -0
- data/lib/libxml/html_parser.rb +96 -0
- data/lib/libxml/namespace.rb +62 -0
- data/lib/libxml/namespaces.rb +38 -0
- data/lib/libxml/node.rb +323 -0
- data/lib/libxml/parser.rb +101 -0
- data/lib/libxml/sax_callbacks.rb +180 -0
- data/lib/libxml/sax_parser.rb +41 -0
- data/lib/libxml/schema/attribute.rb +19 -0
- data/lib/libxml/schema/element.rb +19 -0
- data/lib/libxml/schema/type.rb +21 -0
- data/lib/libxml/schema.rb +48 -0
- data/lib/libxml/tree.rb +29 -0
- data/lib/libxml-ruby.rb +30 -0
- data/lib/libxml.rb +5 -0
- data/lib/xml/libxml.rb +10 -0
- data/lib/xml.rb +14 -0
- data/libxml-ruby.gemspec +48 -0
- data/script/benchmark/depixelate +634 -0
- data/script/benchmark/hamlet.xml +9055 -0
- data/script/benchmark/parsecount +170 -0
- data/script/benchmark/sock_entries.xml +507 -0
- data/script/benchmark/throughput +41 -0
- data/script/test +6 -0
- data/setup.rb +1584 -0
- data/test/c14n/given/doc.dtd +1 -0
- data/test/c14n/given/example-1.xml +14 -0
- data/test/c14n/given/example-2.xml +11 -0
- data/test/c14n/given/example-3.xml +18 -0
- data/test/c14n/given/example-4.xml +9 -0
- data/test/c14n/given/example-5.xml +12 -0
- data/test/c14n/given/example-6.xml +2 -0
- data/test/c14n/given/example-7.xml +11 -0
- data/test/c14n/given/example-8.xml +11 -0
- data/test/c14n/given/example-8.xpath +10 -0
- data/test/c14n/given/world.txt +1 -0
- data/test/c14n/result/1-1-without-comments/example-1 +4 -0
- data/test/c14n/result/1-1-without-comments/example-2 +11 -0
- data/test/c14n/result/1-1-without-comments/example-3 +14 -0
- data/test/c14n/result/1-1-without-comments/example-4 +9 -0
- data/test/c14n/result/1-1-without-comments/example-5 +3 -0
- data/test/c14n/result/1-1-without-comments/example-6 +1 -0
- data/test/c14n/result/1-1-without-comments/example-7 +1 -0
- data/test/c14n/result/1-1-without-comments/example-8 +1 -0
- data/test/c14n/result/with-comments/example-1 +6 -0
- data/test/c14n/result/with-comments/example-2 +11 -0
- data/test/c14n/result/with-comments/example-3 +14 -0
- data/test/c14n/result/with-comments/example-4 +9 -0
- data/test/c14n/result/with-comments/example-5 +4 -0
- data/test/c14n/result/with-comments/example-6 +1 -0
- data/test/c14n/result/with-comments/example-7 +1 -0
- data/test/c14n/result/without-comments/example-1 +4 -0
- data/test/c14n/result/without-comments/example-2 +11 -0
- data/test/c14n/result/without-comments/example-3 +14 -0
- data/test/c14n/result/without-comments/example-4 +9 -0
- data/test/c14n/result/without-comments/example-5 +3 -0
- data/test/c14n/result/without-comments/example-6 +1 -0
- data/test/c14n/result/without-comments/example-7 +1 -0
- data/test/model/atom.xml +13 -0
- data/test/model/bands.iso-8859-1.xml +5 -0
- data/test/model/bands.utf-8.xml +5 -0
- data/test/model/bands.xml +5 -0
- data/test/model/books.xml +154 -0
- data/test/model/cwm_1_0.xml +11336 -0
- data/test/model/merge_bug_data.xml +58 -0
- data/test/model/ruby-lang.html +238 -0
- data/test/model/rubynet.xml +79 -0
- data/test/model/rubynet_project +1 -0
- data/test/model/shiporder.rnc +28 -0
- data/test/model/shiporder.rng +86 -0
- data/test/model/shiporder.xml +23 -0
- data/test/model/shiporder.xsd +40 -0
- data/test/model/soap.xml +27 -0
- data/test/model/xinclude.xml +5 -0
- data/test/test_attr.rb +181 -0
- data/test/test_attr_decl.rb +132 -0
- data/test/test_attributes.rb +136 -0
- data/test/test_canonicalize.rb +120 -0
- data/test/test_deprecated_require.rb +12 -0
- data/test/test_document.rb +132 -0
- data/test/test_document_write.rb +146 -0
- data/test/test_dtd.rb +129 -0
- data/test/test_encoding.rb +129 -0
- data/test/test_encoding_sax.rb +115 -0
- data/test/test_error.rb +178 -0
- data/test/test_helper.rb +9 -0
- data/test/test_html_parser.rb +162 -0
- data/test/test_html_parser_context.rb +23 -0
- data/test/test_namespace.rb +60 -0
- data/test/test_namespaces.rb +200 -0
- data/test/test_node.rb +237 -0
- data/test/test_node_cdata.rb +50 -0
- data/test/test_node_comment.rb +32 -0
- data/test/test_node_copy.rb +40 -0
- data/test/test_node_edit.rb +158 -0
- data/test/test_node_pi.rb +37 -0
- data/test/test_node_text.rb +69 -0
- data/test/test_node_write.rb +97 -0
- data/test/test_node_xlink.rb +28 -0
- data/test/test_parser.rb +324 -0
- data/test/test_parser_context.rb +198 -0
- data/test/test_properties.rb +38 -0
- data/test/test_reader.rb +364 -0
- data/test/test_relaxng.rb +53 -0
- data/test/test_sax_parser.rb +326 -0
- data/test/test_schema.rb +168 -0
- data/test/test_suite.rb +48 -0
- data/test/test_traversal.rb +152 -0
- data/test/test_writer.rb +468 -0
- data/test/test_xinclude.rb +20 -0
- data/test/test_xml.rb +263 -0
- data/test/test_xpath.rb +244 -0
- data/test/test_xpath_context.rb +88 -0
- data/test/test_xpath_expression.rb +37 -0
- data/test/test_xpointer.rb +72 -0
- metadata +325 -0
@@ -0,0 +1,11 @@
|
|
1
|
+
/* Please see the LICENSE file for copyright and distribution information */
|
2
|
+
|
3
|
+
#ifndef __RXML_DOCUMENT__
|
4
|
+
#define __RXML_DOCUMENT__
|
5
|
+
|
6
|
+
extern VALUE cXMLDocument;
|
7
|
+
void rxml_init_document();
|
8
|
+
VALUE rxml_document_wrap(xmlDocPtr xnode);
|
9
|
+
|
10
|
+
typedef xmlChar * xmlCharPtr;
|
11
|
+
#endif
|
@@ -0,0 +1,248 @@
|
|
1
|
+
#include "ruby_libxml.h"
|
2
|
+
#include "ruby_xml_dtd.h"
|
3
|
+
|
4
|
+
/*
|
5
|
+
* Document-class: LibXML::XML::Dtd
|
6
|
+
*
|
7
|
+
* The XML::Dtd class is used to prepare DTD's for validation of xml
|
8
|
+
* documents.
|
9
|
+
*
|
10
|
+
* DTDs can be created from a string or a pair of public and system identifiers.
|
11
|
+
* Once a Dtd object is instantiated, an XML document can be validated by the
|
12
|
+
* XML::Document#validate method providing the XML::Dtd object as parameeter.
|
13
|
+
* The method will raise an exception if the document is
|
14
|
+
* not valid.
|
15
|
+
*
|
16
|
+
* Basic usage:
|
17
|
+
*
|
18
|
+
* # parse DTD
|
19
|
+
* dtd = XML::Dtd.new(<<EOF)
|
20
|
+
* <!ELEMENT root (item*) >
|
21
|
+
* <!ELEMENT item (#PCDATA) >
|
22
|
+
* EOF
|
23
|
+
*
|
24
|
+
* # parse xml document to be validated
|
25
|
+
* instance = XML::Document.file('instance.xml')
|
26
|
+
*
|
27
|
+
* # validate
|
28
|
+
* instance.validate(dtd)
|
29
|
+
*/
|
30
|
+
|
31
|
+
VALUE cXMLDtd;
|
32
|
+
|
33
|
+
void rxml_dtd_free(xmlDtdPtr xdtd)
|
34
|
+
{
|
35
|
+
if (xdtd->doc == NULL && xdtd->parent == NULL)
|
36
|
+
xmlFreeDtd(xdtd);
|
37
|
+
}
|
38
|
+
|
39
|
+
void rxml_dtd_mark(xmlDtdPtr xdtd)
|
40
|
+
{
|
41
|
+
if (xdtd && xdtd->doc)
|
42
|
+
{
|
43
|
+
VALUE doc = (VALUE)xdtd->doc->_private;
|
44
|
+
rb_gc_mark(doc);
|
45
|
+
}
|
46
|
+
}
|
47
|
+
|
48
|
+
static VALUE rxml_dtd_alloc(VALUE klass)
|
49
|
+
{
|
50
|
+
return Data_Wrap_Struct(klass, rxml_dtd_mark, rxml_dtd_free, NULL);
|
51
|
+
}
|
52
|
+
|
53
|
+
VALUE rxml_dtd_wrap(xmlDtdPtr xdtd)
|
54
|
+
{
|
55
|
+
return Data_Wrap_Struct(cXMLDtd, NULL, NULL, xdtd);
|
56
|
+
}
|
57
|
+
|
58
|
+
/*
|
59
|
+
* call-seq:
|
60
|
+
* dtd.external_id -> "string"
|
61
|
+
*
|
62
|
+
* Obtain this dtd's external identifer (for a PUBLIC DTD).
|
63
|
+
*/
|
64
|
+
static VALUE rxml_dtd_external_id_get(VALUE self)
|
65
|
+
{
|
66
|
+
xmlDtdPtr xdtd;
|
67
|
+
Data_Get_Struct(self, xmlDtd, xdtd);
|
68
|
+
|
69
|
+
|
70
|
+
if (xdtd->ExternalID == NULL)
|
71
|
+
return (Qnil);
|
72
|
+
else
|
73
|
+
return (rxml_new_cstr( xdtd->ExternalID, NULL));
|
74
|
+
}
|
75
|
+
|
76
|
+
/*
|
77
|
+
* call-seq:
|
78
|
+
* dtd.name -> "string"
|
79
|
+
*
|
80
|
+
* Obtain this dtd's name.
|
81
|
+
*/
|
82
|
+
static VALUE rxml_dtd_name_get(VALUE self)
|
83
|
+
{
|
84
|
+
xmlDtdPtr xdtd;
|
85
|
+
Data_Get_Struct(self, xmlDtd, xdtd);
|
86
|
+
|
87
|
+
|
88
|
+
if (xdtd->name == NULL)
|
89
|
+
return (Qnil);
|
90
|
+
else
|
91
|
+
return (rxml_new_cstr( xdtd->name, NULL));
|
92
|
+
}
|
93
|
+
|
94
|
+
|
95
|
+
/*
|
96
|
+
* call-seq:
|
97
|
+
* dtd.uri -> "string"
|
98
|
+
*
|
99
|
+
* Obtain this dtd's URI (for a SYSTEM or PUBLIC DTD).
|
100
|
+
*/
|
101
|
+
static VALUE rxml_dtd_uri_get(VALUE self)
|
102
|
+
{
|
103
|
+
xmlDtdPtr xdtd;
|
104
|
+
Data_Get_Struct(self, xmlDtd, xdtd);
|
105
|
+
|
106
|
+
if (xdtd->SystemID == NULL)
|
107
|
+
return (Qnil);
|
108
|
+
else
|
109
|
+
return (rxml_new_cstr( xdtd->SystemID, NULL));
|
110
|
+
}
|
111
|
+
|
112
|
+
/*
|
113
|
+
* call-seq:
|
114
|
+
* node.type -> num
|
115
|
+
*
|
116
|
+
* Obtain this node's type identifier.
|
117
|
+
*/
|
118
|
+
static VALUE rxml_dtd_type(VALUE self)
|
119
|
+
{
|
120
|
+
xmlDtdPtr xdtd;
|
121
|
+
Data_Get_Struct(self, xmlDtd, xdtd);
|
122
|
+
return (INT2NUM(xdtd->type));
|
123
|
+
}
|
124
|
+
|
125
|
+
/*
|
126
|
+
* call-seq:
|
127
|
+
* XML::Dtd.new("DTD string") -> dtd
|
128
|
+
* XML::Dtd.new("public", "system") -> dtd
|
129
|
+
* XML::Dtd.new("name", "public", "system", document) -> external subset dtd
|
130
|
+
* XML::Dtd.new("name", "public", "system", document, false) -> internal subset dtd
|
131
|
+
* XML::Dtd.new("name", "public", "system", document, true) -> internal subset dtd
|
132
|
+
*
|
133
|
+
* Create a new Dtd from the specified public and system
|
134
|
+
* identifiers.
|
135
|
+
*/
|
136
|
+
static VALUE rxml_dtd_initialize(int argc, VALUE *argv, VALUE self)
|
137
|
+
{
|
138
|
+
VALUE external, system, dtd_string;
|
139
|
+
xmlParserInputBufferPtr buffer;
|
140
|
+
xmlCharEncoding enc = XML_CHAR_ENCODING_NONE;
|
141
|
+
xmlChar *new_string;
|
142
|
+
xmlDtdPtr xdtd;
|
143
|
+
|
144
|
+
// 1 argument -- string --> parsujeme jako dtd
|
145
|
+
// 2 arguments -- public, system --> bude se hledat
|
146
|
+
// 3 arguments -- public, system, name --> creates an external subset (any parameter may be nil)
|
147
|
+
// 4 arguments -- public, system, name, doc --> creates an external subset (any parameter may be nil)
|
148
|
+
// 5 arguments -- public, system, name, doc, true --> creates an internal subset (all but last parameter may be nil)
|
149
|
+
switch (argc)
|
150
|
+
{
|
151
|
+
case 3:
|
152
|
+
case 4:
|
153
|
+
case 5: {
|
154
|
+
VALUE name, doc, internal;
|
155
|
+
const xmlChar *xname = NULL, *xpublic = NULL, *xsystem = NULL;
|
156
|
+
xmlDocPtr xdoc = NULL;
|
157
|
+
|
158
|
+
rb_scan_args(argc, argv, "32", &external, &system, &name, &doc, &internal);
|
159
|
+
|
160
|
+
if (external != Qnil) {
|
161
|
+
Check_Type(external, T_STRING);
|
162
|
+
xpublic = (const xmlChar*) StringValuePtr(external);
|
163
|
+
}
|
164
|
+
if (system != Qnil) {
|
165
|
+
Check_Type(system, T_STRING);
|
166
|
+
xsystem = (const xmlChar*) StringValuePtr(system);
|
167
|
+
}
|
168
|
+
if (name != Qnil) {
|
169
|
+
Check_Type(name, T_STRING);
|
170
|
+
xname = (const xmlChar*) StringValuePtr(name);
|
171
|
+
}
|
172
|
+
if (doc != Qnil) {
|
173
|
+
if (rb_obj_is_kind_of(doc, cXMLDocument) == Qfalse)
|
174
|
+
rb_raise(rb_eTypeError, "Must pass an LibXML::XML::Document object");
|
175
|
+
Data_Get_Struct(doc, xmlDoc, xdoc);
|
176
|
+
}
|
177
|
+
|
178
|
+
if (internal == Qnil || internal == Qfalse)
|
179
|
+
xdtd = xmlNewDtd(xdoc, xname, xpublic, xsystem);
|
180
|
+
else
|
181
|
+
xdtd = xmlCreateIntSubset(xdoc, xname, xpublic, xsystem);
|
182
|
+
|
183
|
+
if (xdtd == NULL)
|
184
|
+
rxml_raise(&xmlLastError);
|
185
|
+
|
186
|
+
/* Document will free this dtd now. */
|
187
|
+
RDATA(self)->dfree = NULL;
|
188
|
+
DATA_PTR(self) = xdtd;
|
189
|
+
|
190
|
+
xmlSetTreeDoc((xmlNodePtr) xdtd, xdoc);
|
191
|
+
}
|
192
|
+
break;
|
193
|
+
|
194
|
+
case 2:
|
195
|
+
rb_scan_args(argc, argv, "20", &external, &system);
|
196
|
+
|
197
|
+
Check_Type(external, T_STRING);
|
198
|
+
Check_Type(system, T_STRING);
|
199
|
+
|
200
|
+
xdtd = xmlParseDTD((xmlChar*) StringValuePtr(external),
|
201
|
+
(xmlChar*) StringValuePtr(system));
|
202
|
+
|
203
|
+
if (xdtd == NULL)
|
204
|
+
rxml_raise(&xmlLastError);
|
205
|
+
|
206
|
+
DATA_PTR(self) = xdtd;
|
207
|
+
|
208
|
+
xmlSetTreeDoc((xmlNodePtr) xdtd, NULL);
|
209
|
+
break;
|
210
|
+
|
211
|
+
case 1:
|
212
|
+
rb_scan_args(argc, argv, "10", &dtd_string);
|
213
|
+
Check_Type(dtd_string, T_STRING);
|
214
|
+
|
215
|
+
/* Note that buffer is freed by xmlParserInputBufferPush*/
|
216
|
+
buffer = xmlAllocParserInputBuffer(enc);
|
217
|
+
new_string = xmlStrdup((xmlChar*) StringValuePtr(dtd_string));
|
218
|
+
xmlParserInputBufferPush(buffer, xmlStrlen(new_string),
|
219
|
+
(const char*) new_string);
|
220
|
+
|
221
|
+
xdtd = xmlIOParseDTD(NULL, buffer, enc);
|
222
|
+
|
223
|
+
if (xdtd == NULL)
|
224
|
+
rxml_raise(&xmlLastError);
|
225
|
+
|
226
|
+
xmlFree(new_string);
|
227
|
+
|
228
|
+
DATA_PTR(self) = xdtd;
|
229
|
+
break;
|
230
|
+
|
231
|
+
default:
|
232
|
+
rb_raise(rb_eArgError, "wrong number of arguments");
|
233
|
+
}
|
234
|
+
|
235
|
+
return self;
|
236
|
+
}
|
237
|
+
|
238
|
+
void rxml_init_dtd()
|
239
|
+
{
|
240
|
+
cXMLDtd = rb_define_class_under(mXML, "Dtd", rb_cObject);
|
241
|
+
rb_define_alloc_func(cXMLDtd, rxml_dtd_alloc);
|
242
|
+
rb_define_method(cXMLDtd, "initialize", rxml_dtd_initialize, -1);
|
243
|
+
rb_define_method(cXMLDtd, "external_id", rxml_dtd_external_id_get, 0);
|
244
|
+
rb_define_method(cXMLDtd, "name", rxml_dtd_name_get, 0);
|
245
|
+
rb_define_method(cXMLDtd, "uri", rxml_dtd_uri_get, 0);
|
246
|
+
rb_define_method(cXMLDtd, "node_type", rxml_dtd_type, 0);
|
247
|
+
rb_define_alias(cXMLDtd, "system_id", "uri");
|
248
|
+
}
|
@@ -0,0 +1,250 @@
|
|
1
|
+
/* Please see the LICENSE file for copyright and distribution information */
|
2
|
+
|
3
|
+
#include <stdarg.h>
|
4
|
+
#include "ruby_libxml.h"
|
5
|
+
|
6
|
+
/*
|
7
|
+
* Document-class: LibXML::XML::Encoding
|
8
|
+
*
|
9
|
+
* The encoding class exposes the encodings that libxml
|
10
|
+
* supports via constants.
|
11
|
+
*
|
12
|
+
* LibXML converts all data sources to UTF8
|
13
|
+
* internally before processing them. By default,
|
14
|
+
* LibXML determines a data source's encoding
|
15
|
+
* using the algorithm described on its
|
16
|
+
* website[http://xmlsoft.org/encoding.html].
|
17
|
+
*
|
18
|
+
* However, you may override a data source's encoding
|
19
|
+
* by using the encoding constants defined in this
|
20
|
+
* module.
|
21
|
+
*
|
22
|
+
* Example 1:
|
23
|
+
*
|
24
|
+
* io = File.open('some_file', 'rb')
|
25
|
+
* parser = XML::Parser.io(io, :encoding => XML::Encoding::ISO_8859_1)
|
26
|
+
* doc = parser.parse
|
27
|
+
*
|
28
|
+
* Example 2:
|
29
|
+
*
|
30
|
+
* parser = XML::HTMLParser.file("some_file", :encoding => XML::Encoding::ISO_8859_1)
|
31
|
+
* doc = parser.parse
|
32
|
+
*
|
33
|
+
* Example 3:
|
34
|
+
*
|
35
|
+
* document = XML::Document.new
|
36
|
+
* document.encoding = XML::Encoding::ISO_8859_1
|
37
|
+
* doc << XML::Node.new
|
38
|
+
*/
|
39
|
+
|
40
|
+
VALUE mXMLEncoding;
|
41
|
+
|
42
|
+
/*
|
43
|
+
* call-seq:
|
44
|
+
* Encoding.from_s("UTF_8") -> XML::Encoding::UTF_8
|
45
|
+
*
|
46
|
+
* Converts an encoding string to an encoding constant
|
47
|
+
* defined on the XML::Encoding class.
|
48
|
+
*/
|
49
|
+
static VALUE rxml_encoding_from_s(VALUE klass, VALUE encoding)
|
50
|
+
{
|
51
|
+
xmlCharEncoding xencoding;
|
52
|
+
|
53
|
+
if (encoding == Qnil)
|
54
|
+
return Qnil;
|
55
|
+
|
56
|
+
xencoding = xmlParseCharEncoding(StringValuePtr(encoding));
|
57
|
+
return INT2NUM(xencoding);
|
58
|
+
}
|
59
|
+
|
60
|
+
/*
|
61
|
+
* call-seq:
|
62
|
+
* Encoding.to_s(XML::Encoding::UTF_8) -> "UTF-8"
|
63
|
+
*
|
64
|
+
* Converts an encoding constant defined on the XML::Encoding
|
65
|
+
* class to its text representation.
|
66
|
+
*/
|
67
|
+
static VALUE rxml_encoding_to_s(VALUE klass, VALUE encoding)
|
68
|
+
{
|
69
|
+
const xmlChar* xencoding = (const xmlChar*)xmlGetCharEncodingName(NUM2INT(encoding));
|
70
|
+
|
71
|
+
if (!xencoding)
|
72
|
+
return Qnil;
|
73
|
+
else
|
74
|
+
return rxml_new_cstr(xencoding, xencoding);
|
75
|
+
}
|
76
|
+
|
77
|
+
/*
|
78
|
+
* Converts an xmlCharEncoding enum value into a Ruby Encoding object (available
|
79
|
+
* on Ruby 1.9.* and higher).
|
80
|
+
*/
|
81
|
+
rb_encoding* rxml_xml_encoding_to_rb_encoding(VALUE klass, xmlCharEncoding xmlEncoding)
|
82
|
+
{
|
83
|
+
const char* encodingName;
|
84
|
+
|
85
|
+
switch (xmlEncoding)
|
86
|
+
{
|
87
|
+
case XML_CHAR_ENCODING_UTF8:
|
88
|
+
encodingName = "UTF-8";
|
89
|
+
break;
|
90
|
+
case XML_CHAR_ENCODING_UTF16LE:
|
91
|
+
encodingName = "UTF-16LE";
|
92
|
+
break;
|
93
|
+
case XML_CHAR_ENCODING_UTF16BE:
|
94
|
+
encodingName = "UTF-16BE";
|
95
|
+
break;
|
96
|
+
case XML_CHAR_ENCODING_UCS4LE:
|
97
|
+
encodingName = "UCS-4LE";
|
98
|
+
break;
|
99
|
+
case XML_CHAR_ENCODING_UCS4BE:
|
100
|
+
encodingName = "UCS-4BE";
|
101
|
+
break;
|
102
|
+
case XML_CHAR_ENCODING_UCS2:
|
103
|
+
encodingName = "UCS-2";
|
104
|
+
break;
|
105
|
+
case XML_CHAR_ENCODING_8859_1:
|
106
|
+
encodingName = "ISO8859-1";
|
107
|
+
break;
|
108
|
+
case XML_CHAR_ENCODING_8859_2:
|
109
|
+
encodingName = "ISO8859-2";
|
110
|
+
break;
|
111
|
+
case XML_CHAR_ENCODING_8859_3:
|
112
|
+
encodingName = "ISO8859-3";
|
113
|
+
break;
|
114
|
+
case XML_CHAR_ENCODING_8859_4:
|
115
|
+
encodingName = "ISO8859-4";
|
116
|
+
break;
|
117
|
+
case XML_CHAR_ENCODING_8859_5:
|
118
|
+
encodingName = "ISO8859-5";
|
119
|
+
break;
|
120
|
+
case XML_CHAR_ENCODING_8859_6:
|
121
|
+
encodingName = "ISO8859-6";
|
122
|
+
break;
|
123
|
+
case XML_CHAR_ENCODING_8859_7:
|
124
|
+
encodingName = "ISO8859-7";
|
125
|
+
break;
|
126
|
+
case XML_CHAR_ENCODING_8859_8:
|
127
|
+
encodingName = "ISO8859-8";
|
128
|
+
break;
|
129
|
+
case XML_CHAR_ENCODING_8859_9:
|
130
|
+
encodingName = "ISO8859-9";
|
131
|
+
break;
|
132
|
+
case XML_CHAR_ENCODING_2022_JP:
|
133
|
+
encodingName = "ISO-2022-JP";
|
134
|
+
break;
|
135
|
+
case XML_CHAR_ENCODING_SHIFT_JIS:
|
136
|
+
encodingName = "SHIFT-JIS";
|
137
|
+
break;
|
138
|
+
case XML_CHAR_ENCODING_EUC_JP:
|
139
|
+
encodingName = "EUC-JP";
|
140
|
+
break;
|
141
|
+
case XML_CHAR_ENCODING_ASCII:
|
142
|
+
encodingName = "US-ASCII";
|
143
|
+
break;
|
144
|
+
default:
|
145
|
+
/* Covers XML_CHAR_ENCODING_ERROR, XML_CHAR_ENCODING_NONE, XML_CHAR_ENCODING_EBCDIC */
|
146
|
+
encodingName = "ASCII-8BIT";
|
147
|
+
break;
|
148
|
+
}
|
149
|
+
|
150
|
+
return rb_enc_find(encodingName);
|
151
|
+
}
|
152
|
+
|
153
|
+
/*
|
154
|
+
* call-seq:
|
155
|
+
* Input.encoding_to_rb_encoding(Input::ENCODING) -> Encoding
|
156
|
+
*
|
157
|
+
* Converts an encoding constant defined on the XML::Encoding
|
158
|
+
* class to a Ruby encoding object (available on Ruby 1.9.* and higher).
|
159
|
+
*/
|
160
|
+
VALUE rxml_encoding_to_rb_encoding(VALUE klass, VALUE encoding)
|
161
|
+
{
|
162
|
+
xmlCharEncoding xmlEncoding = (xmlCharEncoding)NUM2INT(encoding);
|
163
|
+
rb_encoding* rbencoding = rxml_xml_encoding_to_rb_encoding(klass, xmlEncoding);
|
164
|
+
return rb_enc_from_encoding(rbencoding);
|
165
|
+
}
|
166
|
+
|
167
|
+
rb_encoding* rxml_figure_encoding(const xmlChar* xencoding)
|
168
|
+
{
|
169
|
+
rb_encoding* result;
|
170
|
+
if (xencoding)
|
171
|
+
{
|
172
|
+
xmlCharEncoding xmlEncoding = xmlParseCharEncoding((const char*)xencoding);
|
173
|
+
result = rxml_xml_encoding_to_rb_encoding(mXMLEncoding, xmlEncoding);
|
174
|
+
}
|
175
|
+
else
|
176
|
+
{
|
177
|
+
result = rb_utf8_encoding();
|
178
|
+
}
|
179
|
+
return result;
|
180
|
+
}
|
181
|
+
|
182
|
+
VALUE rxml_new_cstr(const xmlChar* xstr, const xmlChar* xencoding)
|
183
|
+
{
|
184
|
+
rb_encoding *rbencoding = rxml_figure_encoding(xencoding);
|
185
|
+
return rb_external_str_new_with_enc((const char*)xstr, strlen((const char*)xstr), rbencoding);
|
186
|
+
}
|
187
|
+
|
188
|
+
VALUE rxml_new_cstr_len(const xmlChar* xstr, const long length, const xmlChar* xencoding)
|
189
|
+
{
|
190
|
+
rb_encoding *rbencoding = rxml_figure_encoding(xencoding);
|
191
|
+
return rb_external_str_new_with_enc((const char*)xstr, length, rbencoding);
|
192
|
+
}
|
193
|
+
|
194
|
+
void rxml_init_encoding(void)
|
195
|
+
{
|
196
|
+
mXMLEncoding = rb_define_module_under(mXML, "Encoding");
|
197
|
+
rb_define_module_function(mXMLEncoding, "from_s", rxml_encoding_from_s, 1);
|
198
|
+
rb_define_module_function(mXMLEncoding, "to_s", rxml_encoding_to_s, 1);
|
199
|
+
|
200
|
+
rb_define_module_function(mXMLEncoding, "to_rb_encoding", rxml_encoding_to_rb_encoding, 2);
|
201
|
+
|
202
|
+
/* -1: No char encoding detected. */
|
203
|
+
rb_define_const(mXMLEncoding, "ERROR", INT2NUM(XML_CHAR_ENCODING_ERROR));
|
204
|
+
/* 0: No char encoding detected. */
|
205
|
+
rb_define_const(mXMLEncoding, "NONE", INT2NUM(XML_CHAR_ENCODING_NONE));
|
206
|
+
/* 1: UTF-8 */
|
207
|
+
rb_define_const(mXMLEncoding, "UTF_8", INT2NUM(XML_CHAR_ENCODING_UTF8));
|
208
|
+
/* 2: UTF-16 little endian. */
|
209
|
+
rb_define_const(mXMLEncoding, "UTF_16LE", INT2NUM(XML_CHAR_ENCODING_UTF16LE));
|
210
|
+
/* 3: UTF-16 big endian. */
|
211
|
+
rb_define_const(mXMLEncoding, "UTF_16BE", INT2NUM(XML_CHAR_ENCODING_UTF16BE));
|
212
|
+
/* 4: UCS-4 little endian. */
|
213
|
+
rb_define_const(mXMLEncoding, "UCS_4LE", INT2NUM(XML_CHAR_ENCODING_UCS4LE));
|
214
|
+
/* 5: UCS-4 big endian. */
|
215
|
+
rb_define_const(mXMLEncoding, "UCS_4BE", INT2NUM(XML_CHAR_ENCODING_UCS4BE));
|
216
|
+
/* 6: EBCDIC uh! */
|
217
|
+
rb_define_const(mXMLEncoding, "EBCDIC", INT2NUM(XML_CHAR_ENCODING_EBCDIC));
|
218
|
+
/* 7: UCS-4 unusual ordering. */
|
219
|
+
rb_define_const(mXMLEncoding, "UCS_4_2143", INT2NUM(XML_CHAR_ENCODING_UCS4_2143));
|
220
|
+
/* 8: UCS-4 unusual ordering. */
|
221
|
+
rb_define_const(mXMLEncoding, "UCS_4_3412", INT2NUM(XML_CHAR_ENCODING_UCS4_3412));
|
222
|
+
/* 9: UCS-2. */
|
223
|
+
rb_define_const(mXMLEncoding, "UCS_2", INT2NUM(XML_CHAR_ENCODING_UCS2));
|
224
|
+
/* 10: ISO-8859-1 ISO Latin 1. */
|
225
|
+
rb_define_const(mXMLEncoding, "ISO_8859_1", INT2NUM(XML_CHAR_ENCODING_8859_1));
|
226
|
+
/* 11: ISO-8859-2 ISO Latin 2. */
|
227
|
+
rb_define_const(mXMLEncoding, "ISO_8859_2", INT2NUM(XML_CHAR_ENCODING_8859_2));
|
228
|
+
/* 12: ISO-8859-3. */
|
229
|
+
rb_define_const(mXMLEncoding, "ISO_8859_3", INT2NUM(XML_CHAR_ENCODING_8859_3));
|
230
|
+
/* 13: ISO-8859-4. */
|
231
|
+
rb_define_const(mXMLEncoding, "ISO_8859_4", INT2NUM(XML_CHAR_ENCODING_8859_4));
|
232
|
+
/* 14: ISO-8859-5. */
|
233
|
+
rb_define_const(mXMLEncoding, "ISO_8859_5", INT2NUM(XML_CHAR_ENCODING_8859_5));
|
234
|
+
/* 15: ISO-8859-6. */
|
235
|
+
rb_define_const(mXMLEncoding, "ISO_8859_6", INT2NUM(XML_CHAR_ENCODING_8859_6));
|
236
|
+
/* 16: ISO-8859-7. */
|
237
|
+
rb_define_const(mXMLEncoding, "ISO_8859_7", INT2NUM(XML_CHAR_ENCODING_8859_7));
|
238
|
+
/* 17: ISO-8859-8. */
|
239
|
+
rb_define_const(mXMLEncoding, "ISO_8859_8", INT2NUM(XML_CHAR_ENCODING_8859_8));
|
240
|
+
/* 18: ISO-8859-9. */
|
241
|
+
rb_define_const(mXMLEncoding, "ISO_8859_9", INT2NUM(XML_CHAR_ENCODING_8859_9));
|
242
|
+
/* 19: ISO-2022-JP. */
|
243
|
+
rb_define_const(mXMLEncoding, "ISO_2022_JP", INT2NUM(XML_CHAR_ENCODING_2022_JP));
|
244
|
+
/* 20: Shift_JIS. */
|
245
|
+
rb_define_const(mXMLEncoding, "SHIFT_JIS", INT2NUM(XML_CHAR_ENCODING_SHIFT_JIS));
|
246
|
+
/* 21: EUC-JP. */
|
247
|
+
rb_define_const(mXMLEncoding, "EUC_JP", INT2NUM(XML_CHAR_ENCODING_EUC_JP));
|
248
|
+
/* 22: pure ASCII. */
|
249
|
+
rb_define_const(mXMLEncoding, "ASCII", INT2NUM(XML_CHAR_ENCODING_ASCII));
|
250
|
+
}
|
@@ -0,0 +1,16 @@
|
|
1
|
+
/* Please see the LICENSE file for copyright and distribution information */
|
2
|
+
|
3
|
+
#ifndef __RXML_ENCODING__
|
4
|
+
#define __RXML_ENCODING__
|
5
|
+
|
6
|
+
extern VALUE mXMLEncoding;
|
7
|
+
|
8
|
+
void rxml_init_encoding();
|
9
|
+
|
10
|
+
VALUE rxml_new_cstr(const xmlChar* xstr, const xmlChar* xencoding);
|
11
|
+
VALUE rxml_new_cstr_len(const xmlChar* xstr, const long length, const xmlChar* xencoding);
|
12
|
+
|
13
|
+
rb_encoding* rxml_xml_encoding_to_rb_encoding(VALUE klass, xmlCharEncoding xmlEncoding);
|
14
|
+
rb_encoding* rxml_figure_encoding(const xmlChar* xencoding);
|
15
|
+
|
16
|
+
#endif
|