nokogiri 1.10.10 → 1.14.3-aarch64-linux
Sign up to get free protection for your applications and to get access to all the features.
Potentially problematic release.
This version of nokogiri might be problematic. Click here for more details.
- checksums.yaml +4 -4
- data/Gemfile +44 -0
- data/LICENSE-DEPENDENCIES.md +1632 -1022
- data/LICENSE.md +1 -1
- data/README.md +185 -96
- data/bin/nokogiri +63 -50
- data/dependencies.yml +33 -66
- data/ext/nokogiri/depend +38 -358
- data/ext/nokogiri/extconf.rb +819 -421
- data/ext/nokogiri/gumbo.c +594 -0
- data/ext/nokogiri/html4_document.c +166 -0
- data/ext/nokogiri/html4_element_description.c +294 -0
- data/ext/nokogiri/html4_entity_lookup.c +37 -0
- data/ext/nokogiri/html4_sax_parser_context.c +114 -0
- data/ext/nokogiri/html4_sax_push_parser.c +95 -0
- data/ext/nokogiri/include/libexslt/exslt.h +108 -0
- data/ext/nokogiri/include/libexslt/exsltconfig.h +70 -0
- data/ext/nokogiri/include/libexslt/exsltexports.h +63 -0
- data/ext/nokogiri/include/libxml2/libxml/HTMLparser.h +306 -0
- data/ext/nokogiri/include/libxml2/libxml/HTMLtree.h +147 -0
- data/ext/nokogiri/include/libxml2/libxml/SAX.h +204 -0
- data/ext/nokogiri/include/libxml2/libxml/SAX2.h +172 -0
- data/ext/nokogiri/include/libxml2/libxml/c14n.h +128 -0
- data/ext/nokogiri/include/libxml2/libxml/catalog.h +182 -0
- data/ext/nokogiri/include/libxml2/libxml/chvalid.h +230 -0
- data/ext/nokogiri/include/libxml2/libxml/debugXML.h +217 -0
- data/ext/nokogiri/include/libxml2/libxml/dict.h +81 -0
- data/ext/nokogiri/include/libxml2/libxml/encoding.h +232 -0
- data/ext/nokogiri/include/libxml2/libxml/entities.h +153 -0
- data/ext/nokogiri/include/libxml2/libxml/globals.h +499 -0
- data/ext/nokogiri/include/libxml2/libxml/hash.h +236 -0
- data/ext/nokogiri/include/libxml2/libxml/list.h +137 -0
- data/ext/nokogiri/include/libxml2/libxml/nanoftp.h +186 -0
- data/ext/nokogiri/include/libxml2/libxml/nanohttp.h +81 -0
- data/ext/nokogiri/include/libxml2/libxml/parser.h +1244 -0
- data/ext/nokogiri/include/libxml2/libxml/parserInternals.h +656 -0
- data/ext/nokogiri/include/libxml2/libxml/pattern.h +100 -0
- data/ext/nokogiri/include/libxml2/libxml/relaxng.h +218 -0
- data/ext/nokogiri/include/libxml2/libxml/schemasInternals.h +958 -0
- data/ext/nokogiri/include/libxml2/libxml/schematron.h +142 -0
- data/ext/nokogiri/include/libxml2/libxml/threads.h +91 -0
- data/ext/nokogiri/include/libxml2/libxml/tree.h +1312 -0
- data/ext/nokogiri/include/libxml2/libxml/uri.h +94 -0
- data/ext/nokogiri/include/libxml2/libxml/valid.h +463 -0
- data/ext/nokogiri/include/libxml2/libxml/xinclude.h +129 -0
- data/ext/nokogiri/include/libxml2/libxml/xlink.h +189 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlIO.h +368 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlautomata.h +146 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlerror.h +947 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlexports.h +77 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlmemory.h +226 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlmodule.h +57 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlreader.h +428 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlregexp.h +222 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlsave.h +88 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlschemas.h +246 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlschemastypes.h +152 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlstring.h +140 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlunicode.h +202 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlversion.h +503 -0
- data/ext/nokogiri/include/libxml2/libxml/xmlwriter.h +488 -0
- data/ext/nokogiri/include/libxml2/libxml/xpath.h +575 -0
- data/ext/nokogiri/include/libxml2/libxml/xpathInternals.h +632 -0
- data/ext/nokogiri/include/libxml2/libxml/xpointer.h +137 -0
- data/ext/nokogiri/include/libxslt/attributes.h +38 -0
- data/ext/nokogiri/include/libxslt/documents.h +93 -0
- data/ext/nokogiri/include/libxslt/extensions.h +262 -0
- data/ext/nokogiri/include/libxslt/extra.h +72 -0
- data/ext/nokogiri/include/libxslt/functions.h +78 -0
- data/ext/nokogiri/include/libxslt/imports.h +75 -0
- data/ext/nokogiri/include/libxslt/keys.h +53 -0
- data/ext/nokogiri/include/libxslt/namespaces.h +68 -0
- data/ext/nokogiri/include/libxslt/numbersInternals.h +73 -0
- data/ext/nokogiri/include/libxslt/pattern.h +84 -0
- data/ext/nokogiri/include/libxslt/preproc.h +43 -0
- data/ext/nokogiri/include/libxslt/security.h +104 -0
- data/ext/nokogiri/include/libxslt/templates.h +77 -0
- data/ext/nokogiri/include/libxslt/transform.h +207 -0
- data/ext/nokogiri/include/libxslt/variables.h +118 -0
- data/ext/nokogiri/include/libxslt/xslt.h +110 -0
- data/ext/nokogiri/include/libxslt/xsltInternals.h +1982 -0
- data/ext/nokogiri/include/libxslt/xsltconfig.h +179 -0
- data/ext/nokogiri/include/libxslt/xsltexports.h +64 -0
- data/ext/nokogiri/include/libxslt/xsltlocale.h +76 -0
- data/ext/nokogiri/include/libxslt/xsltutils.h +310 -0
- data/ext/nokogiri/libxml2_backwards_compat.c +121 -0
- data/ext/nokogiri/nokogiri.c +228 -104
- data/ext/nokogiri/nokogiri.h +204 -90
- data/ext/nokogiri/test_global_handlers.c +40 -0
- data/ext/nokogiri/xml_attr.c +17 -17
- data/ext/nokogiri/xml_attribute_decl.c +22 -22
- data/ext/nokogiri/xml_cdata.c +15 -20
- data/ext/nokogiri/xml_comment.c +19 -26
- data/ext/nokogiri/xml_document.c +306 -225
- data/ext/nokogiri/xml_document_fragment.c +12 -16
- data/ext/nokogiri/xml_dtd.c +64 -58
- data/ext/nokogiri/xml_element_content.c +33 -28
- data/ext/nokogiri/xml_element_decl.c +26 -26
- data/ext/nokogiri/xml_encoding_handler.c +45 -20
- data/ext/nokogiri/xml_entity_decl.c +37 -35
- data/ext/nokogiri/xml_entity_reference.c +16 -18
- data/ext/nokogiri/xml_namespace.c +136 -61
- data/ext/nokogiri/xml_node.c +1344 -672
- data/ext/nokogiri/xml_node_set.c +178 -168
- data/ext/nokogiri/xml_processing_instruction.c +17 -19
- data/ext/nokogiri/xml_reader.c +316 -190
- data/ext/nokogiri/xml_relax_ng.c +52 -30
- data/ext/nokogiri/xml_sax_parser.c +130 -124
- data/ext/nokogiri/xml_sax_parser_context.c +110 -89
- data/ext/nokogiri/xml_sax_push_parser.c +36 -29
- data/ext/nokogiri/xml_schema.c +98 -50
- data/ext/nokogiri/xml_syntax_error.c +42 -21
- data/ext/nokogiri/xml_text.c +14 -18
- data/ext/nokogiri/xml_xpath_context.c +263 -148
- data/ext/nokogiri/xslt_stylesheet.c +271 -178
- data/gumbo-parser/CHANGES.md +63 -0
- data/gumbo-parser/Makefile +111 -0
- data/gumbo-parser/THANKS +27 -0
- data/lib/nokogiri/2.7/nokogiri.so +0 -0
- data/lib/nokogiri/3.0/nokogiri.so +0 -0
- data/lib/nokogiri/3.1/nokogiri.so +0 -0
- data/lib/nokogiri/3.2/nokogiri.so +0 -0
- data/lib/nokogiri/class_resolver.rb +67 -0
- data/lib/nokogiri/css/node.rb +10 -8
- data/lib/nokogiri/css/parser.rb +397 -377
- data/lib/nokogiri/css/parser.y +250 -245
- data/lib/nokogiri/css/parser_extras.rb +54 -49
- data/lib/nokogiri/css/syntax_error.rb +3 -1
- data/lib/nokogiri/css/tokenizer.rb +5 -3
- data/lib/nokogiri/css/tokenizer.rex +3 -2
- data/lib/nokogiri/css/xpath_visitor.rb +223 -94
- data/lib/nokogiri/css.rb +56 -17
- data/lib/nokogiri/decorators/slop.rb +9 -7
- data/lib/nokogiri/encoding_handler.rb +57 -0
- data/lib/nokogiri/extension.rb +32 -0
- data/lib/nokogiri/gumbo.rb +15 -0
- data/lib/nokogiri/html.rb +38 -27
- data/lib/nokogiri/{html → html4}/builder.rb +4 -2
- data/lib/nokogiri/html4/document.rb +214 -0
- data/lib/nokogiri/html4/document_fragment.rb +54 -0
- data/lib/nokogiri/{html → html4}/element_description.rb +3 -1
- data/lib/nokogiri/html4/element_description_defaults.rb +572 -0
- data/lib/nokogiri/html4/encoding_reader.rb +121 -0
- data/lib/nokogiri/{html → html4}/entity_lookup.rb +4 -2
- data/lib/nokogiri/{html → html4}/sax/parser.rb +17 -16
- data/lib/nokogiri/html4/sax/parser_context.rb +20 -0
- data/lib/nokogiri/{html → html4}/sax/push_parser.rb +12 -11
- data/lib/nokogiri/html4.rb +47 -0
- data/lib/nokogiri/html5/document.rb +168 -0
- data/lib/nokogiri/html5/document_fragment.rb +90 -0
- data/lib/nokogiri/html5/node.rb +98 -0
- data/lib/nokogiri/html5.rb +389 -0
- data/lib/nokogiri/jruby/dependencies.rb +3 -0
- data/lib/nokogiri/jruby/nokogiri_jars.rb +43 -0
- data/lib/nokogiri/syntax_error.rb +2 -0
- data/lib/nokogiri/version/constant.rb +6 -0
- data/lib/nokogiri/version/info.rb +223 -0
- data/lib/nokogiri/version.rb +3 -108
- data/lib/nokogiri/xml/attr.rb +55 -3
- data/lib/nokogiri/xml/attribute_decl.rb +3 -1
- data/lib/nokogiri/xml/builder.rb +75 -34
- data/lib/nokogiri/xml/cdata.rb +3 -1
- data/lib/nokogiri/xml/character_data.rb +2 -0
- data/lib/nokogiri/xml/document.rb +312 -126
- data/lib/nokogiri/xml/document_fragment.rb +93 -48
- data/lib/nokogiri/xml/dtd.rb +4 -2
- data/lib/nokogiri/xml/element_content.rb +2 -0
- data/lib/nokogiri/xml/element_decl.rb +3 -1
- data/lib/nokogiri/xml/entity_decl.rb +4 -2
- data/lib/nokogiri/xml/entity_reference.rb +2 -0
- data/lib/nokogiri/xml/namespace.rb +45 -0
- data/lib/nokogiri/xml/node/save_options.rb +15 -8
- data/lib/nokogiri/xml/node.rb +1067 -406
- data/lib/nokogiri/xml/node_set.rb +135 -59
- data/lib/nokogiri/xml/notation.rb +13 -0
- data/lib/nokogiri/xml/parse_options.rb +145 -52
- data/lib/nokogiri/xml/pp/character_data.rb +9 -6
- data/lib/nokogiri/xml/pp/node.rb +27 -26
- data/lib/nokogiri/xml/pp.rb +4 -2
- data/lib/nokogiri/xml/processing_instruction.rb +4 -1
- data/lib/nokogiri/xml/reader.rb +21 -28
- data/lib/nokogiri/xml/relax_ng.rb +8 -2
- data/lib/nokogiri/xml/sax/document.rb +45 -49
- data/lib/nokogiri/xml/sax/parser.rb +39 -36
- data/lib/nokogiri/xml/sax/parser_context.rb +8 -3
- data/lib/nokogiri/xml/sax/push_parser.rb +6 -5
- data/lib/nokogiri/xml/sax.rb +6 -4
- data/lib/nokogiri/xml/schema.rb +19 -9
- data/lib/nokogiri/xml/searchable.rb +112 -72
- data/lib/nokogiri/xml/syntax_error.rb +6 -4
- data/lib/nokogiri/xml/text.rb +2 -0
- data/lib/nokogiri/xml/xpath/syntax_error.rb +4 -2
- data/lib/nokogiri/xml/xpath.rb +15 -4
- data/lib/nokogiri/xml/xpath_context.rb +3 -3
- data/lib/nokogiri/xml.rb +38 -37
- data/lib/nokogiri/xslt/stylesheet.rb +3 -1
- data/lib/nokogiri/xslt.rb +29 -20
- data/lib/nokogiri.rb +48 -72
- data/lib/xsd/xmlparser/nokogiri.rb +29 -25
- metadata +146 -307
- data/ext/nokogiri/html_document.c +0 -170
- data/ext/nokogiri/html_document.h +0 -10
- data/ext/nokogiri/html_element_description.c +0 -279
- data/ext/nokogiri/html_element_description.h +0 -10
- data/ext/nokogiri/html_entity_lookup.c +0 -32
- data/ext/nokogiri/html_entity_lookup.h +0 -8
- data/ext/nokogiri/html_sax_parser_context.c +0 -116
- data/ext/nokogiri/html_sax_parser_context.h +0 -11
- data/ext/nokogiri/html_sax_push_parser.c +0 -87
- data/ext/nokogiri/html_sax_push_parser.h +0 -9
- data/ext/nokogiri/xml_attr.h +0 -9
- data/ext/nokogiri/xml_attribute_decl.h +0 -9
- data/ext/nokogiri/xml_cdata.h +0 -9
- data/ext/nokogiri/xml_comment.h +0 -9
- data/ext/nokogiri/xml_document.h +0 -23
- data/ext/nokogiri/xml_document_fragment.h +0 -10
- data/ext/nokogiri/xml_dtd.h +0 -10
- data/ext/nokogiri/xml_element_content.h +0 -10
- data/ext/nokogiri/xml_element_decl.h +0 -9
- data/ext/nokogiri/xml_encoding_handler.h +0 -8
- data/ext/nokogiri/xml_entity_decl.h +0 -10
- data/ext/nokogiri/xml_entity_reference.h +0 -9
- data/ext/nokogiri/xml_io.c +0 -61
- data/ext/nokogiri/xml_io.h +0 -11
- data/ext/nokogiri/xml_libxml2_hacks.c +0 -112
- data/ext/nokogiri/xml_libxml2_hacks.h +0 -12
- data/ext/nokogiri/xml_namespace.h +0 -14
- data/ext/nokogiri/xml_node.h +0 -13
- data/ext/nokogiri/xml_node_set.h +0 -12
- data/ext/nokogiri/xml_processing_instruction.h +0 -9
- data/ext/nokogiri/xml_reader.h +0 -10
- data/ext/nokogiri/xml_relax_ng.h +0 -9
- data/ext/nokogiri/xml_sax_parser.h +0 -39
- data/ext/nokogiri/xml_sax_parser_context.h +0 -10
- data/ext/nokogiri/xml_sax_push_parser.h +0 -9
- data/ext/nokogiri/xml_schema.h +0 -9
- data/ext/nokogiri/xml_syntax_error.h +0 -13
- data/ext/nokogiri/xml_text.h +0 -9
- data/ext/nokogiri/xml_xpath_context.h +0 -10
- data/ext/nokogiri/xslt_stylesheet.h +0 -14
- data/lib/nokogiri/html/document.rb +0 -335
- data/lib/nokogiri/html/document_fragment.rb +0 -49
- data/lib/nokogiri/html/element_description_defaults.rb +0 -671
- data/lib/nokogiri/html/sax/parser_context.rb +0 -16
- data/patches/libxml2/0001-Revert-Do-not-URI-escape-in-server-side-includes.patch +0 -78
- data/patches/libxml2/0002-Remove-script-macro-support.patch +0 -40
- data/patches/libxml2/0003-Update-entities-to-remove-handling-of-ssi.patch +0 -44
- data/patches/libxml2/0004-libxml2.la-is-in-top_builddir.patch +0 -25
- data/patches/libxml2/0005-Fix-infinite-loop-in-xmlStringLenDecodeEntities.patch +0 -32
- data/ports/archives/libxml2-2.9.10.tar.gz +0 -0
- data/ports/archives/libxslt-1.1.34.tar.gz +0 -0
data/ext/nokogiri/xml_relax_ng.c
CHANGED
@@ -1,10 +1,11 @@
|
|
1
|
-
#include <
|
1
|
+
#include <nokogiri.h>
|
2
2
|
|
3
|
-
|
3
|
+
VALUE cNokogiriXmlRelaxNG;
|
4
|
+
|
5
|
+
static void
|
6
|
+
dealloc(xmlRelaxNGPtr schema)
|
4
7
|
{
|
5
|
-
NOKOGIRI_DEBUG_START(schema);
|
6
8
|
xmlRelaxNGFree(schema);
|
7
|
-
NOKOGIRI_DEBUG_END(schema);
|
8
9
|
}
|
9
10
|
|
10
11
|
/*
|
@@ -13,7 +14,8 @@ static void dealloc(xmlRelaxNGPtr schema)
|
|
13
14
|
*
|
14
15
|
* Validate a Nokogiri::XML::Document against this RelaxNG schema.
|
15
16
|
*/
|
16
|
-
static VALUE
|
17
|
+
static VALUE
|
18
|
+
validate_document(VALUE self, VALUE document)
|
17
19
|
{
|
18
20
|
xmlDocPtr doc;
|
19
21
|
xmlRelaxNGPtr schema;
|
@@ -27,7 +29,7 @@ static VALUE validate_document(VALUE self, VALUE document)
|
|
27
29
|
|
28
30
|
valid_ctxt = xmlRelaxNGNewValidCtxt(schema);
|
29
31
|
|
30
|
-
if(NULL == valid_ctxt) {
|
32
|
+
if (NULL == valid_ctxt) {
|
31
33
|
/* we have a problem */
|
32
34
|
rb_raise(rb_eRuntimeError, "Could not create a validation context");
|
33
35
|
}
|
@@ -53,16 +55,25 @@ static VALUE validate_document(VALUE self, VALUE document)
|
|
53
55
|
*
|
54
56
|
* Create a new RelaxNG from the contents of +string+
|
55
57
|
*/
|
56
|
-
static VALUE
|
58
|
+
static VALUE
|
59
|
+
read_memory(int argc, VALUE *argv, VALUE klass)
|
57
60
|
{
|
58
|
-
|
59
|
-
|
60
|
-
|
61
|
-
);
|
61
|
+
VALUE content;
|
62
|
+
VALUE parse_options;
|
63
|
+
xmlRelaxNGParserCtxtPtr ctx;
|
62
64
|
xmlRelaxNGPtr schema;
|
63
|
-
VALUE errors
|
65
|
+
VALUE errors;
|
64
66
|
VALUE rb_schema;
|
67
|
+
int scanned_args = 0;
|
68
|
+
|
69
|
+
scanned_args = rb_scan_args(argc, argv, "11", &content, &parse_options);
|
70
|
+
if (scanned_args == 1) {
|
71
|
+
parse_options = rb_const_get_at(rb_const_get_at(mNokogiriXml, rb_intern("ParseOptions")), rb_intern("DEFAULT_SCHEMA"));
|
72
|
+
}
|
65
73
|
|
74
|
+
ctx = xmlRelaxNGNewMemParserCtxt((const char *)StringValuePtr(content), (int)RSTRING_LEN(content));
|
75
|
+
|
76
|
+
errors = rb_ary_new();
|
66
77
|
xmlSetStructuredErrorFunc((void *)errors, Nokogiri_error_array_pusher);
|
67
78
|
|
68
79
|
#ifdef HAVE_XMLRELAXNGSETPARSERSTRUCTUREDERRORS
|
@@ -78,18 +89,20 @@ static VALUE read_memory(VALUE klass, VALUE content)
|
|
78
89
|
xmlSetStructuredErrorFunc(NULL, NULL);
|
79
90
|
xmlRelaxNGFreeParserCtxt(ctx);
|
80
91
|
|
81
|
-
if(NULL == schema) {
|
92
|
+
if (NULL == schema) {
|
82
93
|
xmlErrorPtr error = xmlGetLastError();
|
83
|
-
if(error)
|
94
|
+
if (error) {
|
84
95
|
Nokogiri_error_raise(NULL, error);
|
85
|
-
else
|
96
|
+
} else {
|
86
97
|
rb_raise(rb_eRuntimeError, "Could not parse document");
|
98
|
+
}
|
87
99
|
|
88
100
|
return Qnil;
|
89
101
|
}
|
90
102
|
|
91
103
|
rb_schema = Data_Wrap_Struct(klass, 0, dealloc, schema);
|
92
104
|
rb_iv_set(rb_schema, "@errors", errors);
|
105
|
+
rb_iv_set(rb_schema, "@parse_options", parse_options);
|
93
106
|
|
94
107
|
return rb_schema;
|
95
108
|
}
|
@@ -100,18 +113,26 @@ static VALUE read_memory(VALUE klass, VALUE content)
|
|
100
113
|
*
|
101
114
|
* Create a new RelaxNG schema from the Nokogiri::XML::Document +doc+
|
102
115
|
*/
|
103
|
-
static VALUE
|
116
|
+
static VALUE
|
117
|
+
from_document(int argc, VALUE *argv, VALUE klass)
|
104
118
|
{
|
119
|
+
VALUE document;
|
120
|
+
VALUE parse_options;
|
105
121
|
xmlDocPtr doc;
|
106
122
|
xmlRelaxNGParserCtxtPtr ctx;
|
107
123
|
xmlRelaxNGPtr schema;
|
108
124
|
VALUE errors;
|
109
125
|
VALUE rb_schema;
|
126
|
+
int scanned_args = 0;
|
127
|
+
|
128
|
+
scanned_args = rb_scan_args(argc, argv, "11", &document, &parse_options);
|
110
129
|
|
111
130
|
Data_Get_Struct(document, xmlDoc, doc);
|
131
|
+
doc = doc->doc; /* In case someone passes us a node. ugh. */
|
112
132
|
|
113
|
-
|
114
|
-
|
133
|
+
if (scanned_args == 1) {
|
134
|
+
parse_options = rb_const_get_at(rb_const_get_at(mNokogiriXml, rb_intern("ParseOptions")), rb_intern("DEFAULT_SCHEMA"));
|
135
|
+
}
|
115
136
|
|
116
137
|
ctx = xmlRelaxNGNewDocParserCtxt(doc);
|
117
138
|
|
@@ -129,33 +150,34 @@ static VALUE from_document(VALUE klass, VALUE document)
|
|
129
150
|
schema = xmlRelaxNGParse(ctx);
|
130
151
|
|
131
152
|
xmlSetStructuredErrorFunc(NULL, NULL);
|
153
|
+
xmlRelaxNGFreeParserCtxt(ctx);
|
132
154
|
|
133
|
-
if(NULL == schema) {
|
155
|
+
if (NULL == schema) {
|
134
156
|
xmlErrorPtr error = xmlGetLastError();
|
135
|
-
if(error)
|
157
|
+
if (error) {
|
136
158
|
Nokogiri_error_raise(NULL, error);
|
137
|
-
else
|
159
|
+
} else {
|
138
160
|
rb_raise(rb_eRuntimeError, "Could not parse document");
|
161
|
+
}
|
139
162
|
|
140
163
|
return Qnil;
|
141
164
|
}
|
142
165
|
|
143
166
|
rb_schema = Data_Wrap_Struct(klass, 0, dealloc, schema);
|
144
167
|
rb_iv_set(rb_schema, "@errors", errors);
|
168
|
+
rb_iv_set(rb_schema, "@parse_options", parse_options);
|
145
169
|
|
146
170
|
return rb_schema;
|
147
171
|
}
|
148
172
|
|
149
|
-
|
150
|
-
void
|
173
|
+
void
|
174
|
+
noko_init_xml_relax_ng(void)
|
151
175
|
{
|
152
|
-
|
153
|
-
|
154
|
-
VALUE klass = rb_define_class_under(xml, "RelaxNG", cNokogiriXmlSchema);
|
176
|
+
assert(cNokogiriXmlSchema);
|
177
|
+
cNokogiriXmlRelaxNG = rb_define_class_under(mNokogiriXml, "RelaxNG", cNokogiriXmlSchema);
|
155
178
|
|
156
|
-
cNokogiriXmlRelaxNG
|
179
|
+
rb_define_singleton_method(cNokogiriXmlRelaxNG, "read_memory", read_memory, -1);
|
180
|
+
rb_define_singleton_method(cNokogiriXmlRelaxNG, "from_document", from_document, -1);
|
157
181
|
|
158
|
-
|
159
|
-
rb_define_singleton_method(klass, "from_document", from_document, 1);
|
160
|
-
rb_define_private_method(klass, "validate_document", validate_document, 1);
|
182
|
+
rb_define_private_method(cNokogiriXmlRelaxNG, "validate_document", validate_document, 1);
|
161
183
|
}
|
@@ -1,23 +1,23 @@
|
|
1
|
-
#include <
|
1
|
+
#include <nokogiri.h>
|
2
2
|
|
3
|
-
|
4
|
-
void vasprintf_free (void *p);
|
3
|
+
VALUE cNokogiriXmlSaxParser ;
|
5
4
|
|
6
5
|
static ID id_start_document, id_end_document, id_start_element, id_end_element;
|
7
6
|
static ID id_start_element_namespace, id_end_element_namespace;
|
8
7
|
static ID id_comment, id_characters, id_xmldecl, id_error, id_warning;
|
9
|
-
static ID id_cdata_block
|
8
|
+
static ID id_cdata_block;
|
10
9
|
static ID id_processing_instruction;
|
11
10
|
|
12
|
-
static void
|
11
|
+
static void
|
12
|
+
start_document(void *ctx)
|
13
13
|
{
|
14
14
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
15
15
|
VALUE doc = rb_iv_get(self, "@document");
|
16
16
|
|
17
17
|
xmlParserCtxtPtr ctxt = NOKOGIRI_SAX_CTXT(ctx);
|
18
18
|
|
19
|
-
if(NULL != ctxt && ctxt->html != 1) {
|
20
|
-
if(ctxt->standalone != -1) {
|
19
|
+
if (NULL != ctxt && ctxt->html != 1) {
|
20
|
+
if (ctxt->standalone != -1) { /* -1 means there was no declaration */
|
21
21
|
VALUE encoding = Qnil ;
|
22
22
|
VALUE standalone = Qnil;
|
23
23
|
VALUE version;
|
@@ -29,8 +29,7 @@ static void start_document(void * ctx)
|
|
29
29
|
|
30
30
|
version = ctxt->version ? NOKOGIRI_STR_NEW2(ctxt->version) : Qnil;
|
31
31
|
|
32
|
-
switch(ctxt->standalone)
|
33
|
-
{
|
32
|
+
switch (ctxt->standalone) {
|
34
33
|
case 0:
|
35
34
|
standalone = NOKOGIRI_STR_NEW2("no");
|
36
35
|
break;
|
@@ -46,138 +45,140 @@ static void start_document(void * ctx)
|
|
46
45
|
rb_funcall(doc, id_start_document, 0);
|
47
46
|
}
|
48
47
|
|
49
|
-
static void
|
48
|
+
static void
|
49
|
+
end_document(void *ctx)
|
50
50
|
{
|
51
51
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
52
52
|
VALUE doc = rb_iv_get(self, "@document");
|
53
53
|
rb_funcall(doc, id_end_document, 0);
|
54
54
|
}
|
55
55
|
|
56
|
-
static void
|
56
|
+
static void
|
57
|
+
start_element(void *ctx, const xmlChar *name, const xmlChar **atts)
|
57
58
|
{
|
58
59
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
59
60
|
VALUE doc = rb_iv_get(self, "@document");
|
60
61
|
VALUE attributes = rb_ary_new();
|
61
|
-
const xmlChar *
|
62
|
+
const xmlChar *attr;
|
62
63
|
int i = 0;
|
63
|
-
if(atts) {
|
64
|
-
while((attr = atts[i]) != NULL) {
|
65
|
-
const xmlChar *
|
64
|
+
if (atts) {
|
65
|
+
while ((attr = atts[i]) != NULL) {
|
66
|
+
const xmlChar *val = atts[i + 1];
|
66
67
|
VALUE value = val != NULL ? NOKOGIRI_STR_NEW2(val) : Qnil;
|
67
68
|
rb_ary_push(attributes, rb_ary_new3(2, NOKOGIRI_STR_NEW2(attr), value));
|
68
|
-
i+=2;
|
69
|
+
i += 2;
|
69
70
|
}
|
70
71
|
}
|
71
72
|
|
72
|
-
rb_funcall(
|
73
|
-
|
74
|
-
|
75
|
-
|
76
|
-
|
77
|
-
|
73
|
+
rb_funcall(doc,
|
74
|
+
id_start_element,
|
75
|
+
2,
|
76
|
+
NOKOGIRI_STR_NEW2(name),
|
77
|
+
attributes
|
78
|
+
);
|
78
79
|
}
|
79
80
|
|
80
|
-
static void
|
81
|
+
static void
|
82
|
+
end_element(void *ctx, const xmlChar *name)
|
81
83
|
{
|
82
84
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
83
85
|
VALUE doc = rb_iv_get(self, "@document");
|
84
86
|
rb_funcall(doc, id_end_element, 1, NOKOGIRI_STR_NEW2(name));
|
85
87
|
}
|
86
88
|
|
87
|
-
static VALUE
|
88
|
-
|
89
|
-
int nb_attributes,
|
90
|
-
const xmlChar ** attributes)
|
89
|
+
static VALUE
|
90
|
+
attributes_as_array(int attributes_len, const xmlChar **c_attributes)
|
91
91
|
{
|
92
|
-
VALUE
|
92
|
+
VALUE rb_array = rb_ary_new2((long)attributes_len);
|
93
|
+
VALUE cNokogiriXmlSaxParserAttribute;
|
93
94
|
|
94
|
-
|
95
|
-
if (
|
95
|
+
cNokogiriXmlSaxParserAttribute = rb_const_get_at(cNokogiriXmlSaxParser, rb_intern("Attribute"));
|
96
|
+
if (c_attributes) {
|
96
97
|
/* Each attribute is an array of [localname, prefix, URI, value, end] */
|
97
98
|
int i;
|
98
|
-
for (i = 0; i <
|
99
|
-
VALUE
|
99
|
+
for (i = 0; i < attributes_len * 5; i += 5) {
|
100
|
+
VALUE rb_constructor_args[4], rb_attribute;
|
100
101
|
|
101
|
-
|
102
|
-
|
103
|
-
|
102
|
+
rb_constructor_args[0] = RBSTR_OR_QNIL(c_attributes[i + 0]); /* localname */
|
103
|
+
rb_constructor_args[1] = RBSTR_OR_QNIL(c_attributes[i + 1]); /* prefix */
|
104
|
+
rb_constructor_args[2] = RBSTR_OR_QNIL(c_attributes[i + 2]); /* URI */
|
104
105
|
|
105
106
|
/* value */
|
106
|
-
|
107
|
-
|
107
|
+
rb_constructor_args[3] = NOKOGIRI_STR_NEW((const char *)c_attributes[i + 3],
|
108
|
+
(c_attributes[i + 4] - c_attributes[i + 3]));
|
108
109
|
|
109
|
-
|
110
|
-
rb_ary_push(
|
110
|
+
rb_attribute = rb_class_new_instance(4, rb_constructor_args, cNokogiriXmlSaxParserAttribute);
|
111
|
+
rb_ary_push(rb_array, rb_attribute);
|
111
112
|
}
|
112
113
|
}
|
113
114
|
|
114
|
-
return
|
115
|
+
return rb_array;
|
115
116
|
}
|
116
117
|
|
117
118
|
static void
|
118
|
-
start_element_ns
|
119
|
-
void *
|
120
|
-
const xmlChar *
|
121
|
-
const xmlChar *
|
122
|
-
const xmlChar *
|
119
|
+
start_element_ns(
|
120
|
+
void *ctx,
|
121
|
+
const xmlChar *localname,
|
122
|
+
const xmlChar *prefix,
|
123
|
+
const xmlChar *uri,
|
123
124
|
int nb_namespaces,
|
124
|
-
const xmlChar **
|
125
|
+
const xmlChar **namespaces,
|
125
126
|
int nb_attributes,
|
126
127
|
int nb_defaulted,
|
127
|
-
const xmlChar **
|
128
|
+
const xmlChar **attributes)
|
128
129
|
{
|
129
130
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
130
131
|
VALUE doc = rb_iv_get(self, "@document");
|
131
132
|
|
132
|
-
VALUE
|
133
|
+
VALUE attribute_ary = attributes_as_array(nb_attributes, attributes);
|
133
134
|
|
134
135
|
VALUE ns_list = rb_ary_new2((long)nb_namespaces);
|
135
136
|
|
136
137
|
if (namespaces) {
|
137
138
|
int i;
|
138
|
-
for (i = 0; i < nb_namespaces * 2; i += 2)
|
139
|
-
{
|
139
|
+
for (i = 0; i < nb_namespaces * 2; i += 2) {
|
140
140
|
rb_ary_push(ns_list,
|
141
|
-
|
142
|
-
|
143
|
-
|
144
|
-
|
145
|
-
|
141
|
+
rb_ary_new3((long)2,
|
142
|
+
RBSTR_OR_QNIL(namespaces[i + 0]),
|
143
|
+
RBSTR_OR_QNIL(namespaces[i + 1])
|
144
|
+
)
|
145
|
+
);
|
146
146
|
}
|
147
147
|
}
|
148
148
|
|
149
|
-
rb_funcall(
|
150
|
-
|
151
|
-
|
152
|
-
|
153
|
-
|
154
|
-
|
155
|
-
|
156
|
-
|
157
|
-
|
149
|
+
rb_funcall(doc,
|
150
|
+
id_start_element_namespace,
|
151
|
+
5,
|
152
|
+
NOKOGIRI_STR_NEW2(localname),
|
153
|
+
attribute_ary,
|
154
|
+
RBSTR_OR_QNIL(prefix),
|
155
|
+
RBSTR_OR_QNIL(uri),
|
156
|
+
ns_list
|
157
|
+
);
|
158
158
|
}
|
159
159
|
|
160
160
|
/**
|
161
161
|
* end_element_ns was borrowed heavily from libxml-ruby.
|
162
162
|
*/
|
163
163
|
static void
|
164
|
-
end_element_ns
|
165
|
-
void *
|
166
|
-
const xmlChar *
|
167
|
-
const xmlChar *
|
168
|
-
const xmlChar *
|
164
|
+
end_element_ns(
|
165
|
+
void *ctx,
|
166
|
+
const xmlChar *localname,
|
167
|
+
const xmlChar *prefix,
|
168
|
+
const xmlChar *uri)
|
169
169
|
{
|
170
170
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
171
171
|
VALUE doc = rb_iv_get(self, "@document");
|
172
172
|
|
173
173
|
rb_funcall(doc, id_end_element_namespace, 3,
|
174
|
-
|
175
|
-
|
176
|
-
|
177
|
-
|
174
|
+
NOKOGIRI_STR_NEW2(localname),
|
175
|
+
RBSTR_OR_QNIL(prefix),
|
176
|
+
RBSTR_OR_QNIL(uri)
|
177
|
+
);
|
178
178
|
}
|
179
179
|
|
180
|
-
static void
|
180
|
+
static void
|
181
|
+
characters_func(void *ctx, const xmlChar *ch, int len)
|
181
182
|
{
|
182
183
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
183
184
|
VALUE doc = rb_iv_get(self, "@document");
|
@@ -185,7 +186,8 @@ static void characters_func(void * ctx, const xmlChar * ch, int len)
|
|
185
186
|
rb_funcall(doc, id_characters, 1, str);
|
186
187
|
}
|
187
188
|
|
188
|
-
static void
|
189
|
+
static void
|
190
|
+
comment_func(void *ctx, const xmlChar *value)
|
189
191
|
{
|
190
192
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
191
193
|
VALUE doc = rb_iv_get(self, "@document");
|
@@ -193,41 +195,52 @@ static void comment_func(void * ctx, const xmlChar * value)
|
|
193
195
|
rb_funcall(doc, id_comment, 1, str);
|
194
196
|
}
|
195
197
|
|
196
|
-
|
198
|
+
PRINTFLIKE_DECL(2, 3)
|
199
|
+
static void
|
200
|
+
warning_func(void *ctx, const char *msg, ...)
|
197
201
|
{
|
198
202
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
199
203
|
VALUE doc = rb_iv_get(self, "@document");
|
200
|
-
|
201
|
-
VALUE ruby_message;
|
204
|
+
VALUE rb_message;
|
202
205
|
|
206
|
+
#ifdef TRUFFLERUBY_NOKOGIRI_SYSTEM_LIBRARIES
|
207
|
+
/* It is not currently possible to pass var args from native
|
208
|
+
functions to sulong, so we work around the issue here. */
|
209
|
+
rb_message = rb_sprintf("warning_func: %s", msg);
|
210
|
+
#else
|
203
211
|
va_list args;
|
204
212
|
va_start(args, msg);
|
205
|
-
|
213
|
+
rb_message = rb_vsprintf(msg, args);
|
206
214
|
va_end(args);
|
215
|
+
#endif
|
207
216
|
|
208
|
-
|
209
|
-
vasprintf_free(message);
|
210
|
-
rb_funcall(doc, id_warning, 1, ruby_message);
|
217
|
+
rb_funcall(doc, id_warning, 1, rb_message);
|
211
218
|
}
|
212
219
|
|
213
|
-
|
220
|
+
PRINTFLIKE_DECL(2, 3)
|
221
|
+
static void
|
222
|
+
error_func(void *ctx, const char *msg, ...)
|
214
223
|
{
|
215
224
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
216
225
|
VALUE doc = rb_iv_get(self, "@document");
|
217
|
-
|
218
|
-
VALUE ruby_message;
|
226
|
+
VALUE rb_message;
|
219
227
|
|
228
|
+
#ifdef TRUFFLERUBY_NOKOGIRI_SYSTEM_LIBRARIES
|
229
|
+
/* It is not currently possible to pass var args from native
|
230
|
+
functions to sulong, so we work around the issue here. */
|
231
|
+
rb_message = rb_sprintf("error_func: %s", msg);
|
232
|
+
#else
|
220
233
|
va_list args;
|
221
234
|
va_start(args, msg);
|
222
|
-
|
235
|
+
rb_message = rb_vsprintf(msg, args);
|
223
236
|
va_end(args);
|
237
|
+
#endif
|
224
238
|
|
225
|
-
|
226
|
-
vasprintf_free(message);
|
227
|
-
rb_funcall(doc, id_error, 1, ruby_message);
|
239
|
+
rb_funcall(doc, id_error, 1, rb_message);
|
228
240
|
}
|
229
241
|
|
230
|
-
static void
|
242
|
+
static void
|
243
|
+
cdata_block(void *ctx, const xmlChar *value, int len)
|
231
244
|
{
|
232
245
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
233
246
|
VALUE doc = rb_iv_get(self, "@document");
|
@@ -235,7 +248,8 @@ static void cdata_block(void * ctx, const xmlChar * value, int len)
|
|
235
248
|
rb_funcall(doc, id_cdata_block, 1, string);
|
236
249
|
}
|
237
250
|
|
238
|
-
static void
|
251
|
+
static void
|
252
|
+
processing_instruction(void *ctx, const xmlChar *name, const xmlChar *content)
|
239
253
|
{
|
240
254
|
VALUE rb_content;
|
241
255
|
VALUE self = NOKOGIRI_SAX_SELF(ctx);
|
@@ -243,26 +257,24 @@ static void processing_instruction(void * ctx, const xmlChar * name, const xmlCh
|
|
243
257
|
|
244
258
|
rb_content = content ? NOKOGIRI_STR_NEW2(content) : Qnil;
|
245
259
|
|
246
|
-
rb_funcall(
|
247
|
-
|
248
|
-
|
249
|
-
|
250
|
-
|
251
|
-
|
260
|
+
rb_funcall(doc,
|
261
|
+
id_processing_instruction,
|
262
|
+
2,
|
263
|
+
NOKOGIRI_STR_NEW2(name),
|
264
|
+
rb_content
|
265
|
+
);
|
252
266
|
}
|
253
267
|
|
254
|
-
static void
|
268
|
+
static void
|
269
|
+
deallocate(xmlSAXHandlerPtr handler)
|
255
270
|
{
|
256
|
-
|
257
|
-
free(handler);
|
258
|
-
NOKOGIRI_DEBUG_END(handler);
|
271
|
+
ruby_xfree(handler);
|
259
272
|
}
|
260
273
|
|
261
|
-
static VALUE
|
274
|
+
static VALUE
|
275
|
+
allocate(VALUE klass)
|
262
276
|
{
|
263
|
-
xmlSAXHandlerPtr handler =
|
264
|
-
|
265
|
-
xmlSetStructuredErrorFunc(NULL, NULL);
|
277
|
+
xmlSAXHandlerPtr handler = ruby_xcalloc((size_t)1, sizeof(xmlSAXHandler));
|
266
278
|
|
267
279
|
handler->startDocument = start_document;
|
268
280
|
handler->endDocument = end_document;
|
@@ -281,29 +293,23 @@ static VALUE allocate(VALUE klass)
|
|
281
293
|
return Data_Wrap_Struct(klass, NULL, deallocate, handler);
|
282
294
|
}
|
283
295
|
|
284
|
-
|
285
|
-
void
|
296
|
+
void
|
297
|
+
noko_init_xml_sax_parser(void)
|
286
298
|
{
|
287
|
-
|
288
|
-
VALUE xml = rb_define_module_under(nokogiri, "XML");
|
289
|
-
VALUE sax = rb_define_module_under(xml, "SAX");
|
290
|
-
VALUE klass = rb_define_class_under(sax, "Parser", rb_cObject);
|
291
|
-
|
292
|
-
cNokogiriXmlSaxParser = klass;
|
299
|
+
cNokogiriXmlSaxParser = rb_define_class_under(mNokogiriXmlSax, "Parser", rb_cObject);
|
293
300
|
|
294
|
-
rb_define_alloc_func(
|
301
|
+
rb_define_alloc_func(cNokogiriXmlSaxParser, allocate);
|
295
302
|
|
296
303
|
id_start_document = rb_intern("start_document");
|
297
|
-
id_end_document
|
298
|
-
id_start_element
|
299
|
-
id_end_element
|
300
|
-
id_comment
|
301
|
-
id_characters
|
302
|
-
id_xmldecl
|
303
|
-
id_error
|
304
|
-
id_warning
|
305
|
-
id_cdata_block
|
306
|
-
id_cAttribute = rb_intern("Attribute");
|
304
|
+
id_end_document = rb_intern("end_document");
|
305
|
+
id_start_element = rb_intern("start_element");
|
306
|
+
id_end_element = rb_intern("end_element");
|
307
|
+
id_comment = rb_intern("comment");
|
308
|
+
id_characters = rb_intern("characters");
|
309
|
+
id_xmldecl = rb_intern("xmldecl");
|
310
|
+
id_error = rb_intern("error");
|
311
|
+
id_warning = rb_intern("warning");
|
312
|
+
id_cdata_block = rb_intern("cdata_block");
|
307
313
|
id_start_element_namespace = rb_intern("start_element_namespace");
|
308
314
|
id_end_element_namespace = rb_intern("end_element_namespace");
|
309
315
|
id_processing_instruction = rb_intern("processing_instruction");
|