Nokogiri_precompiled_aarch64_dedshit 1.14.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/Gemfile +44 -0
- data/LICENSE-DEPENDENCIES.md +2224 -0
- data/LICENSE.md +9 -0
- data/README.md +287 -0
- data/bin/nokogiri +131 -0
- data/dependencies.yml +41 -0
- data/ext/java/nokogiri/Html4Document.java +157 -0
- data/ext/java/nokogiri/Html4ElementDescription.java +133 -0
- data/ext/java/nokogiri/Html4EntityLookup.java +63 -0
- data/ext/java/nokogiri/Html4SaxParserContext.java +289 -0
- data/ext/java/nokogiri/Html4SaxPushParser.java +213 -0
- data/ext/java/nokogiri/NokogiriService.java +613 -0
- data/ext/java/nokogiri/XmlAttr.java +154 -0
- data/ext/java/nokogiri/XmlAttributeDecl.java +119 -0
- data/ext/java/nokogiri/XmlCdata.java +60 -0
- data/ext/java/nokogiri/XmlComment.java +77 -0
- data/ext/java/nokogiri/XmlDocument.java +705 -0
- data/ext/java/nokogiri/XmlDocumentFragment.java +163 -0
- data/ext/java/nokogiri/XmlDtd.java +516 -0
- data/ext/java/nokogiri/XmlElement.java +44 -0
- data/ext/java/nokogiri/XmlElementContent.java +412 -0
- data/ext/java/nokogiri/XmlElementDecl.java +148 -0
- data/ext/java/nokogiri/XmlEntityDecl.java +151 -0
- data/ext/java/nokogiri/XmlEntityReference.java +79 -0
- data/ext/java/nokogiri/XmlNamespace.java +193 -0
- data/ext/java/nokogiri/XmlNode.java +1938 -0
- data/ext/java/nokogiri/XmlNodeSet.java +463 -0
- data/ext/java/nokogiri/XmlProcessingInstruction.java +79 -0
- data/ext/java/nokogiri/XmlReader.java +615 -0
- data/ext/java/nokogiri/XmlRelaxng.java +133 -0
- data/ext/java/nokogiri/XmlSaxParserContext.java +329 -0
- data/ext/java/nokogiri/XmlSaxPushParser.java +288 -0
- data/ext/java/nokogiri/XmlSchema.java +423 -0
- data/ext/java/nokogiri/XmlSyntaxError.java +137 -0
- data/ext/java/nokogiri/XmlText.java +90 -0
- data/ext/java/nokogiri/XmlXpathContext.java +305 -0
- data/ext/java/nokogiri/XsltStylesheet.java +368 -0
- data/ext/java/nokogiri/internals/ClosedStreamException.java +13 -0
- data/ext/java/nokogiri/internals/HtmlDomParserContext.java +252 -0
- data/ext/java/nokogiri/internals/IgnoreSchemaErrorsErrorHandler.java +27 -0
- data/ext/java/nokogiri/internals/NokogiriBlockingQueueInputStream.java +178 -0
- data/ext/java/nokogiri/internals/NokogiriDomParser.java +99 -0
- data/ext/java/nokogiri/internals/NokogiriEntityResolver.java +140 -0
- data/ext/java/nokogiri/internals/NokogiriErrorHandler.java +65 -0
- data/ext/java/nokogiri/internals/NokogiriHandler.java +339 -0
- data/ext/java/nokogiri/internals/NokogiriHelpers.java +817 -0
- data/ext/java/nokogiri/internals/NokogiriNamespaceCache.java +228 -0
- data/ext/java/nokogiri/internals/NokogiriNamespaceContext.java +110 -0
- data/ext/java/nokogiri/internals/NokogiriNonStrictErrorHandler.java +86 -0
- data/ext/java/nokogiri/internals/NokogiriNonStrictErrorHandler4NekoHtml.java +107 -0
- data/ext/java/nokogiri/internals/NokogiriStrictErrorHandler.java +62 -0
- data/ext/java/nokogiri/internals/NokogiriXPathFunction.java +165 -0
- data/ext/java/nokogiri/internals/NokogiriXPathFunctionResolver.java +50 -0
- data/ext/java/nokogiri/internals/NokogiriXPathVariableResolver.java +37 -0
- data/ext/java/nokogiri/internals/NokogiriXsltErrorListener.java +70 -0
- data/ext/java/nokogiri/internals/ParserContext.java +262 -0
- data/ext/java/nokogiri/internals/ReaderNode.java +564 -0
- data/ext/java/nokogiri/internals/SaveContextVisitor.java +865 -0
- data/ext/java/nokogiri/internals/SchemaErrorHandler.java +50 -0
- data/ext/java/nokogiri/internals/XalanDTMManagerPatch.java +174 -0
- data/ext/java/nokogiri/internals/XmlDeclHandler.java +11 -0
- data/ext/java/nokogiri/internals/XmlDomParserContext.java +265 -0
- data/ext/java/nokogiri/internals/XmlSaxParser.java +40 -0
- data/ext/java/nokogiri/internals/c14n/AttrCompare.java +122 -0
- data/ext/java/nokogiri/internals/c14n/C14nHelper.java +178 -0
- data/ext/java/nokogiri/internals/c14n/CanonicalFilter.java +43 -0
- data/ext/java/nokogiri/internals/c14n/CanonicalizationException.java +106 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer.java +278 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer11.java +664 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer11_OmitComments.java +45 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer11_WithComments.java +45 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer20010315.java +388 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer20010315Excl.java +308 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer20010315ExclOmitComments.java +47 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer20010315ExclWithComments.java +51 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer20010315OmitComments.java +51 -0
- data/ext/java/nokogiri/internals/c14n/Canonicalizer20010315WithComments.java +50 -0
- data/ext/java/nokogiri/internals/c14n/CanonicalizerBase.java +660 -0
- data/ext/java/nokogiri/internals/c14n/CanonicalizerPhysical.java +194 -0
- data/ext/java/nokogiri/internals/c14n/CanonicalizerSpi.java +77 -0
- data/ext/java/nokogiri/internals/c14n/Constants.java +45 -0
- data/ext/java/nokogiri/internals/c14n/ElementProxy.java +325 -0
- data/ext/java/nokogiri/internals/c14n/HelperNodeList.java +106 -0
- data/ext/java/nokogiri/internals/c14n/IgnoreAllErrorHandler.java +86 -0
- data/ext/java/nokogiri/internals/c14n/InclusiveNamespaces.java +181 -0
- data/ext/java/nokogiri/internals/c14n/InvalidCanonicalizerException.java +87 -0
- data/ext/java/nokogiri/internals/c14n/NameSpaceSymbTable.java +452 -0
- data/ext/java/nokogiri/internals/c14n/NodeFilter.java +52 -0
- data/ext/java/nokogiri/internals/c14n/UtfHelpper.java +190 -0
- data/ext/java/nokogiri/internals/c14n/XMLUtils.java +540 -0
- data/ext/java/nokogiri/internals/dom2dtm/DOM2DTM.java +1712 -0
- data/ext/java/nokogiri/internals/dom2dtm/DOM2DTMdefaultNamespaceDeclarationNode.java +737 -0
- data/ext/nokogiri/depend +38 -0
- data/ext/nokogiri/extconf.rb +1086 -0
- data/ext/nokogiri/gumbo.c +594 -0
- data/ext/nokogiri/html4_document.c +167 -0
- data/ext/nokogiri/html4_element_description.c +294 -0
- data/ext/nokogiri/html4_entity_lookup.c +37 -0
- data/ext/nokogiri/html4_sax_parser_context.c +116 -0
- data/ext/nokogiri/html4_sax_push_parser.c +95 -0
- data/ext/nokogiri/libxml2_backwards_compat.c +121 -0
- data/ext/nokogiri/nokogiri.c +265 -0
- data/ext/nokogiri/nokogiri.h +235 -0
- data/ext/nokogiri/test_global_handlers.c +42 -0
- data/ext/nokogiri/xml_attr.c +103 -0
- data/ext/nokogiri/xml_attribute_decl.c +70 -0
- data/ext/nokogiri/xml_cdata.c +57 -0
- data/ext/nokogiri/xml_comment.c +62 -0
- data/ext/nokogiri/xml_document.c +689 -0
- data/ext/nokogiri/xml_document_fragment.c +44 -0
- data/ext/nokogiri/xml_dtd.c +210 -0
- data/ext/nokogiri/xml_element_content.c +128 -0
- data/ext/nokogiri/xml_element_decl.c +69 -0
- data/ext/nokogiri/xml_encoding_handler.c +104 -0
- data/ext/nokogiri/xml_entity_decl.c +112 -0
- data/ext/nokogiri/xml_entity_reference.c +50 -0
- data/ext/nokogiri/xml_namespace.c +186 -0
- data/ext/nokogiri/xml_node.c +2426 -0
- data/ext/nokogiri/xml_node_set.c +496 -0
- data/ext/nokogiri/xml_processing_instruction.c +54 -0
- data/ext/nokogiri/xml_reader.c +794 -0
- data/ext/nokogiri/xml_relax_ng.c +164 -0
- data/ext/nokogiri/xml_sax_parser.c +316 -0
- data/ext/nokogiri/xml_sax_parser_context.c +283 -0
- data/ext/nokogiri/xml_sax_push_parser.c +166 -0
- data/ext/nokogiri/xml_schema.c +260 -0
- data/ext/nokogiri/xml_syntax_error.c +85 -0
- data/ext/nokogiri/xml_text.c +48 -0
- data/ext/nokogiri/xml_xpath_context.c +415 -0
- data/ext/nokogiri/xslt_stylesheet.c +363 -0
- data/gumbo-parser/CHANGES.md +63 -0
- data/gumbo-parser/Makefile +111 -0
- data/gumbo-parser/THANKS +27 -0
- data/gumbo-parser/src/Makefile +34 -0
- data/gumbo-parser/src/README.md +41 -0
- data/gumbo-parser/src/ascii.c +75 -0
- data/gumbo-parser/src/ascii.h +115 -0
- data/gumbo-parser/src/attribute.c +42 -0
- data/gumbo-parser/src/attribute.h +17 -0
- data/gumbo-parser/src/char_ref.c +22225 -0
- data/gumbo-parser/src/char_ref.h +29 -0
- data/gumbo-parser/src/char_ref.rl +2154 -0
- data/gumbo-parser/src/error.c +626 -0
- data/gumbo-parser/src/error.h +148 -0
- data/gumbo-parser/src/foreign_attrs.c +104 -0
- data/gumbo-parser/src/foreign_attrs.gperf +27 -0
- data/gumbo-parser/src/insertion_mode.h +33 -0
- data/gumbo-parser/src/macros.h +91 -0
- data/gumbo-parser/src/nokogiri_gumbo.h +944 -0
- data/gumbo-parser/src/parser.c +4878 -0
- data/gumbo-parser/src/parser.h +41 -0
- data/gumbo-parser/src/replacement.h +33 -0
- data/gumbo-parser/src/string_buffer.c +103 -0
- data/gumbo-parser/src/string_buffer.h +68 -0
- data/gumbo-parser/src/string_piece.c +48 -0
- data/gumbo-parser/src/svg_attrs.c +174 -0
- data/gumbo-parser/src/svg_attrs.gperf +77 -0
- data/gumbo-parser/src/svg_tags.c +137 -0
- data/gumbo-parser/src/svg_tags.gperf +55 -0
- data/gumbo-parser/src/tag.c +223 -0
- data/gumbo-parser/src/tag_lookup.c +382 -0
- data/gumbo-parser/src/tag_lookup.gperf +170 -0
- data/gumbo-parser/src/tag_lookup.h +13 -0
- data/gumbo-parser/src/token_buffer.c +79 -0
- data/gumbo-parser/src/token_buffer.h +71 -0
- data/gumbo-parser/src/token_type.h +17 -0
- data/gumbo-parser/src/tokenizer.c +3463 -0
- data/gumbo-parser/src/tokenizer.h +112 -0
- data/gumbo-parser/src/tokenizer_states.h +339 -0
- data/gumbo-parser/src/utf8.c +245 -0
- data/gumbo-parser/src/utf8.h +164 -0
- data/gumbo-parser/src/util.c +66 -0
- data/gumbo-parser/src/util.h +34 -0
- data/gumbo-parser/src/vector.c +111 -0
- data/gumbo-parser/src/vector.h +45 -0
- data/lib/nokogiri/class_resolver.rb +67 -0
- data/lib/nokogiri/css/node.rb +54 -0
- data/lib/nokogiri/css/parser.rb +770 -0
- data/lib/nokogiri/css/parser.y +277 -0
- data/lib/nokogiri/css/parser_extras.rb +96 -0
- data/lib/nokogiri/css/syntax_error.rb +9 -0
- data/lib/nokogiri/css/tokenizer.rb +155 -0
- data/lib/nokogiri/css/tokenizer.rex +56 -0
- data/lib/nokogiri/css/xpath_visitor.rb +359 -0
- data/lib/nokogiri/css.rb +66 -0
- data/lib/nokogiri/decorators/slop.rb +44 -0
- data/lib/nokogiri/encoding_handler.rb +57 -0
- data/lib/nokogiri/extension.rb +32 -0
- data/lib/nokogiri/gumbo.rb +15 -0
- data/lib/nokogiri/html.rb +48 -0
- data/lib/nokogiri/html4/builder.rb +37 -0
- data/lib/nokogiri/html4/document.rb +214 -0
- data/lib/nokogiri/html4/document_fragment.rb +54 -0
- data/lib/nokogiri/html4/element_description.rb +25 -0
- data/lib/nokogiri/html4/element_description_defaults.rb +572 -0
- data/lib/nokogiri/html4/encoding_reader.rb +121 -0
- data/lib/nokogiri/html4/entity_lookup.rb +15 -0
- data/lib/nokogiri/html4/sax/parser.rb +63 -0
- data/lib/nokogiri/html4/sax/parser_context.rb +20 -0
- data/lib/nokogiri/html4/sax/push_parser.rb +37 -0
- data/lib/nokogiri/html4.rb +47 -0
- data/lib/nokogiri/html5/document.rb +168 -0
- data/lib/nokogiri/html5/document_fragment.rb +90 -0
- data/lib/nokogiri/html5/node.rb +98 -0
- data/lib/nokogiri/html5.rb +389 -0
- data/lib/nokogiri/jruby/dependencies.rb +3 -0
- data/lib/nokogiri/jruby/isorelax/isorelax/20030108/isorelax-20030108.jar +0 -0
- data/lib/nokogiri/jruby/net/sf/saxon/Saxon-HE/9.6.0-4/Saxon-HE-9.6.0-4.jar +0 -0
- data/lib/nokogiri/jruby/net/sourceforge/htmlunit/neko-htmlunit/2.63.0/neko-htmlunit-2.63.0.jar +0 -0
- data/lib/nokogiri/jruby/nokogiri_jars.rb +43 -0
- data/lib/nokogiri/jruby/nu/validator/jing/20200702VNU/jing-20200702VNU.jar +0 -0
- data/lib/nokogiri/jruby/org/nokogiri/nekodtd/0.1.11.noko2/nekodtd-0.1.11.noko2.jar +0 -0
- data/lib/nokogiri/jruby/xalan/serializer/2.7.3/serializer-2.7.3.jar +0 -0
- data/lib/nokogiri/jruby/xalan/xalan/2.7.3/xalan-2.7.3.jar +0 -0
- data/lib/nokogiri/jruby/xerces/xercesImpl/2.12.2/xercesImpl-2.12.2.jar +0 -0
- data/lib/nokogiri/jruby/xml-apis/xml-apis/1.4.01/xml-apis-1.4.01.jar +0 -0
- data/lib/nokogiri/syntax_error.rb +6 -0
- data/lib/nokogiri/version/constant.rb +6 -0
- data/lib/nokogiri/version/info.rb +223 -0
- data/lib/nokogiri/version.rb +4 -0
- data/lib/nokogiri/xml/attr.rb +66 -0
- data/lib/nokogiri/xml/attribute_decl.rb +20 -0
- data/lib/nokogiri/xml/builder.rb +487 -0
- data/lib/nokogiri/xml/cdata.rb +13 -0
- data/lib/nokogiri/xml/character_data.rb +9 -0
- data/lib/nokogiri/xml/document.rb +471 -0
- data/lib/nokogiri/xml/document_fragment.rb +205 -0
- data/lib/nokogiri/xml/dtd.rb +34 -0
- data/lib/nokogiri/xml/element_content.rb +38 -0
- data/lib/nokogiri/xml/element_decl.rb +15 -0
- data/lib/nokogiri/xml/entity_decl.rb +21 -0
- data/lib/nokogiri/xml/entity_reference.rb +20 -0
- data/lib/nokogiri/xml/namespace.rb +58 -0
- data/lib/nokogiri/xml/node/save_options.rb +68 -0
- data/lib/nokogiri/xml/node.rb +1563 -0
- data/lib/nokogiri/xml/node_set.rb +447 -0
- data/lib/nokogiri/xml/notation.rb +19 -0
- data/lib/nokogiri/xml/parse_options.rb +213 -0
- data/lib/nokogiri/xml/pp/character_data.rb +21 -0
- data/lib/nokogiri/xml/pp/node.rb +57 -0
- data/lib/nokogiri/xml/pp.rb +4 -0
- data/lib/nokogiri/xml/processing_instruction.rb +11 -0
- data/lib/nokogiri/xml/reader.rb +105 -0
- data/lib/nokogiri/xml/relax_ng.rb +38 -0
- data/lib/nokogiri/xml/sax/document.rb +167 -0
- data/lib/nokogiri/xml/sax/parser.rb +125 -0
- data/lib/nokogiri/xml/sax/parser_context.rb +21 -0
- data/lib/nokogiri/xml/sax/push_parser.rb +61 -0
- data/lib/nokogiri/xml/sax.rb +6 -0
- data/lib/nokogiri/xml/schema.rb +73 -0
- data/lib/nokogiri/xml/searchable.rb +270 -0
- data/lib/nokogiri/xml/syntax_error.rb +72 -0
- data/lib/nokogiri/xml/text.rb +11 -0
- data/lib/nokogiri/xml/xpath/syntax_error.rb +13 -0
- data/lib/nokogiri/xml/xpath.rb +21 -0
- data/lib/nokogiri/xml/xpath_context.rb +16 -0
- data/lib/nokogiri/xml.rb +76 -0
- data/lib/nokogiri/xslt/stylesheet.rb +27 -0
- data/lib/nokogiri/xslt.rb +65 -0
- data/lib/nokogiri.rb +120 -0
- data/lib/xsd/xmlparser/nokogiri.rb +106 -0
- metadata +391 -0
@@ -0,0 +1,148 @@
|
|
1
|
+
#ifndef GUMBO_ERROR_H_
|
2
|
+
#define GUMBO_ERROR_H_
|
3
|
+
|
4
|
+
#include <stdint.h>
|
5
|
+
|
6
|
+
#include "nokogiri_gumbo.h"
|
7
|
+
#include "insertion_mode.h"
|
8
|
+
#include "string_buffer.h"
|
9
|
+
#include "token_type.h"
|
10
|
+
#include "tokenizer_states.h"
|
11
|
+
|
12
|
+
#ifdef __cplusplus
|
13
|
+
extern "C" {
|
14
|
+
#endif
|
15
|
+
|
16
|
+
struct GumboInternalParser;
|
17
|
+
|
18
|
+
typedef enum {
|
19
|
+
// Defined errors.
|
20
|
+
// https://html.spec.whatwg.org/multipage/parsing.html#parse-errors
|
21
|
+
GUMBO_ERR_ABRUPT_CLOSING_OF_EMPTY_COMMENT,
|
22
|
+
GUMBO_ERR_ABRUPT_DOCTYPE_PUBLIC_IDENTIFIER,
|
23
|
+
GUMBO_ERR_ABRUPT_DOCTYPE_SYSTEM_IDENTIFIER,
|
24
|
+
GUMBO_ERR_ABSENCE_OF_DIGITS_IN_NUMERIC_CHARACTER_REFERENCE,
|
25
|
+
GUMBO_ERR_CDATA_IN_HTML_CONTENT,
|
26
|
+
GUMBO_ERR_CHARACTER_REFERENCE_OUTSIDE_UNICODE_RANGE,
|
27
|
+
GUMBO_ERR_CONTROL_CHARACTER_IN_INPUT_STREAM,
|
28
|
+
GUMBO_ERR_CONTROL_CHARACTER_REFERENCE,
|
29
|
+
GUMBO_ERR_END_TAG_WITH_ATTRIBUTES,
|
30
|
+
GUMBO_ERR_DUPLICATE_ATTRIBUTE,
|
31
|
+
GUMBO_ERR_END_TAG_WITH_TRAILING_SOLIDUS,
|
32
|
+
GUMBO_ERR_EOF_BEFORE_TAG_NAME,
|
33
|
+
GUMBO_ERR_EOF_IN_CDATA,
|
34
|
+
GUMBO_ERR_EOF_IN_COMMENT,
|
35
|
+
GUMBO_ERR_EOF_IN_DOCTYPE,
|
36
|
+
GUMBO_ERR_EOF_IN_SCRIPT_HTML_COMMENT_LIKE_TEXT,
|
37
|
+
GUMBO_ERR_EOF_IN_TAG,
|
38
|
+
GUMBO_ERR_INCORRECTLY_CLOSED_COMMENT,
|
39
|
+
GUMBO_ERR_INCORRECTLY_OPENED_COMMENT,
|
40
|
+
GUMBO_ERR_INVALID_CHARACTER_SEQUENCE_AFTER_DOCTYPE_NAME,
|
41
|
+
GUMBO_ERR_INVALID_FIRST_CHARACTER_OF_TAG_NAME,
|
42
|
+
GUMBO_ERR_MISSING_ATTRIBUTE_VALUE,
|
43
|
+
GUMBO_ERR_MISSING_DOCTYPE_NAME,
|
44
|
+
GUMBO_ERR_MISSING_DOCTYPE_PUBLIC_IDENTIFIER,
|
45
|
+
GUMBO_ERR_MISSING_DOCTYPE_SYSTEM_IDENTIFIER,
|
46
|
+
GUMBO_ERR_MISSING_END_TAG_NAME,
|
47
|
+
GUMBO_ERR_MISSING_QUOTE_BEFORE_DOCTYPE_PUBLIC_IDENTIFIER,
|
48
|
+
GUMBO_ERR_MISSING_QUOTE_BEFORE_DOCTYPE_SYSTEM_IDENTIFIER,
|
49
|
+
GUMBO_ERR_MISSING_SEMICOLON_AFTER_CHARACTER_REFERENCE,
|
50
|
+
GUMBO_ERR_MISSING_WHITESPACE_AFTER_DOCTYPE_PUBLIC_KEYWORD,
|
51
|
+
GUMBO_ERR_MISSING_WHITESPACE_AFTER_DOCTYPE_SYSTEM_KEYWORD,
|
52
|
+
GUMBO_ERR_MISSING_WHITESPACE_BEFORE_DOCTYPE_NAME,
|
53
|
+
GUMBO_ERR_MISSING_WHITESPACE_BETWEEN_ATTRIBUTES,
|
54
|
+
GUMBO_ERR_MISSING_WHITESPACE_BETWEEN_DOCTYPE_PUBLIC_AND_SYSTEM_IDENTIFIERS,
|
55
|
+
GUMBO_ERR_NESTED_COMMENT,
|
56
|
+
GUMBO_ERR_NONCHARACTER_CHARACTER_REFERENCE,
|
57
|
+
GUMBO_ERR_NONCHARACTER_IN_INPUT_STREAM,
|
58
|
+
GUMBO_ERR_NON_VOID_HTML_ELEMENT_START_TAG_WITH_TRAILING_SOLIDUS,
|
59
|
+
GUMBO_ERR_NULL_CHARACTER_REFERENCE,
|
60
|
+
GUMBO_ERR_SURROGATE_CHARACTER_REFERENCE,
|
61
|
+
GUMBO_ERR_SURROGATE_IN_INPUT_STREAM,
|
62
|
+
GUMBO_ERR_UNEXPECTED_CHARACTER_AFTER_DOCTYPE_SYSTEM_IDENTIFIER,
|
63
|
+
GUMBO_ERR_UNEXPECTED_CHARACTER_IN_ATTRIBUTE_NAME,
|
64
|
+
GUMBO_ERR_UNEXPECTED_CHARACTER_IN_UNQUOTED_ATTRIBUTE_VALUE,
|
65
|
+
GUMBO_ERR_UNEXPECTED_EQUALS_SIGN_BEFORE_ATTRIBUTE_NAME,
|
66
|
+
GUMBO_ERR_UNEXPECTED_NULL_CHARACTER,
|
67
|
+
GUMBO_ERR_UNEXPECTED_QUESTION_MARK_INSTEAD_OF_TAG_NAME,
|
68
|
+
GUMBO_ERR_UNEXPECTED_SOLIDUS_IN_TAG,
|
69
|
+
GUMBO_ERR_UNKNOWN_NAMED_CHARACTER_REFERENCE,
|
70
|
+
|
71
|
+
// Encoding errors.
|
72
|
+
GUMBO_ERR_UTF8_INVALID,
|
73
|
+
GUMBO_ERR_UTF8_TRUNCATED,
|
74
|
+
|
75
|
+
// Generic parser error.
|
76
|
+
GUMBO_ERR_PARSER,
|
77
|
+
} GumboErrorType;
|
78
|
+
|
79
|
+
// Additional data for tokenizer errors.
|
80
|
+
// This records the current state and codepoint encountered - this is usually
|
81
|
+
// enough to reconstruct what went wrong and provide a friendly error message.
|
82
|
+
typedef struct GumboInternalTokenizerError {
|
83
|
+
// The bad codepoint encountered.
|
84
|
+
int codepoint;
|
85
|
+
|
86
|
+
// The state that the tokenizer was in at the time.
|
87
|
+
GumboTokenizerEnum state;
|
88
|
+
} GumboTokenizerError;
|
89
|
+
|
90
|
+
// Additional data for parse errors.
|
91
|
+
typedef struct GumboInternalParserError {
|
92
|
+
// The type of input token that resulted in this error.
|
93
|
+
GumboTokenType input_type;
|
94
|
+
|
95
|
+
// The HTML tag of the input token. TAG_UNKNOWN if this was not a tag token.
|
96
|
+
GumboTag input_tag;
|
97
|
+
|
98
|
+
// The insertion mode that the parser was in at the time.
|
99
|
+
GumboInsertionMode parser_state;
|
100
|
+
|
101
|
+
// The tag stack at the point of the error. Note that this is an GumboVector
|
102
|
+
// of GumboTag's *stored by value* - cast the void* to an GumboTag directly to
|
103
|
+
// get at the tag.
|
104
|
+
GumboVector /* GumboTag */ tag_stack;
|
105
|
+
} GumboParserError;
|
106
|
+
|
107
|
+
// The overall error struct representing an error in decoding/tokenizing/parsing
|
108
|
+
// the HTML. This contains an enumerated type flag, a source position, and then
|
109
|
+
// a union of fields containing data specific to the error.
|
110
|
+
struct GumboInternalError {
|
111
|
+
// The type of error.
|
112
|
+
GumboErrorType type;
|
113
|
+
|
114
|
+
// The position within the source file where the error occurred.
|
115
|
+
GumboSourcePosition position;
|
116
|
+
|
117
|
+
// The piece of text that caused the error.
|
118
|
+
GumboStringPiece original_text;
|
119
|
+
|
120
|
+
// Type-specific error information.
|
121
|
+
union {
|
122
|
+
// Tokenizer errors.
|
123
|
+
GumboTokenizerError tokenizer;
|
124
|
+
|
125
|
+
// Parser errors.
|
126
|
+
GumboParserError parser;
|
127
|
+
} v;
|
128
|
+
};
|
129
|
+
|
130
|
+
// Adds a new error to the parser's error list, and returns a pointer to it so
|
131
|
+
// that clients can fill out the rest of its fields. May return NULL if we're
|
132
|
+
// already over the max_errors field specified in GumboOptions.
|
133
|
+
GumboError* gumbo_add_error(struct GumboInternalParser* parser);
|
134
|
+
|
135
|
+
// Initializes the errors vector in the parser.
|
136
|
+
void gumbo_init_errors(struct GumboInternalParser* errors);
|
137
|
+
|
138
|
+
// Frees all the errors in the 'errors_' field of the parser.
|
139
|
+
void gumbo_destroy_errors(struct GumboInternalParser* errors);
|
140
|
+
|
141
|
+
// Frees the memory used for a single GumboError.
|
142
|
+
void gumbo_error_destroy(GumboError* error);
|
143
|
+
|
144
|
+
#ifdef __cplusplus
|
145
|
+
}
|
146
|
+
#endif
|
147
|
+
|
148
|
+
#endif // GUMBO_ERROR_H_
|
@@ -0,0 +1,104 @@
|
|
1
|
+
/* ANSI-C code produced by gperf version 3.1 */
|
2
|
+
/* Command-line: gperf -m100 -n src/foreign_attrs.gperf */
|
3
|
+
/* Computed positions: -k'2,8' */
|
4
|
+
/* Filtered by: gperf-filter.sed */
|
5
|
+
|
6
|
+
#include "replacement.h"
|
7
|
+
#include "macros.h"
|
8
|
+
#include <string.h>
|
9
|
+
|
10
|
+
#define TOTAL_KEYWORDS 11
|
11
|
+
#define MIN_WORD_LENGTH 5
|
12
|
+
#define MAX_WORD_LENGTH 13
|
13
|
+
#define MIN_HASH_VALUE 0
|
14
|
+
#define MAX_HASH_VALUE 10
|
15
|
+
/* maximum key range = 11, duplicates = 0 */
|
16
|
+
|
17
|
+
static inline unsigned int
|
18
|
+
hash (register const char *str, register size_t len)
|
19
|
+
{
|
20
|
+
static const unsigned char asso_values[] =
|
21
|
+
{
|
22
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
23
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
24
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
25
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
26
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
27
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
28
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
29
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
30
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
31
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 2,
|
32
|
+
11, 10, 11, 9, 7, 6, 11, 11, 1, 0,
|
33
|
+
11, 5, 11, 11, 4, 11, 11, 11, 11, 11,
|
34
|
+
11, 3, 11, 11, 11, 11, 11, 11, 11, 11,
|
35
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
36
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
37
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
38
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
39
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
40
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
41
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
42
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
43
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
44
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
45
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
46
|
+
11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
|
47
|
+
11, 11, 11, 11, 11, 11
|
48
|
+
};
|
49
|
+
register unsigned int hval = 0;
|
50
|
+
|
51
|
+
switch (len)
|
52
|
+
{
|
53
|
+
default:
|
54
|
+
hval += asso_values[(unsigned char)str[7]];
|
55
|
+
/*FALLTHROUGH*/
|
56
|
+
case 7:
|
57
|
+
case 6:
|
58
|
+
case 5:
|
59
|
+
case 4:
|
60
|
+
case 3:
|
61
|
+
case 2:
|
62
|
+
hval += asso_values[(unsigned char)str[1]];
|
63
|
+
break;
|
64
|
+
}
|
65
|
+
return hval;
|
66
|
+
}
|
67
|
+
|
68
|
+
const ForeignAttrReplacement *
|
69
|
+
gumbo_get_foreign_attr_replacement (register const char *str, register size_t len)
|
70
|
+
{
|
71
|
+
static const unsigned char lengthtable[] =
|
72
|
+
{
|
73
|
+
5, 11, 9, 13, 10, 10, 10, 11, 10, 8, 8
|
74
|
+
};
|
75
|
+
static const ForeignAttrReplacement wordlist[] =
|
76
|
+
{
|
77
|
+
{"xmlns", "xmlns", GUMBO_ATTR_NAMESPACE_XMLNS},
|
78
|
+
{"xmlns:xlink", "xlink", GUMBO_ATTR_NAMESPACE_XMLNS},
|
79
|
+
{"xml:space", "space", GUMBO_ATTR_NAMESPACE_XML},
|
80
|
+
{"xlink:actuate", "actuate", GUMBO_ATTR_NAMESPACE_XLINK},
|
81
|
+
{"xlink:type", "type", GUMBO_ATTR_NAMESPACE_XLINK},
|
82
|
+
{"xlink:href", "href", GUMBO_ATTR_NAMESPACE_XLINK},
|
83
|
+
{"xlink:role", "role", GUMBO_ATTR_NAMESPACE_XLINK},
|
84
|
+
{"xlink:title", "title", GUMBO_ATTR_NAMESPACE_XLINK},
|
85
|
+
{"xlink:show", "show", GUMBO_ATTR_NAMESPACE_XLINK},
|
86
|
+
{"xml:lang", "lang", GUMBO_ATTR_NAMESPACE_XML},
|
87
|
+
{"xml:base", "base", GUMBO_ATTR_NAMESPACE_XML}
|
88
|
+
};
|
89
|
+
|
90
|
+
if (len <= MAX_WORD_LENGTH && len >= MIN_WORD_LENGTH)
|
91
|
+
{
|
92
|
+
register unsigned int key = hash (str, len);
|
93
|
+
|
94
|
+
if (key <= MAX_HASH_VALUE)
|
95
|
+
if (len == lengthtable[key])
|
96
|
+
{
|
97
|
+
register const char *s = wordlist[key].from;
|
98
|
+
|
99
|
+
if (s && *str == *s && !memcmp (str + 1, s + 1, len - 1))
|
100
|
+
return &wordlist[key];
|
101
|
+
}
|
102
|
+
}
|
103
|
+
return 0;
|
104
|
+
}
|
@@ -0,0 +1,27 @@
|
|
1
|
+
%{
|
2
|
+
#include "replacement.h"
|
3
|
+
#include "macros.h"
|
4
|
+
%}
|
5
|
+
|
6
|
+
%struct-type
|
7
|
+
%omit-struct-type
|
8
|
+
%compare-lengths
|
9
|
+
%readonly-tables
|
10
|
+
%null-strings
|
11
|
+
%includes
|
12
|
+
%define lookup-function-name gumbo_get_foreign_attr_replacement
|
13
|
+
%define slot-name from
|
14
|
+
ForeignAttrReplacement;
|
15
|
+
|
16
|
+
%%
|
17
|
+
"xlink:actuate", "actuate", GUMBO_ATTR_NAMESPACE_XLINK
|
18
|
+
"xlink:href", "href", GUMBO_ATTR_NAMESPACE_XLINK
|
19
|
+
"xlink:role", "role", GUMBO_ATTR_NAMESPACE_XLINK
|
20
|
+
"xlink:show", "show", GUMBO_ATTR_NAMESPACE_XLINK
|
21
|
+
"xlink:title", "title", GUMBO_ATTR_NAMESPACE_XLINK
|
22
|
+
"xlink:type", "type", GUMBO_ATTR_NAMESPACE_XLINK
|
23
|
+
"xml:base", "base", GUMBO_ATTR_NAMESPACE_XML
|
24
|
+
"xml:lang", "lang", GUMBO_ATTR_NAMESPACE_XML
|
25
|
+
"xml:space", "space", GUMBO_ATTR_NAMESPACE_XML
|
26
|
+
"xmlns", "xmlns", GUMBO_ATTR_NAMESPACE_XMLNS
|
27
|
+
"xmlns:xlink", "xlink", GUMBO_ATTR_NAMESPACE_XMLNS
|
@@ -0,0 +1,33 @@
|
|
1
|
+
#ifndef GUMBO_INSERTION_MODE_H_
|
2
|
+
#define GUMBO_INSERTION_MODE_H_
|
3
|
+
|
4
|
+
// https://html.spec.whatwg.org/multipage/parsing.html#insertion-mode
|
5
|
+
// If new enum values are added, be sure to update the kTokenHandlers
|
6
|
+
// dispatch table in parser.c.
|
7
|
+
typedef enum {
|
8
|
+
GUMBO_INSERTION_MODE_INITIAL,
|
9
|
+
GUMBO_INSERTION_MODE_BEFORE_HTML,
|
10
|
+
GUMBO_INSERTION_MODE_BEFORE_HEAD,
|
11
|
+
GUMBO_INSERTION_MODE_IN_HEAD,
|
12
|
+
GUMBO_INSERTION_MODE_IN_HEAD_NOSCRIPT,
|
13
|
+
GUMBO_INSERTION_MODE_AFTER_HEAD,
|
14
|
+
GUMBO_INSERTION_MODE_IN_BODY,
|
15
|
+
GUMBO_INSERTION_MODE_TEXT,
|
16
|
+
GUMBO_INSERTION_MODE_IN_TABLE,
|
17
|
+
GUMBO_INSERTION_MODE_IN_TABLE_TEXT,
|
18
|
+
GUMBO_INSERTION_MODE_IN_CAPTION,
|
19
|
+
GUMBO_INSERTION_MODE_IN_COLUMN_GROUP,
|
20
|
+
GUMBO_INSERTION_MODE_IN_TABLE_BODY,
|
21
|
+
GUMBO_INSERTION_MODE_IN_ROW,
|
22
|
+
GUMBO_INSERTION_MODE_IN_CELL,
|
23
|
+
GUMBO_INSERTION_MODE_IN_SELECT,
|
24
|
+
GUMBO_INSERTION_MODE_IN_SELECT_IN_TABLE,
|
25
|
+
GUMBO_INSERTION_MODE_IN_TEMPLATE,
|
26
|
+
GUMBO_INSERTION_MODE_AFTER_BODY,
|
27
|
+
GUMBO_INSERTION_MODE_IN_FRAMESET,
|
28
|
+
GUMBO_INSERTION_MODE_AFTER_FRAMESET,
|
29
|
+
GUMBO_INSERTION_MODE_AFTER_AFTER_BODY,
|
30
|
+
GUMBO_INSERTION_MODE_AFTER_AFTER_FRAMESET
|
31
|
+
} GumboInsertionMode;
|
32
|
+
|
33
|
+
#endif // GUMBO_INSERTION_MODE_H_
|
@@ -0,0 +1,91 @@
|
|
1
|
+
#ifndef MACROS_H
|
2
|
+
#define MACROS_H
|
3
|
+
|
4
|
+
#if (!defined(__STDC_VERSION__) || !(__STDC_VERSION__ >= 199901L)) \
|
5
|
+
&& !defined(_WIN32) && !defined(__cplusplus)
|
6
|
+
# error C99 compiler required
|
7
|
+
#endif
|
8
|
+
|
9
|
+
#if defined(_WIN32)
|
10
|
+
# define inline __inline
|
11
|
+
# define __func__ __FUNCTION__
|
12
|
+
#endif
|
13
|
+
|
14
|
+
// Calculate the number of elements in an array.
|
15
|
+
// The extra division on the third line is a trick to help prevent
|
16
|
+
// passing a pointer to the first element of an array instead of a
|
17
|
+
// reference to the array itself.
|
18
|
+
#define ARRAY_COUNT(x) ( \
|
19
|
+
(sizeof(x) / sizeof((x)[0])) \
|
20
|
+
/ ((size_t)(!(sizeof(x) % sizeof((x)[0])))) \
|
21
|
+
)
|
22
|
+
|
23
|
+
#ifdef NDEBUG
|
24
|
+
#define UNUSED_IF_NDEBUG(x) (void)(x)
|
25
|
+
#else
|
26
|
+
#define UNUSED_IF_NDEBUG(x)
|
27
|
+
#endif
|
28
|
+
|
29
|
+
#ifdef __GNUC__
|
30
|
+
#define GNUC_AT_LEAST(major, minor) ( \
|
31
|
+
(__GNUC__ > major) \
|
32
|
+
|| ((__GNUC__ == major) && (__GNUC_MINOR__ >= minor)) )
|
33
|
+
#else
|
34
|
+
#define GNUC_AT_LEAST(major, minor) 0
|
35
|
+
#endif
|
36
|
+
|
37
|
+
#ifdef __has_attribute
|
38
|
+
#define HAS_ATTRIBUTE(x) __has_attribute(x)
|
39
|
+
#else
|
40
|
+
#define HAS_ATTRIBUTE(x) 0
|
41
|
+
#endif
|
42
|
+
|
43
|
+
#if GNUC_AT_LEAST(3, 0) || HAS_ATTRIBUTE(unused) || defined(__TINYC__)
|
44
|
+
#define UNUSED __attribute__((__unused__))
|
45
|
+
#else
|
46
|
+
#define UNUSED
|
47
|
+
#endif
|
48
|
+
|
49
|
+
#if GNUC_AT_LEAST(3, 0)
|
50
|
+
#define MALLOC __attribute__((__malloc__))
|
51
|
+
#define PRINTF(x) __attribute__((__format__(__printf__, (x), (x + 1))))
|
52
|
+
#define PURE __attribute__((__pure__))
|
53
|
+
#define CONST_FN __attribute__((__const__))
|
54
|
+
#else
|
55
|
+
#define MALLOC
|
56
|
+
#define PRINTF(x)
|
57
|
+
#define PURE
|
58
|
+
#define CONST_FN
|
59
|
+
#endif
|
60
|
+
|
61
|
+
#define UNUSED_ARG(x) unused__ ## x UNUSED
|
62
|
+
|
63
|
+
#if GNUC_AT_LEAST(3, 0) && defined(__OPTIMIZE__)
|
64
|
+
#define likely(x) __builtin_expect(!!(x), 1)
|
65
|
+
#define unlikely(x) __builtin_expect(!!(x), 0)
|
66
|
+
#else
|
67
|
+
#define likely(x) (x)
|
68
|
+
#define unlikely(x) (x)
|
69
|
+
#endif
|
70
|
+
|
71
|
+
#if GNUC_AT_LEAST(3, 3) || HAS_ATTRIBUTE(nonnull)
|
72
|
+
#define NONNULL_ARGS __attribute__((__nonnull__))
|
73
|
+
#else
|
74
|
+
#define NONNULL_ARGS
|
75
|
+
#endif
|
76
|
+
|
77
|
+
#if GNUC_AT_LEAST(3, 4) || HAS_ATTRIBUTE(warn_unused_result)
|
78
|
+
#define WARN_UNUSED_RESULT __attribute__((__warn_unused_result__))
|
79
|
+
#else
|
80
|
+
#define WARN_UNUSED_RESULT
|
81
|
+
#endif
|
82
|
+
|
83
|
+
#if GNUC_AT_LEAST(5, 0) || HAS_ATTRIBUTE(returns_nonnull)
|
84
|
+
#define RETURNS_NONNULL __attribute__((__returns_nonnull__))
|
85
|
+
#else
|
86
|
+
#define RETURNS_NONNULL
|
87
|
+
#endif
|
88
|
+
|
89
|
+
#define XMALLOC MALLOC RETURNS_NONNULL
|
90
|
+
|
91
|
+
#endif // ndef MACROS_H
|