PyPI - lxml - Versions diffs - 5.2.0__cp310-cp310-win32.whl → 5.2.2__cp310-cp310-win32.whl - Mend

lxml 5.2.0cp310-cp310-win32.whl → 5.2.2cp310-cp310-win32.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (89) hide show

lxml/ElementInclude.py +244 -244
lxml/__init__.py +22 -22
lxml/_elementpath.cp310-win32.pyd +0 -0
lxml/_elementpath.py +341 -341
lxml/apihelpers.pxi +1793 -1793
lxml/builder.cp310-win32.pyd +0 -0
lxml/builder.py +232 -232
lxml/classlookup.pxi +580 -580
lxml/cleanup.pxi +215 -215
lxml/cssselect.py +101 -101
lxml/debug.pxi +90 -90
lxml/docloader.pxi +178 -178
lxml/doctestcompare.py +488 -488
lxml/dtd.pxi +478 -478
lxml/etree.cp310-win32.pyd +0 -0
lxml/etree.h +6 -6
lxml/etree.pyx +3732 -3711
lxml/extensions.pxi +833 -833
lxml/html/ElementSoup.py +10 -10
lxml/html/__init__.py +1923 -1923
lxml/html/_diffcommand.py +86 -86
lxml/html/_html5builder.py +100 -100
lxml/html/_setmixin.py +56 -56
lxml/html/builder.py +133 -133
lxml/html/clean.py +21 -21
lxml/html/defs.py +135 -135
lxml/html/diff.cp310-win32.pyd +0 -0
lxml/html/diff.py +878 -878
lxml/html/formfill.py +299 -299
lxml/html/html5parser.py +260 -260
lxml/html/soupparser.py +314 -314
lxml/html/usedoctest.py +13 -13
lxml/includes/c14n.pxd +25 -25
lxml/includes/config.pxd +3 -3
lxml/includes/dtdvalid.pxd +18 -18
lxml/includes/etree_defs.h +379 -379
lxml/includes/etreepublic.pxd +237 -237
lxml/includes/htmlparser.pxd +56 -56
lxml/includes/lxml-version.h +1 -1
lxml/includes/relaxng.pxd +64 -64
lxml/includes/schematron.pxd +34 -34
lxml/includes/tree.pxd +494 -494
lxml/includes/uri.pxd +5 -5
lxml/includes/xinclude.pxd +22 -22
lxml/includes/xmlerror.pxd +852 -852
lxml/includes/xmlparser.pxd +265 -265
lxml/includes/xmlschema.pxd +35 -35
lxml/includes/xpath.pxd +136 -136
lxml/includes/xslt.pxd +190 -190
lxml/isoschematron/__init__.py +348 -348
lxml/isoschematron/resources/rng/iso-schematron.rng +709 -709
lxml/isoschematron/resources/xsl/RNG2Schtrn.xsl +75 -75
lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_abstract_expand.xsl +312 -312
lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_dsdl_include.xsl +1159 -1159
lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_message.xsl +54 -54
lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_schematron_skeleton_for_xslt1.xsl +1796 -1796
lxml/isoschematron/resources/xsl/iso-schematron-xslt1/iso_svrl_for_xslt1.xsl +588 -588
lxml/iterparse.pxi +438 -438
lxml/lxml.etree.h +6 -6
lxml/nsclasses.pxi +281 -281
lxml/objectify.cp310-win32.pyd +0 -0
lxml/objectify.pyx +2145 -2145
lxml/objectpath.pxi +332 -332
lxml/parser.pxi +1994 -1994
lxml/parsertarget.pxi +180 -180
lxml/proxy.pxi +619 -619
lxml/public-api.pxi +178 -178
lxml/pyclasslookup.py +3 -3
lxml/readonlytree.pxi +565 -565
lxml/relaxng.pxi +165 -165
lxml/sax.cp310-win32.pyd +0 -0
lxml/sax.py +275 -275
lxml/saxparser.pxi +875 -875
lxml/schematron.pxi +168 -168
lxml/serializer.pxi +1871 -1871
lxml/usedoctest.py +13 -13
lxml/xinclude.pxi +67 -67
lxml/xmlerror.pxi +1654 -1654
lxml/xmlid.pxi +179 -179
lxml/xmlschema.pxi +215 -215
lxml/xpath.pxi +487 -487
lxml/xslt.pxi +950 -950
lxml/xsltext.pxi +242 -242
{lxml-5.2.0.dist-info → lxml-5.2.2.dist-info}/LICENSE.txt +29 -29
{lxml-5.2.0.dist-info → lxml-5.2.2.dist-info}/LICENSES.txt +29 -29
{lxml-5.2.0.dist-info → lxml-5.2.2.dist-info}/METADATA +9 -17
{lxml-5.2.0.dist-info → lxml-5.2.2.dist-info}/RECORD +89 -89
{lxml-5.2.0.dist-info → lxml-5.2.2.dist-info}/WHEEL +0 -0
{lxml-5.2.0.dist-info → lxml-5.2.2.dist-info}/top_level.txt +0 -0

lxml/cleanup.pxi CHANGED Viewed

@@ -1,215 +1,215 @@
-# functions for tree cleanup and removing elements from subtrees
-def cleanup_namespaces(tree_or_element, top_nsmap=None, keep_ns_prefixes=None):
-    """cleanup_namespaces(tree_or_element, top_nsmap=None, keep_ns_prefixes=None)
-    Remove all namespace declarations from a subtree that are not used
-    by any of the elements or attributes in that tree.
-    If a 'top_nsmap' is provided, it must be a mapping from prefixes
-    to namespace URIs.  These namespaces will be declared on the top
-    element of the subtree before running the cleanup, which allows
-    moving namespace declarations to the top of the tree.
-    If a 'keep_ns_prefixes' is provided, it must be a list of prefixes.
-    These prefixes will not be removed as part of the cleanup.
-    """
-    element = _rootNodeOrRaise(tree_or_element)
-    c_element = element._c_node
-    if top_nsmap:
-        doc = element._doc
-        # declare namespaces from nsmap, then apply them to the subtree
-        _setNodeNamespaces(c_element, doc, None, top_nsmap)
-        moveNodeToDocument(doc, c_element.doc, c_element)
-    keep_ns_prefixes = (
-        set([_utf8(prefix) for prefix in keep_ns_prefixes])
-        if keep_ns_prefixes else None)
-    _removeUnusedNamespaceDeclarations(c_element, keep_ns_prefixes)
-def strip_attributes(tree_or_element, *attribute_names):
-    """strip_attributes(tree_or_element, *attribute_names)
-    Delete all attributes with the provided attribute names from an
-    Element (or ElementTree) and its descendants.
-    Attribute names can contain wildcards as in `_Element.iter`.
-    Example usage::
-        strip_attributes(root_element,
-                         'simpleattr',
-                         '{http://some/ns}attrname',
-                         '{http://other/ns}*')
-    """
-    cdef _MultiTagMatcher matcher
-    element = _rootNodeOrRaise(tree_or_element)
-    if not attribute_names:
-        return
-    matcher = _MultiTagMatcher.__new__(_MultiTagMatcher, attribute_names)
-    matcher.cacheTags(element._doc)
-    if matcher.rejectsAllAttributes():
-        return
-    _strip_attributes(element._c_node, matcher)
-cdef _strip_attributes(xmlNode* c_node, _MultiTagMatcher matcher):
-    cdef xmlAttr* c_attr
-    cdef xmlAttr* c_next_attr
-    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
-    if c_node.type == tree.XML_ELEMENT_NODE:
-        c_attr = c_node.properties
-        while c_attr is not NULL:
-            c_next_attr = c_attr.next
-            if matcher.matchesAttribute(c_attr):
-                tree.xmlRemoveProp(c_attr)
-            c_attr = c_next_attr
-    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
-def strip_elements(tree_or_element, *tag_names, bint with_tail=True):
-    """strip_elements(tree_or_element, *tag_names, with_tail=True)
-    Delete all elements with the provided tag names from a tree or
-    subtree.  This will remove the elements and their entire subtree,
-    including all their attributes, text content and descendants.  It
-    will also remove the tail text of the element unless you
-    explicitly set the ``with_tail`` keyword argument option to False.
-    Tag names can contain wildcards as in `_Element.iter`.
-    Note that this will not delete the element (or ElementTree root
-    element) that you passed even if it matches.  It will only treat
-    its descendants.  If you want to include the root element, check
-    its tag name directly before even calling this function.
-    Example usage::
-        strip_elements(some_element,
-            'simpletagname',             # non-namespaced tag
-            '{http://some/ns}tagname',   # namespaced tag
-            '{http://some/other/ns}*'    # any tag from a namespace
-            lxml.etree.Comment           # comments
-            )
-    """
-    cdef _MultiTagMatcher matcher
-    doc = _documentOrRaise(tree_or_element)
-    element = _rootNodeOrRaise(tree_or_element)
-    if not tag_names:
-        return
-    matcher = _MultiTagMatcher.__new__(_MultiTagMatcher, tag_names)
-    matcher.cacheTags(doc)
-    if matcher.rejectsAll():
-        return
-    if isinstance(tree_or_element, _ElementTree):
-        # include PIs and comments next to the root node
-        if matcher.matchesType(tree.XML_COMMENT_NODE):
-            _removeSiblings(element._c_node, tree.XML_COMMENT_NODE, with_tail)
-        if matcher.matchesType(tree.XML_PI_NODE):
-            _removeSiblings(element._c_node, tree.XML_PI_NODE, with_tail)
-    _strip_elements(doc, element._c_node, matcher, with_tail)
-cdef _strip_elements(_Document doc, xmlNode* c_node, _MultiTagMatcher matcher,
-                     bint with_tail):
-    cdef xmlNode* c_child
-    cdef xmlNode* c_next
-    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
-    if c_node.type == tree.XML_ELEMENT_NODE:
-        # we run through the children here to prevent any problems
-        # with the tree iteration which would occur if we unlinked the
-        # c_node itself
-        c_child = _findChildForwards(c_node, 0)
-        while c_child is not NULL:
-            c_next = _nextElement(c_child)
-            if matcher.matches(c_child):
-                if c_child.type == tree.XML_ELEMENT_NODE:
-                    if not with_tail:
-                        tree.xmlUnlinkNode(c_child)
-                    _removeNode(doc, c_child)
-                else:
-                    if with_tail:
-                        _removeText(c_child.next)
-                    tree.xmlUnlinkNode(c_child)
-                    attemptDeallocation(c_child)
-            c_child = c_next
-    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
-def strip_tags(tree_or_element, *tag_names):
-    """strip_tags(tree_or_element, *tag_names)
-    Delete all elements with the provided tag names from a tree or
-    subtree.  This will remove the elements and their attributes, but
-    *not* their text/tail content or descendants.  Instead, it will
-    merge the text content and children of the element into its
-    parent.
-    Tag names can contain wildcards as in `_Element.iter`.
-    Note that this will not delete the element (or ElementTree root
-    element) that you passed even if it matches.  It will only treat
-    its descendants.
-    Example usage::
-        strip_tags(some_element,
-            'simpletagname',             # non-namespaced tag
-            '{http://some/ns}tagname',   # namespaced tag
-            '{http://some/other/ns}*'    # any tag from a namespace
-            Comment                      # comments (including their text!)
-            )
-    """
-    cdef _MultiTagMatcher matcher
-    doc = _documentOrRaise(tree_or_element)
-    element = _rootNodeOrRaise(tree_or_element)
-    if not tag_names:
-        return
-    matcher = _MultiTagMatcher.__new__(_MultiTagMatcher, tag_names)
-    matcher.cacheTags(doc)
-    if matcher.rejectsAll():
-        return
-    if isinstance(tree_or_element, _ElementTree):
-        # include PIs and comments next to the root node
-        if matcher.matchesType(tree.XML_COMMENT_NODE):
-            _removeSiblings(element._c_node, tree.XML_COMMENT_NODE, 0)
-        if matcher.matchesType(tree.XML_PI_NODE):
-            _removeSiblings(element._c_node, tree.XML_PI_NODE, 0)
-    _strip_tags(doc, element._c_node, matcher)
-cdef _strip_tags(_Document doc, xmlNode* c_node, _MultiTagMatcher matcher):
-    cdef xmlNode* c_child
-    cdef xmlNode* c_next
-    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
-    if c_node.type == tree.XML_ELEMENT_NODE:
-        # we run through the children here to prevent any problems
-        # with the tree iteration which would occur if we unlinked the
-        # c_node itself
-        c_child = _findChildForwards(c_node, 0)
-        while c_child is not NULL:
-            if not matcher.matches(c_child):
-                c_child = _nextElement(c_child)
-                continue
-            if c_child.type == tree.XML_ELEMENT_NODE:
-                c_next = _findChildForwards(c_child, 0) or _nextElement(c_child)
-                _replaceNodeByChildren(doc, c_child)
-                if not attemptDeallocation(c_child):
-                    if c_child.nsDef is not NULL:
-                        # make namespaces absolute
-                        moveNodeToDocument(doc, doc._c_doc, c_child)
-                c_child = c_next
-            else:
-                c_next = _nextElement(c_child)
-                tree.xmlUnlinkNode(c_child)
-                attemptDeallocation(c_child)
-                c_child = c_next
-    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+# functions for tree cleanup and removing elements from subtrees
+def cleanup_namespaces(tree_or_element, top_nsmap=None, keep_ns_prefixes=None):
+    """cleanup_namespaces(tree_or_element, top_nsmap=None, keep_ns_prefixes=None)
+    Remove all namespace declarations from a subtree that are not used
+    by any of the elements or attributes in that tree.
+    If a 'top_nsmap' is provided, it must be a mapping from prefixes
+    to namespace URIs.  These namespaces will be declared on the top
+    element of the subtree before running the cleanup, which allows
+    moving namespace declarations to the top of the tree.
+    If a 'keep_ns_prefixes' is provided, it must be a list of prefixes.
+    These prefixes will not be removed as part of the cleanup.
+    """
+    element = _rootNodeOrRaise(tree_or_element)
+    c_element = element._c_node
+    if top_nsmap:
+        doc = element._doc
+        # declare namespaces from nsmap, then apply them to the subtree
+        _setNodeNamespaces(c_element, doc, None, top_nsmap)
+        moveNodeToDocument(doc, c_element.doc, c_element)
+    keep_ns_prefixes = (
+        set([_utf8(prefix) for prefix in keep_ns_prefixes])
+        if keep_ns_prefixes else None)
+    _removeUnusedNamespaceDeclarations(c_element, keep_ns_prefixes)
+def strip_attributes(tree_or_element, *attribute_names):
+    """strip_attributes(tree_or_element, *attribute_names)
+    Delete all attributes with the provided attribute names from an
+    Element (or ElementTree) and its descendants.
+    Attribute names can contain wildcards as in `_Element.iter`.
+    Example usage::
+        strip_attributes(root_element,
+                         'simpleattr',
+                         '{http://some/ns}attrname',
+                         '{http://other/ns}*')
+    """
+    cdef _MultiTagMatcher matcher
+    element = _rootNodeOrRaise(tree_or_element)
+    if not attribute_names:
+        return
+    matcher = _MultiTagMatcher.__new__(_MultiTagMatcher, attribute_names)
+    matcher.cacheTags(element._doc)
+    if matcher.rejectsAllAttributes():
+        return
+    _strip_attributes(element._c_node, matcher)
+cdef _strip_attributes(xmlNode* c_node, _MultiTagMatcher matcher):
+    cdef xmlAttr* c_attr
+    cdef xmlAttr* c_next_attr
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        c_attr = c_node.properties
+        while c_attr is not NULL:
+            c_next_attr = c_attr.next
+            if matcher.matchesAttribute(c_attr):
+                tree.xmlRemoveProp(c_attr)
+            c_attr = c_next_attr
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+def strip_elements(tree_or_element, *tag_names, bint with_tail=True):
+    """strip_elements(tree_or_element, *tag_names, with_tail=True)
+    Delete all elements with the provided tag names from a tree or
+    subtree.  This will remove the elements and their entire subtree,
+    including all their attributes, text content and descendants.  It
+    will also remove the tail text of the element unless you
+    explicitly set the ``with_tail`` keyword argument option to False.
+    Tag names can contain wildcards as in `_Element.iter`.
+    Note that this will not delete the element (or ElementTree root
+    element) that you passed even if it matches.  It will only treat
+    its descendants.  If you want to include the root element, check
+    its tag name directly before even calling this function.
+    Example usage::
+        strip_elements(some_element,
+            'simpletagname',             # non-namespaced tag
+            '{http://some/ns}tagname',   # namespaced tag
+            '{http://some/other/ns}*'    # any tag from a namespace
+            lxml.etree.Comment           # comments
+            )
+    """
+    cdef _MultiTagMatcher matcher
+    doc = _documentOrRaise(tree_or_element)
+    element = _rootNodeOrRaise(tree_or_element)
+    if not tag_names:
+        return
+    matcher = _MultiTagMatcher.__new__(_MultiTagMatcher, tag_names)
+    matcher.cacheTags(doc)
+    if matcher.rejectsAll():
+        return
+    if isinstance(tree_or_element, _ElementTree):
+        # include PIs and comments next to the root node
+        if matcher.matchesType(tree.XML_COMMENT_NODE):
+            _removeSiblings(element._c_node, tree.XML_COMMENT_NODE, with_tail)
+        if matcher.matchesType(tree.XML_PI_NODE):
+            _removeSiblings(element._c_node, tree.XML_PI_NODE, with_tail)
+    _strip_elements(doc, element._c_node, matcher, with_tail)
+cdef _strip_elements(_Document doc, xmlNode* c_node, _MultiTagMatcher matcher,
+                     bint with_tail):
+    cdef xmlNode* c_child
+    cdef xmlNode* c_next
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        # we run through the children here to prevent any problems
+        # with the tree iteration which would occur if we unlinked the
+        # c_node itself
+        c_child = _findChildForwards(c_node, 0)
+        while c_child is not NULL:
+            c_next = _nextElement(c_child)
+            if matcher.matches(c_child):
+                if c_child.type == tree.XML_ELEMENT_NODE:
+                    if not with_tail:
+                        tree.xmlUnlinkNode(c_child)
+                    _removeNode(doc, c_child)
+                else:
+                    if with_tail:
+                        _removeText(c_child.next)
+                    tree.xmlUnlinkNode(c_child)
+                    attemptDeallocation(c_child)
+            c_child = c_next
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)
+def strip_tags(tree_or_element, *tag_names):
+    """strip_tags(tree_or_element, *tag_names)
+    Delete all elements with the provided tag names from a tree or
+    subtree.  This will remove the elements and their attributes, but
+    *not* their text/tail content or descendants.  Instead, it will
+    merge the text content and children of the element into its
+    parent.
+    Tag names can contain wildcards as in `_Element.iter`.
+    Note that this will not delete the element (or ElementTree root
+    element) that you passed even if it matches.  It will only treat
+    its descendants.
+    Example usage::
+        strip_tags(some_element,
+            'simpletagname',             # non-namespaced tag
+            '{http://some/ns}tagname',   # namespaced tag
+            '{http://some/other/ns}*'    # any tag from a namespace
+            Comment                      # comments (including their text!)
+            )
+    """
+    cdef _MultiTagMatcher matcher
+    doc = _documentOrRaise(tree_or_element)
+    element = _rootNodeOrRaise(tree_or_element)
+    if not tag_names:
+        return
+    matcher = _MultiTagMatcher.__new__(_MultiTagMatcher, tag_names)
+    matcher.cacheTags(doc)
+    if matcher.rejectsAll():
+        return
+    if isinstance(tree_or_element, _ElementTree):
+        # include PIs and comments next to the root node
+        if matcher.matchesType(tree.XML_COMMENT_NODE):
+            _removeSiblings(element._c_node, tree.XML_COMMENT_NODE, 0)
+        if matcher.matchesType(tree.XML_PI_NODE):
+            _removeSiblings(element._c_node, tree.XML_PI_NODE, 0)
+    _strip_tags(doc, element._c_node, matcher)
+cdef _strip_tags(_Document doc, xmlNode* c_node, _MultiTagMatcher matcher):
+    cdef xmlNode* c_child
+    cdef xmlNode* c_next
+    tree.BEGIN_FOR_EACH_ELEMENT_FROM(c_node, c_node, 1)
+    if c_node.type == tree.XML_ELEMENT_NODE:
+        # we run through the children here to prevent any problems
+        # with the tree iteration which would occur if we unlinked the
+        # c_node itself
+        c_child = _findChildForwards(c_node, 0)
+        while c_child is not NULL:
+            if not matcher.matches(c_child):
+                c_child = _nextElement(c_child)
+                continue
+            if c_child.type == tree.XML_ELEMENT_NODE:
+                c_next = _findChildForwards(c_child, 0) or _nextElement(c_child)
+                _replaceNodeByChildren(doc, c_child)
+                if not attemptDeallocation(c_child):
+                    if c_child.nsDef is not NULL:
+                        # make namespaces absolute
+                        moveNodeToDocument(doc, doc._c_doc, c_child)
+                c_child = c_next
+            else:
+                c_next = _nextElement(c_child)
+                tree.xmlUnlinkNode(c_child)
+                attemptDeallocation(c_child)
+                c_child = c_next
+    tree.END_FOR_EACH_ELEMENT_FROM(c_node)

lxml/cssselect.py CHANGED Viewed

@@ -1,101 +1,101 @@
-"""CSS Selectors based on XPath.
-This module supports selecting XML/HTML tags based on CSS selectors.
-See the `CSSSelector` class for details.
-This is a thin wrapper around cssselect 0.7 or later.
-"""
-from . import etree
-try:
-    import cssselect as external_cssselect
-except ImportError:
-    raise ImportError(
-        'cssselect does not seem to be installed. '
-        'See https://pypi.org/project/cssselect/')
-SelectorSyntaxError = external_cssselect.SelectorSyntaxError
-ExpressionError = external_cssselect.ExpressionError
-SelectorError = external_cssselect.SelectorError
-__all__ = ['SelectorSyntaxError', 'ExpressionError', 'SelectorError',
-           'CSSSelector']
-class LxmlTranslator(external_cssselect.GenericTranslator):
-    """
-    A custom CSS selector to XPath translator with lxml-specific extensions.
-    """
-    def xpath_contains_function(self, xpath, function):
-        # Defined there, removed in later drafts:
-        # http://www.w3.org/TR/2001/CR-css3-selectors-20011113/#content-selectors
-        if function.argument_types() not in (['STRING'], ['IDENT']):
-            raise ExpressionError(
-                "Expected a single string or ident for :contains(), got %r"
-                % function.arguments)
-        value = function.arguments[0].value
-        return xpath.add_condition(
-            'contains(__lxml_internal_css:lower-case(string(.)), %s)'
-            % self.xpath_literal(value.lower()))
-class LxmlHTMLTranslator(LxmlTranslator, external_cssselect.HTMLTranslator):
-    """
-    lxml extensions + HTML support.
-    """
-def _make_lower_case(context, s):
-    return s.lower()
-ns = etree.FunctionNamespace('http://codespeak.net/lxml/css/')
-ns.prefix = '__lxml_internal_css'
-ns['lower-case'] = _make_lower_case
-class CSSSelector(etree.XPath):
-    """A CSS selector.
-    Usage::
-        >>> from lxml import etree, cssselect
-        >>> select = cssselect.CSSSelector("a tag > child")
-        >>> root = etree.XML("<a><b><c/><tag><child>TEXT</child></tag></b></a>")
-        >>> [ el.tag for el in select(root) ]
-        ['child']
-    To use CSS namespaces, you need to pass a prefix-to-namespace
-    mapping as ``namespaces`` keyword argument::
-        >>> rdfns = 'http://www.w3.org/1999/02/22-rdf-syntax-ns#'
-        >>> select_ns = cssselect.CSSSelector('root > rdf|Description',
-        ...                                   namespaces={'rdf': rdfns})
-        >>> rdf = etree.XML((
-        ...     '<root xmlns:rdf="%s">'
-        ...       '<rdf:Description>blah</rdf:Description>'
-        ...     '</root>') % rdfns)
-        >>> [(el.tag, el.text) for el in select_ns(rdf)]
-        [('{http://www.w3.org/1999/02/22-rdf-syntax-ns#}Description', 'blah')]
-    """
-    def __init__(self, css, namespaces=None, translator='xml'):
-        if translator == 'xml':
-            translator = LxmlTranslator()
-        elif translator == 'html':
-            translator = LxmlHTMLTranslator()
-        elif translator == 'xhtml':
-            translator = LxmlHTMLTranslator(xhtml=True)
-        path = translator.css_to_xpath(css)
-        super().__init__(path, namespaces=namespaces)
-        self.css = css
-    def __repr__(self):
-        return '<%s %x for %r>' % (
-            self.__class__.__name__,
-            abs(id(self)),
-            self.css)
+"""CSS Selectors based on XPath.
+This module supports selecting XML/HTML tags based on CSS selectors.
+See the `CSSSelector` class for details.
+This is a thin wrapper around cssselect 0.7 or later.
+"""
+from . import etree
+try:
+    import cssselect as external_cssselect
+except ImportError:
+    raise ImportError(
+        'cssselect does not seem to be installed. '
+        'See https://pypi.org/project/cssselect/')
+SelectorSyntaxError = external_cssselect.SelectorSyntaxError
+ExpressionError = external_cssselect.ExpressionError
+SelectorError = external_cssselect.SelectorError
+__all__ = ['SelectorSyntaxError', 'ExpressionError', 'SelectorError',
+           'CSSSelector']
+class LxmlTranslator(external_cssselect.GenericTranslator):
+    """
+    A custom CSS selector to XPath translator with lxml-specific extensions.
+    """
+    def xpath_contains_function(self, xpath, function):
+        # Defined there, removed in later drafts:
+        # http://www.w3.org/TR/2001/CR-css3-selectors-20011113/#content-selectors
+        if function.argument_types() not in (['STRING'], ['IDENT']):
+            raise ExpressionError(
+                "Expected a single string or ident for :contains(), got %r"
+                % function.arguments)
+        value = function.arguments[0].value
+        return xpath.add_condition(
+            'contains(__lxml_internal_css:lower-case(string(.)), %s)'
+            % self.xpath_literal(value.lower()))
+class LxmlHTMLTranslator(LxmlTranslator, external_cssselect.HTMLTranslator):
+    """
+    lxml extensions + HTML support.
+    """
+def _make_lower_case(context, s):
+    return s.lower()
+ns = etree.FunctionNamespace('http://codespeak.net/lxml/css/')
+ns.prefix = '__lxml_internal_css'
+ns['lower-case'] = _make_lower_case
+class CSSSelector(etree.XPath):
+    """A CSS selector.
+    Usage::
+        >>> from lxml import etree, cssselect
+        >>> select = cssselect.CSSSelector("a tag > child")
+        >>> root = etree.XML("<a><b><c/><tag><child>TEXT</child></tag></b></a>")
+        >>> [ el.tag for el in select(root) ]
+        ['child']
+    To use CSS namespaces, you need to pass a prefix-to-namespace
+    mapping as ``namespaces`` keyword argument::
+        >>> rdfns = 'http://www.w3.org/1999/02/22-rdf-syntax-ns#'
+        >>> select_ns = cssselect.CSSSelector('root > rdf|Description',
+        ...                                   namespaces={'rdf': rdfns})
+        >>> rdf = etree.XML((
+        ...     '<root xmlns:rdf="%s">'
+        ...       '<rdf:Description>blah</rdf:Description>'
+        ...     '</root>') % rdfns)
+        >>> [(el.tag, el.text) for el in select_ns(rdf)]
+        [('{http://www.w3.org/1999/02/22-rdf-syntax-ns#}Description', 'blah')]
+    """
+    def __init__(self, css, namespaces=None, translator='xml'):
+        if translator == 'xml':
+            translator = LxmlTranslator()
+        elif translator == 'html':
+            translator = LxmlHTMLTranslator()
+        elif translator == 'xhtml':
+            translator = LxmlHTMLTranslator(xhtml=True)
+        path = translator.css_to_xpath(css)
+        super().__init__(path, namespaces=namespaces)
+        self.css = css
+    def __repr__(self):
+        return '<%s %x for %r>' % (
+            self.__class__.__name__,
+            abs(id(self)),
+            self.css)

lxml 5.2.0__cp310-cp310-win32.whl → 5.2.2__cp310-cp310-win32.whl

lxml 5.2.0cp310-cp310-win32.whl → 5.2.2cp310-cp310-win32.whl