maxml 1.0.2__py3-none-any.whl → 1.0.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
maxml/__init__.py CHANGED
@@ -1,2 +1,4 @@
1
1
  from maxml.element import Element
2
2
  from maxml.namespace import Namespace
3
+ from maxml.enumerations import Escape
4
+ from maxml.exceptions import MaXMLError
maxml/element/__init__.py CHANGED
@@ -2,9 +2,15 @@ from __future__ import annotations
2
2
 
3
3
  from maxml.namespace import Namespace
4
4
  from maxml.logging import logger
5
+ from maxml.enumerations import (
6
+ Context,
7
+ Escape,
8
+ )
9
+ from maxml.exceptions import MaXMLError
5
10
 
6
11
  from classicist import hybridmethod
7
12
 
13
+ import re
8
14
 
9
15
  logger = logger.getChild(__name__)
10
16
 
@@ -22,7 +28,7 @@ class Element(object):
22
28
  _mixed: bool = False
23
29
 
24
30
  @hybridmethod
25
- def register_namespace(self, prefix: str, uri: str):
31
+ def register_namespace(self, prefix: str, uri: str, promoted: bool = False):
26
32
  """Supports registering namespaces globally for the module or per instance
27
33
  depending on whether the method is called on the class directly or whether it is
28
34
  called on a specific instance of the class.
@@ -68,6 +74,9 @@ class Element(object):
68
74
  if not isinstance(uri, str):
69
75
  raise TypeError("The 'uri' argument must have a string value!")
70
76
 
77
+ if not isinstance(promoted, bool):
78
+ raise TypeError("The 'promoted' argument must have a boolean value!")
79
+
71
80
  for namespace in self._namespaces:
72
81
  if namespace.prefix == prefix:
73
82
  if namespace.uri == uri:
@@ -77,12 +86,12 @@ class Element(object):
77
86
  )
78
87
  break
79
88
  else:
80
- raise ValueError(
81
- "The '%s' namespace has already been registered with a different URI!"
82
- % (prefix)
89
+ raise MaXMLError(
90
+ "The '%s' namespace, %s, has already been registered with a different URI: %s!"
91
+ % (prefix, uri, namespace.uri)
83
92
  )
84
93
  else:
85
- if namespace := Namespace(prefix=prefix, uri=uri):
94
+ if namespace := Namespace(prefix=prefix, uri=uri, promoted=promoted):
86
95
  self._namespaces.add(namespace)
87
96
 
88
97
  def __init__(
@@ -170,7 +179,7 @@ class Element(object):
170
179
 
171
180
  break
172
181
  else:
173
- raise ValueError(
182
+ raise MaXMLError(
174
183
  f"No namespace has been registered for the '{prefix}' prefix associated with the '{name}' element!"
175
184
  )
176
185
 
@@ -180,7 +189,7 @@ class Element(object):
180
189
  if namespace.uri == uri:
181
190
  break
182
191
  else:
183
- namespace = Namespace(prefix=prefix, uri=uri)
192
+ namespace = Namespace(prefix=prefix, uri=uri, promoted=False)
184
193
 
185
194
  self.__class__._namespaces.add(namespace)
186
195
 
@@ -557,6 +566,7 @@ class Element(object):
557
566
  pretty: bool = False,
558
567
  indent: str | int = None,
559
568
  encoding: str = None,
569
+ escape: Escape = Escape.All,
560
570
  **kwargs,
561
571
  ) -> str | bytes:
562
572
  """Supports serializing the current Element tree to a string or to a bytes array
@@ -565,6 +575,11 @@ class Element(object):
565
575
  if not isinstance(pretty, bool):
566
576
  raise TypeError("The 'pretty' argument must have a boolean value!")
567
577
 
578
+ if not isinstance(escape, Escape):
579
+ raise TypeError(
580
+ "The 'escape' argument must reference an Escape enumeration option!"
581
+ )
582
+
568
583
  if indent is None:
569
584
  indent = 2
570
585
 
@@ -585,10 +600,54 @@ class Element(object):
585
600
  elif not isinstance(encoding, str):
586
601
  raise TypeError("The 'encoding' argument must have a string value!")
587
602
 
603
+ def escaper(value: str, context: Context, escape: Escape) -> str:
604
+ """Helper method to escape special characters in XML attributes and text."""
605
+
606
+ if isinstance(value, str):
607
+ pass
608
+ elif hasattr(value, "__str__"):
609
+ value = str(value)
610
+ else:
611
+ raise TypeError(
612
+ "The 'value' argument must have a string value or a value that can be cast to a string!"
613
+ )
614
+
615
+ replacements: dict[str, str] = {
616
+ "&": "&",
617
+ "<": "&lt;",
618
+ ">": "&gt;",
619
+ '"': "&quot;",
620
+ "'": "&apos;",
621
+ }
622
+
623
+ if context is Context.Attribute:
624
+ # Required replacements for element attribute values
625
+ required: list[str] = ["&", "<", '"']
626
+ elif context is Context.Text:
627
+ # Required replacements for element text
628
+ required: list[str] = ["&", "<"]
629
+ else:
630
+ # Require all replacements for other contexts
631
+ required: list[str] = [key for key in replacements]
632
+
633
+ for search, replacement in replacements.items():
634
+ if (escape is Escape.All) or (search in required):
635
+ if search == "&":
636
+ # Ensure only standalone "&" characters are replaced, ignoring
637
+ # any that are part of an XML special character escape sequence
638
+ value = re.sub(
639
+ r"&(?!(([a-z]+|#x?[0-9a-fA-F]+);))", replacement, value
640
+ )
641
+ else:
642
+ value = value.replace(search, replacement)
643
+
644
+ return value
645
+
588
646
  def stringify(
589
647
  element: Element,
590
648
  depth: int,
591
649
  pretty: bool = False,
650
+ escape: Escape = Escape.All,
592
651
  indent: str = None,
593
652
  **kwargs,
594
653
  ) -> str:
@@ -606,7 +665,7 @@ class Element(object):
606
665
  # Add any promoted namespaces (those which should proceed any attributes)
607
666
  count = len(element.namespaced)
608
667
  for index, namespace in enumerate(element.namespaced, start=1):
609
- if not namespace.promoted:
668
+ if namespace.promoted is False:
610
669
  continue
611
670
 
612
671
  if pretty and count > 1 and (newline or (index > 1 and index <= count)):
@@ -624,6 +683,8 @@ class Element(object):
624
683
  string += f"\n{indent * (depth + 2)}"
625
684
  newline = True
626
685
 
686
+ value = escaper(value, context=Context.Attribute, escape=escape)
687
+
627
688
  string += f' {key}="{value}"'
628
689
 
629
690
  # Add any non-promoted namespaces (those which can follow any attributes)
@@ -633,7 +694,7 @@ class Element(object):
633
694
  newline = True
634
695
 
635
696
  for index, namespace in enumerate(element.namespaced, start=1):
636
- if namespace.promoted:
697
+ if namespace.promoted is True:
637
698
  continue
638
699
 
639
700
  if pretty and count > 1 and (newline or (index > 1 and index <= count)):
@@ -656,7 +717,7 @@ class Element(object):
656
717
 
657
718
  # Include the element's text content, if any
658
719
  if element.text and (element.mixed or not element.children):
659
- string += element.text
720
+ string += escaper(element.text, context=Context.Text, escape=escape)
660
721
 
661
722
  # Include the element's children, if any
662
723
  if element.children and (element.mixed or not element.text):
@@ -669,6 +730,7 @@ class Element(object):
669
730
  depth=(depth + 1),
670
731
  pretty=pretty,
671
732
  indent=indent,
733
+ escape=escape,
672
734
  **kwargs,
673
735
  )
674
736
 
@@ -684,6 +746,7 @@ class Element(object):
684
746
  depth=0,
685
747
  pretty=pretty,
686
748
  indent=indent,
749
+ escape=escape,
687
750
  **kwargs,
688
751
  )
689
752
 
@@ -0,0 +1,25 @@
1
+ from enumerific import Enumeration, auto
2
+
3
+
4
+ class Context(Enumeration):
5
+ """List of XML contexts, to denote the XML context currently being processed."""
6
+
7
+ Unknown = auto()
8
+ Root = auto(description="Document root node")
9
+ Prolog = auto(description="Document declaration (prolog)")
10
+ Instruction = auto(description="Document processing instruction")
11
+ DocType = auto(description="Document type")
12
+ Element = auto(description="Element comprising opening/closing or self-closing tag")
13
+ TagOpen = auto(description="Opening tag of an element (maybe self-closing)")
14
+ TagClose = auto(description="Closing tag of an element")
15
+ Attribute = auto(description="Attribute held by an element's tag")
16
+ Text = auto(description="Text held between an element's opening and closing tags")
17
+ Data = auto(description="Data held in a CDATA section")
18
+ Comment = auto(description="Comment held in a comment section")
19
+
20
+
21
+ class Escape(Enumeration):
22
+ """List of XML special character escape modes."""
23
+
24
+ All = auto(description="Escape all XML special characters")
25
+ Required = auto(description="Escpae only required XML special characters")
@@ -0,0 +1,2 @@
1
+ class MaXMLError(Exception):
2
+ pass
@@ -14,7 +14,7 @@ class Namespace(object):
14
14
  _uri: str = None
15
15
  _promoted: bool = False
16
16
 
17
- def __init__(self, prefix: str, uri: str):
17
+ def __init__(self, prefix: str, uri: str, promoted: bool = False):
18
18
  """Initialize the Namespace class"""
19
19
 
20
20
  if not isinstance(prefix, str):
@@ -27,6 +27,11 @@ class Namespace(object):
27
27
 
28
28
  self._uri = uri
29
29
 
30
+ if not isinstance(promoted, bool):
31
+ raise TypeError("The 'promoted' argument must have a boolean value!")
32
+
33
+ self._promoted = promoted
34
+
30
35
  def __str__(self) -> str:
31
36
  """Return a string representation of the class for debugging purposes."""
32
37
 
maxml/version.txt CHANGED
@@ -1 +1 @@
1
- 1.0.2
1
+ 1.0.4
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: maxml
3
- Version: 1.0.2
3
+ Version: 1.0.4
4
4
  Summary: A streamlined pure Python XML serializer.
5
5
  Author: Daniel Sissman
6
6
  License-Expression: MIT
@@ -115,10 +115,10 @@ The `Element` class constructor `Element(...)` takes the following arguments:
115
115
 
116
116
  The `Element` class provides the following methods:
117
117
 
118
- * `register_namespace(prefix: str, uri: str)` The `register_namespace()` method
119
- supports registering namespaces globally for the module or per instance depending
120
- on whether the method is called on the class directly or whether it is called on a
121
- specific instance of the class.
118
+ * `register_namespace(prefix: str, uri: str, promoted: bool = False)`
119
+ The `register_namespace()` method supports registering namespaces globally for the
120
+ module or per instance depending on whether the method is called on the class
121
+ directly or whether it is called on a specific instance of the class.
122
122
 
123
123
  If a namespace is registered globally for the module, the registered namespaces
124
124
  become available for use by any instance of the class created within the program
@@ -132,6 +132,12 @@ The `Element` class provides the following methods:
132
132
 
133
133
  Each namespace consists of a prefix which can be used to prefix element names
134
134
  and the URI associated with that namespace prefix.
135
+
136
+ Optionally, a namespace can be marked as promoted during registration, which will
137
+ result in the namespace being serialized into the XML before any attributes on the
138
+ element. Namespaces that are not marked as promoted will appear after attributes.
139
+ Namespace promotion can be enabled for a given namespace during registration by
140
+ passing the optional `promoted` keyword argument with the value of `True`.
135
141
 
136
142
  For example, the 'rdf' prefix is associated with the following canonical URI:
137
143
  "http://www.w3.org/1999/02/22-rdf-syntax-ns#"
@@ -0,0 +1,12 @@
1
+ maxml/__init__.py,sha256=9wLSTIlZTXinpBr9ABp_PUWhfxubtNM89Iac2VCNet8,150
2
+ maxml/version.txt,sha256=rqWtvvV0eFJzxPOcG3aHz4AZk-DLa_Z4GkFonk7bsgw,5
3
+ maxml/element/__init__.py,sha256=TDHieGdGX6ypTWq885ilJgO-sRUt4AT8twa3w9MElOM,26396
4
+ maxml/enumerations/__init__.py,sha256=N15XKtEZp2cFwqq_1GXyODqoOE--z9WukZGt_rFur2E,1153
5
+ maxml/exceptions/__init__.py,sha256=qMI3bIXJe6zDXzRnxdW3v6wbxSYfd1oK-9lnxvZzzjQ,38
6
+ maxml/logging/__init__.py,sha256=AMpvZEQH9GIBe8609sMwb2T64rovpkRRCc9rs2kHy8g,52
7
+ maxml/namespace/__init__.py,sha256=1TT9vo6iWQyxEOLPzvHd_cf4i5_w3F-tdOm_k-VABQM,4067
8
+ maxml-1.0.4.dist-info/METADATA,sha256=UTM15oNsmwGV5YFujZhMYBXKGIF8U8D_BQ34OVENOj4,16626
9
+ maxml-1.0.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
10
+ maxml-1.0.4.dist-info/top_level.txt,sha256=ZFK3SmCc04Dzhl9QkO_hVBAEiHwCNrwn8X_PINWE9C4,6
11
+ maxml-1.0.4.dist-info/zip-safe,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
12
+ maxml-1.0.4.dist-info/RECORD,,
@@ -1,10 +0,0 @@
1
- maxml/__init__.py,sha256=QuUB-oFrPKRZ4XzPuk4Mt8r35EMx652PALyAeWvQXIo,72
2
- maxml/version.txt,sha256=v-wuNFg62n5q8stzmT-3Wj9xR6bJQ-X_X1xClPxXe5A,5
3
- maxml/element/__init__.py,sha256=8N6ePtw7nOX6VVQ0eG5mmDJkBXo8S1qwVF3k9X2OmLo,23843
4
- maxml/logging/__init__.py,sha256=AMpvZEQH9GIBe8609sMwb2T64rovpkRRCc9rs2kHy8g,52
5
- maxml/namespace/__init__.py,sha256=iZqHWuGi09KtMTr7wHiyTQLXB2TFljUir8wZGLi2b60,3882
6
- maxml-1.0.2.dist-info/METADATA,sha256=J9F0r0aKB7prWv2tALoHhPRtFYCUXm096UOdoRQW5Fc,16193
7
- maxml-1.0.2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
8
- maxml-1.0.2.dist-info/top_level.txt,sha256=ZFK3SmCc04Dzhl9QkO_hVBAEiHwCNrwn8X_PINWE9C4,6
9
- maxml-1.0.2.dist-info/zip-safe,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
10
- maxml-1.0.2.dist-info/RECORD,,
File without changes