PyPI - json-repair - Versions diffs - 0.29.3__tar.gz → 0.29.5__tar.gz - Mend

json-repair 0.29.3tar.gz → 0.29.5tar.gz

Files changed (21) hide show

{json_repair-0.29.3/src/json_repair.egg-info → json_repair-0.29.5}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: json_repair
-Version: 0.29.3
+Version: 0.29.5
 Summary: A package to repair broken json strings
 Author-email: Stefano Baccianella <4247706+mangiucugna@users.noreply.github.com>
 License: MIT License

{json_repair-0.29.3 → json_repair-0.29.5}/pyproject.toml RENAMED Viewed

@@ -3,7 +3,7 @@ requires = ["setuptools>=61.0"]
 build-backend = "setuptools.build_meta"
 [project]
 name = "json_repair"
-version = "0.29.3"
+version = "0.29.5"
 license = {file = "LICENSE"}
 authors = [
   { name="Stefano Baccianella", email="4247706+mangiucugna@users.noreply.github.com" },

json_repair-0.29.5/src/json_repair/json_context.py ADDED Viewed

@@ -0,0 +1,45 @@
+from enum import Enum, auto
+from typing import List, Optional
+class ContextValues(Enum):
+    OBJECT_KEY = auto()
+    OBJECT_VALUE = auto()
+    ARRAY = auto()
+class JsonContext:
+    def __init__(self) -> None:
+        self.context: List[ContextValues] = []
+        self.current: Optional[ContextValues] = None
+        self.empty: bool = True
+    def set(self, value: ContextValues) -> None:
+        """
+        Set a new context value.
+        Args:
+            value (ContextValues): The context value to be added.
+        Returns:
+            None
+        """
+        # If a value is provided update the context variable and save in stack
+        if value:
+            self.context.append(value)
+            self.current = value
+            self.empty = False
+    def reset(self) -> None:
+        """
+        Remove the most recent context value.
+        Returns:
+            None
+        """
+        try:
+            self.context.pop()
+            self.current = self.context[-1]
+        except IndexError:
+            self.current = None
+            self.empty = True

{json_repair-0.29.3 → json_repair-0.29.5}/src/json_repair/json_parser.py RENAMED Viewed

@@ -34,7 +34,8 @@ class JSONParser:
             self.logger: List[Dict[str, str]] = []
             self.log = self._log
         else:
-            self.log = self.noop
+            # No-op
+            self.log = lambda *args, **kwargs: None
     def parse(
         self,
@@ -88,12 +89,10 @@ class JSONParser:
                 )
                 return ""
             # <string> starts with a quote
-            elif not self.context.is_empty() and (
-                char in ['"', "'", "“"] or char.isalpha()
-            ):
+            elif not self.context.empty and (char in ['"', "'", "“"] or char.isalpha()):
                 return self.parse_string()
             # <number> starts with [0-9] or minus
-            elif not self.context.is_empty() and (
+            elif not self.context.empty and (
                 char.isdigit() or char == "-" or char == "."
             ):
                 return self.parse_number()
@@ -234,8 +233,9 @@ class JSONParser:
         elif char.isalnum():
             # This could be a <boolean> and not a string. Because (T)rue or (F)alse or (N)ull are valid
             # But remember, object keys are only of type string
-            if char.lower() in ["t", "f", "n"] and not self.context.is_current(
-                ContextValues.OBJECT_KEY
+            if (
+                char.lower() in ["t", "f", "n"]
+                and self.context.current != ContextValues.OBJECT_KEY
             ):
                 value = self.parse_boolean_or_null()
                 if value != "":
@@ -255,15 +255,13 @@ class JSONParser:
         if self.get_char_at() == lstring_delimiter:
             # If it's an empty key, this was easy
             if (
-                self.context.is_current(ContextValues.OBJECT_KEY)
+                self.context.current == ContextValues.OBJECT_KEY
                 and self.get_char_at(1) == ":"
             ):
                 self.index += 1
                 return ""
             # Find the next delimiter
-            i = self.skip_to_character(
-                character=rstring_delimiter, idx=1, move_main_index=False
-            )
+            i = self.skip_to_character(character=rstring_delimiter, idx=1)
             next_c = self.get_char_at(i)
             # Now check that the next character is also a delimiter to ensure that we have "".....""
             # In that case we ignore this rstring delimiter
@@ -296,22 +294,23 @@ class JSONParser:
         while char and char != rstring_delimiter:
             if (
                 missing_quotes
-                and self.context.is_current(ContextValues.OBJECT_KEY)
+                and self.context.current == ContextValues.OBJECT_KEY
                 and (char == ":" or char.isspace())
             ):
                 self.log(
                     "While parsing a string missing the left delimiter in object key context, we found a :, stopping here",
                 )
                 break
-            if self.context.is_current(ContextValues.OBJECT_VALUE) and char in [
+            if self.context.current == ContextValues.OBJECT_VALUE and char in [
                 ",",
                 "}",
             ]:
                 rstring_delimiter_missing = True
                 # check if this is a case in which the closing comma is NOT missing instead
-                i = self.skip_to_character(
-                    character=rstring_delimiter, idx=1, move_main_index=False
-                )
+                i = self.skip_to_character(character=rstring_delimiter, idx=1)
+                # If the rstring_delimeter is escaped then it's not what we are looking for
+                while self.get_char_at(i - 1) == "\\":
+                    i = self.skip_to_character(character=rstring_delimiter, idx=i + 1)
                 next_c = self.get_char_at(i)
                 if next_c:
                     i += 1
@@ -345,8 +344,9 @@ class JSONParser:
                         "While parsing a string, we found a doubled quote, ignoring it"
                     )
                     self.index += 1
-                elif missing_quotes and self.context.is_current(
-                    ContextValues.OBJECT_VALUE
+                elif (
+                    missing_quotes
+                    and self.context.current == ContextValues.OBJECT_VALUE
                 ):
                     # In case of missing starting quote I need to check if the delimeter is the end or the beginning of a key
                     i = 1
@@ -387,20 +387,20 @@ class JSONParser:
                         # If we are in an object context, let's check for the right delimiters
                         if (
                             (
-                                self.context.is_any(ContextValues.OBJECT_KEY)
+                                ContextValues.OBJECT_KEY in self.context.context
                                 and next_c in [":", "}"]
                             )
                             or (
-                                self.context.is_any(ContextValues.OBJECT_VALUE)
+                                ContextValues.OBJECT_VALUE in self.context.context
                                 and next_c == "}"
                             )
                             or (
-                                self.context.is_any(ContextValues.ARRAY)
+                                ContextValues.ARRAY in self.context.context
                                 and next_c in ["]", ","]
                             )
                             or (
                                 check_comma_in_object_value
-                                and self.context.is_current(ContextValues.OBJECT_VALUE)
+                                and self.context.current == ContextValues.OBJECT_VALUE
                                 and next_c == ","
                             )
                         ):
@@ -408,13 +408,17 @@ class JSONParser:
                         i += 1
                         next_c = self.get_char_at(i)
                     # If we stopped for a comma in object_value context, let's check if find a "} at the end of the string
-                    if next_c == "," and self.context.is_current(
-                        ContextValues.OBJECT_VALUE
+                    if (
+                        next_c == ","
+                        and self.context.current == ContextValues.OBJECT_VALUE
                     ):
                         i += 1
-                        i = self.skip_to_character(
-                            character=rstring_delimiter, idx=i, move_main_index=False
-                        )
+                        i = self.skip_to_character(character=rstring_delimiter, idx=i)
+                        # If the rstring_delimeter is escaped then it's not what we are looking for
+                        while self.get_char_at(i - 1) == "\\":
+                            i = self.skip_to_character(
+                                character=rstring_delimiter, idx=i + 1
+                            )
                         next_c = self.get_char_at(i)
                         # Ok now I found a delimiter, let's skip whitespaces and see if next we find a }
                         i += 1
@@ -429,16 +433,19 @@ class JSONParser:
                             self.index += 1
                             char = self.get_char_at()
                     elif next_c == rstring_delimiter:
-                        if self.context.is_current(ContextValues.OBJECT_VALUE):
+                        if self.context.current == ContextValues.OBJECT_VALUE:
                             # But this might not be it! This could be just a missing comma
                             # We found a delimiter and we need to check if this is a key
                             # so find a rstring_delimiter and a colon after
                             i += 1
                             i = self.skip_to_character(
-                                character=rstring_delimiter,
-                                idx=i,
-                                move_main_index=False,
+                                character=rstring_delimiter, idx=i
                             )
+                            # If the rstring_delimeter is escaped then it's not what we are looking for
+                            while self.get_char_at(i - 1) == "\\":
+                                i = self.skip_to_character(
+                                    character=rstring_delimiter, idx=i + 1
+                                )
                             i += 1
                             next_c = self.get_char_at(i)
                             while next_c and next_c != ":":
@@ -462,7 +469,7 @@ class JSONParser:
         if (
             char
             and missing_quotes
-            and self.context.is_current(ContextValues.OBJECT_KEY)
+            and self.context.current == ContextValues.OBJECT_KEY
             and char.isspace()
         ):
             self.log(
@@ -488,7 +495,7 @@ class JSONParser:
         number_str = ""
         number_chars = set("0123456789-.eE/,")
         char = self.get_char_at()
-        is_array = self.context.is_current(ContextValues.ARRAY)
+        is_array = self.context.current == ContextValues.ARRAY
         while char and char in number_chars and (char != "," or not is_array):
             number_str += char
             self.index += 1
@@ -561,9 +568,7 @@ class JSONParser:
                 return idx
         return idx
-    def skip_to_character(
-        self, character: str, idx: int = 0, move_main_index=True
-    ) -> int:
+    def skip_to_character(self, character: str, idx: int = 0) -> int:
         """
         This function quickly iterates to find a character, syntactic sugar to make the code more concise
         """
@@ -572,10 +577,7 @@ class JSONParser:
         except IndexError:
             return idx
         while char != character:
-            if move_main_index:  # pragma: no cover
-                self.index += 1
-            else:
-                idx += 1
+            idx += 1
             try:
                 char = self.json_str[self.index + idx]
             except IndexError:
@@ -593,6 +595,3 @@ class JSONParser:
                 "context": context,
             }
         )
-    def noop(*args: Any, **kwargs: Any) -> None:
-        pass

{json_repair-0.29.3 → json_repair-0.29.5/src/json_repair.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: json_repair
-Version: 0.29.3
+Version: 0.29.5
 Summary: A package to repair broken json strings
 Author-email: Stefano Baccianella <4247706+mangiucugna@users.noreply.github.com>
 License: MIT License

{json_repair-0.29.3 → json_repair-0.29.5}/tests/test_performance.py RENAMED Viewed

@@ -19,7 +19,7 @@ def test_true_true_correct(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds
-  max_time = 2 / 10 ** 3  # 2 millisecond
+  max_time = 1.8 / 10 ** 3  # 1.8 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -31,7 +31,7 @@ def test_true_true_incorrect(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds
-  max_time = 2 / 10 ** 3  # 2 millisecond
+  max_time = 1.8 / 10 ** 3  # 1.8 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -53,7 +53,7 @@ def test_true_false_incorrect(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds
-  max_time = 2 / 10 ** 3  # 2 millisecond
+  max_time = 1.8 / 10 ** 3  # 1.8 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -64,7 +64,7 @@ def test_false_true_correct(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds
-  max_time = 2 / 10 ** 3  # 2 millisecond
+  max_time = 1.8 / 10 ** 3  # 1.8 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -75,7 +75,7 @@ def test_false_true_incorrect(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds
-  max_time = 2 / 10 ** 3  # 2 millisecond
+  max_time = 1.8 / 10 ** 3  # 1.8 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -97,7 +97,7 @@ def test_false_false_incorrect(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds
-  max_time = 2 / 10 ** 3  # 2 millisecond
+  max_time = 1.8 / 10 ** 3  # 1.8 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"

json_repair-0.29.3/src/json_repair/json_context.py DELETED Viewed

@@ -1,69 +0,0 @@
-from enum import Enum, auto
-from typing import List
-class ContextValues(Enum):
-    OBJECT_KEY = auto()
-    OBJECT_VALUE = auto()
-    ARRAY = auto()
-class JsonContext:
-    def __init__(self) -> None:
-        self.context: List[ContextValues] = []
-    def set(self, value: ContextValues) -> None:
-        """
-        Set a new context value.
-        Args:
-            value (ContextValues): The context value to be added.
-        Returns:
-            None
-        """
-        # If a value is provided update the context variable and save in stack
-        if value:
-            self.context.append(value)
-    def reset(self) -> None:
-        """
-        Remove the most recent context value.
-        Returns:
-            None
-        """
-        self.context.pop()
-    def is_current(self, context: ContextValues) -> bool:
-        """
-        Check if the given context is the current (most recent) context.
-        Args:
-            context (ContextValues): The context value to check.
-        Returns:
-            bool: True if the given context is the same as the most recent context in the stack, False otherwise.
-        """
-        return self.context[-1] == context
-    def is_any(self, context: ContextValues) -> bool:
-        """
-        Check if the given context exists anywhere in the context stack.
-        Args:
-            context (ContextValues): The context value to check.
-        Returns:
-            bool: True if the given context exists in the stack, False otherwise.
-        """
-        return context in self.context
-    def is_empty(self) -> bool:
-        """
-        Check if the context stack is empty.
-        Returns:
-            bool: True if the context stack is empty, False otherwise.
-        """
-        return len(self.context) == 0