PyPI - json-repair - Versions diffs - 0.30.2__tar.gz → 0.31.0__tar.gz - Mend

json-repair 0.30.2tar.gz → 0.31.0tar.gz

Files changed (20) hide show

{json_repair-0.30.2/src/json_repair.egg-info → json_repair-0.31.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: json_repair
-Version: 0.30.2
+Version: 0.31.0
 Summary: A package to repair broken json strings
 Author-email: Stefano Baccianella <4247706+mangiucugna@users.noreply.github.com>
 License: MIT License

{json_repair-0.30.2 → json_repair-0.31.0}/pyproject.toml RENAMED Viewed

@@ -3,7 +3,7 @@ requires = ["setuptools>=61.0"]
 build-backend = "setuptools.build_meta"
 [project]
 name = "json_repair"
-version = "0.30.2"
+version = "0.31.0"
 license = {file = "LICENSE"}
 authors = [
   { name="Stefano Baccianella", email="4247706+mangiucugna@users.noreply.github.com" },

{json_repair-0.30.2 → json_repair-0.31.0}/src/json_repair/json_parser.py RENAMED Viewed

@@ -322,11 +322,24 @@ class JSONParser:
                     else:
                         # OK but this could still be some garbage at the end of the string
                         # So we need to check if we find a new lstring_delimiter afterwards
-                        # If we do, this is a missing delimiter
+                        # If we do, maybe this is a missing delimiter
                         i = self.skip_to_character(character=lstring_delimiter, idx=i)
+                        if doubled_quotes:
+                            i = self.skip_to_character(
+                                character=lstring_delimiter, idx=i
+                            )
                         next_c = self.get_char_at(i)
                         if not next_c:
                             rstring_delimiter_missing = False
+                        else:
+                            # But again, this could just be something a bit stupid like "lorem, "ipsum" sic"
+                            # Check if we find a : afterwards (skipping space)
+                            i = self.skip_whitespaces_at(
+                                idx=i + 1, move_main_index=False
+                            )
+                            next_c = self.get_char_at(i)
+                            if next_c and next_c != ":":
+                                rstring_delimiter_missing = False
                 else:
                     # There could be a case in which even the next key:value is missing delimeters
                     # because it might be a systemic issue with the output
@@ -362,6 +375,13 @@ class JSONParser:
                         "While parsing a string missing the left delimiter in object value context, we found a , or } and we couldn't determine that a right delimiter was present. Stopping here",
                     )
                     break
+            if char == "]" and ContextValues.ARRAY in self.context.context:
+                # We found the end of an array and we are in array context
+                # So let's check if we find a rstring_delimiter forward otherwise end early
+                i = self.skip_to_character(rstring_delimiter)
+                if not self.get_char_at(i):
+                    # No delimiter found
+                    break
             string_acc += char
             self.index += 1
             char = self.get_char_at()

{json_repair-0.30.2 → json_repair-0.31.0/src/json_repair.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: json_repair
-Version: 0.30.2
+Version: 0.31.0
 Summary: A package to repair broken json strings
 Author-email: Stefano Baccianella <4247706+mangiucugna@users.noreply.github.com>
 License: MIT License

{json_repair-0.30.2 → json_repair-0.31.0}/tests/test_json_repair.py RENAMED Viewed

@@ -108,6 +108,7 @@ def test_missing_and_mixed_quotes():
     assert repair_json('{"key": value "key2" : "value2" ') == '{"key": "value", "key2": "value2"}'
     assert repair_json('{"key": "lorem ipsum ... "sic " tamet. ...}') ==  '{"key": "lorem ipsum ... \\"sic \\" tamet. ..."}'
     assert repair_json('{"key": value , }') == '{"key": "value"}'
+    assert repair_json('{"comment": "lorem, "ipsum" sic "tamet". To improve"}') == '{"comment": "lorem, \\"ipsum\\" sic \\"tamet\\". To improve"}'
 def test_array_edge_cases():
     assert repair_json("[1, 2, 3,") == "[1, 2, 3]"
@@ -119,6 +120,7 @@ def test_array_edge_cases():
     assert repair_json('{"employees":["John", "Anna",') == '{"employees": ["John", "Anna"]}'
     assert repair_json('{"employees":["John", "Anna", "Peter') == '{"employees": ["John", "Anna", "Peter"]}'
     assert repair_json('{"key1": {"key2": [1, 2, 3') == '{"key1": {"key2": [1, 2, 3]}}'
+    assert repair_json('{"key": ["value]}') == '{"key": ["value"]}'
 def test_escaping():
     assert repair_json("'\"'") == '""'
@@ -134,7 +136,7 @@ def test_object_edge_cases():
     assert repair_json('{"value_1": true, COMMENT "value_2": "data"}') == '{"value_1": true, "value_2": "data"}'
     assert repair_json('{"value_1": true, SHOULD_NOT_EXIST "value_2": "data" AAAA }') == '{"value_1": true, "value_2": "data"}'
     assert repair_json('{"" : true, "key2": "value2"}') == '{"": true, "key2": "value2"}'
-    assert repair_json('{""answer"":[{""traits"":''Female aged 60+'',""answer1"":""5""}]}') == '{"answer": [{"traits": "Female aged 60+", "answer1": "5"}]}'
+    assert repair_json("""{""answer"":[{""traits"":''Female aged 60+'',""answer1"":""5""}]}""") == '{"answer": [{"traits": "Female aged 60+", "answer1": "5"}]}'
     assert repair_json('{ "words": abcdef", "numbers": 12345", "words2": ghijkl" }') == '{"words": "abcdef", "numbers": 12345, "words2": "ghijkl"}'
     assert repair_json('''{"number": 1,"reason": "According...""ans": "YES"}''') == '{"number": 1, "reason": "According...", "ans": "YES"}'
     assert repair_json('''{ "a" : "{ b": {} }" }''') == '{"a": "{ b"}'

{json_repair-0.30.2 → json_repair-0.31.0}/tests/test_performance.py RENAMED Viewed

@@ -97,7 +97,7 @@ def test_false_false_incorrect(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds
-  max_time = 1.8 / 10 ** 3  # 1.8 millisecond
+  max_time = 1.9 / 10 ** 3  # 1.9 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"