PyPI - json-repair - Versions diffs - 0.5.0__tar.gz → 0.6.0__tar.gz - Mend

json-repair 0.5.0tar.gz → 0.6.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

{json_repair-0.5.0/src/json_repair.egg-info → json_repair-0.6.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: json_repair
-Version: 0.5.0
+Version: 0.6.0
 Summary: A package to repair broken json strings
 Author-email: Stefano Baccianella <4247706+mangiucugna@users.noreply.github.com>
 License: MIT License

{json_repair-0.5.0 → json_repair-0.6.0}/pyproject.toml RENAMED Viewed

@@ -3,7 +3,7 @@ requires = ["setuptools>=61.0"]
 build-backend = "setuptools.build_meta"
 [project]
 name = "json_repair"
-version = "0.5.0"
+version = "0.6.0"
 license = {file = "LICENSE"}
 authors = [
   { name="Stefano Baccianella", email="4247706+mangiucugna@users.noreply.github.com" },

{json_repair-0.5.0 → json_repair-0.6.0}/src/json_repair/json_repair.py RENAMED Viewed

@@ -111,6 +111,11 @@ class JSONParser:
                     use_single_quotes=(self.json_str[self.index] == "'")
                 )
+                # This can happen sometimes like { "": "value" }
+                if key == "" and self.get_char_at() == ":":
+                    key = "empty_placeholder"
+                    break
             # We reached the end here
             if key == "}":
                 continue
@@ -197,6 +202,7 @@ class JSONParser:
         # * It iterated over the entire sequence
         # * If we are fixing missing quotes in an object, when it finds the special terminators
         char = self.get_char_at()
+        fix_broken_markdown_link = False
         while char and char != string_terminator:
             if fixed_quotes:
                 if self.context == "object_key" and (char == ":" or char.isspace()):
@@ -205,6 +211,17 @@ class JSONParser:
                     break
             self.index += 1
             char = self.get_char_at()
+            # ChatGPT sometimes forget to quote links in markdown like: { "content": "[LINK]("https://google.com")" }
+            if char == string_terminator and (
+                fix_broken_markdown_link
+                or (
+                    self.index - 2 > 0
+                    and self.json_str[self.index - 2 : self.index] == "]("
+                )
+            ):
+                fix_broken_markdown_link = not fix_broken_markdown_link
+                self.index += 1
+                char = self.get_char_at()
         if char and fixed_quotes and self.context == "object_key" and char.isspace():
             self.skip_whitespaces_at()

{json_repair-0.5.0 → json_repair-0.6.0/src/json_repair.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: json_repair
-Version: 0.5.0
+Version: 0.6.0
 Summary: A package to repair broken json strings
 Author-email: Stefano Baccianella <4247706+mangiucugna@users.noreply.github.com>
 License: MIT License

{json_repair-0.5.0 → json_repair-0.6.0}/tests/test_json_repair.py RENAMED Viewed

@@ -49,6 +49,8 @@ def test_repair_json():
     assert repair_json("{") == "{}"
     assert repair_json('{"') == '{"": ""}'
     assert repair_json('["') == '[]'
+    assert repair_json("'\"'") == '"\\\""'
+    assert repair_json("'string\"") == '"string\\\""'
     assert repair_json('{foo: [}') == '{"foo": []}'
     assert repair_json('{"key": "value:value"}') == '{"key": "value:value"}'
     assert (
@@ -79,6 +81,15 @@ def test_repair_json():
     }
     # Test with garbage comments
     assert repair_json('{"value_1": true, SHOULD_NOT_EXIST "value_2": "data" AAAA }') == '{"value_1": true, "value_2": "data"}'
+    assert {
+        repair_json('{"" : true, "key2": "value2"}') == '{" ": true, "key2": "value_2"}'
+    }
+    assert {
+        repair_json('{"": true, "key2": "value2"}') == '{"empty_placeholder": true, "key2": "value_2"}'
+    }
+    #Test markdown stupidities from ChatGPT
+    assert repair_json('{ "content": "[LINK]("https://google.com")" }') == '{"content": "[LINK](\\"https://google.com\\")"}'
@@ -137,6 +148,9 @@ def test_repair_json_with_objects():
     #Test with garbage comments
     assert repair_json('{"value_1": true, SHOULD_NOT_EXIST "value_2": "data" AAAA }', True) == {'value_1': True, 'value_2': 'data'}
+    #Test markdown stupidities from ChatGPT
+    assert repair_json('{ "content": "[LINK]("https://google.com")" }', True) == { "content": "[LINK](\"https://google.com\")"}
 def test_repair_json_corner_cases_generate_by_gpt():
     # Test with nested JSON

{json_repair-0.5.0 → json_repair-0.6.0}/tests/test_performance.py RENAMED Viewed

@@ -282,7 +282,7 @@ def test_true_true(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds (100ms in this case)
-  max_time = 1 / 10 ** 6  # 1 microsecond
+  max_time = 1.1 / 10 ** 6  # 1.1 microsecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -293,7 +293,7 @@ def test_true_false(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds (100ms in this case)
-  max_time = 160 * (1 / 10 ** 6)  # 160 microsecond
+  max_time = 180 * (1 / 10 ** 6)  # 180 microsecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -304,7 +304,7 @@ def test_false_true(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds (ms in this case)
-  max_time = 0.9 / 10 ** 3  # 0.9 millisecond
+  max_time = 1 / 10 ** 3  # 1 millisecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"
@@ -315,7 +315,7 @@ def test_false_false(benchmark):
   mean_time = benchmark.stats.get("median")
   # Define your time threshold in seconds (100ms in this case)
-  max_time = 190 * (1 / 10 ** 6)  # 190 microsecond
+  max_time = 210 * (1 / 10 ** 6)  # 210 microsecond
   # Assert that the average time is below the threshold
   assert mean_time < max_time, f"Benchmark exceeded threshold: {mean_time:.3f}s > {max_time:.3f}s"

{json_repair-0.5.0 → json_repair-0.6.0}/LICENSE RENAMED Viewed

File without changes

{json_repair-0.5.0 → json_repair-0.6.0}/README.md RENAMED Viewed

File without changes

{json_repair-0.5.0 → json_repair-0.6.0}/setup.cfg RENAMED Viewed

File without changes

{json_repair-0.5.0 → json_repair-0.6.0}/src/json_repair/__init__.py RENAMED Viewed

File without changes

{json_repair-0.5.0 → json_repair-0.6.0}/src/json_repair.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{json_repair-0.5.0 → json_repair-0.6.0}/src/json_repair.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{json_repair-0.5.0 → json_repair-0.6.0}/src/json_repair.egg-info/top_level.txt RENAMED Viewed

File without changes

json-repair 0.5.0__tar.gz → 0.6.0__tar.gz

json-repair 0.5.0tar.gz → 0.6.0tar.gz