PyPI - csv-detective - Versions diffs - 0.7.5.dev1277__py3-none-any.whl → 0.7.5.dev1298__py3-none-any.whl - Mend

csv-detective 0.7.5.dev1277py3-none-any.whl → 0.7.5.dev1298py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

tests/test_file.py CHANGED Viewed

@@ -28,7 +28,7 @@ def test_columns_output_on_file():
         "STRUCTURED_INFO",
         "GEO_INFO",
     ]
-    assert output["total_lines"] == 414
+    assert output["total_lines"] == 404
     assert output["nb_duplicates"] == 7
     assert output["columns"]["NOMCOM"]["format"] == "commune"
     assert output["columns"]["NOMDEP"]["format"] == "departement"
@@ -48,7 +48,7 @@ def test_profile_output_on_file():
     )
     assert all(
         [
-            c in list(output["profile"]["NUMCOM"].keys())
+            c in list(output["profile"]["TXCOUVGLO_COM_2014"].keys())
             for c in [
                 "min",
                 "max",
@@ -60,12 +60,22 @@ def test_profile_output_on_file():
             ]
         ]
     )
-    assert len(output["profile"]["NOMCOM"].keys()) == 3
-    assert output["profile"]["NUMCOM"]["min"] == 1001
-    assert output["profile"]["NUMCOM"]["max"] == 6125
-    assert round(output["profile"]["NUMCOM"]["mean"]) == 1245
-    assert round(output["profile"]["NUMCOM"]["std"]) == 363
-    assert output["profile"]["TXCOUVGLO_COM_2014"]["nb_distinct"] == 296
+    assert not any(
+        [
+            c in list(output["profile"]["NUMCOM"].keys())
+            for c in [
+                    "min",
+                    "max",
+                    "mean",
+                    "std",
+            ]
+        ]
+    )
+    assert output["profile"]["TXCOUVGLO_COM_2014"]["min"] == 0.0
+    assert output["profile"]["TXCOUVGLO_COM_2014"]["max"] == 200.2
+    assert round(output["profile"]["TXCOUVGLO_COM_2014"]["mean"]) == 60
+    assert round(output["profile"]["TXCOUVGLO_COM_2014"]["std"]) == 36
+    assert output["profile"]["TXCOUVGLO_COM_2014"]["nb_distinct"] == 290
     assert output["profile"]["TXCOUVGLO_COM_2014"]["nb_missing_values"] == 3
     assert output["profile"]["GEO_INFO"]["nb_distinct"] == 1
@@ -175,7 +185,7 @@ def mocked_responses():
     "params",
     # ideally we'd like to do the same with params_others but pandas.read_excel uses urllib
     # which doesn't support the way we mock the response, TBC
-    params_csv + [("a_test_file.csv", {"separator": ";", "header_row_idx": 2, "total_lines": 414})]
+    params_csv + [("a_test_file.csv", {"separator": ";", "header_row_idx": 2, "total_lines": 404})]
 )
 def test_urls(mocked_responses, params):
     file_name, checks = params

tests/test_structure.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import os
 # flake8: noqa
 from csv_detective import detect_fields, detect_labels
+from csv_detective.load_tests import return_all_tests
 def tests_conformity():
@@ -29,3 +30,8 @@ def tests_conformity():
                 .replace("/", ".")
             )
             assert "_is" in dir(_package)
+def test_all_tests_have_unique_name():
+    names = [t.__name__.split(".")[-1] for t in return_all_tests("ALL", "detect_fields")]
+    assert len(names) == len(set(names))

tests/test_validation.py ADDED Viewed

@@ -0,0 +1,18 @@
+import json
+import pandas as pd
+from csv_detective.validate import validate
+def test_validation():
+    with open("tests/data/a_test_file.json", "r") as f:
+        previous_analysis = json.load(f)
+    is_valid, table, analysis = validate(
+        "tests/data/a_test_file.csv",
+        previous_analysis=previous_analysis,
+        num_rows=-1,
+    )
+    assert is_valid is True
+    assert isinstance(table, pd.DataFrame)
+    assert isinstance(analysis, dict)

{csv_detective-0.7.5.dev1277.data → csv_detective-0.7.5.dev1298.data}/data/share/csv_detective/LICENSE.AGPL.txt RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1277.data → csv_detective-0.7.5.dev1298.data}/data/share/csv_detective/README.md RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1277.dist-info → csv_detective-0.7.5.dev1298.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1277.dist-info → csv_detective-0.7.5.dev1298.dist-info}/licenses/LICENSE.AGPL.txt RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1277.dist-info → csv_detective-0.7.5.dev1298.dist-info}/top_level.txt RENAMED Viewed

File without changes

csv-detective 0.7.5.dev1277__py3-none-any.whl → 0.7.5.dev1298__py3-none-any.whl

csv-detective 0.7.5.dev1277py3-none-any.whl → 0.7.5.dev1298py3-none-any.whl