PyPI - csv-detective - Versions diffs - 0.7.5.dev1307__py3-none-any.whl → 0.7.5.dev1330__py3-none-any.whl - Mend

csv-detective 0.7.5.dev1307py3-none-any.whl → 0.7.5.dev1330py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

tests/test_validation.py CHANGED Viewed

@@ -1,18 +1,99 @@
 import json
 import pandas as pd
+import pytest
+from csv_detective.explore_csv import validate_then_detect
 from csv_detective.validate import validate
-def test_validation():
+def set_nested_value(source_dict: dict, key_chain: list[str], value):
+    current_dict = source_dict
+    for key in key_chain[:-1]:
+        if key not in current_dict:
+            current_dict[key] = {}
+        current_dict = current_dict[key]
+    current_dict[key_chain[-1]] = value
+def get_nested_value(source_dict: dict, key_chain: list[str]):
+    result = source_dict
+    for k in key_chain:
+        result = result[k]
+    return result
+@pytest.mark.parametrize(
+    "_params",
+    (
+        ((True, pd.DataFrame, dict), {}),
+        ((False, None, None), {"separator": "|"}),
+        ((False, None, None), {"encoding": "unknown"}),
+        ((False, None, None), {"header": ["a", "b"]}),
+        ((False, pd.DataFrame, dict), {
+            "columns.NUMCOM": {
+                "python_type": "int",
+                "format": "int",
+                "score": 1.0,
+            },
+        }),
+    ),
+)
+def test_validation(_params):
+    (should_be_valid, table_type, analysis_type), modif_previous_analysis = _params
     with open("tests/data/a_test_file.json", "r") as f:
         previous_analysis = json.load(f)
+    for dotkey in modif_previous_analysis:
+        keys = dotkey.split(".")
+        set_nested_value(previous_analysis, keys, modif_previous_analysis[dotkey])
     is_valid, table, analysis = validate(
         "tests/data/a_test_file.csv",
         previous_analysis=previous_analysis,
         num_rows=-1,
+        sep=previous_analysis.get("separator"),
+        encoding=previous_analysis.get("encoding"),
+    )
+    assert is_valid == should_be_valid
+    if table_type is None:
+        assert table is None
+    else:
+        assert isinstance(table, table_type)
+    if analysis_type is None:
+        assert analysis is None
+    else:
+        assert isinstance(analysis, analysis_type)
+@pytest.mark.parametrize(
+    "modif_previous_analysis",
+    (
+        {"separator": "|"},
+        {"encoding": "unknown"},
+        {"header": ["a", "b"]},
+        {
+            "columns.NUMCOM": {
+                "python_type": "int",
+                "format": "int",
+                "score": 1.0,
+            },
+        },
+    ),
+)
+def test_validate_then_detect(modif_previous_analysis):
+    with open("tests/data/a_test_file.json", "r") as f:
+        previous_analysis = json.load(f)
+    valid_values = {}
+    for dotkey in modif_previous_analysis:
+        keys = dotkey.split(".")
+        valid_values[dotkey] = get_nested_value(previous_analysis, keys)
+        set_nested_value(previous_analysis, keys, modif_previous_analysis[dotkey])
+    analysis = validate_then_detect(
+        "tests/data/a_test_file.csv",
+        previous_analysis=previous_analysis,
+        num_rows=-1,
+        output_profile=True,
+        save_results=False,
     )
-    assert is_valid is True
-    assert isinstance(table, pd.DataFrame)
-    assert isinstance(analysis, dict)
+    # checking that if not valid, the analysis has managed to retrieve the right values
+    for dotkey in modif_previous_analysis:
+        assert get_nested_value(analysis, dotkey.split(".")) == valid_values[dotkey]

{csv_detective-0.7.5.dev1307.data → csv_detective-0.7.5.dev1330.data}/data/share/csv_detective/LICENSE.AGPL.txt RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1307.data → csv_detective-0.7.5.dev1330.data}/data/share/csv_detective/README.md RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1307.dist-info → csv_detective-0.7.5.dev1330.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1307.dist-info → csv_detective-0.7.5.dev1330.dist-info}/licenses/LICENSE.AGPL.txt RENAMED Viewed

File without changes

{csv_detective-0.7.5.dev1307.dist-info → csv_detective-0.7.5.dev1330.dist-info}/top_level.txt RENAMED Viewed

File without changes

csv-detective 0.7.5.dev1307__py3-none-any.whl → 0.7.5.dev1330__py3-none-any.whl

csv-detective 0.7.5.dev1307py3-none-any.whl → 0.7.5.dev1330py3-none-any.whl