PyPI - csv-detective - Versions diffs - 0.10.4.dev1__py3-none-any.whl → 0.10.12674__py3-none-any.whl - Mend

csv-detective 0.10.4.dev1py3-none-any.whl → 0.10.12674py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

csv_detective/detection/__init__.py +0 -0
csv_detective/detection/columns.py +0 -0
csv_detective/detection/encoding.py +0 -0
csv_detective/detection/engine.py +0 -0
csv_detective/detection/formats.py +0 -2
csv_detective/detection/headers.py +14 -12
csv_detective/detection/rows.py +1 -1
csv_detective/detection/separator.py +0 -0
csv_detective/detection/variables.py +0 -0
csv_detective/explore_csv.py +4 -15
csv_detective/format.py +1 -1
csv_detective/formats/__init__.py +0 -0
csv_detective/formats/adresse.py +0 -0
csv_detective/formats/binary.py +0 -0
csv_detective/formats/booleen.py +0 -0
csv_detective/formats/code_commune_insee.py +0 -0
csv_detective/formats/code_csp_insee.py +0 -0
csv_detective/formats/code_departement.py +0 -0
csv_detective/formats/code_fantoir.py +0 -0
csv_detective/formats/code_import.py +0 -0
csv_detective/formats/code_postal.py +0 -0
csv_detective/formats/code_region.py +0 -0
csv_detective/formats/code_rna.py +0 -0
csv_detective/formats/code_waldec.py +0 -0
csv_detective/formats/commune.py +0 -0
csv_detective/formats/csp_insee.py +0 -0
csv_detective/formats/date.py +1 -10
csv_detective/formats/date_fr.py +0 -0
csv_detective/formats/datetime_aware.py +0 -0
csv_detective/formats/datetime_naive.py +0 -0
csv_detective/formats/datetime_rfc822.py +0 -0
csv_detective/formats/departement.py +0 -0
csv_detective/formats/email.py +0 -0
csv_detective/formats/float.py +0 -0
csv_detective/formats/geojson.py +0 -0
csv_detective/formats/insee_ape700.py +0 -0
csv_detective/formats/insee_canton.py +0 -0
csv_detective/formats/int.py +0 -0
csv_detective/formats/iso_country_code_alpha2.py +0 -0
csv_detective/formats/iso_country_code_alpha3.py +0 -0
csv_detective/formats/iso_country_code_numeric.py +0 -0
csv_detective/formats/jour_de_la_semaine.py +0 -0
csv_detective/formats/json.py +0 -0
csv_detective/formats/latitude_l93.py +0 -0
csv_detective/formats/latitude_wgs.py +0 -0
csv_detective/formats/latitude_wgs_fr_metropole.py +0 -0
csv_detective/formats/latlon_wgs.py +0 -0
csv_detective/formats/longitude_l93.py +0 -0
csv_detective/formats/longitude_wgs.py +0 -0
csv_detective/formats/longitude_wgs_fr_metropole.py +0 -0
csv_detective/formats/lonlat_wgs.py +0 -0
csv_detective/formats/mois_de_lannee.py +0 -0
csv_detective/formats/money.py +0 -0
csv_detective/formats/mongo_object_id.py +0 -0
csv_detective/formats/pays.py +0 -0
csv_detective/formats/percent.py +0 -0
csv_detective/formats/region.py +0 -0
csv_detective/formats/sexe.py +0 -0
csv_detective/formats/siren.py +0 -0
csv_detective/formats/siret.py +0 -0
csv_detective/formats/tel_fr.py +0 -0
csv_detective/formats/uai.py +0 -0
csv_detective/formats/url.py +0 -0
csv_detective/formats/username.py +0 -0
csv_detective/formats/uuid.py +0 -0
csv_detective/formats/year.py +0 -0
csv_detective/output/__init__.py +0 -0
csv_detective/output/dataframe.py +2 -2
csv_detective/output/example.py +0 -0
csv_detective/output/profile.py +1 -1
csv_detective/output/schema.py +0 -0
csv_detective/output/utils.py +0 -0
csv_detective/parsing/__init__.py +0 -0
csv_detective/parsing/columns.py +5 -9
csv_detective/parsing/compression.py +0 -0
csv_detective/parsing/csv.py +0 -0
csv_detective/parsing/excel.py +1 -1
csv_detective/parsing/load.py +12 -11
csv_detective/validate.py +36 -71
{csv_detective-0.10.4.dev1.dist-info → csv_detective-0.10.12674.dist-info}/METADATA +18 -15
{csv_detective-0.10.4.dev1.dist-info → csv_detective-0.10.12674.dist-info}/RECORD +22 -41
csv_detective-0.10.12674.dist-info/WHEEL +4 -0
{csv_detective-0.10.4.dev1.dist-info → csv_detective-0.10.12674.dist-info}/entry_points.txt +1 -0
csv_detective-0.10.4.dev1.dist-info/WHEEL +0 -5
csv_detective-0.10.4.dev1.dist-info/licenses/LICENSE +0 -21
csv_detective-0.10.4.dev1.dist-info/top_level.txt +0 -3
tests/__init__.py +0 -0
tests/data/a_test_file.csv +0 -407
tests/data/a_test_file.json +0 -394
tests/data/b_test_file.csv +0 -7
tests/data/c_test_file.csv +0 -2
tests/data/csv_file +0 -7
tests/data/file.csv.gz +0 -0
tests/data/file.ods +0 -0
tests/data/file.xls +0 -0
tests/data/file.xlsx +0 -0
tests/data/xlsx_file +0 -0
tests/test_example.py +0 -67
tests/test_fields.py +0 -175
tests/test_file.py +0 -469
tests/test_labels.py +0 -26
tests/test_structure.py +0 -45
tests/test_validation.py +0 -163

csv_detective/validate.py CHANGED Viewed

@@ -1,13 +1,10 @@
 import logging
-from collections import defaultdict
 import pandas as pd
 from csv_detective.format import FormatsManager
 from csv_detective.parsing.columns import MAX_NUMBER_CATEGORICAL_VALUES, test_col_val
-# VALIDATION_CHUNK_SIZE is bigger than (analysis) CHUNK_SIZE because
-# it's faster to validate so we can afford to load more rows
 VALIDATION_CHUNK_SIZE = int(1e5)
 logging.basicConfig(level=logging.INFO)
@@ -19,9 +16,9 @@ def validate(
     previous_analysis: dict,
     verbose: bool = False,
     skipna: bool = True,
-) -> tuple[bool, dict | None, dict[str, pd.Series] | None]:
+) -> tuple[bool, pd.DataFrame | None, dict | None, dict[str, pd.Series] | None]:
     """
-    Verify is the given file has the same fields and formats as in the given analysis.
+    Verify is the given file has the same fields and types as in the given analysis.
     Args:
         file_path: the path of the file to validate
@@ -29,15 +26,6 @@ def validate(
         verbose: whether the code displays the steps it's going through
         skipna: whether to ignore NaN values in the checks
     """
-    if verbose:
-        logging.info(f"Checking given formats exist")
-    for col_name, detected in previous_analysis["columns"].items():
-        if detected["format"] == "string":
-            continue
-        elif detected["format"] not in formats:
-            if verbose:
-                logging.warning(f"> Unknown format `{detected['format']}` in analysis")
-            return False, None, None
     try:
         if previous_analysis.get("separator"):
             # loading the table in chunks
@@ -70,94 +58,71 @@ def validate(
                 ]
             )
             analysis = {k: v for k, v in previous_analysis.items() if k in ["engine", "sheet_name"]}
+        first_chunk = next(chunks)
         analysis.update(
             {k: v for k, v in previous_analysis.items() if k in ["header_row_idx", "header"]}
         )
     except Exception as e:
         if verbose:
             logging.warning(f"> Could not load the file with previous analysis values: {e}")
-        return False, None, None
+        return False, None, None, None
     if verbose:
         logging.info("Comparing table with the previous analysis")
+        logging.info("- Checking if all columns match")
+    if len(first_chunk.columns) != len(previous_analysis["header"]) or any(
+        list(first_chunk.columns)[k] != previous_analysis["header"][k]
+        for k in range(len(previous_analysis["header"]))
+    ):
+        if verbose:
+            logging.warning("> Columns do not match, proceeding with full analysis")
+        return False, None, None, None
+    if verbose:
         logging.info(
             f"Testing previously detected formats on chunks of {VALIDATION_CHUNK_SIZE} rows"
         )
-    # will contain hashes of each row of the file as index and the number of times
-    # each hash was seen as values; used to compute nb_duplicates
-    row_hashes_count = pd.Series()
-    # will contain the number of times each value of each column is seen in the whole file
-    # used for profile to read the file only once
-    # naming it "count" to be iso with how col_values are made in detect_formats
-    col_values: defaultdict[str, pd.Series] = defaultdict(lambda: pd.Series(name="count"))
+    # hashing rows to get nb_duplicates
+    row_hashes_count = pd.util.hash_pandas_object(first_chunk, index=False).value_counts()
+    # getting values for profile to read the file only once
+    col_values = {col: first_chunk[col].value_counts(dropna=False) for col in first_chunk.columns}
     analysis["total_lines"] = 0
-    checked_values: dict[str, int] = {col_name: 0 for col_name in previous_analysis["columns"]}
-    valid_values: dict[str, int] = {col_name: 0 for col_name in previous_analysis["columns"]}
-    for idx, chunk in enumerate(chunks):
+    for idx, chunk in enumerate([first_chunk, *chunks]):
         if verbose:
-            logging.info(f"- Testing chunk number {idx}")
-        if idx == 0:
-            if verbose:
-                logging.info("Checking if all columns match")
-            if len(chunk.columns) != len(previous_analysis["header"]) or any(
-                list(chunk.columns)[k] != previous_analysis["header"][k]
-                for k in range(len(previous_analysis["header"]))
-            ):
-                if verbose:
-                    logging.warning("> Columns in the file do not match those of the analysis")
-                return False, None, None
+            logging.info(f"> Testing chunk number {idx}")
         analysis["total_lines"] += len(chunk)
         row_hashes_count = row_hashes_count.add(
             pd.util.hash_pandas_object(chunk, index=False).value_counts(),
             fill_value=0,
         )
-        for col_name, detected in previous_analysis["columns"].items():
+        for col in chunk.columns:
+            col_values[col] = col_values[col].add(
+                chunk[col].value_counts(dropna=False),
+                fill_value=0,
+            )
+        for col_name, args in previous_analysis["columns"].items():
             if verbose:
-                logging.info(f"- Testing {col_name} for {detected['format']}")
-            if detected["format"] == "string":
+                logging.info(f"- Testing {col_name} for {args['format']}")
+            if args["format"] == "string":
                 # no test for columns that have not been recognized as a specific format
                 continue
-            to_check = chunk[col_name].dropna() if skipna else chunk[col_name]
-            chunk_valid_values = sum(to_check.apply(formats[detected["format"]].func))
-            if formats[detected["format"]].proportion == 1 and chunk_valid_values < len(to_check):
-                # we can early stop in this case, not all values are valid while we want 100%
+            test_result: float = test_col_val(
+                serie=chunk[col_name],
+                format=formats[args["format"]],
+                skipna=skipna,
+            )
+            if not bool(test_result):
                 if verbose:
-                    logging.warning(
-                        f"> Test failed for column {col_name} with format {detected['format']}"
-                    )
-                return False, None, None
-            checked_values[col_name] += len(to_check)
-            valid_values[col_name] += chunk_valid_values
-            col_values[col_name] = (
-                col_values[col_name]
-                .add(
-                    chunk[col_name].value_counts(dropna=False),
-                    fill_value=0,
-                )
-                .rename_axis(col_name)
-            )  # rename_axis because *sometimes* pandas doesn't pass on the column's name ¯\_(ツ)_/¯
-        del chunk
-    # finally we loop through the formats that accept less than 100% valid values to check the proportion
-    for col_name, detected in previous_analysis["columns"].items():
-        if (
-            checked_values[col_name] > 0
-            and valid_values[col_name] / checked_values[col_name]
-            < formats[detected["format"]].proportion
-        ):
-            if verbose:
-                logging.warning(
-                    f"> Test failed for column {col_name} with format {detected['format']}"
-                )
-            return False, None, None
+                    logging.warning("> Test failed, proceeding with full analysis")
+                return False, first_chunk, analysis, None
     if verbose:
         logging.info("> All checks successful")
     analysis["nb_duplicates"] = sum(row_hashes_count > 1)
-    del row_hashes_count
     analysis["categorical"] = [
         col for col, values in col_values.items() if len(values) <= MAX_NUMBER_CATEGORICAL_VALUES
     ]
     return (
         True,
+        first_chunk,
         analysis
         | {
             k: previous_analysis[k]

{csv_detective-0.10.4.dev1.dist-info → csv_detective-0.10.12674.dist-info}/METADATA RENAMED Viewed

@@ -1,29 +1,32 @@
-Metadata-Version: 2.4
+Metadata-Version: 2.3
 Name: csv-detective
-Version: 0.10.4.dev1
+Version: 0.10.12674
 Summary: Detect tabular files column content
-Author-email: "data.gouv.fr" <opendatateam@data.gouv.fr>
-License: MIT
-Project-URL: Source, https://github.com/datagouv/csv-detective
 Keywords: CSV,data processing,encoding,guess,parser,tabular
-Requires-Python: <3.15,>=3.10
-Description-Content-Type: text/markdown
-License-File: LICENSE
-Requires-Dist: dateparser<2,>=1.2.0
+Author: data.gouv.fr
+Author-email: data.gouv.fr <opendatateam@data.gouv.fr>
+License: MIT
+Requires-Dist: dateparser>=1.2.0,<2
 Requires-Dist: faust-cchardet==2.1.19
-Requires-Dist: pandas<3,>=2.2.0
-Requires-Dist: python-dateutil<3,>=2.8.2
-Requires-Dist: Unidecode<2,>=1.3.6
+Requires-Dist: pandas>=2.2.0,<3
+Requires-Dist: python-dateutil>=2.8.2,<3
+Requires-Dist: unidecode>=1.3.6,<2
 Requires-Dist: openpyxl>=3.1.5
 Requires-Dist: xlrd>=2.0.1
 Requires-Dist: odfpy>=1.4.1
-Requires-Dist: requests<3,>=2.32.3
+Requires-Dist: requests>=2.32.3,<3
 Requires-Dist: python-magic>=0.4.27
 Requires-Dist: frformat==0.4.0
-Requires-Dist: Faker>=33.0.0
+Requires-Dist: faker>=33.0.0
 Requires-Dist: rstr>=3.2.2
 Requires-Dist: more-itertools>=10.8.0
-Dynamic: license-file
+Requires-Dist: pytest>=8.3.0 ; extra == 'dev'
+Requires-Dist: responses>=0.25.0 ; extra == 'dev'
+Requires-Dist: ruff>=0.9.3 ; extra == 'dev'
+Requires-Python: >=3.10, <3.15
+Project-URL: Source, https://github.com/datagouv/csv-detective
+Provides-Extra: dev
+Description-Content-Type: text/markdown
 # CSV Detective

{csv_detective-0.10.4.dev1.dist-info → csv_detective-0.10.12674.dist-info}/RECORD RENAMED Viewed

@@ -1,18 +1,16 @@
 csv_detective/__init__.py,sha256=zlYElTOp_I2_VG7ZdOTuAu0wuCXSc0cr3sH6gtk2bcg,152
 csv_detective/cli.py,sha256=mu5anmBmaDk52_uZGiA4T37wYZCuV43gZAepjs1Cqzc,1389
-csv_detective/explore_csv.py,sha256=M8jabAP08raPY438v5UeBqJy3bBudTeuo-UNe2unWyE,7639
-csv_detective/format.py,sha256=VTdwg4gp9pq6WYhbkCxv9X2hXq0fMrzfooFchmIL0as,2911
-csv_detective/utils.py,sha256=RJ_zFOJ1DRY8HtDrKPiCdNk5gU6-KwOrOKOyfSkBZZY,1118
-csv_detective/validate.py,sha256=7k0GC5AsTn5BbsRChetZZDmnTGiYLe40qPKiP3GruYs,7495
 csv_detective/detection/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 csv_detective/detection/columns.py,sha256=_JtZHBr3aoEmSWh2xVe2ISnt-G7hpnA9vqlvcaGd0Go,2887
 csv_detective/detection/encoding.py,sha256=KZ8W8BPfZAq9UiP5wgaeupYa5INU8KPz98E2L3XpX2Y,999
 csv_detective/detection/engine.py,sha256=wQeDKpp2DKF-HcS1R8H6GgQyaUgQme4szPtEHgAjBII,1552
-csv_detective/detection/formats.py,sha256=cgECpxRaygwnedPhOteG1P_697qCoceeDrKK9G_O-u8,4812
-csv_detective/detection/headers.py,sha256=lnbWRxkI6rdyoWGtmxSfsPkqNjS0Nlpgw-pVevtmBP0,899
-csv_detective/detection/rows.py,sha256=JQsmKP8-i8wzcZIWI_13LUer5mpYRIqaKg6qW01ZO3A,750
+csv_detective/detection/formats.py,sha256=9aIE4gwTN8c8pa-kofeJ7zalo8NqjGZabYD-G79kV5I,4734
+csv_detective/detection/headers.py,sha256=95pTL524Sy5PGxyQ03ofFUaamvlmkxTJQe8u6HfzOkU,1051
+csv_detective/detection/rows.py,sha256=quf3ZTTFPOo09H-faZ9cRKibb1QGHEKHlpivFRx2Va4,742
 csv_detective/detection/separator.py,sha256=XjeDBqhiBxVfkCPJKem9BAgJqs_hOgQltc_pxrH_-Tg,1547
 csv_detective/detection/variables.py,sha256=-QtZOB96z3pWbqnZ-c1RU3yzoYqcO61A0JzeS6JbkxY,3576
+csv_detective/explore_csv.py,sha256=qSf6N3tbp43BUMJF5wiXz3aYKaTez6ro-75KL2Arci4,7174
+csv_detective/format.py,sha256=VglcxWBmjTvWNMhwSUZDfMdJcK9lAUum64Jxvm70AJ4,2898
 csv_detective/formats/__init__.py,sha256=Egiy29kcG3Oz2eE2maYhD3wP29zOSOWyRlOpGD5LGvU,318
 csv_detective/formats/adresse.py,sha256=79tIXeC1AUjUG9m0XGZUcP_BXvmLgd1M8XVfxgLNGDE,1966
 csv_detective/formats/binary.py,sha256=26qrbqv_Dqu0LhVPpQOz2xzglxse7Nz5EasbQ0xP38c,715
@@ -28,7 +26,12 @@ csv_detective/formats/code_rna.py,sha256=o6Kptrux6T2bSnWHi7MBCqIfVKbMMeN4dHlxxzk
 csv_detective/formats/code_waldec.py,sha256=j4-xpj_73c7IdgLoZJY_kRVj3HkpB7RFfGPN4NwPmVo,303
 csv_detective/formats/commune.py,sha256=QVscVy5Ij9kdzKJgIG2aFC_v1IRsov5M9Zkj_SHDWgs,541
 csv_detective/formats/csp_insee.py,sha256=y1w9zPQvijQi5v1Cuye0aX87ZVDC4FeFx1YC0dLqqp8,688
-csv_detective/formats/date.py,sha256=caMMvcqkbON8Cxp9oDYZsfmkSXuu-PiiJi8YUbypBso,3167
+csv_detective/formats/data/csp_insee.txt,sha256=kgKaKc-5PHu5U4--ugLjpFyMNtTU9CGdZ9ANU3YAsM4,32879
+csv_detective/formats/data/insee_ape700.txt,sha256=-_N-zAmcT7rK7ACRfsrM01Ton4_XtZGcNk-7lU28VHU,4397
+csv_detective/formats/data/iso_country_code_alpha2.txt,sha256=mLt_qcQ6D8hfy9zdi7fAK_zON1ojReKlKMA8c2VDoRU,752
+csv_detective/formats/data/iso_country_code_alpha3.txt,sha256=XFPdGBsyZCBg4D8IDn6VgwsycCwYVfuqPbyHfNeqGv0,1003
+csv_detective/formats/data/iso_country_code_numeric.txt,sha256=sdGpn0PqDMlc59-7prThkihHrf7mwB6j5uEHpxGvLFE,1003
+csv_detective/formats/date.py,sha256=Q6w1azLKNshJJVLOPBHj-77ZinXYMW_EKp_BGDshLLE,2802
 csv_detective/formats/date_fr.py,sha256=YnNXSgT6QekfTUJoS5yuRX8LeK-fmVDgLgVP9cP0e4M,505
 csv_detective/formats/datetime_aware.py,sha256=izKo6CA-MNIzmmM3Br4-FOESyqCS_YYK8N4V9D6CVEI,1909
 csv_detective/formats/datetime_naive.py,sha256=DZ0apAm3vIy4cdm5DynAeRueI_8rhuHYQtAOZ5yyZ5k,1681
@@ -68,44 +71,22 @@ csv_detective/formats/url.py,sha256=m3i_XhFRFaAxSACS05XfciQ-oyTCsP_0TASShCY2t7A,
 csv_detective/formats/username.py,sha256=6qviaFOtF2wg-gtvs0N8548JxFNE67Ue3a0JD0Kv7TQ,261
 csv_detective/formats/uuid.py,sha256=LxkRZFAOlfig5KKrravO9bgyYjmRBegzOtGyzjopVNc,352
 csv_detective/formats/year.py,sha256=tMc2HHr6Jga3PGWjmeHweK3G17DsjkIpIUUkCecXAm4,362
-csv_detective/formats/data/csp_insee.txt,sha256=kgKaKc-5PHu5U4--ugLjpFyMNtTU9CGdZ9ANU3YAsM4,32879
-csv_detective/formats/data/insee_ape700.txt,sha256=-_N-zAmcT7rK7ACRfsrM01Ton4_XtZGcNk-7lU28VHU,4397
-csv_detective/formats/data/iso_country_code_alpha2.txt,sha256=mLt_qcQ6D8hfy9zdi7fAK_zON1ojReKlKMA8c2VDoRU,752
-csv_detective/formats/data/iso_country_code_alpha3.txt,sha256=XFPdGBsyZCBg4D8IDn6VgwsycCwYVfuqPbyHfNeqGv0,1003
-csv_detective/formats/data/iso_country_code_numeric.txt,sha256=sdGpn0PqDMlc59-7prThkihHrf7mwB6j5uEHpxGvLFE,1003
 csv_detective/output/__init__.py,sha256=ALSq_tgX7rGyh--7rmbKz8wHkmResN0h7mNujndow3w,2103
-csv_detective/output/dataframe.py,sha256=juBMdj0eiL8c3OrJJ3kCf15Qs4-CFQfHqh91FnVbG9E,3656
+csv_detective/output/dataframe.py,sha256=QX5vplx0AOKgnwwJ6dKvDHWRX9IGPStax-svXEyweJ8,3584
 csv_detective/output/example.py,sha256=8LWheSBYCeDFfarbnmzBrdCbTd8Alh1U4pfXMKfabOw,8630
-csv_detective/output/profile.py,sha256=R9YMl-dANde69RXkFlZpvMDBsX7e1SyMAnlW8p1XNNM,4984
+csv_detective/output/profile.py,sha256=ADr5DwuvwcBYxugjN38fHm11l6ivfzGHXPd8a87Ht-s,4985
 csv_detective/output/schema.py,sha256=XoKljXPXP00DfqPCiz1ydwTHYGAFsvNxnaPCNBuuBIo,10443
 csv_detective/output/utils.py,sha256=tbji3dEH7bDc6gLCeVSVquqU3xaHA1CQOMuaJT4Hub8,3297
 csv_detective/parsing/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-csv_detective/parsing/columns.py,sha256=MFtEJFLsFdlKdM5AXtgXbf5p6HRW6DuOC4XnxhFMpIY,9344
+csv_detective/parsing/columns.py,sha256=rb5JywbKnYCT3Jb0ZaG1BnyPVtB3gy5mSD-K7qcOl8I,9257
 csv_detective/parsing/compression.py,sha256=Fnw5tj-PpBNI8NYsWj5gD-DUoWcVLnsVpiKm9MpxmIA,350
 csv_detective/parsing/csv.py,sha256=5rw6gXZFQC1T4NT9CnW0AumidrYOkF8kjrfWGmk949I,1716
-csv_detective/parsing/excel.py,sha256=pX6dbhAdAdbRpoGcrGsL1lSaF-fbzEb4WcvwcCGEgFw,6978
-csv_detective/parsing/load.py,sha256=1Fk43ikIOJwtWJUY-e8oNeNOk4MMtpmZV7s-VbQBS1k,4345
+csv_detective/parsing/excel.py,sha256=tb65I78tdYlZci_tzvvQt8U6bZSYKjeVdn2CEvsET1o,6972
+csv_detective/parsing/load.py,sha256=f-8aKiNpy_47qg4Lq-UZUR4NNrbJ_-KEGvcUQZ8cmb0,4317
 csv_detective/parsing/text.py,sha256=yDAcop5xJQc25UtbZcV0guHXAZQfm-H8WuJORTy8Rr8,1734
-csv_detective-0.10.4.dev1.dist-info/licenses/LICENSE,sha256=A1dQrzxyxRHRih02KwibWj1khQyF7GeA6SqdOU87Gk4,1088
-tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-tests/test_example.py,sha256=uTWswvUzBWEADGXZmMAdZvKhKvIjvT5zWOVVABgCDN4,1987
-tests/test_fields.py,sha256=DSI-ZXDcRt69iZArYZZAr_3OEb-qvwgOVBZxmYAKIkI,5918
-tests/test_file.py,sha256=Ov9NGvZQxeoehxTpfcsnwEybebM0tnbmcRsFwe46cjg,15277
-tests/test_labels.py,sha256=lgxRbLrGV1C-MkASf3KIQ120BG-UHzFQ4pqDWaeBvaw,539
-tests/test_structure.py,sha256=XDbviuuvk-0Mu9Y9PI6He2e5hry2dXVJ6yBVwEqF_2o,1043
-tests/test_validation.py,sha256=309k3Axgbp-1Wh6qvCj2BpeMBp3HXzLi5j9UKm1bRQs,5384
-tests/data/a_test_file.csv,sha256=SOHjseGYqZer9yu3Bd3oS12Vw8MFsebo0BzrLZ_R4Cc,68871
-tests/data/a_test_file.json,sha256=fB9bCpAMFPxFw8KxHRFlgRqjYG819QVGrCQWxQvwkvo,10542
-tests/data/b_test_file.csv,sha256=wJGX62KhYjZi62De2XjZWClAzeRFEBsg3ET0IPX1BNU,98
-tests/data/c_test_file.csv,sha256=dz6axMyFscHIWR2Brqia_jvlBfQ30l1rFrxvcTqsmJ8,36
-tests/data/csv_file,sha256=nMAQx2PrQliu3czifCHXLyruZbvCNTyYqwZ4JYzImqA,70
-tests/data/file.csv.gz,sha256=mfGfqG5mGlojCs05A0IF7IUZe5r87bAe2FuQ0Uh5ZMI,108
-tests/data/file.ods,sha256=4dR7zWptz5djALIBVeWHQ20GaZNfA63fevIJGFIk1_U,11832
-tests/data/file.xls,sha256=QYmNX3FF0QfcQSzYQMtaMJaepJf5EZpDa1miKc4wMdQ,21495
-tests/data/file.xlsx,sha256=naWzL02PK4pdIjMzfEyfSW9GQhkYYd_e7bpJvB8Pb2w,8314
-tests/data/xlsx_file,sha256=NyOyN_rIe7ryJuHQLqjxVdKCc8V4s5pxyHl6wWFykCM,8305
-csv_detective-0.10.4.dev1.dist-info/METADATA,sha256=le1Rn1JIh8MoIf_RTc3Fi9DOOlvug4eR-Mwpw4AK0To,10925
-csv_detective-0.10.4.dev1.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
-csv_detective-0.10.4.dev1.dist-info/entry_points.txt,sha256=JjweTReFqKJmuvkegzlew2j3D5pZzfxvbEGOtGVGmaY,56
-csv_detective-0.10.4.dev1.dist-info/top_level.txt,sha256=KDI4gyOpkmormGgUvSWrE3jen2e0unIsxR2b96DRvcw,25
-csv_detective-0.10.4.dev1.dist-info/RECORD,,
+csv_detective/utils.py,sha256=RJ_zFOJ1DRY8HtDrKPiCdNk5gU6-KwOrOKOyfSkBZZY,1118
+csv_detective/validate.py,sha256=CjZXhhDP-n6wGgEqbwrGRqebU8L5bidwnvQp-TbnvFA,5424
+csv_detective-0.10.12674.dist-info/WHEEL,sha256=XjEbIc5-wIORjWaafhI6vBtlxDBp7S9KiujWF1EM7Ak,79
+csv_detective-0.10.12674.dist-info/entry_points.txt,sha256=1J86TQNCanjsLMboAufdEUla03qEQaC9QmVGYgt2FCQ,57
+csv_detective-0.10.12674.dist-info/METADATA,sha256=TZIyuSI6QBmDeZoNZdYqarZ2R_GvaGazjB5WSkt8PFI,11060
+csv_detective-0.10.12674.dist-info/RECORD,,

csv_detective-0.10.12674.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,4 @@
+Wheel-Version: 1.0
+Generator: uv 0.9.25
+Root-Is-Purelib: true
+Tag: py3-none-any

{csv_detective-0.10.4.dev1.dist-info → csv_detective-0.10.12674.dist-info}/entry_points.txt RENAMED Viewed

@@ -1,2 +1,3 @@
 [console_scripts]
 csv_detective = csv_detective.cli:run

csv_detective-0.10.4.dev1.dist-info/WHEEL DELETED Viewed

@@ -1,5 +0,0 @@
-Wheel-Version: 1.0
-Generator: setuptools (80.10.2)
-Root-Is-Purelib: true
-Tag: py3-none-any

csv_detective-0.10.4.dev1.dist-info/licenses/LICENSE DELETED Viewed

@@ -1,21 +0,0 @@
-MIT License
-Copyright (c) 2025 data.gouv.fr
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-The above copyright notice and this permission notice shall be included in all
-copies or substantial portions of the Software.
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-SOFTWARE.

csv_detective-0.10.4.dev1.dist-info/top_level.txt DELETED Viewed

@@ -1,3 +0,0 @@
-csv_detective
-dist
-tests

tests/__init__.py DELETED Viewed

File without changes

csv-detective 0.10.4.dev1__py3-none-any.whl → 0.10.12674__py3-none-any.whl

csv-detective 0.10.4.dev1py3-none-any.whl → 0.10.12674py3-none-any.whl