PyPI - pointblank - Versions diffs - 0.13.4__py3-none-any.whl → 0.15.0__py3-none-any.whl - Mend

pointblank 0.13.4py3-none-any.whl → 0.15.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

pointblank/__init__.py +4 -0
pointblank/_constants.py +117 -0
pointblank/_constants_translations.py +487 -2
pointblank/_interrogation.py +1065 -12
pointblank/_spec_utils.py +1015 -0
pointblank/_utils.py +17 -7
pointblank/_utils_ai.py +875 -0
pointblank/assistant.py +1 -1
pointblank/cli.py +128 -115
pointblank/column.py +1 -1
pointblank/data/api-docs.txt +1838 -130
pointblank/data/validations/README.md +108 -0
pointblank/data/validations/complex_preprocessing.json +54 -0
pointblank/data/validations/complex_preprocessing.pkl +0 -0
pointblank/data/validations/generate_test_files.py +127 -0
pointblank/data/validations/multiple_steps.json +83 -0
pointblank/data/validations/multiple_steps.pkl +0 -0
pointblank/data/validations/narwhals_function.json +28 -0
pointblank/data/validations/narwhals_function.pkl +0 -0
pointblank/data/validations/no_preprocessing.json +83 -0
pointblank/data/validations/no_preprocessing.pkl +0 -0
pointblank/data/validations/pandas_compatible.json +28 -0
pointblank/data/validations/pandas_compatible.pkl +0 -0
pointblank/data/validations/preprocessing_functions.py +46 -0
pointblank/data/validations/simple_preprocessing.json +57 -0
pointblank/data/validations/simple_preprocessing.pkl +0 -0
pointblank/datascan.py +4 -4
pointblank/draft.py +52 -3
pointblank/scan_profile.py +6 -6
pointblank/schema.py +8 -82
pointblank/thresholds.py +1 -1
pointblank/validate.py +3069 -437
{pointblank-0.13.4.dist-info → pointblank-0.15.0.dist-info}/METADATA +67 -8
pointblank-0.15.0.dist-info/RECORD +56 -0
pointblank-0.13.4.dist-info/RECORD +0 -39
{pointblank-0.13.4.dist-info → pointblank-0.15.0.dist-info}/WHEEL +0 -0
{pointblank-0.13.4.dist-info → pointblank-0.15.0.dist-info}/entry_points.txt +0 -0
{pointblank-0.13.4.dist-info → pointblank-0.15.0.dist-info}/licenses/LICENSE +0 -0
{pointblank-0.13.4.dist-info → pointblank-0.15.0.dist-info}/top_level.txt +0 -0

pointblank/_utils.py CHANGED Viewed

@@ -102,7 +102,7 @@ def _get_tbl_type(data: FrameT | Any) -> str:
                 if "read_parquet" in tbl_name:
                     return "parquet"
-            else:
+            else:  # pragma: no cover
                 return "duckdb"
         return backend
@@ -274,10 +274,10 @@ def _copy_dataframe(df):
         import copy
         return copy.deepcopy(df)
-    except Exception:
+    except Exception:  # pragma: no cover
         # If all else fails, return the original DataFrame
         # This is better than crashing the validation
-        return df
+        return df  # pragma: no cover
 def _convert_to_narwhals(df: FrameT) -> nw.DataFrame:
@@ -670,18 +670,23 @@ def _get_api_text() -> str:
         "Validate.col_vals_outside",
         "Validate.col_vals_in_set",
         "Validate.col_vals_not_in_set",
+        "Validate.col_vals_increasing",
+        "Validate.col_vals_decreasing",
         "Validate.col_vals_null",
         "Validate.col_vals_not_null",
         "Validate.col_vals_regex",
+        "Validate.col_vals_within_spec",
         "Validate.col_vals_expr",
-        "Validate.col_exists",
         "Validate.rows_distinct",
         "Validate.rows_complete",
+        "Validate.col_exists",
         "Validate.col_schema_match",
         "Validate.row_count_match",
         "Validate.col_count_match",
+        "Validate.tbl_match",
         "Validate.conjointly",
         "Validate.specially",
+        "Validate.prompt",
     ]
     column_selection_exported = [
@@ -702,6 +707,7 @@ def _get_api_text() -> str:
     interrogation_exported = [
         "Validate.interrogate",
+        "Validate.set_tbl",
         "Validate.get_tabular_report",
         "Validate.get_step_report",
         "Validate.get_json_report",
@@ -735,6 +741,7 @@ def _get_api_text() -> str:
     yaml_exported = [
         "yaml_interrogate",
         "validate_yaml",
+        "yaml_to_python",
     ]
     utility_exported = [
@@ -742,6 +749,8 @@ def _get_api_text() -> str:
         "get_row_count",
         "get_action_metadata",
         "get_validation_summary",
+        "write_file",
+        "read_file",
         "config",
     ]
@@ -786,9 +795,10 @@ datasets included in the package can be accessed via the `load_dataset()` functi
 the `assistant()` function to get help with Pointblank."""
     yaml_desc = """The *YAML* group contains functions that allow for the use of YAML to orchestrate
-validation workflows. The `yaml_interrogate()` function can be used to run a validation workflow from
-YAML strings or files. The `validate_yaml()` function checks if the YAML configuration
-passes its own validity checks."""
+validation workflows. The `yaml_interrogate()` function can be used to run a validation workflow
+from YAML strings or files. The `validate_yaml()` function checks if the YAML configuration passes
+its own validity checks. The `yaml_to_python()` function converts YAML configuration to equivalent
+Python code."""
     utility_desc = """The Utility Functions group contains functions that are useful for accessing
 metadata about the target data. Use `get_column_count()` or `get_row_count()` to get the number of

pointblank 0.13.4__py3-none-any.whl → 0.15.0__py3-none-any.whl

pointblank 0.13.4py3-none-any.whl → 0.15.0py3-none-any.whl