data-sitter 0.1.1__tar.gz → 0.1.3__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (32) hide show
  1. {data_sitter-0.1.1 → data_sitter-0.1.3}/PKG-INFO +1 -1
  2. {data_sitter-0.1.1 → data_sitter-0.1.3}/README.md +1 -1
  3. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/Contract.py +9 -4
  4. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/FieldResolver.py +2 -1
  5. data_sitter-0.1.3/data_sitter/Validation.py +30 -0
  6. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/cli.py +1 -1
  7. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/field_types/BaseField.py +12 -5
  8. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter.egg-info/PKG-INFO +1 -1
  9. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter.egg-info/SOURCES.txt +1 -0
  10. {data_sitter-0.1.1 → data_sitter-0.1.3}/pyproject.toml +1 -1
  11. {data_sitter-0.1.1 → data_sitter-0.1.3}/setup.py +1 -1
  12. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/__init__.py +0 -0
  13. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/field_types/FloatField.py +0 -0
  14. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/field_types/IntegerField.py +0 -0
  15. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/field_types/NumericField.py +0 -0
  16. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/field_types/StringField.py +0 -0
  17. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/field_types/__init__.py +0 -0
  18. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/MatchedRule.py +0 -0
  19. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/Parser/RuleParser.py +0 -0
  20. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/Parser/__init__.py +0 -0
  21. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/Parser/alias_parameters_parser.py +0 -0
  22. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/Parser/parser_utils.py +0 -0
  23. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/Rule.py +0 -0
  24. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/RuleRegistry.py +0 -0
  25. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/rules/__init__.py +0 -0
  26. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/utils/__init__.py +0 -0
  27. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter/utils/logger_config.py +0 -0
  28. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter.egg-info/dependency_links.txt +0 -0
  29. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter.egg-info/entry_points.txt +0 -0
  30. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter.egg-info/requires.txt +0 -0
  31. {data_sitter-0.1.1 → data_sitter-0.1.3}/data_sitter.egg-info/top_level.txt +0 -0
  32. {data_sitter-0.1.1 → data_sitter-0.1.3}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: data-sitter
3
- Version: 0.1.1
3
+ Version: 0.1.3
4
4
  Summary: A Python library that reads data contracts and generates Pydantic models for seamless data validation.
5
5
  Author-email: Lázaro Pereira Candea <lazaro@candea.es>
6
6
  Requires-Dist: python-dotenv==1.0.1
@@ -48,7 +48,7 @@ contract_dict = {
48
48
  }
49
49
 
50
50
  contract = Contract.from_dict(contract_dict)
51
- pydantic_contract = contract.get_pydantic_model()
51
+ pydantic_contract = contract.pydantic_model
52
52
  ```
53
53
 
54
54
  ### Using Rule References
@@ -3,6 +3,7 @@ from functools import cached_property
3
3
 
4
4
  from pydantic import BaseModel
5
5
 
6
+ from .Validation import Validation
6
7
  from .field_types import BaseField
7
8
  from .FieldResolver import FieldResolver
8
9
  from .rules import MatchedRule, RuleRegistry, RuleParser
@@ -68,10 +69,13 @@ class Contract:
68
69
  return rules
69
70
 
70
71
  def model_validate(self, item: dict):
71
- pydantic_model = self.get_pydantic_model()
72
- return pydantic_model.model_validate(item).model_dump()
72
+ return self.pydantic_model.model_validate(item).model_dump()
73
73
 
74
- def get_pydantic_model(self) -> BaseModel:
74
+ def validate(self, item: dict) -> Validation:
75
+ return Validation.validate(self.pydantic_model, item)
76
+
77
+ @cached_property
78
+ def pydantic_model(self) -> BaseModel:
75
79
  return type(self.name, (BaseModel,), {
76
80
  "__annotations__": {
77
81
  field_name: field_validator.get_annotation()
@@ -97,5 +101,6 @@ class Contract:
97
101
  ]
98
102
  }
99
103
  for field_name, field_validator in self.field_validators.items()
100
- ]
104
+ ],
105
+ "values": self.rule_parser.values
101
106
  }
@@ -32,7 +32,8 @@ class FieldResolver:
32
32
  return matched_rules
33
33
 
34
34
  def get_field_validator(self, field_name: str, parsed_rules: List[str]) -> BaseField:
35
- validator = self.field_class(field_name)
35
+ is_optional = "Validate Not Null" not in parsed_rules
36
+ validator = self.field_class(field_name, is_optional)
36
37
  matched_rules = self.get_matched_rules(parsed_rules)
37
38
  for matched_rule in matched_rules:
38
39
  matched_rule.add_to_instance(validator)
@@ -0,0 +1,30 @@
1
+
2
+ from collections import defaultdict
3
+ from typing import Any, Dict, List, Type
4
+
5
+ from pydantic import BaseModel, ValidationError
6
+
7
+
8
+ class Validation():
9
+ row: Dict[str, Any]
10
+ errors: Dict[str, List[str]]
11
+
12
+ def __init__(self, row: dict, errors: dict = None):
13
+ self.row = row
14
+ self.errors = errors or {}
15
+
16
+ def to_dict(self) -> dict:
17
+ return {"row": self.row, "errors": self.errors}
18
+
19
+ @classmethod
20
+ def validate(cls, model: Type[BaseModel], item: dict) -> "Validation":
21
+ try:
22
+ row = model(**item) # Validate the row
23
+ return Validation(row=row.model_dump())
24
+ except ValidationError as e:
25
+ errors = defaultdict(list)
26
+ for error in e.errors():
27
+ field = error['loc'][0] # Extract the field name
28
+ msg = error['msg']
29
+ errors[field].append(msg)
30
+ return Validation(row=item, errors=dict(errors))
@@ -23,7 +23,7 @@ def main():
23
23
  contract_path = Path(args.contract)
24
24
  contract_dict = json.loads(contract_path.read_text(encoding))
25
25
  contract = Contract.from_dict(contract_dict)
26
- pydantic_contract = contract.get_pydantic_model()
26
+ pydantic_contract = contract.pydantic_model
27
27
 
28
28
  if file_path.suffix == '.csv':
29
29
  with open(file_path, encoding=encoding) as f:
@@ -1,12 +1,14 @@
1
1
  from abc import ABC
2
- from typing import Annotated, List, Type
2
+ from typing import Annotated, List, Optional, Type
3
3
 
4
4
  from pydantic import AfterValidator
5
5
  from ..rules import register_rule, register_field
6
6
 
7
7
 
8
- def aggregated_validator(validators: List[callable]):
8
+ def aggregated_validator(validators: List[callable], is_optional: bool):
9
9
  def _validator(value):
10
+ if is_optional and value is None:
11
+ return value
10
12
  for validator_func in validators:
11
13
  validator_func(value)
12
14
  return value
@@ -15,18 +17,22 @@ def aggregated_validator(validators: List[callable]):
15
17
  @register_field
16
18
  class BaseField(ABC):
17
19
  name: str
20
+ is_optional: bool
18
21
  validators = None
19
22
  field_type = None
20
23
 
21
- def __init__(self, name) -> None:
24
+ def __init__(self, name: str, is_optional: bool) -> None:
22
25
  self.name = name
26
+ self.is_optional = is_optional
23
27
  self.validators = []
24
28
 
25
29
  @register_rule("Validate Not Null")
26
30
  def validator_not_null(self):
27
31
  def _validator(value):
32
+ if self.is_optional:
33
+ return value
28
34
  if value is None:
29
- raise ValueError()
35
+ raise ValueError("Value cannot be null")
30
36
  return value
31
37
 
32
38
  self.validators.append(_validator)
@@ -36,7 +42,8 @@ class BaseField(ABC):
36
42
  validator(value)
37
43
 
38
44
  def get_annotation(self):
39
- return Annotated[self.field_type, AfterValidator(aggregated_validator(self.validators))]
45
+ field_type = Optional[self.field_type] if self.is_optional else self.field_type
46
+ return Annotated[field_type, AfterValidator(aggregated_validator(self.validators, self.is_optional))]
40
47
 
41
48
  @classmethod
42
49
  def get_parents(cls: Type["BaseField"]) -> List[Type["BaseField"]]:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.2
2
2
  Name: data-sitter
3
- Version: 0.1.1
3
+ Version: 0.1.3
4
4
  Summary: A Python library that reads data contracts and generates Pydantic models for seamless data validation.
5
5
  Author-email: Lázaro Pereira Candea <lazaro@candea.es>
6
6
  Requires-Dist: python-dotenv==1.0.1
@@ -3,6 +3,7 @@ pyproject.toml
3
3
  setup.py
4
4
  data_sitter/Contract.py
5
5
  data_sitter/FieldResolver.py
6
+ data_sitter/Validation.py
6
7
  data_sitter/__init__.py
7
8
  data_sitter/cli.py
8
9
  data_sitter.egg-info/PKG-INFO
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = 'data-sitter'
7
- version = "0.1.1"
7
+ version = "0.1.3"
8
8
  description = "A Python library that reads data contracts and generates Pydantic models for seamless data validation."
9
9
  authors = [
10
10
  {name = 'Lázaro Pereira Candea', email = 'lazaro@candea.es'},
@@ -3,7 +3,7 @@ from setuptools import setup, find_packages
3
3
 
4
4
  setup(
5
5
  name='data-sitter',
6
- version='0.1.1',
6
+ version='0.1.3',
7
7
  packages=find_packages(),
8
8
  install_requires=[
9
9
  # Keep this in sync with pyproject.toml
File without changes