PyPI - vtlengine - Versions diffs - 1.0.0__py3-none-any.whl → 1.0.1__py3-none-any.whl - Mend

vtlengine 1.0.0py3-none-any.whl → 1.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of vtlengine might be problematic. Click here for more details.

Files changed (54) hide show

vtlengine/API/_InternalApi.py +153 -100
vtlengine/API/__init__.py +109 -67
vtlengine/AST/ASTConstructor.py +188 -98
vtlengine/AST/ASTConstructorModules/Expr.py +306 -200
vtlengine/AST/ASTConstructorModules/ExprComponents.py +172 -102
vtlengine/AST/ASTConstructorModules/Terminals.py +158 -95
vtlengine/AST/ASTEncoders.py +1 -1
vtlengine/AST/ASTTemplate.py +8 -9
vtlengine/AST/ASTVisitor.py +8 -12
vtlengine/AST/DAG/__init__.py +43 -35
vtlengine/AST/DAG/_words.py +4 -4
vtlengine/AST/Grammar/lexer.py +732 -142
vtlengine/AST/Grammar/parser.py +2188 -826
vtlengine/AST/Grammar/tokens.py +128 -128
vtlengine/AST/VtlVisitor.py +7 -4
vtlengine/AST/__init__.py +22 -11
vtlengine/DataTypes/NumericTypesHandling.py +5 -4
vtlengine/DataTypes/TimeHandling.py +194 -301
vtlengine/DataTypes/__init__.py +304 -218
vtlengine/Exceptions/__init__.py +52 -27
vtlengine/Exceptions/messages.py +134 -62
vtlengine/Interpreter/__init__.py +781 -487
vtlengine/Model/__init__.py +165 -121
vtlengine/Operators/Aggregation.py +156 -95
vtlengine/Operators/Analytic.py +115 -59
vtlengine/Operators/Assignment.py +7 -4
vtlengine/Operators/Boolean.py +27 -32
vtlengine/Operators/CastOperator.py +177 -131
vtlengine/Operators/Clause.py +137 -99
vtlengine/Operators/Comparison.py +148 -117
vtlengine/Operators/Conditional.py +149 -98
vtlengine/Operators/General.py +68 -47
vtlengine/Operators/HROperators.py +91 -72
vtlengine/Operators/Join.py +217 -118
vtlengine/Operators/Numeric.py +89 -44
vtlengine/Operators/RoleSetter.py +16 -15
vtlengine/Operators/Set.py +61 -36
vtlengine/Operators/String.py +213 -139
vtlengine/Operators/Time.py +334 -216
vtlengine/Operators/Validation.py +117 -76
vtlengine/Operators/__init__.py +340 -213
vtlengine/Utils/__init__.py +195 -40
vtlengine/__init__.py +1 -1
vtlengine/files/output/__init__.py +15 -6
vtlengine/files/output/_time_period_representation.py +10 -9
vtlengine/files/parser/__init__.py +77 -52
vtlengine/files/parser/_rfc_dialect.py +6 -5
vtlengine/files/parser/_time_checking.py +46 -37
vtlengine-1.0.1.dist-info/METADATA +236 -0
vtlengine-1.0.1.dist-info/RECORD +58 -0
{vtlengine-1.0.dist-info → vtlengine-1.0.1.dist-info}/WHEEL +1 -1
vtlengine-1.0.dist-info/METADATA +0 -104
vtlengine-1.0.dist-info/RECORD +0 -58
{vtlengine-1.0.dist-info → vtlengine-1.0.1.dist-info}/LICENSE.md +0 -0

vtlengine/Operators/__init__.py CHANGED Viewed

@@ -1,19 +1,29 @@
 import os
 from copy import copy
-from typing import Any, Union
-from vtlengine.DataTypes import COMP_NAME_MAPPING, ScalarType, \
-    binary_implicit_promotion, check_binary_implicit_promotion, check_unary_implicit_promotion, \
-    unary_implicit_promotion, SCALAR_TYPES_CLASS_REVERSE
-from vtlengine.DataTypes.TimeHandling import TimeIntervalHandler, TimePeriodHandler, DURATION_MAPPING
+from typing import Any, Union, Optional
+from vtlengine.DataTypes import (
+    COMP_NAME_MAPPING,
+    binary_implicit_promotion,
+    check_binary_implicit_promotion,
+    check_unary_implicit_promotion,
+    unary_implicit_promotion,
+    SCALAR_TYPES_CLASS_REVERSE,
+)
+from vtlengine.DataTypes.TimeHandling import (
+    TimeIntervalHandler,
+    TimePeriodHandler,
+    DURATION_MAPPING,
+)
 from vtlengine.AST.Grammar.tokens import CEIL, FLOOR, ROUND, EQ, NEQ, GT, GTE, LT, LTE, XOR, OR, AND
 from vtlengine.Exceptions import SemanticError
-if os.environ.get("SPARK", False):
-    import pyspark.pandas as pd
-else:
-    import pandas as pd
+# if os.environ.get("SPARK", False):
+#     import pyspark.pandas as pd
+# else:
+#     import pandas as pd
+import pandas as pd
 from vtlengine.Model import Component, Dataset, Role, Scalar, DataComponent, ScalarSet
@@ -31,35 +41,36 @@ only_semantic = False
 class Operator:
     """Superclass for all operators"""
-    op = None
-    py_op = None
-    spark_op = None
-    type_to_check = None
-    return_type = None
+    op: Any = None
+    py_op: Any = None
+    spark_op: Any = None
+    type_to_check: Any = None
+    return_type: Any = None
     @classmethod
-    def analyze(cls, *args, **kwargs):
+    def analyze(cls, *args: Any, **kwargs: Any) -> Any:
         if only_semantic:
             return cls.validate(*args, **kwargs)
         return cls.evaluate(*args, **kwargs)
     @classmethod
-    def cast_time_types(cls, data_type: ScalarType, series: pd.Series) -> pd.Series:
+    def cast_time_types(cls, data_type: Any, series: Any) -> Any:
         if cls.op not in BINARY_COMPARISON_OPERATORS:
             return series
         if data_type.__name__ == "TimeInterval":
-            series = series.map(lambda x: TimeIntervalHandler.from_iso_format(x),
-                                na_action='ignore')
+            series = series.map(
+                lambda x: TimeIntervalHandler.from_iso_format(x), na_action="ignore"
+            )
         elif data_type.__name__ == "TimePeriod":
-            series = series.map(lambda x: TimePeriodHandler(x),
-                                na_action='ignore')
+            series = series.map(lambda x: TimePeriodHandler(x), na_action="ignore")
         elif data_type.__name__ == "Duration":
-            series = series.map(lambda x: DURATION_MAPPING[x],
-                                na_action='ignore')
+            series = series.map(lambda x: DURATION_MAPPING[x], na_action="ignore")
         return series
     @classmethod
-    def cast_time_types_scalar(cls, data_type: ScalarType, value: str):
+    def cast_time_types_scalar(cls, data_type: Any, value: str) -> Any:
         if cls.op not in BINARY_COMPARISON_OPERATORS:
             return value
         if data_type.__name__ == "TimeInterval":
@@ -75,55 +86,59 @@ class Operator:
     @classmethod
     def modify_measure_column(cls, result: Dataset) -> None:
         """
-        If an Operator change the data type of the Variable it is applied to (e.g., from string to number),
-        the result Data Set cannot maintain this Variable as it happens in the previous cases,
-        because a Variable cannot have different data types in different Data Sets.
-        As a consequence, the converted variable cannot follow the same rules described in the sections above and must be replaced,
-        in the result Data Set, by another Variable of the proper data type.
-        For sake of simplicity, the operators changing the data type are allowed only on mono-measure operand Data Sets, so that the conversion happens on just one Measure.
-        A default generic Measure is assigned by default to the result Data Set, depending on the data type of the result (the default Measure Variables are reported in the table below).
+        If an Operator change the data type of the Variable it is applied to (e.g., from string to
+        number), the result Data Set cannot maintain this Variable as it happens in the previous
+        cases, because a Variable cannot have different data types in different Data Sets.
+        As a consequence, the converted variable cannot follow the same rules described in the
+        sections above and must be replaced, in the result Data Set, by another Variable of the
+        proper data type.
+        For sake of simplicity, the operators changing the data type are allowed only on
+        mono-measure operand Data Sets, so that the conversion happens on just one Measure.
+        A default generic Measure is assigned by default to the result Data Set, depending on the
+        data type of the result (the default Measure Variables are reported in the table below).
         Function used by the evaluate function when a dataset is involved
         """
-        if len(result.get_measures()) == 1 and cls.return_type is not None:
+        if len(result.get_measures()) == 1 and cls.return_type is not None and result is not None:
             measure_name = result.get_measures_names()[0]
             components = list(result.components.keys())
-            columns = list(result.data.columns)
+            columns = list(result.data.columns) if result.data is not None else []
             for column in columns:
-                if column not in set(components):
+                if column not in set(components) and result.data is not None:
                     result.data[measure_name] = result.data[column]
                     del result.data[column]
     @classmethod
-    def validate_dataset_type(cls, dataset: Dataset) -> None:
+    def validate_dataset_type(cls, *args: Any) -> None:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def validate_component_type(cls, component: DataComponent) -> None:
+    def validate_component_type(cls, *args: Any) -> None:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def validate_scalar_type(cls, scalar: Scalar) -> None:
+    def validate_scalar_type(cls, *args: Any) -> None:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def validate(cls, *args, **kwargs):
+    def validate(cls, *args: Any, **kwargs: Any) -> Any:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def evaluate(cls, *args, **kwargs):
+    def evaluate(cls, *args: Any, **kwargs: Any) -> Any:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def scalar_validation(cls, *args) -> None:
+    def scalar_validation(cls, *args: Any) -> Any:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def component_validation(cls, *args) -> None:
+    def component_validation(cls, *args: Any) -> Any:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def validate_type_compatibility(cls, *args) -> bool:
+    def validate_type_compatibility(cls, *args: Any) -> bool:
         if len(args) == 1:
             operand = args[0]
             return check_unary_implicit_promotion(operand, cls.type_to_check, cls.return_type)
@@ -133,7 +148,7 @@ class Operator:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def type_validation(cls, *args) -> ScalarType:
+    def type_validation(cls, *args: Any) -> Any:
         if len(args) == 1:
             operand = args[0]
             return unary_implicit_promotion(operand, cls.type_to_check, cls.return_type)
@@ -143,26 +158,37 @@ class Operator:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def apply_return_type_dataset(cls, *args) -> None:
+    def apply_return_type_dataset(cls, *args: Any) -> None:
         raise Exception("Method should be implemented by inheritors")
     @classmethod
-    def apply_return_type(cls, *args):
+    def apply_return_type(cls, *args: Any) -> None:
         raise Exception("Method should be implemented by inheritors")
-def _id_type_promotion_join_keys(c_left: Component, c_right: Component, join_key: str,
-                                 left_data: pd.DataFrame,
-                                 right_data: pd.DataFrame) -> None:
-    left_type_name = c_left.data_type.__name__
-    right_type_name = c_right.data_type.__name__
+def _id_type_promotion_join_keys(
+    c_left: Component,
+    c_right: Component,
+    join_key: str,
+    left_data: Optional[pd.DataFrame] = None,
+    right_data: Optional[pd.DataFrame] = None,
+) -> None:
+    if left_data is None:
+        left_data = pd.DataFrame()
+    if right_data is None:
+        right_data = pd.DataFrame()
+    left_type_name: str = str(c_left.data_type.__name__)
+    right_type_name: str = str(c_right.data_type.__name__)
     if left_type_name == right_type_name or len(left_data) == 0 or len(right_data) == 0:
         left_data[join_key] = left_data[join_key].astype(object)
         right_data[join_key] = right_data[join_key].astype(object)
         return
-    if ((left_type_name == "Integer" and right_type_name == "Number") or
-            (left_type_name == "Number" and right_type_name == "Integer")):
+    if (left_type_name == "Integer" and right_type_name == "Number") or (
+        left_type_name == "Number" and right_type_name == "Integer"
+    ):
         left_data[join_key] = left_data[join_key].map(lambda x: int(float(x)))
         right_data[join_key] = right_data[join_key].map(lambda x: int(float(x)))
     elif left_type_name == "String" and right_type_name in ("Integer", "Number"):
@@ -173,7 +199,8 @@ def _id_type_promotion_join_keys(c_left: Component, c_right: Component, join_key
     right_data[join_key] = right_data[join_key].astype(object)
-def _handle_str_number(x: Union[str, int, float]) -> Union[int, float]:
+def _handle_str_number(x: Union[str, int, float]) -> Union[str, int, float]:
     if isinstance(x, int):
         return x
     try:
@@ -188,15 +215,16 @@ def _handle_str_number(x: Union[str, int, float]) -> Union[int, float]:
 class Binary(Operator):
     @classmethod
-    def op_func(cls, x: Any, y: Any) -> Any:
+    def op_func(cls, *args: Any) -> Any:
+        x, y = args
         if pd.isnull(x) or pd.isnull(y):
             return None
         return cls.py_op(x, y)
     @classmethod
-    def apply_operation_two_series(cls,
-                                   left_series: Any,
-                                   right_series: Any) -> Any:
+    def apply_operation_two_series(cls, left_series: Any, right_series: Any) -> Any:
         if os.getenv("SPARK", False):
             if cls.spark_op is None:
                 cls.spark_op = cls.py_op
@@ -206,26 +234,32 @@ class Binary(Operator):
             result.loc[nulls] = None
             return result
         result = list(map(cls.op_func, left_series.values, right_series.values))
-        return pd.Series(result, index=list(range(len(result))),
-                         dtype=object)
+        return pd.Series(result, index=list(range(len(result))), dtype=object)
     @classmethod
-    def apply_operation_series_scalar(cls, series: pd.Series, scalar: Any,
-                                      series_left: bool) -> Any:
+    def apply_operation_series_scalar(
+        cls,
+        series: Any,
+        scalar: Scalar,
+        series_left: bool,
+    ) -> Any:
         if scalar is None:
             return pd.Series(None, index=series.index)
         if series_left:
-            return series.map(lambda x: cls.py_op(x, scalar), na_action='ignore')
+            return series.map(lambda x: cls.py_op(x, scalar), na_action="ignore")
         else:
-            return series.map(lambda x: cls.py_op(scalar, x), na_action='ignore')
+            return series.map(lambda x: cls.py_op(scalar, x), na_action="ignore")
     @classmethod
-    def validate(cls, left_operand: ALL_MODEL_DATA_TYPES, right_operand: ALL_MODEL_DATA_TYPES):
+    def validate(cls, *args: Any) -> Any:
         """
         The main function for validate, applies the implicit promotion (or check it), and
         can do a semantic check too.
         Returns an operand.
         """
+        left_operand, right_operand = args
         if isinstance(left_operand, Dataset) and isinstance(right_operand, Dataset):
             return cls.dataset_validation(left_operand, right_operand)
         if isinstance(left_operand, Dataset) and isinstance(right_operand, Scalar):
@@ -234,29 +268,23 @@ class Binary(Operator):
             return cls.dataset_scalar_validation(right_operand, left_operand)
         if isinstance(left_operand, Scalar) and isinstance(right_operand, Scalar):
             return cls.scalar_validation(left_operand, right_operand)
         if isinstance(left_operand, DataComponent) and isinstance(right_operand, DataComponent):
             return cls.component_validation(left_operand, right_operand)
         if isinstance(left_operand, DataComponent) and isinstance(right_operand, Scalar):
             return cls.component_scalar_validation(left_operand, right_operand)
         if isinstance(left_operand, Scalar) and isinstance(right_operand, DataComponent):
             return cls.component_scalar_validation(right_operand, left_operand)
         # In operator
         if isinstance(left_operand, Dataset) and isinstance(right_operand, ScalarSet):
             return cls.dataset_set_validation(left_operand, right_operand)
         if isinstance(left_operand, Scalar) and isinstance(right_operand, ScalarSet):
             return cls.scalar_set_validation(left_operand, right_operand)
         if isinstance(left_operand, DataComponent) and isinstance(right_operand, ScalarSet):
             return cls.component_set_validation(left_operand, right_operand)
     @classmethod
     def dataset_validation(cls, left_operand: Dataset, right_operand: Dataset) -> Dataset:
         left_identifiers = left_operand.get_identifiers_names()
         right_identifiers = right_operand.get_identifiers_names()
@@ -268,8 +296,9 @@ class Binary(Operator):
         right_measures_names = [measure.name for measure in right_measures]
         if left_measures_names != right_measures_names:
-            raise SemanticError("1-1-14-1", op=cls.op, left=left_measures_names,
-                                right=right_measures_names)
+            raise SemanticError(
+                "1-1-14-1", op=cls.op, left=left_measures_names, right=right_measures_names
+            )
         elif len(left_measures) == 0:
             raise SemanticError("1-1-1-8", op=cls.op, name=left_operand.name)
         for left_measure, right_measure in zip(left_measures, right_measures):
@@ -288,9 +317,11 @@ class Binary(Operator):
         # Deleting extra identifiers that we do not need anymore
         base_operand = right_operand if use_right_components else left_operand
-        result_components = {component_name: copy(component) for component_name, component in
-                             base_operand.components.items()
-                             if component.role in [Role.IDENTIFIER, Role.MEASURE]}
+        result_components = {
+            component_name: copy(component)
+            for component_name, component in base_operand.components.items()
+            if component.role in [Role.IDENTIFIER, Role.MEASURE]
+        }
         for comp in [x for x in result_components.values() if x.role == Role.MEASURE]:
             if comp.name in left_operand.components and comp.name in right_operand.components:
@@ -303,57 +334,66 @@ class Binary(Operator):
         return result_dataset
     @classmethod
-    def dataset_scalar_validation(cls, dataset: Dataset, scalar: Scalar):
+    def dataset_scalar_validation(cls, dataset: Dataset, scalar: Scalar) -> Dataset:
         if len(dataset.get_measures()) == 0:
             raise SemanticError("1-1-1-8", op=cls.op, name=dataset.name)
-        result_components = {comp_name: copy(comp) for comp_name, comp in
-                             dataset.components.items() if
-                             comp.role in [Role.IDENTIFIER, Role.MEASURE]}
-        result_dataset = Dataset(name="result", components=result_components,
-                                 data=None)
+        result_components = {
+            comp_name: copy(comp)
+            for comp_name, comp in dataset.components.items()
+            if comp.role in [Role.IDENTIFIER, Role.MEASURE]
+        }
+        result_dataset = Dataset(name="result", components=result_components, data=None)
         cls.apply_return_type_dataset(result_dataset, dataset, scalar)
         return result_dataset
     @classmethod
     def scalar_validation(cls, left_operand: Scalar, right_operand: Scalar) -> Scalar:
-        if not cls.validate_type_compatibility(left_operand.data_type, right_operand.data_type):
-            raise SemanticError("1-1-1-2", )
-        return Scalar(name="result",
-                      data_type=cls.type_validation(left_operand.data_type,
-                                                    right_operand.data_type),
-                      value=None)
-    @classmethod
-    def component_validation(cls, left_operand: DataComponent,
-                             right_operand: DataComponent) -> DataComponent:
+        if not cls.validate_type_compatibility(left_operand.data_type, right_operand.data_type):
+            raise SemanticError(
+                "1-1-1-2",
+            )
+        return Scalar(
+            name="result",
+            data_type=cls.type_validation(left_operand.data_type, right_operand.data_type),
+            value=None,
+        )
+    @classmethod
+    def component_validation(
+        cls, left_operand: DataComponent, right_operand: DataComponent
+    ) -> DataComponent:
         """
         Validates the compatibility between the types of the components and the operator
         :param left_operand: The left component
         :param right_operand: The right component
         :return: The result data type of the validation
         """
-        result_data_type = cls.type_validation(left_operand.data_type, right_operand.data_type)
-        result = DataComponent(name="result",
-                               data_type=result_data_type,
-                               data=None,
-                               role=left_operand.role,
-                               nullable=(left_operand.nullable or right_operand.nullable))
+        result_data_type = cls.type_validation(left_operand.data_type, right_operand.data_type)
+        result = DataComponent(
+            name="result",
+            data_type=result_data_type,
+            data=None,
+            role=left_operand.role,
+            nullable=(left_operand.nullable or right_operand.nullable),
+        )
         return result
     @classmethod
-    def component_scalar_validation(cls, component: DataComponent, scalar: Scalar):
-        cls.type_validation(component.data_type, scalar.data_type)
-        result = DataComponent(name=component.name,
-                               data_type=cls.type_validation(component.data_type, scalar.data_type),
-                               data=None, role=component.role,
-                               nullable=component.nullable or scalar is None)
+    def component_scalar_validation(cls, component: DataComponent, scalar: Scalar) -> DataComponent:
+        cls.type_validation(component.data_type, scalar.data_type)
+        result = DataComponent(
+            name=component.name,
+            data_type=cls.type_validation(component.data_type, scalar.data_type),
+            data=None,
+            role=component.role,
+            nullable=component.nullable or scalar is None,
+        )
         return result
     @classmethod
@@ -363,37 +403,44 @@ class Binary(Operator):
             raise SemanticError("1-1-1-8", op=cls.op, name=dataset.name)
         for measure in dataset.get_measures():
             cls.type_validation(measure.data_type, scalar_set.data_type)
+        result_components = {
+            comp_name: copy(comp)
+            for comp_name, comp in dataset.components.items()
+            if comp.role in [Role.IDENTIFIER, Role.MEASURE]
+        }
-        result_components = {comp_name: copy(comp) for comp_name, comp in
-                             dataset.components.items() if
-                             comp.role in [Role.IDENTIFIER, Role.MEASURE]}
-        result_dataset = Dataset(name="result", components=result_components,
-                                 data=None)
+        result_dataset = Dataset(name="result", components=result_components, data=None)
         cls.apply_return_type_dataset(result_dataset, dataset, scalar_set)
         return result_dataset
     @classmethod
-    def component_set_validation(cls, component: DataComponent,
-                                 scalar_set: ScalarSet) -> DataComponent:
-        cls.type_validation(component.data_type, scalar_set.data_type)
-        result = DataComponent(name="result", data_type=cls.type_validation(component.data_type,
-                                                                            scalar_set.data_type),
-                               data=None,
-                               role=Role.MEASURE, nullable=component.nullable)
+    def component_set_validation(
+        cls, component: DataComponent, scalar_set: ScalarSet
+    ) -> DataComponent:
+        cls.type_validation(component.data_type, scalar_set.data_type)
+        result = DataComponent(
+            name="result",
+            data_type=cls.type_validation(component.data_type, scalar_set.data_type),
+            data=None,
+            role=Role.MEASURE,
+            nullable=component.nullable,
+        )
         return result
     @classmethod
-    def scalar_set_validation(cls, scalar: Scalar, scalar_set: ScalarSet):
+    def scalar_set_validation(cls, scalar: Scalar, scalar_set: ScalarSet) -> Scalar:
         cls.type_validation(scalar.data_type, scalar_set.data_type)
-        return Scalar(name="result",
-                      data_type=cls.type_validation(scalar.data_type, scalar_set.data_type),
-                      value=None)
+        return Scalar(
+            name="result",
+            data_type=cls.type_validation(scalar.data_type, scalar_set.data_type),
+            value=None,
+        )
     # The following class method implements the type promotion
     @classmethod
-    def type_validation(cls, left_type: ScalarType, right_type: ScalarType) -> ScalarType:
+    def type_validation(cls, left_type: Any, right_type: Any) -> Any:
         """
         Validates the compatibility between the types of the operands and the operator
         and give us the result ScalarType of the promotion
@@ -404,11 +451,12 @@ class Binary(Operator):
         :return: result ScalarType or exception
         """
         return binary_implicit_promotion(left_type, right_type, cls.type_to_check, cls.return_type)
     # The following class method checks the type promotion
     @classmethod
-    def validate_type_compatibility(cls, left: ScalarType, right: ScalarType) -> bool:
+    def validate_type_compatibility(cls, left: Any, right: Any) -> bool:
         """
         Validates the compatibility between the types of the operands and the operator
         (implicit type promotion : check_binary_implicit_type_promotion)
@@ -418,17 +466,19 @@ class Binary(Operator):
         :return: True if the types are compatible, False otherwise
         """
         return check_binary_implicit_promotion(left, right, cls.type_to_check, cls.return_type)
     @classmethod
     def apply_return_type_dataset(
-            cls, result_dataset: Dataset, left_operand: Dataset,
-            right_operand: Union[Dataset, Scalar, ScalarSet]
+        cls, result_dataset: Dataset, left_operand: Any, right_operand: Any
     ) -> None:
         """
         Used in dataset's validation.
-        Changes the result dataset and give us his final form (#TODO: write this explanation in a better way)
+        Changes the result dataset and give us his final form
+        (#TODO: write this explanation in a better way)
         """
         changed_allowed = cls.op in MONOMEASURE_CHANGED_ALLOWED
         is_mono_measure = len(result_dataset.get_measures()) == 1
         for measure in result_dataset.get_measures():
@@ -444,22 +494,24 @@ class Binary(Operator):
                     name=COMP_NAME_MAPPING[result_data_type],
                     data_type=result_data_type,
                     role=Role.MEASURE,
-                    nullable=measure.nullable
+                    nullable=measure.nullable,
                 )
                 result_dataset.delete_component(measure.name)
                 result_dataset.add_component(component)
                 if result_dataset.data is not None:
                     result_dataset.data.rename(columns={measure.name: component.name}, inplace=True)
-            elif (changed_allowed is False and
-                  is_mono_measure is False and
-                  left_type.promotion_changed_type(result_data_type)
+            elif (
+                changed_allowed is False
+                and is_mono_measure is False
+                and left_type.promotion_changed_type(result_data_type)
             ):
                 raise SemanticError("1-1-1-4", op=cls.op)
             else:
                 measure.data_type = result_data_type
     @classmethod
-    def dataset_evaluation(cls, left_operand: Dataset, right_operand: Dataset):
+    def dataset_evaluation(cls, left_operand: Dataset, right_operand: Dataset) -> Dataset:
         result_dataset = cls.dataset_validation(left_operand, right_operand)
         use_right_as_base = False
@@ -471,49 +523,65 @@ class Binary(Operator):
             base_operand_data = left_operand.data
             other_operand_data = right_operand.data
-        join_keys = list(set(left_operand.get_identifiers_names()).intersection(
-            right_operand.get_identifiers_names()))
+        join_keys = list(
+            set(left_operand.get_identifiers_names()).intersection(
+                right_operand.get_identifiers_names()
+            )
+        )
         for join_key in join_keys:
-            _id_type_promotion_join_keys(left_operand.get_component(join_key),
-                                         right_operand.get_component(join_key),
-                                         join_key, base_operand_data, other_operand_data)
+            _id_type_promotion_join_keys(
+                left_operand.get_component(join_key),
+                right_operand.get_component(join_key),
+                join_key,
+                base_operand_data,
+                other_operand_data,
+            )
         try:
             # Merge the data
-            result_data: pd.DataFrame = pd.merge(
-                base_operand_data, other_operand_data,
-                how='inner', on=join_keys,
-                suffixes=('_x', '_y'))
+            if base_operand_data is None or other_operand_data is None:
+                result_data: pd.DataFrame = pd.DataFrame()
+            else:
+                result_data = pd.merge(
+                    base_operand_data,
+                    other_operand_data,
+                    how="inner",
+                    on=join_keys,
+                    suffixes=("_x", "_y"),
+                )
         except ValueError as e:
             raise Exception(f"Error merging datasets on Binary Operator: {str(e)}")
         # Measures are the same, using left operand measures names
         for measure in left_operand.get_measures():
-            result_data[measure.name + '_x'] = cls.cast_time_types(measure.data_type,
-                                                                   result_data[measure.name + '_x'])
-            result_data[measure.name + '_y'] = cls.cast_time_types(measure.data_type,
-                                                                   result_data[measure.name + '_y'])
+            result_data[measure.name + "_x"] = cls.cast_time_types(
+                measure.data_type, result_data[measure.name + "_x"]
+            )
+            result_data[measure.name + "_y"] = cls.cast_time_types(
+                measure.data_type, result_data[measure.name + "_y"]
+            )
             if use_right_as_base:
                 result_data[measure.name] = cls.apply_operation_two_series(
-                    result_data[measure.name + '_y'],
-                    result_data[measure.name + '_x'])
+                    result_data[measure.name + "_y"], result_data[measure.name + "_x"]
+                )
             else:
                 result_data[measure.name] = cls.apply_operation_two_series(
-                    result_data[measure.name + '_x'],
-                    result_data[measure.name + '_y'])
-            result_data = result_data.drop([measure.name + '_x', measure.name + '_y'], axis=1)
+                    result_data[measure.name + "_x"], result_data[measure.name + "_y"]
+                )
+            result_data = result_data.drop([measure.name + "_x", measure.name + "_y"], axis=1)
         # Delete attributes from the result data
         attributes = list(
-            set(left_operand.get_attributes_names()).union(right_operand.get_attributes_names()))
+            set(left_operand.get_attributes_names()).union(right_operand.get_attributes_names())
+        )
         for att in attributes:
             if att in result_data.columns:
                 result_data = result_data.drop(att, axis=1)
-            if att + '_x' in result_data.columns:
-                result_data = result_data.drop(att + '_x', axis=1)
-            if att + '_y' in result_data.columns:
-                result_data = result_data.drop(att + '_y', axis=1)
+            if att + "_x" in result_data.columns:
+                result_data = result_data.drop(att + "_x", axis=1)
+            if att + "_y" in result_data.columns:
+                result_data = result_data.drop(att + "_y", axis=1)
         result_dataset.data = result_data
         cls.modify_measure_column(result_dataset)
@@ -522,25 +590,31 @@ class Binary(Operator):
     @classmethod
     def scalar_evaluation(cls, left_operand: Scalar, right_operand: Scalar) -> Scalar:
         result_scalar = cls.scalar_validation(left_operand, right_operand)
         result_scalar.value = cls.op_func(left_operand.value, right_operand.value)
         return result_scalar
     @classmethod
-    def dataset_scalar_evaluation(cls, dataset: Dataset, scalar: Scalar,
-                                  dataset_left=True) -> Dataset:
+    def dataset_scalar_evaluation(
+        cls, dataset: Dataset, scalar: Scalar, dataset_left: bool = True
+    ) -> Dataset:
         result_dataset = cls.dataset_scalar_validation(dataset, scalar)
-        result_data = dataset.data.copy()
+        result_data = dataset.data.copy() if dataset.data is not None else pd.DataFrame()
         result_dataset.data = result_data
         scalar_value = cls.cast_time_types_scalar(scalar.data_type, scalar.value)
         for measure in dataset.get_measures():
             measure_data = cls.cast_time_types(measure.data_type, result_data[measure.name].copy())
-            if measure.data_type.__name__ == "Duration" and not isinstance(scalar_value, int):
+            if measure.data_type.__name__.__str__() == "Duration" and not isinstance(
+                scalar_value, int
+            ):
                 scalar_value = DURATION_MAPPING[scalar_value]
             result_dataset.data[measure.name] = cls.apply_operation_series_scalar(
-                measure_data, scalar_value, dataset_left)
+                measure_data, scalar_value, dataset_left
+            )
         result_dataset.data = result_data
         cols_to_keep = dataset.get_identifiers_names() + dataset.get_measures_names()
@@ -549,34 +623,53 @@ class Binary(Operator):
         return result_dataset
     @classmethod
-    def component_evaluation(cls, left_operand: DataComponent,
-                             right_operand: DataComponent) -> DataComponent:
+    def component_evaluation(
+        cls, left_operand: DataComponent, right_operand: DataComponent
+    ) -> DataComponent:
         result_component = cls.component_validation(left_operand, right_operand)
-        left_data = cls.cast_time_types(left_operand.data_type, left_operand.data.copy())
-        right_data = cls.cast_time_types(right_operand.data_type, right_operand.data.copy())
+        left_data = cls.cast_time_types(
+            left_operand.data_type,
+            left_operand.data.copy() if left_operand.data is not None else pd.Series(),
+        )
+        right_data = cls.cast_time_types(
+            right_operand.data_type,
+            right_operand.data.copy() if right_operand.data is not None else pd.Series(),
+        )
         result_component.data = cls.apply_operation_two_series(left_data, right_data)
         return result_component
     @classmethod
-    def component_scalar_evaluation(cls, component: DataComponent, scalar: Scalar,
-                                    component_left: bool) -> DataComponent:
+    def component_scalar_evaluation(
+        cls, component: DataComponent, scalar: Scalar, component_left: bool = True
+    ) -> DataComponent:
         result_component = cls.component_scalar_validation(component, scalar)
-        comp_data = cls.cast_time_types(component.data_type, component.data.copy())
+        comp_data = cls.cast_time_types(
+            component.data_type,
+            component.data.copy() if component.data is not None else pd.Series(),
+        )
         scalar_value = cls.cast_time_types_scalar(scalar.data_type, scalar.value)
-        if component.data_type.__name__ == "Duration" and not isinstance(scalar_value, int):
+        if component.data_type.__name__.__str__() == "Duration" and not isinstance(
+            scalar_value, int
+        ):
             scalar_value = DURATION_MAPPING[scalar_value]
-        result_component.data = cls.apply_operation_series_scalar(comp_data,
-                                                                  scalar_value, component_left)
+        result_component.data = cls.apply_operation_series_scalar(
+            comp_data, scalar_value, component_left
+        )
         return result_component
     @classmethod
     def dataset_set_evaluation(cls, dataset: Dataset, scalar_set: ScalarSet) -> Dataset:
         result_dataset = cls.dataset_set_validation(dataset, scalar_set)
-        result_data = dataset.data.copy()
+        result_data = dataset.data.copy() if dataset.data is not None else pd.DataFrame()
         for measure_name in dataset.get_measures_names():
-            result_data[measure_name] = cls.apply_operation_two_series(dataset.data[measure_name],
-                                                                       scalar_set)
+            if dataset.data is not None:
+                result_data[measure_name] = cls.apply_operation_two_series(
+                    dataset.data[measure_name], scalar_set
+                )
         cols_to_keep = dataset.get_identifiers_names() + dataset.get_measures_names()
         result_dataset.data = result_data[cols_to_keep]
@@ -585,28 +678,32 @@ class Binary(Operator):
         return result_dataset
     @classmethod
-    def component_set_evaluation(cls, component: DataComponent,
-                                 scalar_set: ScalarSet) -> DataComponent:
+    def component_set_evaluation(
+        cls, component: DataComponent, scalar_set: ScalarSet
+    ) -> DataComponent:
         result_component = cls.component_set_validation(component, scalar_set)
-        result_component.data = cls.apply_operation_two_series(component.data.copy(),
-                                                               scalar_set)
+        result_component.data = cls.apply_operation_two_series(
+            component.data.copy() if component.data is not None else pd.Series(), scalar_set
+        )
         return result_component
     @classmethod
     def scalar_set_evaluation(cls, scalar: Scalar, scalar_set: ScalarSet) -> Scalar:
         result_scalar = cls.scalar_set_validation(scalar, scalar_set)
         result_scalar.value = cls.op_func(scalar.value, scalar_set)
         return result_scalar
     @classmethod
-    def evaluate(cls, left_operand: ALL_MODEL_DATA_TYPES,
-                 right_operand: ALL_MODEL_DATA_TYPES) -> ALL_MODEL_DATA_TYPES:
+    def evaluate(cls, left_operand: Any, right_operand: Any) -> Any:
         """
         Evaluate the operation (based on validation output)
         :param left_operand: The left operand
         :param right_operand: The right operand
         :return: The result of the operation
         """
         if isinstance(left_operand, Dataset) and isinstance(right_operand, Dataset):
             return cls.dataset_evaluation(left_operand, right_operand)
         if isinstance(left_operand, Scalar) and isinstance(right_operand, Scalar):
@@ -615,23 +712,18 @@ class Binary(Operator):
             return cls.dataset_scalar_evaluation(left_operand, right_operand, dataset_left=True)
         if isinstance(left_operand, Scalar) and isinstance(right_operand, Dataset):
             return cls.dataset_scalar_evaluation(right_operand, left_operand, dataset_left=False)
         if isinstance(left_operand, DataComponent) and isinstance(right_operand, DataComponent):
             return cls.component_evaluation(left_operand, right_operand)
         if isinstance(left_operand, DataComponent) and isinstance(right_operand, Scalar):
             return cls.component_scalar_evaluation(left_operand, right_operand, component_left=True)
         if isinstance(left_operand, Scalar) and isinstance(right_operand, DataComponent):
-            return cls.component_scalar_evaluation(right_operand, left_operand,
-                                                   component_left=False)
+            return cls.component_scalar_evaluation(
+                right_operand, left_operand, component_left=False
+            )
         if isinstance(left_operand, Dataset) and isinstance(right_operand, ScalarSet):
             return cls.dataset_set_evaluation(left_operand, right_operand)
         if isinstance(left_operand, DataComponent) and isinstance(right_operand, ScalarSet):
             return cls.component_set_evaluation(left_operand, right_operand)
         if isinstance(left_operand, Scalar) and isinstance(right_operand, ScalarSet):
             return cls.scalar_set_evaluation(left_operand, right_operand)
@@ -639,21 +731,27 @@ class Binary(Operator):
 class Unary(Operator):
     @classmethod
-    def op_func(cls, x: Any) -> Any:
+    def op_func(cls, *args: Any) -> Any:
+        x = args[0]
         return None if pd.isnull(x) else cls.py_op(x)
     @classmethod
     def apply_operation_component(cls, series: Any) -> Any:
-        """Applies the operation to a component"""
-        return series.map(cls.py_op, na_action='ignore')
+        """
+        Applies the operation to a component
+        """
+        return series.map(cls.py_op, na_action="ignore")
     @classmethod
-    def validate(cls, operand: ALL_MODEL_DATA_TYPES):
+    def validate(cls, operand: Any) -> Any:
         """
         The main function for validate, applies the implicit promotion (or check it), and
         can do a semantic check too.
         Returns an operand.
         """
         if isinstance(operand, Dataset):
             return cls.dataset_validation(operand)
         elif isinstance(operand, DataComponent):
@@ -663,12 +761,15 @@ class Unary(Operator):
     @classmethod
     def dataset_validation(cls, operand: Dataset) -> Dataset:
         cls.validate_dataset_type(operand)
         if len(operand.get_measures()) == 0:
             raise SemanticError("1-1-1-8", op=cls.op, name=operand.name)
-        result_components = {comp_name: copy(comp) for comp_name, comp in
-                             operand.components.items() if
-                             comp.role in [Role.IDENTIFIER, Role.MEASURE]}
+        result_components = {
+            comp_name: copy(comp)
+            for comp_name, comp in operand.components.items()
+            if comp.role in [Role.IDENTIFIER, Role.MEASURE]
+        }
         result_dataset = Dataset(name="result", components=result_components, data=None)
         cls.apply_return_type_dataset(result_dataset, operand)
@@ -676,46 +777,64 @@ class Unary(Operator):
     @classmethod
     def scalar_validation(cls, operand: Scalar) -> Scalar:
         result_type = cls.type_validation(operand.data_type)
         result = Scalar(name="result", data_type=result_type, value=None)
         return result
     @classmethod
     def component_validation(cls, operand: DataComponent) -> DataComponent:
         result_type = cls.type_validation(operand.data_type)
-        result = DataComponent(name="result", data_type=result_type, data=None,
-                               role=operand.role, nullable=operand.nullable)
+        result = DataComponent(
+            name="result",
+            data_type=result_type,
+            data=None,
+            role=operand.role,
+            nullable=operand.nullable,
+        )
         return result
     # The following class method implements the type promotion
     @classmethod
-    def type_validation(cls, operand: ScalarType) -> ScalarType:
+    def type_validation(cls, operand: Any) -> Any:
         return unary_implicit_promotion(operand, cls.type_to_check, cls.return_type)
     # The following class method checks the type promotion
     @classmethod
-    def validate_type_compatibility(cls, operand: ScalarType) -> bool:
+    def validate_type_compatibility(cls, operand: Any) -> bool:
         return check_unary_implicit_promotion(operand, cls.type_to_check, cls.return_type)
     @classmethod
     def validate_dataset_type(cls, dataset: Dataset) -> None:
         if cls.type_to_check is not None:
             for measure in dataset.get_measures():
                 if not cls.validate_type_compatibility(measure.data_type):
-                    raise SemanticError("1-1-1-3",
-                                        op=cls.op, entity=measure.role.value,
-                                        name=measure.name,
-                                        target_type=SCALAR_TYPES_CLASS_REVERSE[cls.type_to_check])
+                    raise SemanticError(
+                        "1-1-1-3",
+                        op=cls.op,
+                        entity=measure.role.value,
+                        name=measure.name,
+                        target_type=SCALAR_TYPES_CLASS_REVERSE[cls.type_to_check],
+                    )
     @classmethod
     def validate_scalar_type(cls, scalar: Scalar) -> None:
-        if (cls.type_to_check is not None and not cls.validate_type_compatibility(
-                scalar.data_type)):
-            raise SemanticError("1-1-1-5", op=cls.op, name=scalar.name,
-                                type=SCALAR_TYPES_CLASS_REVERSE[scalar.data_type])
+        if cls.type_to_check is not None and not cls.validate_type_compatibility(scalar.data_type):
+            raise SemanticError(
+                "1-1-1-5",
+                op=cls.op,
+                name=scalar.name,
+                type=SCALAR_TYPES_CLASS_REVERSE[scalar.data_type],
+            )
     @classmethod
     def apply_return_type_dataset(cls, result_dataset: Dataset, operand: Dataset) -> None:
         changed_allowed = cls.op in MONOMEASURE_CHANGED_ALLOWED
         is_mono_measure = len(operand.get_measures()) == 1
         for measure in result_dataset.get_measures():
@@ -727,20 +846,23 @@ class Unary(Operator):
                     name=COMP_NAME_MAPPING[result_data_type],
                     data_type=result_data_type,
                     role=Role.MEASURE,
-                    nullable=measure.nullable
+                    nullable=measure.nullable,
                 )
                 result_dataset.delete_component(measure.name)
                 result_dataset.add_component(component)
                 if result_dataset.data is not None:
                     result_dataset.data.rename(columns={measure.name: component.name}, inplace=True)
-            elif changed_allowed is False and is_mono_measure is False and operand_type.promotion_changed_type(
-                    result_data_type):
+            elif (
+                changed_allowed is False
+                and is_mono_measure is False
+                and operand_type.promotion_changed_type(result_data_type)
+            ):
                 raise SemanticError("1-1-1-4", op=cls.op)
             else:
                 measure.data_type = result_data_type
     @classmethod
-    def evaluate(cls, operand: ALL_MODEL_DATA_TYPES) -> ALL_MODEL_DATA_TYPES:
+    def evaluate(cls, operand: ALL_MODEL_DATA_TYPES) -> Any:
         if isinstance(operand, Dataset):
             return cls.dataset_evaluation(operand)
@@ -751,8 +873,9 @@ class Unary(Operator):
     @classmethod
     def dataset_evaluation(cls, operand: Dataset) -> Dataset:
         result_dataset = cls.dataset_validation(operand)
-        result_data = operand.data.copy()
+        result_data = operand.data.copy() if operand.data is not None else pd.DataFrame()
         for measure_name in operand.get_measures_names():
             result_data[measure_name] = cls.apply_operation_component(result_data[measure_name])
@@ -765,12 +888,16 @@ class Unary(Operator):
     @classmethod
     def scalar_evaluation(cls, operand: Scalar) -> Scalar:
         result_scalar = cls.scalar_validation(operand)
         result_scalar.value = cls.op_func(operand.value)
         return result_scalar
     @classmethod
     def component_evaluation(cls, operand: DataComponent) -> DataComponent:
         result_component = cls.component_validation(operand)
-        result_component.data = cls.apply_operation_component(operand.data.copy())
+        result_component.data = cls.apply_operation_component(
+            operand.data.copy() if operand.data is not None else pd.Series()
+        )
         return result_component

vtlengine 1.0.0__py3-none-any.whl → 1.0.1__py3-none-any.whl

Potentially problematic release.

vtlengine 1.0.0py3-none-any.whl → 1.0.1py3-none-any.whl