PyPI - pydpm_xl - Versions diffs - 0.1.10__py3-none-any.whl - Mend

pydpm_xl 0.1.10__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (94) hide show

py_dpm/AST/ASTConstructor.py +503 -0
py_dpm/AST/ASTObjects.py +827 -0
py_dpm/AST/ASTTemplate.py +101 -0
py_dpm/AST/ASTVisitor.py +13 -0
py_dpm/AST/MLGeneration.py +588 -0
py_dpm/AST/ModuleAnalyzer.py +79 -0
py_dpm/AST/ModuleDependencies.py +203 -0
py_dpm/AST/WhereClauseChecker.py +12 -0
py_dpm/AST/__init__.py +0 -0
py_dpm/AST/check_operands.py +302 -0
py_dpm/DataTypes/ScalarTypes.py +324 -0
py_dpm/DataTypes/TimeClasses.py +370 -0
py_dpm/DataTypes/TypePromotion.py +195 -0
py_dpm/DataTypes/__init__.py +0 -0
py_dpm/Exceptions/__init__.py +0 -0
py_dpm/Exceptions/exceptions.py +84 -0
py_dpm/Exceptions/messages.py +114 -0
py_dpm/OperationScopes/OperationScopeService.py +247 -0
py_dpm/OperationScopes/__init__.py +0 -0
py_dpm/Operators/AggregateOperators.py +138 -0
py_dpm/Operators/BooleanOperators.py +30 -0
py_dpm/Operators/ClauseOperators.py +159 -0
py_dpm/Operators/ComparisonOperators.py +69 -0
py_dpm/Operators/ConditionalOperators.py +362 -0
py_dpm/Operators/NumericOperators.py +101 -0
py_dpm/Operators/Operator.py +388 -0
py_dpm/Operators/StringOperators.py +27 -0
py_dpm/Operators/TimeOperators.py +53 -0
py_dpm/Operators/__init__.py +0 -0
py_dpm/Utils/ValidationsGenerationUtils.py +429 -0
py_dpm/Utils/__init__.py +0 -0
py_dpm/Utils/operands_mapping.py +73 -0
py_dpm/Utils/operator_mapping.py +89 -0
py_dpm/Utils/tokens.py +172 -0
py_dpm/Utils/utils.py +2 -0
py_dpm/ValidationsGeneration/PropertiesConstraintsProcessor.py +190 -0
py_dpm/ValidationsGeneration/Utils.py +364 -0
py_dpm/ValidationsGeneration/VariantsProcessor.py +265 -0
py_dpm/ValidationsGeneration/__init__.py +0 -0
py_dpm/ValidationsGeneration/auxiliary_functions.py +98 -0
py_dpm/__init__.py +61 -0
py_dpm/api/__init__.py +140 -0
py_dpm/api/ast_generator.py +438 -0
py_dpm/api/complete_ast.py +241 -0
py_dpm/api/data_dictionary_validation.py +577 -0
py_dpm/api/migration.py +77 -0
py_dpm/api/semantic.py +224 -0
py_dpm/api/syntax.py +182 -0
py_dpm/client.py +106 -0
py_dpm/data_handlers.py +99 -0
py_dpm/db_utils.py +117 -0
py_dpm/grammar/__init__.py +0 -0
py_dpm/grammar/dist/__init__.py +0 -0
py_dpm/grammar/dist/dpm_xlLexer.interp +428 -0
py_dpm/grammar/dist/dpm_xlLexer.py +804 -0
py_dpm/grammar/dist/dpm_xlLexer.tokens +106 -0
py_dpm/grammar/dist/dpm_xlParser.interp +249 -0
py_dpm/grammar/dist/dpm_xlParser.py +5224 -0
py_dpm/grammar/dist/dpm_xlParser.tokens +106 -0
py_dpm/grammar/dist/dpm_xlParserListener.py +742 -0
py_dpm/grammar/dist/dpm_xlParserVisitor.py +419 -0
py_dpm/grammar/dist/listeners.py +10 -0
py_dpm/grammar/dpm_xlLexer.g4 +435 -0
py_dpm/grammar/dpm_xlParser.g4 +260 -0
py_dpm/migration.py +282 -0
py_dpm/models.py +2139 -0
py_dpm/semantics/DAG/DAGAnalyzer.py +158 -0
py_dpm/semantics/DAG/__init__.py +0 -0
py_dpm/semantics/SemanticAnalyzer.py +320 -0
py_dpm/semantics/Symbols.py +223 -0
py_dpm/semantics/__init__.py +0 -0
py_dpm/utils/__init__.py +0 -0
py_dpm/utils/ast_serialization.py +481 -0
py_dpm/views/data_types.sql +12 -0
py_dpm/views/datapoints.sql +65 -0
py_dpm/views/hierarchy_operand_reference.sql +11 -0
py_dpm/views/hierarchy_preconditions.sql +13 -0
py_dpm/views/hierarchy_variables.sql +26 -0
py_dpm/views/hierarchy_variables_context.sql +14 -0
py_dpm/views/key_components.sql +18 -0
py_dpm/views/module_from_table.sql +11 -0
py_dpm/views/open_keys.sql +13 -0
py_dpm/views/operation_info.sql +27 -0
py_dpm/views/operation_list.sql +18 -0
py_dpm/views/operations_versions_from_module_version.sql +30 -0
py_dpm/views/precondition_info.sql +17 -0
py_dpm/views/report_type_operand_reference_info.sql +18 -0
py_dpm/views/subcategory_info.sql +17 -0
py_dpm/views/table_info.sql +19 -0
pydpm_xl-0.1.10.dist-info/LICENSE +674 -0
pydpm_xl-0.1.10.dist-info/METADATA +50 -0
pydpm_xl-0.1.10.dist-info/RECORD +94 -0
pydpm_xl-0.1.10.dist-info/WHEEL +4 -0
pydpm_xl-0.1.10.dist-info/entry_points.txt +3 -0

py_dpm/Utils/ValidationsGenerationUtils.py ADDED Viewed

@@ -0,0 +1,429 @@
+import json
+from itertools import groupby
+import pandas as pd
+from py_dpm.Utils.tokens import CELL_COMPONENTS, COLUMN, COLUMN_CODE, EXISTENCE_REPORT, \
+    HIERARCHY_REPORT, ROW, ROW_CODE, SHEET, SHEET_CODE, \
+    SIGN_REPORT
+from py_dpm.ValidationsGeneration.Utils import ExternalDataExistence, ExternalDataHierarchies, \
+    ExternalDataSign
+def from_generate_to_response(validations):
+    """
+    """
+    response_validations = {}
+    for validation in validations:
+        if validation['expression'] not in response_validations:
+            response_validations[validation['expression']] = validation
+        else:
+            for op_code in validation['operation_code']:
+                if op_code not in response_validations[validation['expression']]['operation_code']:
+                    response_validations[validation['expression']]['operation_code'].append(op_code)
+            if validation['subcategory_id'] not in response_validations[validation['expression']]['subcategory_id']:
+                response_validations[validation['expression']]['subcategory_id'].append(validation['subcategory_id'][0])
+                response_validations[validation['expression']]['subcategory_code'].append(validation['subcategory_code'][0])
+    response_validations_list = list(response_validations.values())
+    return response_validations_list
+def generate_report_validation_view(validations, report_type):
+    report_type_list = [HIERARCHY_REPORT, SIGN_REPORT, EXISTENCE_REPORT]
+    if report_type not in report_type_list:
+        raise ValueError(f"report_type must be one of {report_type_list}")
+    #
+    if report_type == HIERARCHY_REPORT:
+        external_data = ExternalDataHierarchies()
+        # TODO: Check this
+        proposed = external_data.proposed_rules[external_data.proposed_rules['Type'] == 'Hierarchy']
+        rejected = external_data.rejected_rules[external_data.proposed_rules['Type'] == 'Hierarchy']
+    elif report_type == SIGN_REPORT:
+        external_data = ExternalDataSign()
+        proposed = external_data.proposed_rules
+        rejected = external_data.rejected_rules
+    else:
+        external_data = ExternalDataExistence()
+        proposed = external_data.proposed_rules
+        rejected = external_data.rejected_rules
+    #
+    matched = {"number_validations": 0}
+    unmatched = {"number_validations": 0}
+    review = {"number_validations": 0}
+    #
+    for validation in validations:
+        valdict = {
+            "operation_code": validation['operation_code'],
+            "expression": validation['expression'],
+            # "parent_id": validation['parent_id'],
+            "status": validation['status']
+        }
+        if valdict['status'] != 'Correct':
+            if valdict['expression'] in review:
+                # review[valdict['expression']]['subcategories'].append(validation['subcategory_id'])
+                pass
+            else:
+                review[valdict['expression']] = valdict
+                # review[valdict['expression']]['subcategories'] = [validation['subcategory_id']]
+            review['number_validations'] += 1
+        elif valdict['operation_code'] != []:
+            if valdict['expression'] in matched:
+                pass
+                # matched[valdict['expression']]['subcategories'].append(validation['subcategory_id'])
+            else:
+                matched[valdict['expression']] = valdict
+                # matched[valdict['expression']]['subcategories'] = [validation['subcategory_id']]
+            matched['number_validations'] += 1
+        else:
+            if valdict['expression'] in unmatched:
+                pass
+                # unmatched[valdict['expression']]['subcategories'].append(validation['subcategory_id'])
+            else:
+                unmatched[valdict['expression']] = valdict
+                # unmatched[valdict['expression']]['subcategories'] = [validation['subcategory_id']]
+            unmatched['number_validations'] += 1
+    matched_codes = []
+    for val in matched:
+        if val != 'number_validations':
+            matched_codes += matched[val]['operation_code']
+    # proposed = external_hierarchy_data.proposed_rules[external_hierarchy_data.proposed_rules['Type'] == 'Hierarchy']
+    # rejected = external_hierarchy_data.rejected_rules[external_hierarchy_data.proposed_rules['Type'] == 'Hierarchy']
+    proposed_not_generated = proposed[~proposed['ID'].isin(matched_codes)]
+    rejected_not_generated = rejected[~rejected['ID'].isin(matched_codes)]
+    with open('./development/data/' + report_type + '_matched.json', 'w') as fp:
+        json.dump(matched, fp, indent=4)
+    with open('./development/data/' + report_type + '_unmatched.json', 'w') as fp:
+        json.dump(unmatched, fp, indent=4)
+    with open('./development/data/' + report_type + '_review.json', 'w') as fp:
+        json.dump(review, fp, indent=4)
+    proposed_not_generated.to_csv('./development/data/' + report_type + '_proposed_not_generated.csv', index=False)
+    rejected_not_generated.to_csv('./development/data/' + report_type + '_rejected_not_generated.csv', index=False)
+class ValidationsGenerationUtils:
+    """
+    Class with common methods used by the different generation processes of validations
+    """
+    @classmethod
+    def get_components_to_group(cls, datapoints_variable: pd.DataFrame):
+        """
+        Gets cell components to group by
+        :param datapoints_variable: dataframe with datapoints to group
+        :return a list with cell components to group by
+        """
+        component_values = datapoints_variable[CELL_COMPONENTS]
+        components_to_group = []
+        components_to_check = []
+        for cell_component in CELL_COMPONENTS:
+            if not component_values[cell_component].isnull().all():
+                components_to_check.append(cell_component)
+        if len(components_to_check):
+            if len(components_to_check) == 1:
+                return []
+            for cell_component in components_to_check:
+                duplicated = component_values.duplicated(
+                    subset=[comp for comp in components_to_check if comp != cell_component],
+                    keep=False)
+                if not duplicated.all():
+                    components_to_group.append(cell_component)
+        return components_to_group
+    @classmethod
+    def group_cells(cls, datapoints_variable: pd.DataFrame, datapoints_table: pd.DataFrame):
+        """
+        Get the cell groups from datapoints by grouping them when necessary
+        :param datapoints_variable: datapoints of the variable
+        :param datapoints_table: datapoints of the table associated which the table code of operand
+        :return a list with rows, cols and sheets for each group
+        """
+        components_to_group = cls.get_components_to_group(datapoints_variable=datapoints_variable)
+        result_lst = []
+        if not len(components_to_group) or len(components_to_group) > 2:
+            rows, cols, sheets = cls.group_cell_components(datapoints_variable=datapoints_variable,
+                                                           datapoints_table=datapoints_table)
+            result_lst.append((rows, cols, sheets))
+        elif len(components_to_group) == 1:
+            for key, group_df in datapoints_variable.groupby(components_to_group[0], dropna=False):
+                rows, cols, sheets = cls.group_cell_components(datapoints_variable=group_df,
+                                                               datapoints_table=datapoints_table)
+                result_lst.append((rows, cols, sheets))
+        else:
+            ref_component = components_to_group[0]
+            second_group_component = components_to_group[1]
+            third_component = [component for component in CELL_COMPONENTS if component not in components_to_group][0]
+            reference_prefix = ROW if ref_component == ROW_CODE else COLUMN if ref_component == COLUMN_CODE else SHEET
+            second_component_prefix = ROW if second_group_component == ROW_CODE else COLUMN if second_group_component == COLUMN_CODE else SHEET
+            third_component_prefix = ROW if third_component == ROW_CODE else COLUMN if third_component == COLUMN_CODE else SHEET
+            datapoints_variable = datapoints_variable.sort_values([ref_component, second_group_component])
+            components_dict = {}
+            for value in datapoints_variable[ref_component].unique().tolist():
+                components_dict[value] = datapoints_variable[datapoints_variable[ref_component] == value][
+                    second_group_component].unique().tolist()
+            # group reference component values by second group component values
+            for keys_values, group_values in groupby(components_dict.items(), key=lambda x: sorted(x[1])):
+                group_values = [v[0] for v in group_values]
+                reference_component_grouping = cls.group_cell_component_elements(reference_prefix, group_values,
+                                                                                 datapoints_table[ref_component])
+                second_component_grouping = cls.group_cell_component_elements(second_component_prefix, keys_values,
+                                                                              datapoints_table[second_group_component])
+                third_component_grouping = None
+                if not datapoints_variable[third_component].isnull().all():
+                    third_values = datapoints_variable[
+                        datapoints_variable[ref_component].isin(group_values) & datapoints_variable[
+                            second_group_component].isin(keys_values)][third_component].unique().tolist()
+                    third_component_grouping = cls.group_cell_component_elements(third_component_prefix, third_values,
+                                                                                 datapoints_table[third_component])
+                rows = reference_component_grouping if reference_prefix == ROW else second_component_grouping if second_component_prefix == ROW else third_component_grouping
+                cols = reference_component_grouping if reference_prefix == COLUMN else second_component_grouping if second_component_prefix == COLUMN else third_component_grouping
+                sheets = reference_component_grouping if reference_prefix == SHEET else second_component_grouping if second_component_prefix == SHEET else third_component_grouping
+                result_lst.append((rows, cols, sheets))
+        return result_lst
+    @classmethod
+    def group_cells_test(cls, datapoints_variable: pd.DataFrame, datapoints_table: pd.DataFrame):
+        """
+        Get the cell groups from datapoints by grouping them when necessary
+        :param datapoints_variable: datapoints of the variable
+        :param datapoints_table: datapoints of the table associated which the table code of operand
+        :return a list with rows, cols and sheets for each group
+        """
+        components_to_group = cls.get_components_to_group(datapoints_variable=datapoints_variable)
+        result_lst = []
+        if not len(components_to_group) or len(components_to_group) > 2:
+            is_several_vals, filtered_df=cls._several_validations_checker(datapoints_variable)
+            if is_several_vals:
+                for df in filtered_df:
+                    rows, cols, sheets = cls.group_cell_components(datapoints_variable=df,
+                                                        datapoints_table=datapoints_table)
+                    result_lst.append((rows, cols, sheets, df['cell_id'].to_list()))
+            else:
+                rows, cols, sheets = cls.group_cell_components(datapoints_variable=datapoints_variable,
+                                                            datapoints_table=datapoints_table)
+                result_lst.append((rows, cols, sheets, datapoints_variable['cell_id'].to_list()))
+        elif len(components_to_group) == 1:
+            for key, group_df in datapoints_variable.groupby(components_to_group[0], dropna=False):
+                rows, cols, sheets = cls.group_cell_components(datapoints_variable=group_df,
+                                                               datapoints_table=datapoints_table)
+                result_lst.append((rows, cols, sheets, group_df['cell_id'].to_list()))
+        else:
+            ref_component = components_to_group[0]
+            second_group_component = components_to_group[1]
+            third_component = [component for component in CELL_COMPONENTS if component not in components_to_group][0]
+            reference_prefix = ROW if ref_component == ROW_CODE else COLUMN if ref_component == COLUMN_CODE else SHEET
+            second_component_prefix = ROW if second_group_component == ROW_CODE else COLUMN if second_group_component == COLUMN_CODE else SHEET
+            third_component_prefix = ROW if third_component == ROW_CODE else COLUMN if third_component == COLUMN_CODE else SHEET
+            datapoints_variable = datapoints_variable.sort_values([ref_component, second_group_component])
+            components_dict = {}
+            for value in datapoints_variable[ref_component].unique().tolist():
+                components_dict[value] = datapoints_variable[datapoints_variable[ref_component] == value][
+                    second_group_component].unique().tolist()
+            # group reference component values by second group component values
+            for keys_values, group_values in groupby(components_dict.items(), key=lambda x: sorted(x[1])):
+                group_values = [v[0] for v in group_values]
+                reference_component_grouping = cls.group_cell_component_elements(reference_prefix, group_values,
+                                                                                 datapoints_table[ref_component])
+                second_component_grouping = cls.group_cell_component_elements(second_component_prefix, keys_values,
+                                                                              datapoints_table[second_group_component])
+                third_component_grouping = None
+                if not datapoints_variable[third_component].isnull().all():
+                    third_values = datapoints_variable[
+                        datapoints_variable[ref_component].isin(group_values) & datapoints_variable[
+                            second_group_component].isin(keys_values)][third_component].unique().tolist()
+                    third_component_grouping = cls.group_cell_component_elements(third_component_prefix, third_values,
+                                                                                 datapoints_table[third_component])
+                rows = reference_component_grouping if reference_prefix == ROW else second_component_grouping if second_component_prefix == ROW else third_component_grouping
+                cols = reference_component_grouping if reference_prefix == COLUMN else second_component_grouping if second_component_prefix == COLUMN else third_component_grouping
+                sheets = reference_component_grouping if reference_prefix == SHEET else second_component_grouping if second_component_prefix == SHEET else third_component_grouping
+                result_lst.append((rows, cols, sheets, datapoints_variable['cell_id'].to_list()))  #TODO: Check this
+        return result_lst
+    @classmethod
+    def group_cell_components(cls, datapoints_variable, datapoints_table):
+        """
+        Extracts the cell components by grouping them when necessary
+        :param datapoints_variable: datapoints of the variable
+        :param datapoints_table: datapoints of the table associated which the table code of operand
+        :return Rows, cols and sheets of operand
+        """
+        rows = cls.group_cell_component_elements(ROW, datapoints_variable[ROW_CODE].tolist(),
+                                                 datapoints_table[ROW_CODE])
+        cols = cls.group_cell_component_elements(COLUMN, datapoints_variable[COLUMN_CODE].tolist(),
+                                                 datapoints_table[COLUMN_CODE])
+        sheets = cls.group_cell_component_elements(SHEET, datapoints_variable[SHEET_CODE].tolist(),
+                                                   datapoints_table[SHEET_CODE])
+        return rows, cols, sheets
+    @classmethod
+    def group_cell_component_elements(cls, cell_component_prefix: str, cell_component_elements: list,
+                                      datapoints: pd.Series):
+        """
+        Groups elements of a cell component
+        :param cell_component_prefix: Cell component name to be operated on
+        :param cell_component_elements: values of operand cell component associated with the cell_component_prefix
+         argument
+        :param datapoints: values of table cell component associated with the cell_component_prefix argument
+        return the cell component by grouping it when necessary
+        """
+        unique_values = set(cell_component_elements)
+        if len(unique_values) == 0:
+            return None
+        elif len(unique_values) == 1:
+            if cell_component_elements[0]:
+                return cell_component_prefix + str(cell_component_elements[0])
+            return None
+        cell_component_elements.sort()
+        cell_component_all_unique_values = datapoints.drop_duplicates().tolist()
+        datapoints_cell_component = datapoints[
+            datapoints.between(cell_component_elements[0], cell_component_elements[-1])]
+        if len(unique_values) == len(cell_component_all_unique_values):
+            return f"{cell_component_prefix}*"
+        if len(unique_values) == len(datapoints_cell_component.drop_duplicates()):
+            return f"{cell_component_prefix}{cell_component_elements[0]}-{cell_component_elements[-1]}"
+        return '(' + ', '.join([f"{cell_component_prefix}{component}" for component in sorted(unique_values)]) + ')'
+    @classmethod
+    def write_cell(cls, table_code, rows, cols, sheets):
+        """
+        Returns a string that represents a cell expression
+        :param table_code: Table code
+        :param rows: Expression rows
+        :param cols: Expression cols
+        :param sheets: Expression sheets
+        """
+        table_code = f"t{table_code}" if table_code else None
+        cell_components = [components for components in (table_code, rows, cols, sheets) if components]
+        if len(cell_components):
+            cell_info = ', '.join(cell_components)
+            return '{' + cell_info + '}'
+        return ""
+    @classmethod
+    def write_cell_with_asterisk(cls, table_code, rows, cols, sheets, reference_data):
+        """
+        Returns a string that represents a cell expression
+        :param table_code: Table code
+        :param rows: Expression rows
+        :param cols: Expression cols
+        :param sheets: Expression sheets
+        """
+        cell_info = ""
+        # check if * is needed
+        if rows and "-" in rows:
+            rows = replace_range_by_asterisk(rows, reference_data[ROW_CODE], ROW)
+        if cols and "-" in cols:
+            cols = replace_range_by_asterisk(cols, reference_data[COLUMN_CODE], COLUMN)
+        if sheets and "-" in sheets:
+            sheets = replace_range_by_asterisk(sheets, reference_data[SHEET_CODE], SHEET)
+        table_code = f"t{table_code}" if table_code else None
+        cell_components = [components for components in (table_code, rows, cols, sheets) if components]
+        if len(cell_components):
+            cell_info = ', '.join(cell_components)
+            return '{' + cell_info + '}'
+        return None
+    @classmethod
+    def _several_validations_checker(cls, df)->(bool,pd.DataFrame):
+        """
+        Checks if the dataframe has several validations
+        :param df: dataframe with validations
+        :return True if the dataframe has several validations, False otherwise
+        """
+        # TODO: Check this, example F_18.00.b sign validations
+        checker = 0
+        checker_component = []
+        for c_component in CELL_COMPONENTS:
+            if df[c_component].nunique() > 1:
+                checker += 1
+                checker_component.append(c_component)
+        if checker == 2:
+            results = _two_components_checker(df, checker_component)
+            if results:
+                return True, results
+        if checker == 3:
+            # TODO: To implement, not necessary for now because there are no sign validations (withoout components to group) with 3 components
+            pass
+        return False, None
+def _two_components_checker(df, checker_component)->list:
+    """
+    Checks if the dataframe has several validations
+    :param df: dataframe with validations
+    :return True if the dataframe has several validations, False otherwise
+    """
+    results = []
+    for i in enumerate(checker_component):
+        component_group = checker_component[i[0]-1]
+        other_component = checker_component[i[0]]
+        # component_group_values = df[component_group].unique().tolist()
+        group_df = df.groupby(component_group)
+        dict_related = {}
+        dict_values = {}
+        for a, b in group_df:
+            dict_values[a] = b[other_component].unique().tolist()
+        for k, v in dict_values.items():
+            dict_related[k] = []
+            for i, j in dict_values.items():
+                if k != i:
+                    if set(v) == set(j):
+                        dict_related[k].append(i)
+        components_grouped_list = [(k, *v) for k, v in dict_related.items()]
+        components_grouped_sorted = [sorted(x) for x in components_grouped_list]
+        components_grouped_sorted = [tuple(x) for x in components_grouped_sorted]
+        components_set = set(components_grouped_sorted)
+        if len(components_set) > 1:
+            for elto in components_set:
+                results.append(df[df[component_group].isin(elto)])
+    return results
+def replace_range_by_asterisk(expression, df_component, component_prefix):
+    """
+    Replaces range by asterisk
+    :param expression: expression to be replaced
+    :return expression with asterisk
+    """
+    sorted_list = sorted(df_component.drop_duplicates().to_list())
+    # sorted_list = sorted(list(set(df_component.to_list())))
+    first_element_expression = expression.split("-")[0][1:]
+    last_element_expression = expression.split("-")[1]
+    if len(sorted_list) > 1 and first_element_expression == sorted_list[0] \
+            and last_element_expression == sorted_list[-1]:
+        return component_prefix + "*"
+    return expression

py_dpm/Utils/__init__.py ADDED Viewed

File without changes

py_dpm/Utils/operands_mapping.py ADDED Viewed

@@ -0,0 +1,73 @@
+import itertools
+import string
+from typing import Union
+from py_dpm.AST.ASTObjects import PreconditionItem, VarID
+class LabelHandler:
+    _instance = None
+    labels = None
+    operands_labels = None
+    def __new__(cls):
+        if not isinstance(cls._instance, cls):
+            cls._instance = object.__new__(cls)
+            cls.labels = iter_all_strings()
+            cls.operands_labels = {}
+            cls.labels_type = {}
+        return cls._instance
+    @classmethod
+    def reset_instance(cls):
+        cls.labels.close()
+        cls.labels = iter_all_strings()
+        cls.operands_labels = {}
+        cls.labels_type = {}
+def iter_all_strings():
+    for size in itertools.count(1):
+        for s in itertools.product(string.ascii_uppercase, repeat=size):
+            yield "".join(s)
+def set_operand_label(label: str, operand: Union[str, VarID]):
+    if isinstance(operand, VarID):
+        LabelHandler().operands_labels[label] = generate_operand_expression(operand)
+        LabelHandler().labels_type[label] = 'single'
+    elif isinstance(operand, PreconditionItem):
+        LabelHandler().operands_labels[label] = f"v_{operand.variable_code}"
+        LabelHandler().labels_type[label] = 'single'
+    else:
+        LabelHandler().operands_labels[label] = operand
+        LabelHandler().labels_type[label] = 'not_single'
+def generate_operand_expression(operand: VarID):
+    operand_expression = "{ "
+    operand_expression += f"t{operand.table}"
+    if operand.rows:
+        operand_expression += f", {','.join(['r' + x for x in operand.rows])}"
+    if operand.cols:
+        operand_expression += f", {','.join(['c' + x for x in operand.cols])}"
+    if operand.sheets:
+        operand_expression += f", {','.join(['s' + x for x in operand.sheets])}"
+    operand_expression += " }"
+    return operand_expression
+def get_operand_from_label(label: str):
+    if label in LabelHandler().operands_labels:
+        return LabelHandler().operands_labels[label]
+    return None
+def get_type_from_label(label: str):
+    if label in LabelHandler().labels_type:
+        return LabelHandler().labels_type[label]
+    return None
+def generate_new_label():
+    label = LabelHandler().labels.__next__()
+    return f"$@{label}#"

py_dpm/Utils/operator_mapping.py ADDED Viewed

@@ -0,0 +1,89 @@
+from py_dpm.Operators.AggregateOperators import Avg, Count, MaxAggr, Median, MinAggr, Sum
+from py_dpm.Operators.BooleanOperators import And, Not, Or, Xor
+from py_dpm.Operators.ClauseOperators import Get, Rename, Where
+from py_dpm.Operators.ComparisonOperators import Equal, Greater, GreaterEqual, In, IsNull, Less, LessEqual, Match, NotEqual
+from py_dpm.Operators.ConditionalOperators import Filter, IfOperator, Nvl
+from py_dpm.Operators.NumericOperators import AbsoluteValue, BinMinus, BinPlus, Div, Exponential, Logarithm, \
+    Max, Min, Mult, NaturalLogarithm, \
+    Power, SquareRoot, UnMinus, UnPlus
+from py_dpm.Operators.StringOperators import Concatenate, Len
+from py_dpm.Operators.TimeOperators import TimeShift
+from .tokens import *
+BIN_OP_MAPPING = {
+    # Boolean operators
+    AND: And,
+    OR: Or,
+    XOR: Xor,
+    # Comparison operators
+    EQ: Equal,
+    NEQ: NotEqual,
+    GT: Greater,
+    GTE: GreaterEqual,
+    LT: Less,
+    LTE: LessEqual,
+    IN: In,
+    MATCH: Match,
+    # Numeric operators
+    PLUS: BinPlus,
+    MINUS: BinMinus,
+    MULT: Mult,
+    DIV: Div,
+    POW: Power,
+    LOG: Logarithm,
+    # Conditional operator
+    NVL: Nvl,
+    # String operators
+    CONCATENATE: Concatenate
+}
+UNARY_OP_MAPPING = {
+    # Boolean Operators
+    NOT: Not,
+    # Numeric Operators
+    PLUS: UnPlus,
+    MINUS: UnMinus,
+    ABS: AbsoluteValue,
+    EXP: Exponential,
+    LN: NaturalLogarithm,
+    SQRT: SquareRoot,
+    # Comparison Operators
+    ISNULL: IsNull,
+    # String operators
+    LENGTH: Len
+}
+AGGR_OP_MAPPING = {
+    MAX_AGGR: MaxAggr,
+    MIN_AGGR: MinAggr,
+    SUM: Sum,
+    COUNT: Count,
+    AVG: Avg,
+    MEDIAN: Median
+}
+CLAUSE_OP_MAPPING = {
+    WHERE: Where,
+    RENAME: Rename,
+    GET: Get
+}
+TIME_OPERATORS = {
+    TIME_SHIFT: TimeShift
+}
+CONDITIONAL_OP_MAPPING = {
+    IF: IfOperator,
+    FILTER: Filter
+}
+COMPLEX_OP_MAPPING = {
+    MAX: Max,
+    MIN: Min
+}