PyPI - squirrels - Versions diffs - 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

squirrels 0.4.0py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of squirrels might be problematic. Click here for more details.

Files changed (125) hide show

dateutils/__init__.py +6 -0
dateutils/_enums.py +25 -0
squirrels/dateutils.py → dateutils/_implementation.py +58 -111
dateutils/types.py +6 -0
squirrels/__init__.py +13 -11
squirrels/_api_routes/__init__.py +5 -0
squirrels/_api_routes/auth.py +271 -0
squirrels/_api_routes/base.py +165 -0
squirrels/_api_routes/dashboards.py +150 -0
squirrels/_api_routes/data_management.py +145 -0
squirrels/_api_routes/datasets.py +257 -0
squirrels/_api_routes/oauth2.py +298 -0
squirrels/_api_routes/project.py +252 -0
squirrels/_api_server.py +256 -450
squirrels/_arguments/__init__.py +0 -0
squirrels/_arguments/init_time_args.py +108 -0
squirrels/_arguments/run_time_args.py +147 -0
squirrels/_auth.py +960 -0
squirrels/_command_line.py +126 -45
squirrels/_compile_prompts.py +147 -0
squirrels/_connection_set.py +48 -26
squirrels/_constants.py +68 -38
squirrels/_dashboards.py +160 -0
squirrels/_data_sources.py +570 -0
squirrels/_dataset_types.py +84 -0
squirrels/_exceptions.py +29 -0
squirrels/_initializer.py +177 -80
squirrels/_logging.py +115 -0
squirrels/_manifest.py +208 -79
squirrels/_model_builder.py +69 -0
squirrels/_model_configs.py +74 -0
squirrels/_model_queries.py +52 -0
squirrels/_models.py +926 -367
squirrels/_package_data/base_project/.env +42 -0
squirrels/_package_data/base_project/.env.example +42 -0
squirrels/_package_data/base_project/assets/expenses.db +0 -0
squirrels/_package_data/base_project/connections.yml +16 -0
squirrels/_package_data/base_project/dashboards/dashboard_example.py +34 -0
squirrels/_package_data/base_project/dashboards/dashboard_example.yml +22 -0
squirrels/{package_data → _package_data}/base_project/docker/.dockerignore +5 -2
squirrels/{package_data → _package_data}/base_project/docker/Dockerfile +3 -3
squirrels/{package_data → _package_data}/base_project/docker/compose.yml +1 -1
squirrels/_package_data/base_project/duckdb_init.sql +10 -0
squirrels/{package_data/base_project/.gitignore → _package_data/base_project/gitignore} +3 -2
squirrels/_package_data/base_project/macros/macros_example.sql +17 -0
squirrels/_package_data/base_project/models/builds/build_example.py +26 -0
squirrels/_package_data/base_project/models/builds/build_example.sql +16 -0
squirrels/_package_data/base_project/models/builds/build_example.yml +57 -0
squirrels/_package_data/base_project/models/dbviews/dbview_example.sql +12 -0
squirrels/_package_data/base_project/models/dbviews/dbview_example.yml +26 -0
squirrels/_package_data/base_project/models/federates/federate_example.py +37 -0
squirrels/_package_data/base_project/models/federates/federate_example.sql +19 -0
squirrels/_package_data/base_project/models/federates/federate_example.yml +65 -0
squirrels/_package_data/base_project/models/sources.yml +38 -0
squirrels/{package_data → _package_data}/base_project/parameters.yml +56 -40
squirrels/_package_data/base_project/pyconfigs/connections.py +14 -0
squirrels/{package_data → _package_data}/base_project/pyconfigs/context.py +21 -40
squirrels/_package_data/base_project/pyconfigs/parameters.py +141 -0
squirrels/_package_data/base_project/pyconfigs/user.py +44 -0
squirrels/_package_data/base_project/seeds/seed_categories.yml +15 -0
squirrels/_package_data/base_project/seeds/seed_subcategories.csv +15 -0
squirrels/_package_data/base_project/seeds/seed_subcategories.yml +21 -0
squirrels/_package_data/base_project/squirrels.yml.j2 +61 -0
squirrels/_package_data/templates/dataset_results.html +112 -0
squirrels/_package_data/templates/oauth_login.html +271 -0
squirrels/_package_data/templates/squirrels_studio.html +20 -0
squirrels/_package_loader.py +8 -4
squirrels/_parameter_configs.py +104 -103
squirrels/_parameter_options.py +348 -0
squirrels/_parameter_sets.py +57 -47
squirrels/_parameters.py +1664 -0
squirrels/_project.py +721 -0
squirrels/_py_module.py +7 -5
squirrels/_schemas/__init__.py +0 -0
squirrels/_schemas/auth_models.py +167 -0
squirrels/_schemas/query_param_models.py +75 -0
squirrels/{_api_response_models.py → _schemas/response_models.py} +126 -47
squirrels/_seeds.py +35 -16
squirrels/_sources.py +110 -0
squirrels/_utils.py +248 -73
squirrels/_version.py +1 -1
squirrels/arguments.py +7 -0
squirrels/auth.py +4 -0
squirrels/connections.py +3 -0
squirrels/dashboards.py +2 -81
squirrels/data_sources.py +14 -631
squirrels/parameter_options.py +13 -348
squirrels/parameters.py +14 -1266
squirrels/types.py +16 -0
squirrels-0.5.0.dist-info/METADATA +113 -0
squirrels-0.5.0.dist-info/RECORD +97 -0
{squirrels-0.4.0.dist-info → squirrels-0.5.0.dist-info}/WHEEL +1 -1
squirrels-0.5.0.dist-info/entry_points.txt +3 -0
{squirrels-0.4.0.dist-info → squirrels-0.5.0.dist-info/licenses}/LICENSE +1 -1
squirrels/_authenticator.py +0 -85
squirrels/_dashboards_io.py +0 -61
squirrels/_environcfg.py +0 -84
squirrels/arguments/init_time_args.py +0 -40
squirrels/arguments/run_time_args.py +0 -208
squirrels/package_data/assets/favicon.ico +0 -0
squirrels/package_data/assets/index.css +0 -1
squirrels/package_data/assets/index.js +0 -58
squirrels/package_data/base_project/assets/expenses.db +0 -0
squirrels/package_data/base_project/connections.yml +0 -7
squirrels/package_data/base_project/dashboards/dashboard_example.py +0 -32
squirrels/package_data/base_project/dashboards.yml +0 -10
squirrels/package_data/base_project/env.yml +0 -29
squirrels/package_data/base_project/models/dbviews/dbview_example.py +0 -47
squirrels/package_data/base_project/models/dbviews/dbview_example.sql +0 -22
squirrels/package_data/base_project/models/federates/federate_example.py +0 -21
squirrels/package_data/base_project/models/federates/federate_example.sql +0 -3
squirrels/package_data/base_project/pyconfigs/auth.py +0 -45
squirrels/package_data/base_project/pyconfigs/connections.py +0 -19
squirrels/package_data/base_project/pyconfigs/parameters.py +0 -95
squirrels/package_data/base_project/seeds/seed_subcategories.csv +0 -15
squirrels/package_data/base_project/squirrels.yml.j2 +0 -94
squirrels/package_data/templates/index.html +0 -18
squirrels/project.py +0 -378
squirrels/user_base.py +0 -55
squirrels-0.4.0.dist-info/METADATA +0 -117
squirrels-0.4.0.dist-info/RECORD +0 -60
squirrels-0.4.0.dist-info/entry_points.txt +0 -4
/squirrels/{package_data → _package_data}/base_project/assets/weather.db +0 -0
/squirrels/{package_data → _package_data}/base_project/seeds/seed_categories.csv +0 -0
/squirrels/{package_data → _package_data}/base_project/tmp/.gitignore +0 -0

squirrels/_data_sources.py ADDED Viewed

@@ -0,0 +1,570 @@
+from __future__ import annotations
+from dataclasses import dataclass
+from enum import Enum
+import polars as pl, typing as t, abc
+from . import _parameter_configs as pc, _parameter_options as po
+from ._exceptions import ConfigurationError
+class SourceEnum(Enum):
+    CONNECTION = "connection"
+    SEEDS = "seeds"
+    VDL = "vdl"
+@dataclass
+class DataSource(metaclass=abc.ABCMeta):
+    """
+    Abstract class for lookup tables coming from a database
+    """
+    _table_or_query: str
+    _id_col: str | None
+    _source: SourceEnum
+    _user_group_col: str | None
+    _parent_id_col: str | None
+    _connection: str | None
+    @abc.abstractmethod
+    def __init__(
+        self, table_or_query: str, *, id_col: str | None = None, source: SourceEnum = SourceEnum.CONNECTION,
+        user_group_col: str | None = None, parent_id_col: str | None = None, connection: str | None = None, **kwargs
+    ) -> None:
+        self._table_or_query = table_or_query
+        self._id_col = id_col
+        self._source = source
+        self._user_group_col = user_group_col
+        self._parent_id_col = parent_id_col
+        self._connection = connection
+    def _get_connection_name(self, default_conn_name: str) -> str:
+        return self._connection if self._connection is not None else default_conn_name
+    def _get_query(self) -> str:
+        """
+        Get the "table_or_query" attribute as a select query
+        Returns:
+            str: The converted select query
+        """
+        if self._table_or_query.strip().lower().startswith('select '):
+            query = self._table_or_query
+        else:
+            query = f'SELECT * FROM {self._table_or_query}'
+        return query
+    @abc.abstractmethod
+    def _convert(self, ds_param: pc.DataSourceParameterConfig, df: pl.DataFrame) -> pc.ParameterConfig:
+        """
+        An abstract method for converting itself into a parameter
+        """
+        pass
+    def _validate_parameter_type(self, ds_param: pc.DataSourceParameterConfig, target_parameter_type: t.Type[pc.ParameterConfig]) -> None:
+        if ds_param.parameter_type != target_parameter_type:
+            parameter_type_name = ds_param.parameter_type.__name__
+            datasource_type_name = self.__class__.__name__
+            raise ConfigurationError(f'Invalid widget type "{parameter_type_name}" for {datasource_type_name}')
+    def _get_aggregated_df(self, df: pl.DataFrame, columns_to_include: t.Iterable[str]) -> pl.DataFrame:
+        if self._id_col is None:
+            return df
+        agg_rules = []
+        for column in columns_to_include:
+            if column is not None:
+                agg_rules.append(pl.first(column))
+        if self._user_group_col is not None:
+            agg_rules.append(pl.col(self._user_group_col))
+        if self._parent_id_col is not None:
+            agg_rules.append(pl.col(self._parent_id_col))
+        try:
+            df_agg = df.group_by(self._id_col).agg(agg_rules).sort(by=self._id_col)
+        except pl.exceptions.ColumnNotFoundError as e:
+            raise ConfigurationError(e)
+        return df_agg
+    def _get_key_from_record(self, key: str | None, record: dict[t.Hashable, t.Any], default: t.Any) -> t.Any:
+        return record[key] if key is not None else default
+    def _get_key_from_record_as_list(self, key: str | None, record: dict[t.Hashable, t.Any]) -> t.Iterable[str]:
+        value = self._get_key_from_record(key, record, list())
+        return [str(x) for x in value]
+@dataclass
+class _SelectionDataSource(DataSource):
+    """
+    Abstract class for selection parameter data sources
+    """
+    _options_col: str
+    _order_by_col: str | None
+    _is_default_col: str | None
+    _custom_cols: dict[str, str]
+    @abc.abstractmethod
+    def __init__(
+        self, table_or_query: str, id_col: str, options_col: str, *, order_by_col: str | None = None,
+        is_default_col: str | None = None, custom_cols: dict[str, str] = {}, source: SourceEnum = SourceEnum.CONNECTION,
+        user_group_col: str | None = None, parent_id_col: str | None = None, connection: str | None = None,
+        **kwargs
+    ) -> None:
+        super().__init__(
+            table_or_query, id_col=id_col, source=source, user_group_col=user_group_col, parent_id_col=parent_id_col,
+            connection=connection
+        )
+        self._options_col = options_col
+        self._order_by_col = order_by_col
+        self._is_default_col = is_default_col
+        self._custom_cols = custom_cols
+    def _get_all_options(self, df: pl.DataFrame) -> t.Sequence[po.SelectParameterOption]:
+        columns = [self._options_col, self._order_by_col, self._is_default_col, *self._custom_cols.values()]
+        df_agg = self._get_aggregated_df(df, columns)
+        if self._order_by_col is None:
+            df_agg = df_agg.sort(by=self._id_col)
+        else:
+            df_agg = df_agg.sort(by=self._order_by_col)
+        def get_is_default(record: dict[t.Hashable, t.Any]) -> bool:
+            return int(record[self._is_default_col]) == 1 if self._is_default_col is not None else False
+        def get_custom_fields(record: dict[t.Hashable, t.Any]) -> dict[str, t.Any]:
+            result = {}
+            for key, val in self._custom_cols.items():
+                result[key] = record[val]
+            return result
+        records = df_agg.to_pandas().to_dict("records")
+        return tuple(
+            po.SelectParameterOption(
+                str(record[self._id_col]), str(record[self._options_col]),
+                is_default=get_is_default(record), custom_fields=get_custom_fields(record),
+                user_groups=self._get_key_from_record_as_list(self._user_group_col, record),
+                parent_option_ids=self._get_key_from_record_as_list(self._parent_id_col, record)
+            )
+            for record in records
+        )
+@dataclass
+class SelectDataSource(_SelectionDataSource):
+    """
+    Lookup table for select parameter options
+    """
+    def __init__(
+            self, table_or_query: str, id_col: str, options_col: str, *, order_by_col: str | None = None,
+            is_default_col: str | None = None, custom_cols: dict[str, str] = {}, source: SourceEnum = SourceEnum.CONNECTION,
+            user_group_col: str | None = None, parent_id_col: str | None = None, connection: str | None = None,
+            **kwargs
+        ) -> None:
+        """
+        Constructor for SelectDataSource
+        Arguments:
+            table_or_query: Either the name of the table to use, or a query to run
+            id_col: The column name of the id
+            options_col: The column name of the options
+            order_by_col: The column name to order the options by. Orders by the id_col instead if this is None
+            is_default_col: The column name that indicates which options are the default
+            custom_cols: Dictionary of attribute to column name for custom fields for the SelectParameterOption
+            source: The source to fetch data from. Must be "connection", "seeds", or "vdl". Defaults to "connection"
+            user_group_col: The column name of the user group that the user is in for this option to be valid
+            parent_id_col: The column name of the parent option id that must be selected for this option to be valid
+            connection: Name of the connection to use defined in connections.py
+        """
+        super().__init__(
+            table_or_query, id_col, options_col, order_by_col=order_by_col, is_default_col=is_default_col, custom_cols=custom_cols,
+            source=source, user_group_col=user_group_col, parent_id_col=parent_id_col, connection=connection
+        )
+    def _convert(self, ds_param: pc.DataSourceParameterConfig, df: pl.DataFrame) -> pc.SelectionParameterConfig:
+        """
+        Method to convert the associated DataSourceParameterConfig into a SingleSelectParameterConfig or MultiSelectParameterConfig
+        Arguments:
+            ds_param: The parameter to convert
+            df: The dataframe containing the parameter options data
+        Returns:
+            The converted parameter
+        """
+        all_options = self._get_all_options(df)
+        if ds_param.parameter_type == pc.SingleSelectParameterConfig:
+            return pc.SingleSelectParameterConfig(
+                ds_param.name, ds_param.label, all_options, description=ds_param.description,
+                user_attribute=ds_param.user_attribute, parent_name=ds_param.parent_name, **ds_param.extra_args
+            )
+        elif ds_param.parameter_type == pc.MultiSelectParameterConfig:
+            return pc.MultiSelectParameterConfig(
+                ds_param.name, ds_param.label, all_options, description=ds_param.description,
+                user_attribute=ds_param.user_attribute, parent_name=ds_param.parent_name, **ds_param.extra_args
+            )
+        else:
+            raise ConfigurationError(f'Invalid widget type "{ds_param.parameter_type}" for SelectDataSource')
+@dataclass
+class DateDataSource(DataSource):
+    """
+    Lookup table for date parameter default options
+    """
+    _default_date_col: str
+    _date_format: str
+    def __init__(
+        self, table_or_query: str, default_date_col: str, *, min_date_col: str | None = None,
+        max_date_col: str | None = None, date_format: str = '%Y-%m-%d', id_col: str | None = None,
+        source: SourceEnum = SourceEnum.CONNECTION, user_group_col: str | None = None, parent_id_col: str | None = None,
+        connection: str | None = None, **kwargs
+    ) -> None:
+        """
+        Constructor for DateDataSource
+        Arguments:
+            table_or_query: Either the name of the table to use, or a query to run
+            default_date_col: The column name of the default date
+            date_format: The format of the default date(s). Defaults to '%Y-%m-%d'
+            id_col: The column name of the id
+            source: The source to fetch data from. Must be "connection", "seeds", or "vdl". Defaults to "connection"
+            user_group_col: The column name of the user group that the user is in for this option to be valid
+            parent_id_col: The column name of the parent option id that the default date belongs to
+            connection: Name of the connection to use defined in connections.py
+        """
+        super().__init__(
+            table_or_query, id_col=id_col, source=source, user_group_col=user_group_col, parent_id_col=parent_id_col,
+            connection=connection
+        )
+        self._default_date_col = default_date_col
+        self._min_date_col = min_date_col
+        self._max_date_col = max_date_col
+        self._date_format = date_format
+    def _convert(self, ds_param: pc.DataSourceParameterConfig, df: pl.DataFrame) -> pc.DateParameterConfig:
+        """
+        Method to convert the associated DataSourceParameterConfig into a DateParameterConfig
+        Arguments:
+            ds_param: The parameter to convert
+            df: The dataframe containing the parameter options data
+        Returns:
+            The converted parameter
+        """
+        self._validate_parameter_type(ds_param, pc.DateParameterConfig)
+        columns = [self._default_date_col, self._min_date_col, self._max_date_col]
+        df_agg = self._get_aggregated_df(df, columns)
+        records = df_agg.to_pandas().to_dict("records")
+        options = tuple(
+            po.DateParameterOption(
+                str(record[self._default_date_col]), date_format=self._date_format,
+                min_date = str(record[self._min_date_col]) if self._min_date_col else None,
+                max_date = str(record[self._max_date_col]) if self._max_date_col else None,
+                user_groups=self._get_key_from_record_as_list(self._user_group_col, record),
+                parent_option_ids=self._get_key_from_record_as_list(self._parent_id_col, record)
+            )
+            for record in records
+        )
+        return pc.DateParameterConfig(
+            ds_param.name, ds_param.label, options, description=ds_param.description, user_attribute=ds_param.user_attribute,
+            parent_name=ds_param.parent_name, **ds_param.extra_args
+        )
+@dataclass
+class DateRangeDataSource(DataSource):
+    """
+    Lookup table for date parameter default options
+    """
+    _default_start_date_col: str
+    _default_end_date_col: str
+    _date_format: str
+    def __init__(
+        self, table_or_query: str, default_start_date_col: str, default_end_date_col: str, *, date_format: str = '%Y-%m-%d',
+        min_date_col: str | None = None, max_date_col: str | None = None, id_col: str | None = None, source: SourceEnum = SourceEnum.CONNECTION,
+        user_group_col: str | None = None, parent_id_col: str | None = None, connection: str | None = None, **kwargs
+    ) -> None:
+        """
+        Constructor for DateRangeDataSource
+        Arguments:
+            table_or_query: Either the name of the table to use, or a query to run
+            default_start_date_col: The column name of the default start date
+            default_end_date_col: The column name of the default end date
+            date_format: The format of the default date(s). Defaults to '%Y-%m-%d'
+            id_col: The column name of the id
+            source: The source to fetch data from. Must be "connection", "seeds", or "vdl". Defaults to "connection"
+            user_group_col: The column name of the user group that the user is in for this option to be valid
+            parent_id_col: The column name of the parent option id that the default date belongs to
+            connection: Name of the connection to use defined in connections.py
+        """
+        super().__init__(
+            table_or_query, id_col=id_col, source=source, user_group_col=user_group_col, parent_id_col=parent_id_col,
+            connection=connection
+        )
+        self._default_start_date_col = default_start_date_col
+        self._default_end_date_col = default_end_date_col
+        self._min_date_col = min_date_col
+        self._max_date_col = max_date_col
+        self._date_format = date_format
+    def _convert(self, ds_param: pc.DataSourceParameterConfig, df: pl.DataFrame) -> pc.DateRangeParameterConfig:
+        """
+        Method to convert the associated DataSourceParameterConfig into a DateRangeParameterConfig
+        Arguments:
+            ds_param: The parameter to convert
+            df: The dataframe containing the parameter options data
+        Returns:
+            The converted parameter
+        """
+        self._validate_parameter_type(ds_param, pc.DateRangeParameterConfig)
+        columns = [self._default_start_date_col, self._default_end_date_col, self._min_date_col, self._max_date_col]
+        df_agg = self._get_aggregated_df(df, columns)
+        records = df_agg.to_pandas().to_dict("records")
+        options = tuple(
+            po.DateRangeParameterOption(
+                str(record[self._default_start_date_col]), str(record[self._default_end_date_col]),
+                min_date=str(record[self._min_date_col]) if self._min_date_col else None,
+                max_date=str(record[self._max_date_col]) if self._max_date_col else None,
+                date_format=self._date_format,
+                user_groups=self._get_key_from_record_as_list(self._user_group_col, record),
+                parent_option_ids=self._get_key_from_record_as_list(self._parent_id_col, record)
+            )
+            for record in records
+        )
+        return pc.DateRangeParameterConfig(
+            ds_param.name, ds_param.label, options, description=ds_param.description, user_attribute=ds_param.user_attribute,
+            parent_name=ds_param.parent_name, **ds_param.extra_args
+        )
+@dataclass
+class _NumericDataSource(DataSource):
+    """
+    Abstract class for number or number range data sources
+    """
+    _min_value_col: str
+    _max_value_col: str
+    _increment_col: str | None
+    @abc.abstractmethod
+    def __init__(
+        self, table_or_query: str, min_value_col: str, max_value_col: str, *, increment_col: str | None = None,
+        id_col: str | None = None, source: SourceEnum = SourceEnum.CONNECTION, user_group_col: str | None = None,
+        parent_id_col: str | None = None, connection: str | None = None, **kwargs
+    ) -> None:
+        super().__init__(
+            table_or_query, id_col=id_col, source=source, user_group_col=user_group_col, parent_id_col=parent_id_col,
+            connection=connection
+        )
+        self._min_value_col = min_value_col
+        self._max_value_col = max_value_col
+        self._increment_col = increment_col
+@dataclass
+class NumberDataSource(_NumericDataSource):
+    """
+    Lookup table for number parameter default options
+    """
+    _default_value_col: str | None
+    def __init__(
+        self, table_or_query: str, min_value_col: str, max_value_col: str, *, increment_col: str | None = None,
+        default_value_col: str | None = None, id_col: str | None = None, source: SourceEnum = SourceEnum.CONNECTION,
+        user_group_col: str | None = None, parent_id_col: str | None = None, connection: str | None = None, **kwargs
+    ) -> None:
+        """
+        Constructor for NumberDataSource
+        Arguments:
+            table_or_query: Either the name of the table to use, or a query to run
+            min_value_col: The column name of the minimum value
+            max_value_col: The column name of the maximum value
+            increment_col: The column name of the increment value. Defaults to column of 1's if None
+            default_value_col: The column name of the default value. Defaults to min_value_col if None
+            id_col: The column name of the id
+            source: The source to fetch data from. Must be "connection", "seeds", or "vdl". Defaults to "connection"
+            user_group_col: The column name of the user group that the user is in for this option to be valid
+            parent_id_col: The column name of the parent option id that the default value belongs to
+            connection: Name of the connection to use defined in connections.py
+        """
+        super().__init__(
+            table_or_query, min_value_col, max_value_col, increment_col=increment_col, id_col=id_col, source=source,
+            user_group_col=user_group_col, parent_id_col=parent_id_col, connection=connection
+        )
+        self._default_value_col = default_value_col
+    def _convert(self, ds_param: pc.DataSourceParameterConfig, df: pl.DataFrame) -> pc.NumberParameterConfig:
+        """
+        Method to convert the associated DataSourceParameterConfig into a NumberParameterConfig
+        Arguments:
+            ds_param: The parameter to convert
+            df: The dataframe containing the parameter options data
+        Returns:
+            The converted parameter
+        """
+        self._validate_parameter_type(ds_param, pc.NumberParameterConfig)
+        columns = [self._min_value_col, self._max_value_col, self._increment_col, self._default_value_col]
+        df_agg = self._get_aggregated_df(df, columns)
+        records = df_agg.to_pandas().to_dict("records")
+        options = tuple(
+            po.NumberParameterOption(
+                record[self._min_value_col], record[self._max_value_col],
+                increment=self._get_key_from_record(self._increment_col, record, 1),
+                default_value=self._get_key_from_record(self._default_value_col, record, None),
+                user_groups=self._get_key_from_record_as_list(self._user_group_col, record),
+                parent_option_ids=self._get_key_from_record_as_list(self._parent_id_col, record)
+            )
+            for record in records
+        )
+        return pc.NumberParameterConfig(
+            ds_param.name, ds_param.label, options, description=ds_param.description, user_attribute=ds_param.user_attribute,
+            parent_name=ds_param.parent_name, **ds_param.extra_args
+        )
+@dataclass
+class NumberRangeDataSource(_NumericDataSource):
+    """
+    Lookup table for number range parameter default options
+    """
+    _default_lower_value_col: str | None
+    _default_upper_value_col: str | None
+    def __init__(
+        self, table_or_query: str, min_value_col: str, max_value_col: str, *, increment_col: str | None = None,
+        default_lower_value_col: str | None = None, default_upper_value_col: str | None = None, id_col: str | None = None,
+        source: SourceEnum = SourceEnum.CONNECTION, user_group_col: str | None = None, parent_id_col: str | None = None,
+        connection: str | None = None, **kwargs
+    ) -> None:
+        """
+        Constructor for NumRangeDataSource
+        Arguments:
+            table_or_query: Either the name of the table to use, or a query to
+            min_value_col: The column name of the minimum value
+            max_value_col: The column name of the maximum value
+            increment_col: The column name of the increment value. Defaults to column of 1's if None
+            default_lower_value_col: The column name of the default lower value. Defaults to min_value_col if None
+            default_upper_value_col: The column name of the default upper value. Defaults to max_value_col if None
+            id_col: The column name of the id
+            source: The source to fetch data from. Must be "connection", "seeds", or "vdl". Defaults to "connection"
+            user_group_col: The column name of the user group that the user is in for this option to be valid
+            parent_id_col: The column name of the parent option id that the default value belongs to
+            connection: Name of the connection to use defined in connections.py
+        """
+        super().__init__(
+            table_or_query, min_value_col, max_value_col, increment_col=increment_col, id_col=id_col, source=source,
+            user_group_col=user_group_col, parent_id_col=parent_id_col, connection=connection
+        )
+        self._default_lower_value_col = default_lower_value_col
+        self._default_upper_value_col = default_upper_value_col
+    def _convert(self, ds_param: pc.DataSourceParameterConfig, df: pl.DataFrame) -> pc.NumberRangeParameterConfig:
+        """
+        Method to convert the associated DataSourceParameterConfig into a NumberRangeParameterConfig
+        Arguments:
+            ds_param: The parameter to convert
+            df: The dataframe containing the parameter options data
+        Returns:
+            The converted parameter
+        """
+        self._validate_parameter_type(ds_param, pc.NumberRangeParameterConfig)
+        columns = [self._min_value_col, self._max_value_col, self._increment_col, self._default_lower_value_col, self._default_upper_value_col]
+        df_agg = self._get_aggregated_df(df, columns)
+        records = df_agg.to_pandas().to_dict("records")
+        options = tuple(
+            po.NumberRangeParameterOption(
+                record[self._min_value_col], record[self._max_value_col],
+                increment=self._get_key_from_record(self._increment_col, record, 1),
+                default_lower_value=self._get_key_from_record(self._default_lower_value_col, record, None),
+                default_upper_value=self._get_key_from_record(self._default_upper_value_col, record, None),
+                user_groups=self._get_key_from_record_as_list(self._user_group_col, record),
+                parent_option_ids=self._get_key_from_record_as_list(self._parent_id_col, record)
+            )
+            for record in records
+        )
+        return pc.NumberRangeParameterConfig(
+            ds_param.name, ds_param.label, options, description=ds_param.description, user_attribute=ds_param.user_attribute,
+            parent_name=ds_param.parent_name, **ds_param.extra_args
+        )
+@dataclass
+class TextDataSource(DataSource):
+    """
+    Lookup table for text parameter default options
+    """
+    _default_text_col: str
+    def __init__(
+        self, table_or_query: str, default_text_col: str, *, id_col: str | None = None, source: SourceEnum = SourceEnum.CONNECTION,
+        user_group_col: str | None = None, parent_id_col: str | None = None, connection: str | None = None,
+        **kwargs
+    ) -> None:
+        """
+        Constructor for TextDataSource
+        Arguments:
+            table_or_query: Either the name of the table to use, or a query to run
+            default_text_col: The column name of the default text
+            id_col: The column name of the id
+            source: The source to fetch data from. Must be "connection", "seeds", or "vdl". Defaults to "connection"
+            user_group_col: The column name of the user group that the user is in for this option to be valid
+            parent_id_col: The column name of the parent option id that the default date belongs to
+            connection: Name of the connection to use defined in connections.py
+        """
+        super().__init__(
+            table_or_query, id_col=id_col, source=source, user_group_col=user_group_col, parent_id_col=parent_id_col,
+            connection=connection
+        )
+        self._default_text_col = default_text_col
+    def _convert(self, ds_param: pc.DataSourceParameterConfig, df: pl.DataFrame) -> pc.TextParameterConfig:
+        """
+        Method to convert the associated DataSourceParameterConfig into a TextParameterConfig
+        Arguments:
+            ds_param: The parameter to convert
+            df: The dataframe containing the parameter options data
+        Returns:
+            The converted parameter
+        """
+        self._validate_parameter_type(ds_param, pc.TextParameterConfig)
+        columns = [self._default_text_col]
+        df_agg = self._get_aggregated_df(df, columns)
+        records = df_agg.to_pandas().to_dict("records")
+        options = tuple(
+            po.TextParameterOption(
+                default_text=str(record[self._default_text_col]),
+                user_groups=self._get_key_from_record_as_list(self._user_group_col, record),
+                parent_option_ids=self._get_key_from_record_as_list(self._parent_id_col, record)
+            )
+            for record in records
+        )
+        return pc.TextParameterConfig(
+            ds_param.name, ds_param.label, options, description=ds_param.description, user_attribute=ds_param.user_attribute,
+            parent_name=ds_param.parent_name, **ds_param.extra_args
+        )

squirrels/_dataset_types.py ADDED Viewed

@@ -0,0 +1,84 @@
+from typing import Callable, Literal
+from dataclasses import dataclass, field
+from functools import cached_property, lru_cache
+import polars as pl
+from ._model_configs import ModelConfig
+@dataclass
+class DatasetMetadata:
+    target_model_config: ModelConfig
+    @cached_property
+    def _json_repr(self) -> dict:
+        fields = []
+        for col in self.target_model_config.columns:
+            fields.append({
+                "name": col.name,
+                "type": col.type,
+                "condition": col.condition,
+                "description": col.description,
+                "category": col.category.value
+            })
+        return {
+            "schema": {
+                "fields": fields
+            },
+        }
+    def to_json(self) -> dict:
+        return self._json_repr
+@dataclass
+class DatasetResult(DatasetMetadata):
+    df: pl.DataFrame
+    to_json: Callable[[str, int, int], dict] = field(init=False)
+    def __post_init__(self):
+        self.to_json = lru_cache()(self._to_json)
+    def _to_json(self, orientation: Literal["records", "rows", "columns"], limit: int, offset: int) -> dict:
+        df = self.df.lazy()
+        if offset > 0:
+            df = df.filter(pl.col("_row_num") > offset)
+        if limit > 0:
+            df = df.limit(limit)
+        df = df.collect()
+        if orientation == "columns":
+            data = df.to_dict(as_series=False)
+        else:
+            data = df.to_dicts()
+            if orientation == "rows":
+                data = [[row[col] for col in df.columns] for row in data]
+        column_details_by_name = {col.name: col for col in self.target_model_config.columns}
+        fields = []
+        for col in df.columns:
+            if col == "_row_num":
+                fields.append({"name": "_row_num", "type": "integer", "description": "The row number of the dataset (starts at 1)", "category": "misc"})
+            elif col in column_details_by_name:
+                column_details = column_details_by_name[col]
+                fields.append({
+                    "name": col,
+                    "type": column_details.type,
+                    "description": column_details.description,
+                    "category": column_details.category.value
+                })
+            else:
+                fields.append({"name": col, "type": "unknown", "description": "", "category": "misc"})
+        return {
+            "schema": {
+                "fields": fields
+            },
+            "total_num_rows": self.df.select(pl.len()).item(),
+            "data_details": {
+                "num_rows": df.select(pl.len()).item(),
+                "orientation": orientation
+            },
+            "data": data
+        }

squirrels/_exceptions.py ADDED Viewed

@@ -0,0 +1,29 @@
+class InvalidInputError(Exception):
+    """
+    Use this exception when the error is due to providing invalid inputs to the REST API
+    Attributes:
+        status_code: The HTTP status code to return
+        error: A short error message that should never change in the future
+        error_description: A detailed error message (that is allowed to change in the future)
+    """
+    def __init__(self, status_code: int, error: str, error_description: str, *args) -> None:
+        self.status_code = status_code
+        self.error = error
+        self.error_description = error_description
+        super().__init__(error_description, *args)
+class ConfigurationError(Exception):
+    """
+    Use this exception when the server error is due to errors in the squirrels project instead of the squirrels framework/library
+    """
+    pass
+class FileExecutionError(Exception):
+    def __init__(self, message: str, error: Exception, *args) -> None:
+        t = "  "
+        new_message = f"\n" + message + f"\n{t}Produced error message:\n{t}{t}{error} (see above for more details on handled exception)"
+        super().__init__(new_message, *args)
+        self.error = error

squirrels 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

Potentially problematic release.

squirrels 0.4.0py3-none-any.whl → 0.5.0py3-none-any.whl