PyPI - pyoframe - Versions diffs - 0.2.0__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

pyoframe 0.2.0py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

pyoframe/__init__.py +21 -14
pyoframe/_arithmetic.py +346 -238
pyoframe/_constants.py +463 -0
pyoframe/_core.py +2652 -0
pyoframe/_model.py +598 -0
pyoframe/_model_element.py +189 -0
pyoframe/_monkey_patch.py +82 -0
pyoframe/{objective.py → _objective.py} +50 -17
pyoframe/{util.py → _utils.py} +108 -129
pyoframe/_version.py +16 -3
{pyoframe-0.2.0.dist-info → pyoframe-1.0.0.dist-info}/METADATA +37 -31
pyoframe-1.0.0.dist-info/RECORD +15 -0
pyoframe/constants.py +0 -140
pyoframe/core.py +0 -1794
pyoframe/model.py +0 -408
pyoframe/model_element.py +0 -184
pyoframe/monkey_patch.py +0 -54
pyoframe-0.2.0.dist-info/RECORD +0 -15
{pyoframe-0.2.0.dist-info → pyoframe-1.0.0.dist-info}/WHEEL +0 -0
{pyoframe-0.2.0.dist-info → pyoframe-1.0.0.dist-info}/licenses/LICENSE +0 -0
{pyoframe-0.2.0.dist-info → pyoframe-1.0.0.dist-info}/top_level.txt +0 -0

pyoframe/_arithmetic.py CHANGED Viewed

@@ -1,99 +1,87 @@
-"""
-Defines helper functions for doing arithmetic operations on expressions (e.g. addition).
-"""
+"""Defines helper functions for doing arithmetic operations on expressions (e.g. addition)."""
+from __future__ import annotations
-from typing import TYPE_CHECKING, List, Optional
+from typing import TYPE_CHECKING
 import polars as pl
-from pyoframe.constants import (
+from pyoframe._constants import (
     COEF_KEY,
     CONST_TERM,
-    KEY_TYPE,
     QUAD_VAR_KEY,
     RESERVED_COL_KEYS,
     VAR_KEY,
     Config,
+    ExtrasStrategy,
     PyoframeError,
-    UnmatchedStrategy,
 )
 if TYPE_CHECKING:  # pragma: no cover
-    from pyoframe.core import Expression
+    from pyoframe._core import Expression
+# Mapping of how a sum of two expressions should propagate the extras strategy
+_extras_propagation_rules = {
+    (ExtrasStrategy.DROP, ExtrasStrategy.DROP): ExtrasStrategy.DROP,
+    (ExtrasStrategy.UNSET, ExtrasStrategy.UNSET): ExtrasStrategy.UNSET,
+    (ExtrasStrategy.KEEP, ExtrasStrategy.KEEP): ExtrasStrategy.KEEP,
+    (ExtrasStrategy.DROP, ExtrasStrategy.KEEP): ExtrasStrategy.UNSET,
+    (ExtrasStrategy.DROP, ExtrasStrategy.UNSET): ExtrasStrategy.DROP,
+    (ExtrasStrategy.KEEP, ExtrasStrategy.UNSET): ExtrasStrategy.KEEP,
+}
-def _multiply_expressions(self: "Expression", other: "Expression") -> "Expression":
-    """
-    Multiply two or more expressions together.
+def multiply(self: Expression, other: Expression) -> Expression:
+    """Multiplies two expressions together.
     Examples:
         >>> import pyoframe as pf
-        >>> m = pf.Model("min")
+        >>> m = pf.Model()
         >>> m.x1 = pf.Variable()
         >>> m.x2 = pf.Variable()
         >>> m.x3 = pf.Variable()
         >>> result = 5 * m.x1 * m.x2
         >>> result
-        <Expression size=1 dimensions={} terms=1 degree=2>
-        5 x2 * x1
+        <Expression terms=1 type=quadratic>
+        5 x2 * x1
         >>> result * m.x3
         Traceback (most recent call last):
         ...
-        pyoframe.constants.PyoframeError: Failed to multiply expressions:
-        <Expression size=1 dimensions={} terms=1 degree=2> * <Expression size=1 dimensions={} terms=1>
-        Due to error:
-        Cannot multiply a quadratic expression by a non-constant.
+        pyoframe._constants.PyoframeError: Cannot multiply the two expressions below because the result would be a cubic. Only quadratic or linear expressions are allowed.
+        Expression 1 (quadratic):   ((5 * x1) * x2)
+        Expression 2 (linear):      x3
     """
-    try:
-        return _multiply_expressions_core(self, other)
-    except PyoframeError as error:
-        raise PyoframeError(
-            "Failed to multiply expressions:\n"
-            + " * ".join(
-                e.to_str(include_header=True, include_data=False) for e in [self, other]
-            )
-            + "\nDue to error:\n"
-            + str(error)
-        ) from error
-def _add_expressions(*expressions: "Expression") -> "Expression":
-    try:
-        return _add_expressions_core(*expressions)
-    except PyoframeError as error:
+    self_degree, other_degree = self.degree(), other.degree()
+    product_degree = self_degree + other_degree
+    if product_degree > 2:
+        assert product_degree <= 4, (
+            "Unexpected because expressions should not exceed degree 2."
+        )
+        res_type = "cubic" if product_degree == 3 else "quartic"
         raise PyoframeError(
-            "Failed to add expressions:\n"
-            + " + ".join(
-                e.to_str(include_header=True, include_data=False) for e in expressions
-            )
-            + "\nDue to error:\n"
-            + str(error)
-        ) from error
+            f"""Cannot multiply the two expressions below because the result would be a {res_type}. Only quadratic or linear expressions are allowed.
+Expression 1 ({self.degree(return_str=True)}):\t{self.name}
+Expression 2 ({other.degree(return_str=True)}):\t{other.name}"""
+        )
+    if self_degree == 1 and other_degree == 1:
+        return _quadratic_multiplication(self, other)
-def _multiply_expressions_core(self: "Expression", other: "Expression") -> "Expression":
-    self_degree, other_degree = self.degree(), other.degree()
-    if self_degree + other_degree > 2:
-        # We know one of the two must be a quadratic since 1 + 1 is not greater than 2.
-        raise PyoframeError("Cannot multiply a quadratic expression by a non-constant.")
+    # save names to use in debug messages before any swapping occurs
+    self_name, other_name = self.name, other.name
     if self_degree < other_degree:
         self, other = other, self
         self_degree, other_degree = other_degree, self_degree
-    if other_degree == 1:
-        assert self_degree == 1, (
-            "This should always be true since the sum of degrees must be <=2."
-        )
-        return _quadratic_multiplication(self, other)
     assert other_degree == 0, (
         "This should always be true since other cases have already been handled."
     )
-    multiplier = other.data.drop(
-        VAR_KEY
-    )  # QUAD_VAR_KEY doesn't need to be dropped since we know it doesn't exist
-    dims = self.dimensions_unsafe
-    other_dims = other.dimensions_unsafe
+    # QUAD_VAR_KEY doesn't need to be dropped since we know it doesn't exist
+    multiplier = other.data.drop(VAR_KEY)
+    dims = self._dimensions_unsafe
+    other_dims = other._dimensions_unsafe
     dims_in_common = [dim for dim in dims if dim in other_dims]
     data = (
@@ -101,17 +89,19 @@ def _multiply_expressions_core(self: "Expression", other: "Expression") -> "Expr
             multiplier,
             on=dims_in_common if len(dims_in_common) > 0 else None,
             how="inner" if dims_in_common else "cross",
+            maintain_order=(
+                "left" if Config.maintain_order and dims_in_common else None
+            ),
         )
         .with_columns(pl.col(COEF_KEY) * pl.col(COEF_KEY + "_right"))
         .drop(COEF_KEY + "_right")
     )
-    return self._new(data)
+    return self._new(data, name=f"({self_name} * {other_name})")
-def _quadratic_multiplication(self: "Expression", other: "Expression") -> "Expression":
-    """
-    Multiply two expressions of degree 1.
+def _quadratic_multiplication(self: Expression, other: Expression) -> Expression:
+    """Multiplies two expressions of degree 1.
     Examples:
         >>> import polars as pl
@@ -122,18 +112,29 @@ def _quadratic_multiplication(self: "Expression", other: "Expression") -> "Expre
         >>> expr1 = df * m.x1
         >>> expr2 = df * m.x2 * 2 + 4
         >>> expr1 * expr2
-        <Expression size=3 dimensions={'dim': 3} terms=6 degree=2>
-        [1]: 4 x1 +2 x2 * x1
-        [2]: 8 x1 +8 x2 * x1
-        [3]: 12 x1 +18 x2 * x1
+        <Expression height=3 terms=6 type=quadratic>
+        ┌─────┬───────────────────┐
+        │ dim ┆ expression        │
+        │ (3) ┆                   │
+        ╞═════╪═══════════════════╡
+        │ 1   ┆ 4 x1 +2 x2 * x1   │
+        │ 2   ┆ 8 x1 +8 x2 * x1   │
+        │ 3   ┆ 12 x1 +18 x2 * x1 │
+        └─────┴───────────────────┘
         >>> (expr1 * expr2) - df * m.x1 * df * m.x2 * 2
-        <Expression size=3 dimensions={'dim': 3} terms=3>
-        [1]: 4 x1
-        [2]: 8 x1
-        [3]: 12 x1
+        <Expression height=3 terms=3 type=linear>
+        ┌─────┬────────────┐
+        │ dim ┆ expression │
+        │ (3) ┆            │
+        ╞═════╪════════════╡
+        │ 1   ┆ 4 x1       │
+        │ 2   ┆ 8 x1       │
+        │ 3   ┆ 12 x1      │
+        └─────┴────────────┘
     """
-    dims = self.dimensions_unsafe
-    other_dims = other.dimensions_unsafe
+    dims = self._dimensions_unsafe
+    other_dims = other._dimensions_unsafe
     dims_in_common = [dim for dim in dims if dim in other_dims]
     data = (
@@ -141,11 +142,14 @@ def _quadratic_multiplication(self: "Expression", other: "Expression") -> "Expre
             other.data,
             on=dims_in_common if len(dims_in_common) > 0 else None,
             how="inner" if dims_in_common else "cross",
+            maintain_order=(
+                "left" if Config.maintain_order and dims_in_common else None
+            ),
         )
         .with_columns(pl.col(COEF_KEY) * pl.col(COEF_KEY + "_right"))
         .drop(COEF_KEY + "_right")
         .rename({VAR_KEY + "_right": QUAD_VAR_KEY})
-        # Swap VAR_KEY and QUAD_VAR_KEY so that VAR_KEy is always the larger one
+        # Swap VAR_KEY and QUAD_VAR_KEY so that VAR_KEY is always the larger one
         .with_columns(
             pl.when(pl.col(VAR_KEY) < pl.col(QUAD_VAR_KEY))
             .then(pl.col(QUAD_VAR_KEY))
@@ -160,147 +164,87 @@ def _quadratic_multiplication(self: "Expression", other: "Expression") -> "Expre
     data = _sum_like_terms(data)
-    return self._new(data)
+    return self._new(data, name=f"({self.name} * {other.name})")
-def _add_expressions_core(*expressions: "Expression") -> "Expression":
-    # Mapping of how a sum of two expressions should propogate the unmatched strategy
-    propogatation_strategies = {
-        (UnmatchedStrategy.DROP, UnmatchedStrategy.DROP): UnmatchedStrategy.DROP,
-        (
-            UnmatchedStrategy.UNSET,
-            UnmatchedStrategy.UNSET,
-        ): UnmatchedStrategy.UNSET,
-        (UnmatchedStrategy.KEEP, UnmatchedStrategy.KEEP): UnmatchedStrategy.KEEP,
-        (UnmatchedStrategy.DROP, UnmatchedStrategy.KEEP): UnmatchedStrategy.UNSET,
-        (UnmatchedStrategy.DROP, UnmatchedStrategy.UNSET): UnmatchedStrategy.DROP,
-        (UnmatchedStrategy.KEEP, UnmatchedStrategy.UNSET): UnmatchedStrategy.KEEP,
-    }
+def add(*expressions: Expression) -> Expression:
+    """Add multiple expressions together."""
     assert len(expressions) > 1, "Need at least two expressions to add together."
-    dims = expressions[0].dimensions
-    if dims is None:
-        requires_join = False
-        dims = []
-    elif Config.disable_unmatched_checks:
-        requires_join = any(
-            expr.unmatched_strategy
-            not in (UnmatchedStrategy.KEEP, UnmatchedStrategy.UNSET)
-            for expr in expressions
-        )
+    if Config.disable_extras_checks:
+        no_checks_strats = (ExtrasStrategy.KEEP, ExtrasStrategy.UNSET)
     else:
-        requires_join = any(
-            expr.unmatched_strategy != UnmatchedStrategy.KEEP for expr in expressions
-        )
+        no_checks_strats = (ExtrasStrategy.KEEP,)
-    has_dim_conflict = any(
-        sorted(dims) != sorted(expr.dimensions_unsafe) for expr in expressions[1:]
+    no_extras_checks_required = (
+        all(expr._extras_strategy in no_checks_strats for expr in expressions)
+        # if only one dimensioned, then there is no such thing as extra labels,
+        # labels will be set by the only dimensioned expression
+        or sum(not expr.dimensionless for expr in expressions) <= 1
     )
-    # If we cannot use .concat compute the sum in a pairwise manner
-    if len(expressions) > 2 and (has_dim_conflict or requires_join):
-        result = expressions[0]
-        for expr in expressions[1:]:
-            result = _add_expressions_core(result, expr)
-        return result
-    if has_dim_conflict:
-        assert len(expressions) == 2
-        expressions = (
-            _add_dimension(expressions[0], expressions[1]),
-            _add_dimension(expressions[1], expressions[0]),
-        )
-        assert sorted(expressions[0].dimensions_unsafe) == sorted(
-            expressions[1].dimensions_unsafe
-        )
-    dims = expressions[0].dimensions_unsafe
-    # Check no dims conflict
-    assert all(
-        sorted(dims) == sorted(expr.dimensions_unsafe) for expr in expressions[1:]
+    has_dim_conflict = any(
+        sorted(expressions[0]._dimensions_unsafe) != sorted(expr._dimensions_unsafe)
+        for expr in expressions[1:]
     )
-    if requires_join:
-        assert len(expressions) == 2
-        assert dims != []
-        left, right = expressions[0], expressions[1]
-        # Order so that drop always comes before keep, and keep always comes before default
-        if (left.unmatched_strategy, right.unmatched_strategy) in (
-            (UnmatchedStrategy.UNSET, UnmatchedStrategy.DROP),
-            (UnmatchedStrategy.UNSET, UnmatchedStrategy.KEEP),
-            (UnmatchedStrategy.KEEP, UnmatchedStrategy.DROP),
-        ):
-            left, right = right, left
+    # If we cannot use .concat compute the sum in a pairwise manner, so far nobody uses this code
+    if len(expressions) > 2:  # pragma: no cover
+        assert False, "This code has not been tested."
+        if has_dim_conflict or not no_extras_checks_required:
+            result = expressions[0]
+            for expr in expressions[1:]:
+                result = add(result, expr)
+            return result
+        propagate_strat = expressions[0]._extras_strategy
+        dims = expressions[0]._dimensions_unsafe
+        expr_data = [expr.data for expr in expressions]
+    else:
+        left, right = expressions[0], expressions[1]
-        def get_indices(expr):
-            return expr.data.select(dims).unique(maintain_order=True)
+        if has_dim_conflict:
+            left_dims, right_dims = left._dimensions_unsafe, right._dimensions_unsafe
+            missing_left = [dim for dim in right_dims if dim not in left_dims]
+            missing_right = [dim for dim in left_dims if dim not in right_dims]
+            common_dims = [dim for dim in left_dims if dim in right_dims]
+            if not (
+                set(missing_left) <= set(left._allowed_new_dims)
+                and set(missing_right) <= set(right._allowed_new_dims)
+            ):
+                _raise_addition_error(
+                    left,
+                    right,
+                    f"their\n\tdimensions are different ({left_dims} != {right_dims})",
+                    "If this is intentional, use .over(…) to broadcast. Learn more at\n\thttps://bravos-power.github.io/pyoframe/latest/learn/concepts/addition/#adding-expressions-with-differing-dimensions-using-over",
+                )
-        left_data, right_data = left.data, right.data
+            left_old = left
+            if missing_left:
+                left = _broadcast(left, right, common_dims, missing_left)
+            if missing_right:
+                right = _broadcast(
+                    right, left_old, common_dims, missing_right, swapped=True
+                )
-        strat = (left.unmatched_strategy, right.unmatched_strategy)
+            assert sorted(left._dimensions_unsafe) == sorted(right._dimensions_unsafe)
-        propogate_strat = propogatation_strategies[strat]  # type: ignore
+        dims = left._dimensions_unsafe
-        if strat == (UnmatchedStrategy.DROP, UnmatchedStrategy.DROP):
-            left_data = left.data.join(get_indices(right), how="inner", on=dims)
-            right_data = right.data.join(get_indices(left), how="inner", on=dims)
-        elif strat == (UnmatchedStrategy.UNSET, UnmatchedStrategy.UNSET):
-            assert not Config.disable_unmatched_checks, (
-                "This code should not be reached when unmatched checks are disabled."
-            )
-            outer_join = get_indices(left).join(
-                get_indices(right),
-                how="full",
-                on=dims,
-            )
-            if outer_join.get_column(dims[0]).null_count() > 0:
-                raise PyoframeError(
-                    "Dataframe has unmatched values. If this is intentional, use .drop_unmatched() or .keep_unmatched()\n"
-                    + str(outer_join.filter(outer_join.get_column(dims[0]).is_null()))
-                )
-            if outer_join.get_column(dims[0] + "_right").null_count() > 0:
-                raise PyoframeError(
-                    "Dataframe has unmatched values. If this is intentional, use .drop_unmatched() or .keep_unmatched()\n"
-                    + str(
-                        outer_join.filter(
-                            outer_join.get_column(dims[0] + "_right").is_null()
-                        )
-                    )
-                )
-        elif strat == (UnmatchedStrategy.DROP, UnmatchedStrategy.KEEP):
-            left_data = get_indices(right).join(left.data, how="left", on=dims)
-        elif strat == (UnmatchedStrategy.DROP, UnmatchedStrategy.UNSET):
-            left_data = get_indices(right).join(left.data, how="left", on=dims)
-            if left_data.get_column(COEF_KEY).null_count() > 0:
-                raise PyoframeError(
-                    "Dataframe has unmatched values. If this is intentional, use .drop_unmatched() or .keep_unmatched()\n"
-                    + str(left_data.filter(left_data.get_column(COEF_KEY).is_null()))
-                )
-        elif strat == (UnmatchedStrategy.KEEP, UnmatchedStrategy.UNSET):
-            assert not Config.disable_unmatched_checks, (
-                "This code should not be reached when unmatched checks are disabled."
-            )
-            unmatched = right.data.join(get_indices(left), how="anti", on=dims)
-            if len(unmatched) > 0:
-                raise PyoframeError(
-                    "Dataframe has unmatched values. If this is intentional, use .drop_unmatched() or .keep_unmatched()\n"
-                    + str(unmatched)
-                )
-        else:  # pragma: no cover
-            assert False, "This code should've never been reached!"
-        expr_data = [left_data, right_data]
-    else:
-        propogate_strat = expressions[0].unmatched_strategy
-        expr_data = [expr.data for expr in expressions]
+        if not no_extras_checks_required:
+            expr_data, propagate_strat = _handle_extra_labels(left, right, dims)
+        else:
+            propagate_strat = left._extras_strategy
+            expr_data = (left.data, right.data)
     # Add quadratic column if it is needed and doesn't already exist
     if any(QUAD_VAR_KEY in df.columns for df in expr_data):
         expr_data = [
             (
-                df.with_columns(pl.lit(CONST_TERM).alias(QUAD_VAR_KEY).cast(KEY_TYPE))
+                df.with_columns(
+                    pl.lit(CONST_TERM).alias(QUAD_VAR_KEY).cast(Config.id_dtype)
+                )
                 if QUAD_VAR_KEY not in df.columns
                 else df
             )
@@ -315,71 +259,215 @@ def _add_expressions_core(*expressions: "Expression") -> "Expression":
     data = pl.concat(expr_data, how="vertical_relaxed")
     data = _sum_like_terms(data)
-    new_expr = expressions[0]._new(data)
-    new_expr.unmatched_strategy = propogate_strat
+    full_name = expressions[0].name
+    for expr in expressions[1:]:
+        name = expr.name
+        full_name += f" - {name[1:]}" if name[0] == "-" else f" + {name}"
+    new_expr = expressions[0]._new(data, name=f"({full_name})")
+    new_expr._extras_strategy = propagate_strat
     return new_expr
-def _add_dimension(self: "Expression", target: "Expression") -> "Expression":
-    target_dims = target.dimensions
-    if target_dims is None:
-        return self
-    dims = self.dimensions
-    if dims is None:
-        dims_in_common = []
-        missing_dims = target_dims
-    else:
-        dims_in_common = [dim for dim in dims if dim in target_dims]
-        missing_dims = [dim for dim in target_dims if dim not in dims]
+def _handle_extra_labels(
+    left: Expression, right: Expression, dims: list[str]
+) -> tuple[tuple[pl.DataFrame, pl.DataFrame], ExtrasStrategy]:
+    assert dims != []
+    # Order so that drop always comes before keep, and keep always comes before default
+    if swapped := (
+        (left._extras_strategy, right._extras_strategy)
+        in (
+            (ExtrasStrategy.UNSET, ExtrasStrategy.DROP),
+            (ExtrasStrategy.UNSET, ExtrasStrategy.KEEP),
+            (ExtrasStrategy.KEEP, ExtrasStrategy.DROP),
+        )
+    ):
+        left, right = right, left
-    # We're already at the size of our target
-    if not missing_dims:
-        return self
+    def get_labels(expr):
+        return expr.data.select(dims).unique(maintain_order=Config.maintain_order)
-    if not set(missing_dims) <= set(self.allowed_new_dims):
-        # TODO actually suggest using e.g. .add_dim("a", "b") instead of just "use .add_dim()"
-        raise PyoframeError(
-            f"Dataframe has missing dimensions {missing_dims}. If this is intentional, use .add_dim()\n{self.data}"
+    left_data, right_data = left.data, right.data
+    strat = (left._extras_strategy, right._extras_strategy)
+    if strat == (ExtrasStrategy.DROP, ExtrasStrategy.DROP):
+        left_data = left.data.join(
+            get_labels(right),
+            on=dims,
+            maintain_order="left" if Config.maintain_order else None,
+        )
+        right_data = right.data.join(
+            get_labels(left),
+            on=dims,
+            maintain_order="left" if Config.maintain_order else None,
         )
+    elif strat == (ExtrasStrategy.UNSET, ExtrasStrategy.UNSET):
+        assert not Config.disable_extras_checks, (
+            "This code should not be reached when checks for extra values are disabled."
+        )
+        left_labels, right_labels = get_labels(left), get_labels(right)
+        left_extras = left_labels.join(right_labels, how="anti", on=dims)
+        right_extras = right_labels.join(left_labels, how="anti", on=dims)
+        if len(left_extras) > 0:
+            _raise_extras_error(
+                left, right, left_extras, swapped, extras_on_right=False
+            )
+        if len(right_extras) > 0:
+            _raise_extras_error(left, right, right_extras, swapped)
+    elif strat == (ExtrasStrategy.DROP, ExtrasStrategy.KEEP):
+        left_data = get_labels(right).join(
+            left.data,
+            on=dims,
+            maintain_order="left" if Config.maintain_order else None,
+        )
+    elif strat == (ExtrasStrategy.DROP, ExtrasStrategy.UNSET):
+        right_labels = get_labels(right)
+        left_data = right_labels.join(
+            left.data,
+            how="left",
+            on=dims,
+            maintain_order="left" if Config.maintain_order else None,
+        )
+        if left_data.get_column(COEF_KEY).null_count() > 0:
+            _raise_extras_error(
+                left,
+                right,
+                right_labels.join(get_labels(left), how="anti", on=dims),
+                swapped,
+            )
-    target_data = target.data.select(target_dims).unique(maintain_order=True)
+    elif strat == (ExtrasStrategy.KEEP, ExtrasStrategy.UNSET):
+        assert not Config.disable_extras_checks, (
+            "This code should not be reached when checks for extra values are disabled."
+        )
+        extras = right.data.join(get_labels(left), how="anti", on=dims)
+        if len(extras) > 0:
+            _raise_extras_error(left, right, extras.select(dims), swapped)
+    else:  # pragma: no cover
+        assert False, "This code should've never been reached!"
+    if swapped:
+        left_data, right_data = right_data, left_data
+    return (left_data, right_data), _extras_propagation_rules[strat]
+def _raise_extras_error(
+    left: Expression,
+    right: Expression,
+    extra_labels: pl.DataFrame,
+    swapped: bool,
+    extras_on_right: bool = True,
+):
+    if swapped:
+        left, right = right, left
+        extras_on_right = not extras_on_right
+    expression_num = 2 if extras_on_right else 1
+    with Config.print_polars_config:
+        _raise_addition_error(
+            left,
+            right,
+            f"expression {expression_num} has extra labels",
+            f"Extra labels in expression {expression_num}:\n{extra_labels}\nUse .drop_extras() or .keep_extras() to indicate how the extra labels should be handled. Learn more at\n\thttps://bravos-power.github.io/pyoframe/latest/learn/concepts/addition",
+        )
-    if not dims_in_common:
-        return self._new(self.data.join(target_data, how="cross"))
-    # If drop, we just do an inner join to get into the shape of the other
-    if self.unmatched_strategy == UnmatchedStrategy.DROP:
-        return self._new(self.data.join(target_data, on=dims_in_common, how="inner"))
+def _raise_addition_error(
+    left: Expression, right: Expression, reason: str, postfix: str
+):
+    op = "add"
+    right_name = right.name
+    if right_name[0] == "-":
+        op = "subtract"
+        right_name = right_name[1:]
+    raise PyoframeError(
+        f"""Cannot {op} the two expressions below because {reason}.
+Expression 1:\t{left.name}
+Expression 2:\t{right_name}
+{postfix}
+"""
+    )
-    result = self.data.join(target_data, on=dims_in_common, how="left")
-    right_has_missing = result.get_column(missing_dims[0]).null_count() > 0
-    if right_has_missing:
-        raise PyoframeError(
-            f"Cannot add dimension {missing_dims} since it contains unmatched values. If this is intentional, consider using .drop_unmatched()"
+# TODO consider returning a dataframe instead of an expression to simplify code (e.g. avoid copy_flags)
+def _broadcast(
+    self: Expression,
+    target: Expression,
+    common_dims: list[str],
+    missing_dims: list[str],
+    swapped: bool = False,
+) -> Expression:
+    target_data = target.data.select(target._dimensions_unsafe).unique(
+        maintain_order=Config.maintain_order
+    )
+    if not common_dims:
+        res = self._new(self.data.join(target_data, how="cross"), name=self.name)
+        res._copy_flags(self)
+        return res
+    # If drop, we just do an inner join to get into the shape of the other
+    if self._extras_strategy == ExtrasStrategy.DROP:
+        res = self._new(
+            self.data.join(
+                target_data,
+                on=common_dims,
+                maintain_order="left" if Config.maintain_order else None,
+            ),
+            name=self.name,
+        )
+        res._copy_flags(self)
+        return res
+    result = self.data.join(
+        target_data,
+        on=common_dims,
+        how="left",
+        maintain_order="left" if Config.maintain_order else None,
+    )
+    if result.get_column(missing_dims[0]).null_count() > 0:
+        target_labels = target.data.select(target._dimensions_unsafe).unique(
+            maintain_order=Config.maintain_order
         )
-    return self._new(result)
+        _raise_extras_error(
+            self,
+            target,
+            target_labels.join(self.data, how="anti", on=common_dims),
+            swapped,
+        )
+    res = self._new(result, self.name)
+    res._copy_flags(self)
+    return res
 def _sum_like_terms(df: pl.DataFrame) -> pl.DataFrame:
     """Combines terms with the same variables."""
     dims = [c for c in df.columns if c not in RESERVED_COL_KEYS]
     var_cols = [VAR_KEY] + ([QUAD_VAR_KEY] if QUAD_VAR_KEY in df.columns else [])
-    df = df.group_by(dims + var_cols, maintain_order=True).sum()
+    df = df.group_by(dims + var_cols, maintain_order=Config.maintain_order).sum()
     return df
 def _simplify_expr_df(df: pl.DataFrame) -> pl.DataFrame:
-    """
-    Removes the quadratic column and terms with a zero coefficient, when applicable.
+    """Removes the quadratic column and terms with a zero coefficient, when applicable.
     Specifically, zero coefficient terms are always removed, except if they're the only terms in which case the expression contains a single term.
     The quadratic column is removed if the expression is not a quadratic.
     Examples:
         >>> import polars as pl
-        >>> df = pl.DataFrame({ VAR_KEY: [CONST_TERM, 1], QUAD_VAR_KEY: [CONST_TERM, 1], COEF_KEY: [1.0, 0]})
+        >>> df = pl.DataFrame(
+        ...     {
+        ...         VAR_KEY: [CONST_TERM, 1],
+        ...         QUAD_VAR_KEY: [CONST_TERM, 1],
+        ...         COEF_KEY: [1.0, 0],
+        ...     }
+        ... )
         >>> _simplify_expr_df(df)
         shape: (1, 2)
         ┌───────────────┬─────────┐
@@ -389,7 +477,21 @@ def _simplify_expr_df(df: pl.DataFrame) -> pl.DataFrame:
         ╞═══════════════╪═════════╡
         │ 0             ┆ 1.0     │
         └───────────────┴─────────┘
-        >>> df = pl.DataFrame({"t": [1, 1, 2, 2, 3, 3], VAR_KEY: [CONST_TERM, 1, CONST_TERM, 1, 1, 2], QUAD_VAR_KEY: [CONST_TERM, CONST_TERM, CONST_TERM, CONST_TERM, CONST_TERM, 1], COEF_KEY: [1, 0, 0, 0, 1, 0]})
+        >>> df = pl.DataFrame(
+        ...     {
+        ...         "t": [1, 1, 2, 2, 3, 3],
+        ...         VAR_KEY: [CONST_TERM, 1, CONST_TERM, 1, 1, 2],
+        ...         QUAD_VAR_KEY: [
+        ...             CONST_TERM,
+        ...             CONST_TERM,
+        ...             CONST_TERM,
+        ...             CONST_TERM,
+        ...             CONST_TERM,
+        ...             1,
+        ...         ],
+        ...         COEF_KEY: [1, 0, 0, 0, 1, 0],
+        ...     }
+        ... )
         >>> _simplify_expr_df(df)
         shape: (3, 3)
         ┌─────┬───────────────┬─────────┐
@@ -406,9 +508,14 @@ def _simplify_expr_df(df: pl.DataFrame) -> pl.DataFrame:
     if len(df_filtered) < len(df):
         dims = [c for c in df.columns if c not in RESERVED_COL_KEYS]
         if dims:
-            dim_values = df.select(dims).unique(maintain_order=True)
+            dim_values = df.select(dims).unique(maintain_order=Config.maintain_order)
             df = (
-                dim_values.join(df_filtered, on=dims, how="left")
+                dim_values.join(
+                    df_filtered,
+                    on=dims,
+                    how="left",
+                    maintain_order="left" if Config.maintain_order else None,
+                )
                 .with_columns(pl.col(COEF_KEY).fill_null(0))
                 .fill_null(CONST_TERM)
             )
@@ -417,7 +524,7 @@ def _simplify_expr_df(df: pl.DataFrame) -> pl.DataFrame:
             if df.is_empty():
                 df = pl.DataFrame(
                     {VAR_KEY: [CONST_TERM], COEF_KEY: [0]},
-                    schema={VAR_KEY: KEY_TYPE, COEF_KEY: pl.Float64},
+                    schema={VAR_KEY: Config.id_dtype, COEF_KEY: pl.Float64},
                 )
     if QUAD_VAR_KEY in df.columns and (df.get_column(QUAD_VAR_KEY) == CONST_TERM).all():
@@ -426,10 +533,11 @@ def _simplify_expr_df(df: pl.DataFrame) -> pl.DataFrame:
     return df
-def _get_dimensions(df: pl.DataFrame) -> Optional[List[str]]:
-    """
-    Returns the dimensions of the DataFrame. Reserved columns do not count as dimensions.
-    If there are no dimensions, returns None to force caller to handle this special case.
+def _get_dimensions(df: pl.DataFrame) -> list[str] | None:
+    """Returns the dimensions of the DataFrame.
+    Reserved columns do not count as dimensions. If there are no dimensions,
+    returns `None` to force caller to handle this special case.
     Examples:
         >>> import polars as pl

pyoframe 0.2.0__py3-none-any.whl → 1.0.0__py3-none-any.whl

pyoframe 0.2.0py3-none-any.whl → 1.0.0py3-none-any.whl