PyPI - geometallurgy - Versions diffs - 0.4.12__py3-none-any.whl → 0.4.13__py3-none-any.whl - Mend

geometallurgy 0.4.12py3-none-any.whl → 0.4.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

elphick/geomet/__init__.py +11 -11
elphick/geomet/base.py +1133 -1133
elphick/geomet/block_model.py +319 -358
elphick/geomet/config/__init__.py +1 -1
elphick/geomet/config/config_read.py +39 -39
elphick/geomet/config/flowsheet_example_partition.yaml +31 -31
elphick/geomet/config/flowsheet_example_simple.yaml +25 -25
elphick/geomet/config/mc_config.yml +35 -35
elphick/geomet/data/downloader.py +39 -39
elphick/geomet/data/register.csv +12 -12
elphick/geomet/datasets/__init__.py +2 -2
elphick/geomet/datasets/datasets.py +47 -47
elphick/geomet/datasets/downloader.py +40 -40
elphick/geomet/datasets/register.csv +12 -12
elphick/geomet/datasets/sample_data.py +196 -196
elphick/geomet/extras.py +35 -35
elphick/geomet/flowsheet/__init__.py +1 -1
elphick/geomet/flowsheet/flowsheet.py +1216 -1216
elphick/geomet/flowsheet/loader.py +99 -99
elphick/geomet/flowsheet/operation.py +256 -256
elphick/geomet/flowsheet/stream.py +39 -39
elphick/geomet/interval_sample.py +641 -641
elphick/geomet/io.py +379 -379
elphick/geomet/plot.py +147 -147
elphick/geomet/sample.py +28 -28
elphick/geomet/utils/amenability.py +49 -49
elphick/geomet/utils/block_model_converter.py +93 -93
elphick/geomet/utils/components.py +136 -136
elphick/geomet/utils/data.py +49 -49
elphick/geomet/utils/estimates.py +108 -108
elphick/geomet/utils/interp.py +193 -193
elphick/geomet/utils/interp2.py +134 -134
elphick/geomet/utils/layout.py +72 -72
elphick/geomet/utils/moisture.py +61 -61
elphick/geomet/utils/output.html +617 -0
elphick/geomet/utils/pandas.py +378 -378
elphick/geomet/utils/parallel.py +29 -29
elphick/geomet/utils/partition.py +63 -63
elphick/geomet/utils/size.py +51 -51
elphick/geomet/utils/timer.py +80 -80
elphick/geomet/utils/viz.py +56 -56
elphick/geomet/validate.py.hide +176 -176
{geometallurgy-0.4.12.dist-info → geometallurgy-0.4.13.dist-info}/LICENSE +21 -21
{geometallurgy-0.4.12.dist-info → geometallurgy-0.4.13.dist-info}/METADATA +7 -5
geometallurgy-0.4.13.dist-info/RECORD +49 -0
{geometallurgy-0.4.12.dist-info → geometallurgy-0.4.13.dist-info}/WHEEL +1 -1
geometallurgy-0.4.12.dist-info/RECORD +0 -48
{geometallurgy-0.4.12.dist-info → geometallurgy-0.4.13.dist-info}/entry_points.txt +0 -0

elphick/geomet/interval_sample.py CHANGED Viewed

@@ -1,641 +1,641 @@
-from __future__ import annotations
-import functools
-import uuid
-from pathlib import Path
-from typing import Optional, Literal, Callable, Union, Iterable, TYPE_CHECKING
-import numpy as np
-import pandas as pd
-from pandas import IntervalIndex
-from pandas.core.indexes.frozen import FrozenList
-import plotly.graph_objects as go
-import plotly.express as px
-import elphick.geomet.flowsheet.stream
-from elphick.geomet.utils.amenability import amenability_index
-from elphick.geomet.utils.interp import mass_preserving_interp
-from elphick.geomet.utils.interp2 import mass_preserving_interp_2d
-from elphick.geomet.utils.pandas import MeanIntervalIndex, weight_average, calculate_recovery, calculate_partition, \
-    cumulate, mass_to_composition
-from elphick.geomet.base import MassComposition
-if TYPE_CHECKING:
-    from elphick.geomet.flowsheet.stream import Stream
-class IntervalSample(MassComposition):
-    """
-    A class to represent a sample of data with an interval index.
-    This exposes methods to split the sample by a partition definition.
-    """
-    def __init__(self,
-                 data: Optional[pd.DataFrame] = None,
-                 name: Optional[str] = None,
-                 moisture_in_scope: bool = True,
-                 mass_wet_var: Optional[str] = None,
-                 mass_dry_var: Optional[str] = None,
-                 moisture_var: Optional[str] = None,
-                 component_vars: Optional[list[str]] = None,
-                 composition_units: Literal['%', 'ppm', 'ppb'] = '%',
-                 components_as_symbols: bool = True,
-                 ranges: Optional[dict[str, list]] = None,
-                 config_file: Optional[Path] = None):
-        super().__init__(data=data, name=name, moisture_in_scope=moisture_in_scope,
-                         mass_wet_var=mass_wet_var, mass_dry_var=mass_dry_var,
-                         moisture_var=moisture_var, component_vars=component_vars,
-                         composition_units=composition_units, components_as_symbols=components_as_symbols,
-                         ranges=ranges, config_file=config_file)
-        # manage the interval indexes
-        if self.data is not None:
-            self.data = self._create_interval_indexes(data)
-    def _create_interval_indexes(self, data: pd.DataFrame) -> pd.DataFrame:
-        original_indexes = data.index.names
-        interval_indexes = []
-        for pair in self.config['intervals']['suffixes']:
-            if data.index.names != FrozenList([None]):
-                suffix_candidates: dict = {n: n.split('_')[-1].lower() for n in data.index.names}
-                suffixes: dict = {k: v for k, v in suffix_candidates.items() if v in pair}
-                if suffixes:
-                    data.reset_index(list(suffixes.keys()), inplace=True)
-                    num_interval_indexes: int = int(len(suffixes.keys()) / 2)
-                    for i in range(0, num_interval_indexes + 1, 2):
-                        keys = list(suffixes.keys())[i: i + 2]
-                        base_name: str = '_'.join(keys[0].split('_')[:-1])
-                        index = IntervalIndex.from_arrays(left=data[keys[0]], right=data[keys[1]],
-                                                          closed=self.config['intervals']['closed'])
-                        index.name = base_name
-                        # left and right names are only preserved for a single interval index.
-                        # when a multiindex is used, the names are not preserved.
-                        index.left.name = keys[0].split('_')[-1]
-                        index.right.name = keys[1].split('_')[-1]
-                        interval_indexes.append(index)
-                        # drop the index columns from the dataframe columns
-                        data.drop(columns=keys, inplace=True)
-        if interval_indexes:
-            new_indexes = {}  # Use dict to preserve order and uniqueness
-            # we need to set the index to include the new interval index, but respect the order of the original.
-            for i in original_indexes:
-                if i.split('_')[0] not in [ii.name for ii in interval_indexes]:
-                    new_indexes[i] = data.index.get_level_values(i)
-                else:
-                    # Find the corresponding interval index and append it to the new_indexes list
-                    for ii in interval_indexes:
-                        if ii.name == i.split('_')[0]:
-                            new_indexes[ii.name] = ii
-                            break
-            if len(new_indexes) > 1:
-                data.index = pd.MultiIndex.from_frame(pd.DataFrame(new_indexes.values()).T, names=new_indexes.keys())
-            else:
-                data.index = list(new_indexes.values())[0]
-        return data
-    def split_by_partition(self, partition_definition: Union[pd.Series, Callable], name_1: str = 'preferred',
-                           name_2: str = 'complement'):
-        """
-        Split the sample into two samples based on the partition definition.
-        .. math::
-            K = \\frac{{m_{preferred}}}{{m_{feed}}}
-        :param partition_definition: A function that takes a data frame and returns a boolean series with a
-         range [0, 1]. A 1D function must have an argument that matches the dimension of the interval index.
-         A 2D function must have two arguments that match the dimensions of the interval index.
-        :param name_1: The name of the first sample.
-        :param name_2: The name of the second sample.
-        :return: A tuple of two IntervalSamples.
-        """
-        # Check that the partition definition has the correct number of arguments and that the names match
-        sample_fraction_dims = [col for col in self.mass_data.index.names if
-                                col != isinstance(self.mass_data.index.get_level_values(col), pd.IntervalIndex)]
-        fraction_means: pd.DataFrame = self.mass_data.index.to_frame()[sample_fraction_dims].apply(
-            lambda x: MeanIntervalIndex(x).mean, axis=0)
-        # Get the function from the partial object if necessary
-        if isinstance(partition_definition, Callable):
-            partition_func = partition_definition.func if isinstance(partition_definition,
-                                                                     functools.partial) else partition_definition
-            # Check that the required argument names are present in the IntervalIndex levels
-            required_args = [col for col in partition_func.__code__.co_varnames if col in sample_fraction_dims]
-            pn: pd.Series = pd.Series(partition_definition(**fraction_means[required_args]), name='K',
-                                      index=self._mass_data.index)
-        elif isinstance(partition_definition, pd.Series):
-            required_args = partition_definition.index.names
-            pn: pd.Series = partition_definition
-        else:
-            raise TypeError(f"The partition definition must be a function or a pandas Series:"
-                            f" type = {type(partition_definition)}")
-        for arg, dim in zip(required_args, sample_fraction_dims):
-            if arg != dim:
-                raise ValueError(f"The partition definition argument name does not match the index name. "
-                                 f"Expected {dim}, found {arg}")
-        self.to_stream()
-        self: 'Stream'
-        sample_1 = self.create_congruent_object(name=name_1).to_stream()
-        sample_1.mass_data = self.mass_data.copy().multiply(pn, axis=0)
-        sample_1.set_nodes([self.nodes[1], uuid.uuid4()])
-        sample_2 = self.create_congruent_object(name=name_2)
-        sample_2.mass_data = self.mass_data.copy().multiply((1 - pn), axis=0)
-        sample_2.set_nodes([self.nodes[1], uuid.uuid4()])
-        return sample_1, sample_2
-    def is_2d_grid(self):
-        """
-        Check if the sample is a 2d grid.
-        :return: True if the sample has 2 levels of intervals, False otherwise.
-        """
-        res = False
-        if self.mass_data is not None and self.mass_data.index.nlevels >= 2:
-            # get the type of the index levels
-            level_types = [type(level) for level in self.mass_data.index.levels]
-            # get the counts of each type
-            level_counts = {level_type: level_types.count(level_type) for level_type in set(level_types)}
-            # check if there are 2 levels of intervals
-            res = level_counts.get(pd.Interval, 0) == 2
-        return res
-    @property
-    def is_rectilinear_grid(self):
-        """If rectilinear we can plot with a simple heatmap"""
-        res = False
-        if self.mass_data is not None and self._mass_data.index.nlevels >= 2:
-            # Get the midpoints of the intervals for X and Y
-            x_midpoints = self.mass_data.index.get_level_values(0).mid
-            y_midpoints = self.mass_data.index.get_level_values(1).mid
-            # Get unique midpoints for X and Y
-            unique_x_midpoints = set(x_midpoints)
-            unique_y_midpoints = set(y_midpoints)
-            # Check if the grid is full (i.e., no steps in the lines that define the grid edges)
-            # todo: fix this logic - it is not correct
-            if len(unique_x_midpoints) == len(x_midpoints) and len(unique_y_midpoints) == len(y_midpoints):
-                res = True
-        return res
-    def ideal_incremental_separation(self, discard_from: Literal["lowest", "highest"] = "lowest") -> pd.DataFrame:
-        """Incrementally separate a fractionated sample.
-        This method sorts by the provided direction prior to incrementally removing and discarding the first fraction
-         (of the remaining fractions) and recalculating the mass-composition and recovery of the portion remaining.
-         This is equivalent to incrementally applying a perfect separation (partition) at every interval edge.
-        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
-        See also: ideal_incremental_composition, ideal_incremental_recovery.
-        Args:
-            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
-             first, then the next lowest, etc.
-        Returns:
-            A pandas DataFrame
-        """
-        self._check_one_dim_interval()
-        sample: pd.DataFrame = self.data
-        is_decreasing: bool = sample.index.is_monotonic_decreasing
-        if discard_from == "lowest":
-            sample.sort_index(ascending=True, inplace=True)
-            new_index: pd.Index = pd.Index(sample.index.left)
-        else:
-            sample.sort_index(ascending=False, inplace=True)
-            new_index: pd.Index = pd.Index(sample.index.right)
-        new_index.name = f"{sample.index.name}_cut-point"
-        aggregated_chunks: list = []
-        recovery_chunks: list = []
-        head: pd.Series = sample.pipe(weight_average)
-        for i, indx in enumerate(sample.index):
-            tmp_composition: pd.DataFrame = sample.iloc[i:, :].pipe(weight_average).to_frame().T
-            aggregated_chunks.append(tmp_composition)
-            recovery_chunks.append(tmp_composition.pipe(calculate_recovery, df_ref=head.to_frame().T))
-        res_composition: pd.DataFrame = pd.concat(aggregated_chunks).assign(attribute="composition").set_index(
-            new_index)
-        res_recovery: pd.DataFrame = pd.concat(recovery_chunks).assign(attribute="recovery").set_index(
-            new_index)
-        if is_decreasing:
-            res_composition.sort_index(ascending=False, inplace=True)
-            res_recovery.sort_index(ascending=False, inplace=True)
-        res: pd.DataFrame = pd.concat([res_composition, res_recovery]).reset_index().set_index(
-            [new_index.name, 'attribute'])
-        return res
-    def _check_one_dim_interval(self):
-        if len(self.mass_data.index.names) != 1:
-            raise NotImplementedError(f"This object is {self.mass_data.index.ndim} dimensional. "
-                                      f"Only 1D interval objects are valid")
-        index_var: str = self.mass_data.index.name
-        if not isinstance(self.mass_data.index, pd.IntervalIndex):
-            raise NotImplementedError(f"The {index_var} of this object is not a pd.Interval. "
-                                      f" Only 1D interval objects are valid")
-    def _check_two_dim_interval(self):
-        if len(self.mass_data.index.names) != 2:
-            raise NotImplementedError(f"This object is {self.mass_data.index.ndim} dimensional. "
-                                      f"Only 2D interval objects are valid")
-        for indx in self.mass_data.index.levels:
-            if not isinstance(indx, pd.IntervalIndex):
-                raise NotImplementedError(f"The {indx.name} of this object is not a pd.Interval. "
-                                          f" Only 1D interval objects are valid")
-    def ideal_incremental_composition(self, discard_from: Literal["lowest", "highest"] = "lowest") -> pd.DataFrame:
-        """Incrementally separate a fractionated sample.
-        This method sorts by the provided direction prior to incrementally removing and discarding the first fraction
-         (of the remaining fractions) and recalculating the mass-composition of the portion remaining.
-         This is equivalent to incrementally applying a perfect separation (partition) at every interval edge.
-        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
-        See also: ideal_incremental_separation, ideal_incremental_recovery.
-        Args:
-            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
-             first, then the next lowest, etc.
-        Returns:
-            A pandas DataFrame
-        """
-        df: pd.DataFrame = self.ideal_incremental_separation(discard_from=discard_from).query(
-            'attribute=="composition"').droplevel('attribute')
-        return df
-    def ideal_incremental_recovery(self, discard_from: Literal["lowest", "highest"] = "lowest",
-                                   apply_closure: bool = True) -> pd.DataFrame:
-        """Incrementally separate a fractionated sample.
-        This method sorts by the provided direction prior to incrementally removing and discarding the first fraction
-         (of the remaining fractions) and recalculating the recovery of the portion remaining.
-         This is equivalent to incrementally applying a perfect separation (partition) at every interval edge.
-        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
-        See also: ideal_incremental_separation, ideal_incremental_composition.
-        Args:
-            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
-             first, then the next lowest, etc.
-            apply_closure: If True, Add the missing record (zero recovery) that closes the recovery envelope.
-        Returns:
-            A pandas DataFrame
-        """
-        columns_to_drop: list[str] = ['mass_wet', 'H2O'] if self.moisture_in_scope else []
-        df: pd.DataFrame = self.ideal_incremental_separation(discard_from=discard_from).query(
-            'attribute=="recovery"').droplevel('attribute').rename(columns={'mass_dry': 'mass'}).drop(
-            columns=columns_to_drop)
-        if apply_closure:
-            # add zero recovery record to close the envelope.
-            indx = np.inf if df.index.min() == 0.0 else 0.0
-            indx_name: str = df.index.name
-            df = pd.concat([df, pd.Series(0, index=df.columns, name=indx).to_frame().T]).sort_index(ascending=True)
-            df.index.name = indx_name
-        return df
-    def plot_heatmap(self, components: list[str], **kwargs):
-        """
-        Plot the sample as a heatmap.
-        :param components: The list of components to plot.
-        :param kwargs: Additional keyword arguments to pass to the plot method.
-        :return: The axis with the plot.
-        """
-        # if not self.is_rectilinear_grid:
-        #     raise ValueError('The sample is not a rectilinear grid.')
-        # convert IntervalIndex to nominal values df.index = df.index.map(lambda x: x.mid)
-        x_label = self.mass_data.index.names[0]
-        y_label = self.mass_data.index.names[1]
-        z_label = self.mass_data.columns[0]
-        # create a pivot table for the heatmap
-        pivot_df = self.mass_data[components].copy().unstack()
-        # Get the midpoints of the intervals for X and Y
-        x_midpoints = [interval.mid for interval in self.mass_data.index.get_level_values(x_label)]
-        y_midpoints = [interval.mid for interval in self.mass_data.index.get_level_values(y_label)]
-        # Get interval edges for x and y axes
-        x_edges = self._get_unique_edges(self.mass_data.index.get_level_values(x_label))
-        y_edges = self._get_unique_edges(self.mass_data.index.get_level_values(y_label))
-        # Create hover text
-        hover_text = [[f"{x_label}: {x_mid}, {y_label}: {y_mid}, {z_label}: {z_val}"
-                       for x_mid, z_val in zip(x_midpoints, z_values)]
-                      for y_mid, z_values in zip(y_midpoints, pivot_df.values)]
-        # plot the heatmap
-        fig = go.Figure(data=go.Heatmap(
-            z=pivot_df.values,
-            x=x_edges,
-            y=y_edges,
-            text=hover_text,
-            hoverinfo='text'))
-        # update the layout to use logarithmic x-axis
-        if x_label == 'size':
-            fig.update_layout(xaxis_type="log")
-        elif y_label == 'size':
-            fig.update_layout(yaxis_type="log")
-        # set the title and x and y labels dynamically
-        fig.update_layout(title=f'{self.name} Heatmap',
-                          xaxis_title=self.mass_data.index.names[0],
-                          yaxis_title=self.mass_data.index.names[1])
-        return fig
-    def plot_intervals(self,
-                       variables: list[str],
-                       cumulative: bool = True,
-                       direction: str = 'descending',
-                       show_edges: bool = True,
-                       min_x: Optional[float] = None) -> go.Figure:
-        """Plot "The Grade-Tonnage" curve.
-        Mass and grade by bins for a cut-off variable.
-        Args:
-            variables: List of variables to include in the plot
-            cumulative: If True, the results are cumulative weight averaged.
-            direction: 'ascending'|'descending', if cumulative is True, the direction of accumulation
-            show_edges: If True, show the edges on the plot.  Applicable to cumulative plots only.
-            min_x: Optional minimum value for the x-axis, useful to set reasonable visual range with a log
-            scaled x-axis when plotting size data
-        """
-        res: pd.DataFrame = self.data[variables]
-        plot_kwargs: dict = dict(line_shape='vh')
-        if cumulative:
-            res = self.mass_data.pipe(cumulate, direction=direction).pipe(mass_to_composition)
-            plot_kwargs = dict(line_shape='spline')
-        interval_data: pd.DataFrame = res
-        # Get the first IntervalIndex - TODO: specify or check...
-        interval_index: Optional[pd.IntervalIndex] = None
-        for level in range(interval_data.index.nlevels):
-            if isinstance(interval_data.index.get_level_values(level), pd.IntervalIndex):
-                interval_index = interval_data.index.get_level_values(level)
-                break
-        if interval_index is None:
-            raise ValueError("No IntervalIndex found in the index levels")
-        left_name: str = interval_index.left.name if interval_index.left.name else 'left'
-        right_name: str = interval_index.right.name if interval_index.right.name else 'right'
-        left: pd.Series = pd.Series(interval_index.left, name=left_name, index=interval_index)
-        right: pd.Series = pd.Series(interval_index.right, name=right_name, index=interval_index)
-        df_intervals = pd.concat([left, right, interval_data], axis='columns')
-        x_var: str = interval_data.index.name
-        if not cumulative:
-            # append on the largest fraction right edge for display purposes
-            is_ascending: bool = interval_index.is_monotonic_increasing
-            df_end: pd.DataFrame = df_intervals.loc[df_intervals.index.max(), :].to_frame().T
-            df_end[left_name] = df_end[right_name]
-            df_end[right_name] = np.inf
-            df = pd.concat([df_end.reset_index(drop=True), df_intervals], axis='index')
-            df[interval_data.index.name] = df[left_name]
-            df = df.sort_values(by=interval_data.index.name, ascending=is_ascending)
-        else:
-            if direction == 'ascending':
-                x_var = right_name
-            elif direction == 'descending':
-                x_var = left_name
-            df = df_intervals
-        if res.index.name.lower() == 'size':
-            if not min_x:
-                min_x = interval_data.index.min().right / 2.0
-            # set zero to the minimum x value (for display only) to enable the tooltips on that point.
-            df.loc[df[x_var] == df[x_var].min(), x_var] = min_x
-            hover_data = {'component': True,  # add other column, default formatting
-                          x_var: ':.3f',  # add other column, customized formatting
-                          'value': ':.2f'
-                          }
-            plot_kwargs = {**plot_kwargs,
-                           **dict(log_x=True,
-                                  range_x=[min_x, interval_data.index.max().right],
-                                  hover_data=hover_data)}
-        df = df[[x_var] + variables].melt(id_vars=[x_var], var_name='component')
-        if cumulative and show_edges:
-            plot_kwargs['markers'] = True
-        fig = px.line(df, x=x_var, y='value', facet_row='component', **plot_kwargs)
-        fig.for_each_annotation(lambda a: a.update(text=a.text.replace("component=", "")))
-        fig.update_yaxes(matches=None)
-        fig.update_layout(title=self.name)
-        return fig
-    @staticmethod
-    def _get_unique_edges(interval_index):
-        # Get the left and right edges of the intervals
-        left_edges = interval_index.left.tolist()
-        right_edges = interval_index.right.tolist()
-        # Concatenate the two lists
-        all_edges = left_edges + right_edges
-        # Get the unique edges
-        unique_edges = np.unique(all_edges)
-        return unique_edges
-    def plot_grade_recovery(self, target_analyte,
-                            discard_from: Literal["lowest", "highest"] = "lowest",
-                            title: Optional[str] = None,
-                            ) -> go.Figure:
-        """The grade-recovery plot.
-        The grade recovery curve is generated by assuming an ideal separation (for the chosen property, or dimension)
-        at each fractional interval.  It defines the theoretical maximum performance, which can only be improved if
-        liberation is improved by comminution.
-        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
-        Args:
-            target_analyte: The analyte of value.
-            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
-             first, then the next lowest, etc.
-            title: Optional plot title
-        Returns:
-            A plotly.GraphObjects figure
-        """
-        title = title if title is not None else 'Ideal Grade - Recovery'
-        cols_to_drop: list[str] = ['mass_wet', 'mass_dry', 'H2O'] if self.moisture_in_scope else ['mass_dry']
-        df: pd.DataFrame = self.ideal_incremental_separation(discard_from=discard_from)
-        df_recovery: pd.DataFrame = df.loc[(slice(None), 'recovery'), [target_analyte, 'mass_dry']].droplevel(
-            'attribute').rename(
-            columns={'mass_dry': 'Yield', target_analyte: f"{target_analyte}_recovery"})
-        df_composition: pd.DataFrame = df.loc[(slice(None), 'composition'), :].droplevel('attribute').drop(
-            columns=cols_to_drop)
-        df_plot: pd.DataFrame = pd.concat([df_recovery, df_composition], axis=1).reset_index()
-        fig = px.line(df_plot, x=target_analyte,
-                      y=f"{target_analyte}_recovery",
-                      hover_data=df_plot.columns,
-                      title=title)
-        # fig.update_layout(xaxis_title=f"Grade of {target_analyte}", yaxis_title=f"Recovery of {target_analyte}",
-        #                   title=title)
-        return fig
-    def plot_amenability(self, target_analyte: str,
-                         discard_from: Literal["lowest", "highest"] = "lowest",
-                         gangue_analytes: Optional[str] = None,
-                         title: Optional[str] = None,
-                         ) -> go.Figure:
-        """The yield-recovery plot.
-        The yield recovery curve provides an understanding of the amenability of a sample.
-        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
-        Args:
-            target_analyte: The analyte of value.
-            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
-             first, then the next lowest, etc.
-            gangue_analytes: The analytes to be rejected
-            title: Optional plot title
-        Returns:
-            A plotly.GraphObjects figure
-        """
-        title = title if title is not None else 'Amenability Plot'
-        df: pd.DataFrame = self.ideal_incremental_recovery(discard_from=discard_from)
-        amenability_indices: pd.Series = amenability_index(df, col_target=target_analyte, col_mass_recovery='mass')
-        analytes = [col for col in df.columns if col != "mass"] if gangue_analytes is None else [
-            target_analyte + gangue_analytes]
-        mass_rec: pd.DataFrame = df["mass"]
-        df = df[analytes]
-        fig = go.Figure()
-        for analyte in analytes:
-            fig.add_trace(
-                go.Scatter(x=mass_rec, y=df[analyte], mode="lines",
-                           name=f"{analyte} ({round(amenability_indices[analyte], 2)})",
-                           customdata=df.index.values,
-                           hovertemplate='<b>Recovery: %{y:.3f}</b><br>Cut-point: %{customdata:.3f} '))
-        fig.add_trace(go.Scatter(x=[0, 1], y=[0, 1], mode="lines", name='y=x',
-                                 line=dict(shape='linear', color='gray', dash='dash'),
-                                 ))
-        fig.update_layout(xaxis_title='Yield (Mass Recovery)', yaxis_title='Recovery', title=title,
-                          hovermode='x')
-        return fig
-    def calculate_partition(self, preferred: 'MassComposition') -> pd.DataFrame:
-        """Calculate the partition number (K) [0, 1] of the preferred stream relative to self
-        .. math::
-            K = \\frac{{m_{preferred}}}{{m_{feed}}}
-        """
-        self._check_one_dim_interval()
-        return calculate_partition(df_feed=self.data, df_preferred=preferred.data,
-                                   col_mass_dry='mass_dry')
-    def resample_1d(self, interval_edges: Union[Iterable, int],
-                    precision: Optional[int] = None,
-                    include_original_edges: bool = False) -> 'IntervalSample':
-        """Resample a 1D fractional dim/index
-        Args:
-            interval_edges: The values of the new grid (interval edges).  If an int, will up-sample by that factor, for
-             example the value of 10 will automatically define edges that create 10 x the resolution (up-sampled).
-            precision: Optional integer for the number of decimal places to round the grid values to.
-            include_original_edges: If True include the original edges in the grid.
-        Returns:
-            A new IntervalSample object interpolated onto the new grid
-        """
-        # TODO: add support for supplementary variables
-        # test the index contains a single interval index
-        self._check_one_dim_interval()
-        df_upsampled: pd.DataFrame = mass_preserving_interp(self.mass_data,
-                                                            interval_edges=interval_edges, precision=precision,
-                                                            include_original_edges=include_original_edges,
-                                                            mass_wet=None, mass_dry=self.mass_dry_var,
-                                                            interval_data_as_mass=True)
-        obj: IntervalSample = IntervalSample(df_upsampled, name=self.name, moisture_in_scope=False,
-                                             mass_dry_var=self.mass_dry_var)
-        obj.status.ranges = self.status.ranges
-        return obj
-    def resample_2d(self, interval_edges: dict[str, Iterable],
-                    precision: Optional[int] = None) -> 'IntervalSample':
-        """Resample a 2D fractional dim/index
-        Args:
-            interval_edges: A dict keyed by index name containing the grid the data is resampled to.
-            precision: Optional integer for the number of decimal places to round the grid values to.
-        Returns:
-            A new IntervalSample object interpolated onto the new grid
-        """
-        # TODO: add support for supplementary variables
-        # test the index contains a single interval index
-        self._check_two_dim_interval()
-        df_upsampled_specific_mass: pd.DataFrame = mass_preserving_interp_2d(self._specific_mass(),
-                                                                             interval_edges=interval_edges,
-                                                                             precision=precision,
-                                                                             mass_dry=self.mass_dry_var)
-        # convert from specific mass to mass
-        df_upsampled = df_upsampled_specific_mass.mul(self.mass_data[self.mass_dry_var].sum(), axis=0)
-        df_upsampled[self.composition_columns] = df_upsampled[self.composition_columns].div(
-            df_upsampled[self.mass_dry_var], axis=0).mul(self.composition_factor, axis=0)
-        obj: IntervalSample = IntervalSample(df_upsampled, name=self.name, moisture_in_scope=False,
-                                             mass_dry_var=self.mass_dry_var)
-        if hasattr(obj, 'nodes'):
-            obj.nodes = self.nodes
-        obj.status.ranges = self.status.ranges
-        return obj
-    def _specific_mass(self) -> Optional[pd.DataFrame]:
-        """Calculate the specific mass of the sample
-        Specific mass is the mass of the sample fractions divided by the mass of all fractions.
-        The sum of the specific mass (for mass_dry) is 1.0 by definition.
-        """
-        res = None
-        if self.data is not None:
-            res = self.mass_data.div(self.mass_data[self.mass_dry_var].sum(), axis=0)
-            if self.moisture_in_scope:
-                res.drop(columns=[self.mass_wet_var], inplace=True)
-        return res
+from __future__ import annotations
+import functools
+import uuid
+from pathlib import Path
+from typing import Optional, Literal, Callable, Union, Iterable, TYPE_CHECKING
+import numpy as np
+import pandas as pd
+from pandas import IntervalIndex
+from pandas.core.indexes.frozen import FrozenList
+import plotly.graph_objects as go
+import plotly.express as px
+import elphick.geomet.flowsheet.stream
+from elphick.geomet.utils.amenability import amenability_index
+from elphick.geomet.utils.interp import mass_preserving_interp
+from elphick.geomet.utils.interp2 import mass_preserving_interp_2d
+from elphick.geomet.utils.pandas import MeanIntervalIndex, weight_average, calculate_recovery, calculate_partition, \
+    cumulate, mass_to_composition
+from elphick.geomet.base import MassComposition
+if TYPE_CHECKING:
+    from elphick.geomet.flowsheet.stream import Stream
+class IntervalSample(MassComposition):
+    """
+    A class to represent a sample of data with an interval index.
+    This exposes methods to split the sample by a partition definition.
+    """
+    def __init__(self,
+                 data: Optional[pd.DataFrame] = None,
+                 name: Optional[str] = None,
+                 moisture_in_scope: bool = True,
+                 mass_wet_var: Optional[str] = None,
+                 mass_dry_var: Optional[str] = None,
+                 moisture_var: Optional[str] = None,
+                 component_vars: Optional[list[str]] = None,
+                 composition_units: Literal['%', 'ppm', 'ppb'] = '%',
+                 components_as_symbols: bool = True,
+                 ranges: Optional[dict[str, list]] = None,
+                 config_file: Optional[Path] = None):
+        super().__init__(data=data, name=name, moisture_in_scope=moisture_in_scope,
+                         mass_wet_var=mass_wet_var, mass_dry_var=mass_dry_var,
+                         moisture_var=moisture_var, component_vars=component_vars,
+                         composition_units=composition_units, components_as_symbols=components_as_symbols,
+                         ranges=ranges, config_file=config_file)
+        # manage the interval indexes
+        if self.data is not None:
+            self.data = self._create_interval_indexes(data)
+    def _create_interval_indexes(self, data: pd.DataFrame) -> pd.DataFrame:
+        original_indexes = data.index.names
+        interval_indexes = []
+        for pair in self.config['intervals']['suffixes']:
+            if data.index.names != FrozenList([None]):
+                suffix_candidates: dict = {n: n.split('_')[-1].lower() for n in data.index.names}
+                suffixes: dict = {k: v for k, v in suffix_candidates.items() if v in pair}
+                if suffixes:
+                    data.reset_index(list(suffixes.keys()), inplace=True)
+                    num_interval_indexes: int = int(len(suffixes.keys()) / 2)
+                    for i in range(0, num_interval_indexes + 1, 2):
+                        keys = list(suffixes.keys())[i: i + 2]
+                        base_name: str = '_'.join(keys[0].split('_')[:-1])
+                        index = IntervalIndex.from_arrays(left=data[keys[0]], right=data[keys[1]],
+                                                          closed=self.config['intervals']['closed'])
+                        index.name = base_name
+                        # left and right names are only preserved for a single interval index.
+                        # when a multiindex is used, the names are not preserved.
+                        index.left.name = keys[0].split('_')[-1]
+                        index.right.name = keys[1].split('_')[-1]
+                        interval_indexes.append(index)
+                        # drop the index columns from the dataframe columns
+                        data.drop(columns=keys, inplace=True)
+        if interval_indexes:
+            new_indexes = {}  # Use dict to preserve order and uniqueness
+            # we need to set the index to include the new interval index, but respect the order of the original.
+            for i in original_indexes:
+                if i.split('_')[0] not in [ii.name for ii in interval_indexes]:
+                    new_indexes[i] = data.index.get_level_values(i)
+                else:
+                    # Find the corresponding interval index and append it to the new_indexes list
+                    for ii in interval_indexes:
+                        if ii.name == i.split('_')[0]:
+                            new_indexes[ii.name] = ii
+                            break
+            if len(new_indexes) > 1:
+                data.index = pd.MultiIndex.from_frame(pd.DataFrame(new_indexes.values()).T, names=new_indexes.keys())
+            else:
+                data.index = list(new_indexes.values())[0]
+        return data
+    def split_by_partition(self, partition_definition: Union[pd.Series, Callable], name_1: str = 'preferred',
+                           name_2: str = 'complement'):
+        """
+        Split the sample into two samples based on the partition definition.
+        .. math::
+            K = \\frac{{m_{preferred}}}{{m_{feed}}}
+        :param partition_definition: A function that takes a data frame and returns a boolean series with a
+         range [0, 1]. A 1D function must have an argument that matches the dimension of the interval index.
+         A 2D function must have two arguments that match the dimensions of the interval index.
+        :param name_1: The name of the first sample.
+        :param name_2: The name of the second sample.
+        :return: A tuple of two IntervalSamples.
+        """
+        # Check that the partition definition has the correct number of arguments and that the names match
+        sample_fraction_dims = [col for col in self.mass_data.index.names if
+                                col != isinstance(self.mass_data.index.get_level_values(col), pd.IntervalIndex)]
+        fraction_means: pd.DataFrame = self.mass_data.index.to_frame()[sample_fraction_dims].apply(
+            lambda x: MeanIntervalIndex(x).mean, axis=0)
+        # Get the function from the partial object if necessary
+        if isinstance(partition_definition, Callable):
+            partition_func = partition_definition.func if isinstance(partition_definition,
+                                                                     functools.partial) else partition_definition
+            # Check that the required argument names are present in the IntervalIndex levels
+            required_args = [col for col in partition_func.__code__.co_varnames if col in sample_fraction_dims]
+            pn: pd.Series = pd.Series(partition_definition(**fraction_means[required_args]), name='K',
+                                      index=self._mass_data.index)
+        elif isinstance(partition_definition, pd.Series):
+            required_args = partition_definition.index.names
+            pn: pd.Series = partition_definition
+        else:
+            raise TypeError(f"The partition definition must be a function or a pandas Series:"
+                            f" type = {type(partition_definition)}")
+        for arg, dim in zip(required_args, sample_fraction_dims):
+            if arg != dim:
+                raise ValueError(f"The partition definition argument name does not match the index name. "
+                                 f"Expected {dim}, found {arg}")
+        self.to_stream()
+        self: 'Stream'
+        sample_1 = self.create_congruent_object(name=name_1).to_stream()
+        sample_1.mass_data = self.mass_data.copy().multiply(pn, axis=0)
+        sample_1.set_nodes([self.nodes[1], uuid.uuid4()])
+        sample_2 = self.create_congruent_object(name=name_2)
+        sample_2.mass_data = self.mass_data.copy().multiply((1 - pn), axis=0)
+        sample_2.set_nodes([self.nodes[1], uuid.uuid4()])
+        return sample_1, sample_2
+    def is_2d_grid(self):
+        """
+        Check if the sample is a 2d grid.
+        :return: True if the sample has 2 levels of intervals, False otherwise.
+        """
+        res = False
+        if self.mass_data is not None and self.mass_data.index.nlevels >= 2:
+            # get the type of the index levels
+            level_types = [type(level) for level in self.mass_data.index.levels]
+            # get the counts of each type
+            level_counts = {level_type: level_types.count(level_type) for level_type in set(level_types)}
+            # check if there are 2 levels of intervals
+            res = level_counts.get(pd.Interval, 0) == 2
+        return res
+    @property
+    def is_rectilinear_grid(self):
+        """If rectilinear we can plot with a simple heatmap"""
+        res = False
+        if self.mass_data is not None and self._mass_data.index.nlevels >= 2:
+            # Get the midpoints of the intervals for X and Y
+            x_midpoints = self.mass_data.index.get_level_values(0).mid
+            y_midpoints = self.mass_data.index.get_level_values(1).mid
+            # Get unique midpoints for X and Y
+            unique_x_midpoints = set(x_midpoints)
+            unique_y_midpoints = set(y_midpoints)
+            # Check if the grid is full (i.e., no steps in the lines that define the grid edges)
+            # todo: fix this logic - it is not correct
+            if len(unique_x_midpoints) == len(x_midpoints) and len(unique_y_midpoints) == len(y_midpoints):
+                res = True
+        return res
+    def ideal_incremental_separation(self, discard_from: Literal["lowest", "highest"] = "lowest") -> pd.DataFrame:
+        """Incrementally separate a fractionated sample.
+        This method sorts by the provided direction prior to incrementally removing and discarding the first fraction
+         (of the remaining fractions) and recalculating the mass-composition and recovery of the portion remaining.
+         This is equivalent to incrementally applying a perfect separation (partition) at every interval edge.
+        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
+        See also: ideal_incremental_composition, ideal_incremental_recovery.
+        Args:
+            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
+             first, then the next lowest, etc.
+        Returns:
+            A pandas DataFrame
+        """
+        self._check_one_dim_interval()
+        sample: pd.DataFrame = self.data
+        is_decreasing: bool = sample.index.is_monotonic_decreasing
+        if discard_from == "lowest":
+            sample.sort_index(ascending=True, inplace=True)
+            new_index: pd.Index = pd.Index(sample.index.left)
+        else:
+            sample.sort_index(ascending=False, inplace=True)
+            new_index: pd.Index = pd.Index(sample.index.right)
+        new_index.name = f"{sample.index.name}_cut-point"
+        aggregated_chunks: list = []
+        recovery_chunks: list = []
+        head: pd.Series = sample.pipe(weight_average)
+        for i, indx in enumerate(sample.index):
+            tmp_composition: pd.DataFrame = sample.iloc[i:, :].pipe(weight_average).to_frame().T
+            aggregated_chunks.append(tmp_composition)
+            recovery_chunks.append(tmp_composition.pipe(calculate_recovery, df_ref=head.to_frame().T))
+        res_composition: pd.DataFrame = pd.concat(aggregated_chunks).assign(attribute="composition").set_index(
+            new_index)
+        res_recovery: pd.DataFrame = pd.concat(recovery_chunks).assign(attribute="recovery").set_index(
+            new_index)
+        if is_decreasing:
+            res_composition.sort_index(ascending=False, inplace=True)
+            res_recovery.sort_index(ascending=False, inplace=True)
+        res: pd.DataFrame = pd.concat([res_composition, res_recovery]).reset_index().set_index(
+            [new_index.name, 'attribute'])
+        return res
+    def _check_one_dim_interval(self):
+        if len(self.mass_data.index.names) != 1:
+            raise NotImplementedError(f"This object is {self.mass_data.index.ndim} dimensional. "
+                                      f"Only 1D interval objects are valid")
+        index_var: str = self.mass_data.index.name
+        if not isinstance(self.mass_data.index, pd.IntervalIndex):
+            raise NotImplementedError(f"The {index_var} of this object is not a pd.Interval. "
+                                      f" Only 1D interval objects are valid")
+    def _check_two_dim_interval(self):
+        if len(self.mass_data.index.names) != 2:
+            raise NotImplementedError(f"This object is {self.mass_data.index.ndim} dimensional. "
+                                      f"Only 2D interval objects are valid")
+        for indx in self.mass_data.index.levels:
+            if not isinstance(indx, pd.IntervalIndex):
+                raise NotImplementedError(f"The {indx.name} of this object is not a pd.Interval. "
+                                          f" Only 1D interval objects are valid")
+    def ideal_incremental_composition(self, discard_from: Literal["lowest", "highest"] = "lowest") -> pd.DataFrame:
+        """Incrementally separate a fractionated sample.
+        This method sorts by the provided direction prior to incrementally removing and discarding the first fraction
+         (of the remaining fractions) and recalculating the mass-composition of the portion remaining.
+         This is equivalent to incrementally applying a perfect separation (partition) at every interval edge.
+        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
+        See also: ideal_incremental_separation, ideal_incremental_recovery.
+        Args:
+            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
+             first, then the next lowest, etc.
+        Returns:
+            A pandas DataFrame
+        """
+        df: pd.DataFrame = self.ideal_incremental_separation(discard_from=discard_from).query(
+            'attribute=="composition"').droplevel('attribute')
+        return df
+    def ideal_incremental_recovery(self, discard_from: Literal["lowest", "highest"] = "lowest",
+                                   apply_closure: bool = True) -> pd.DataFrame:
+        """Incrementally separate a fractionated sample.
+        This method sorts by the provided direction prior to incrementally removing and discarding the first fraction
+         (of the remaining fractions) and recalculating the recovery of the portion remaining.
+         This is equivalent to incrementally applying a perfect separation (partition) at every interval edge.
+        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
+        See also: ideal_incremental_separation, ideal_incremental_composition.
+        Args:
+            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
+             first, then the next lowest, etc.
+            apply_closure: If True, Add the missing record (zero recovery) that closes the recovery envelope.
+        Returns:
+            A pandas DataFrame
+        """
+        columns_to_drop: list[str] = ['mass_wet', 'H2O'] if self.moisture_in_scope else []
+        df: pd.DataFrame = self.ideal_incremental_separation(discard_from=discard_from).query(
+            'attribute=="recovery"').droplevel('attribute').rename(columns={'mass_dry': 'mass'}).drop(
+            columns=columns_to_drop)
+        if apply_closure:
+            # add zero recovery record to close the envelope.
+            indx = np.inf if df.index.min() == 0.0 else 0.0
+            indx_name: str = df.index.name
+            df = pd.concat([df, pd.Series(0, index=df.columns, name=indx).to_frame().T]).sort_index(ascending=True)
+            df.index.name = indx_name
+        return df
+    def plot_heatmap(self, components: list[str], **kwargs):
+        """
+        Plot the sample as a heatmap.
+        :param components: The list of components to plot.
+        :param kwargs: Additional keyword arguments to pass to the plot method.
+        :return: The axis with the plot.
+        """
+        # if not self.is_rectilinear_grid:
+        #     raise ValueError('The sample is not a rectilinear grid.')
+        # convert IntervalIndex to nominal values df.index = df.index.map(lambda x: x.mid)
+        x_label = self.mass_data.index.names[0]
+        y_label = self.mass_data.index.names[1]
+        z_label = self.mass_data.columns[0]
+        # create a pivot table for the heatmap
+        pivot_df = self.mass_data[components].copy().unstack()
+        # Get the midpoints of the intervals for X and Y
+        x_midpoints = [interval.mid for interval in self.mass_data.index.get_level_values(x_label)]
+        y_midpoints = [interval.mid for interval in self.mass_data.index.get_level_values(y_label)]
+        # Get interval edges for x and y axes
+        x_edges = self._get_unique_edges(self.mass_data.index.get_level_values(x_label))
+        y_edges = self._get_unique_edges(self.mass_data.index.get_level_values(y_label))
+        # Create hover text
+        hover_text = [[f"{x_label}: {x_mid}, {y_label}: {y_mid}, {z_label}: {z_val}"
+                       for x_mid, z_val in zip(x_midpoints, z_values)]
+                      for y_mid, z_values in zip(y_midpoints, pivot_df.values)]
+        # plot the heatmap
+        fig = go.Figure(data=go.Heatmap(
+            z=pivot_df.values,
+            x=x_edges,
+            y=y_edges,
+            text=hover_text,
+            hoverinfo='text'))
+        # update the layout to use logarithmic x-axis
+        if x_label == 'size':
+            fig.update_layout(xaxis_type="log")
+        elif y_label == 'size':
+            fig.update_layout(yaxis_type="log")
+        # set the title and x and y labels dynamically
+        fig.update_layout(title=f'{self.name} Heatmap',
+                          xaxis_title=self.mass_data.index.names[0],
+                          yaxis_title=self.mass_data.index.names[1])
+        return fig
+    def plot_intervals(self,
+                       variables: list[str],
+                       cumulative: bool = True,
+                       direction: str = 'descending',
+                       show_edges: bool = True,
+                       min_x: Optional[float] = None) -> go.Figure:
+        """Plot "The Grade-Tonnage" curve.
+        Mass and grade by bins for a cut-off variable.
+        Args:
+            variables: List of variables to include in the plot
+            cumulative: If True, the results are cumulative weight averaged.
+            direction: 'ascending'|'descending', if cumulative is True, the direction of accumulation
+            show_edges: If True, show the edges on the plot.  Applicable to cumulative plots only.
+            min_x: Optional minimum value for the x-axis, useful to set reasonable visual range with a log
+            scaled x-axis when plotting size data
+        """
+        res: pd.DataFrame = self.data[variables]
+        plot_kwargs: dict = dict(line_shape='vh')
+        if cumulative:
+            res = self.mass_data.pipe(cumulate, direction=direction).pipe(mass_to_composition)
+            plot_kwargs = dict(line_shape='spline')
+        interval_data: pd.DataFrame = res
+        # Get the first IntervalIndex - TODO: specify or check...
+        interval_index: Optional[pd.IntervalIndex] = None
+        for level in range(interval_data.index.nlevels):
+            if isinstance(interval_data.index.get_level_values(level), pd.IntervalIndex):
+                interval_index = interval_data.index.get_level_values(level)
+                break
+        if interval_index is None:
+            raise ValueError("No IntervalIndex found in the index levels")
+        left_name: str = interval_index.left.name if interval_index.left.name else 'left'
+        right_name: str = interval_index.right.name if interval_index.right.name else 'right'
+        left: pd.Series = pd.Series(interval_index.left, name=left_name, index=interval_index)
+        right: pd.Series = pd.Series(interval_index.right, name=right_name, index=interval_index)
+        df_intervals = pd.concat([left, right, interval_data], axis='columns')
+        x_var: str = interval_data.index.name
+        if not cumulative:
+            # append on the largest fraction right edge for display purposes
+            is_ascending: bool = interval_index.is_monotonic_increasing
+            df_end: pd.DataFrame = df_intervals.loc[df_intervals.index.max(), :].to_frame().T
+            df_end[left_name] = df_end[right_name]
+            df_end[right_name] = np.inf
+            df = pd.concat([df_end.reset_index(drop=True), df_intervals], axis='index')
+            df[interval_data.index.name] = df[left_name]
+            df = df.sort_values(by=interval_data.index.name, ascending=is_ascending)
+        else:
+            if direction == 'ascending':
+                x_var = right_name
+            elif direction == 'descending':
+                x_var = left_name
+            df = df_intervals
+        if res.index.name.lower() == 'size':
+            if not min_x:
+                min_x = interval_data.index.min().right / 2.0
+            # set zero to the minimum x value (for display only) to enable the tooltips on that point.
+            df.loc[df[x_var] == df[x_var].min(), x_var] = min_x
+            hover_data = {'component': True,  # add other column, default formatting
+                          x_var: ':.3f',  # add other column, customized formatting
+                          'value': ':.2f'
+                          }
+            plot_kwargs = {**plot_kwargs,
+                           **dict(log_x=True,
+                                  range_x=[min_x, interval_data.index.max().right],
+                                  hover_data=hover_data)}
+        df = df[[x_var] + variables].melt(id_vars=[x_var], var_name='component')
+        if cumulative and show_edges:
+            plot_kwargs['markers'] = True
+        fig = px.line(df, x=x_var, y='value', facet_row='component', **plot_kwargs)
+        fig.for_each_annotation(lambda a: a.update(text=a.text.replace("component=", "")))
+        fig.update_yaxes(matches=None)
+        fig.update_layout(title=self.name)
+        return fig
+    @staticmethod
+    def _get_unique_edges(interval_index):
+        # Get the left and right edges of the intervals
+        left_edges = interval_index.left.tolist()
+        right_edges = interval_index.right.tolist()
+        # Concatenate the two lists
+        all_edges = left_edges + right_edges
+        # Get the unique edges
+        unique_edges = np.unique(all_edges)
+        return unique_edges
+    def plot_grade_recovery(self, target_analyte,
+                            discard_from: Literal["lowest", "highest"] = "lowest",
+                            title: Optional[str] = None,
+                            ) -> go.Figure:
+        """The grade-recovery plot.
+        The grade recovery curve is generated by assuming an ideal separation (for the chosen property, or dimension)
+        at each fractional interval.  It defines the theoretical maximum performance, which can only be improved if
+        liberation is improved by comminution.
+        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
+        Args:
+            target_analyte: The analyte of value.
+            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
+             first, then the next lowest, etc.
+            title: Optional plot title
+        Returns:
+            A plotly.GraphObjects figure
+        """
+        title = title if title is not None else 'Ideal Grade - Recovery'
+        cols_to_drop: list[str] = ['mass_wet', 'mass_dry', 'H2O'] if self.moisture_in_scope else ['mass_dry']
+        df: pd.DataFrame = self.ideal_incremental_separation(discard_from=discard_from)
+        df_recovery: pd.DataFrame = df.loc[(slice(None), 'recovery'), [target_analyte, 'mass_dry']].droplevel(
+            'attribute').rename(
+            columns={'mass_dry': 'Yield', target_analyte: f"{target_analyte}_recovery"})
+        df_composition: pd.DataFrame = df.loc[(slice(None), 'composition'), :].droplevel('attribute').drop(
+            columns=cols_to_drop)
+        df_plot: pd.DataFrame = pd.concat([df_recovery, df_composition], axis=1).reset_index()
+        fig = px.line(df_plot, x=target_analyte,
+                      y=f"{target_analyte}_recovery",
+                      hover_data=df_plot.columns,
+                      title=title)
+        # fig.update_layout(xaxis_title=f"Grade of {target_analyte}", yaxis_title=f"Recovery of {target_analyte}",
+        #                   title=title)
+        return fig
+    def plot_amenability(self, target_analyte: str,
+                         discard_from: Literal["lowest", "highest"] = "lowest",
+                         gangue_analytes: Optional[str] = None,
+                         title: Optional[str] = None,
+                         ) -> go.Figure:
+        """The yield-recovery plot.
+        The yield recovery curve provides an understanding of the amenability of a sample.
+        This method is only applicable to a 1D object where the single dimension is a pd.Interval type.
+        Args:
+            target_analyte: The analyte of value.
+            discard_from: Defines the discarded direction.  discard_from = "lowest" will discard the lowest value
+             first, then the next lowest, etc.
+            gangue_analytes: The analytes to be rejected
+            title: Optional plot title
+        Returns:
+            A plotly.GraphObjects figure
+        """
+        title = title if title is not None else 'Amenability Plot'
+        df: pd.DataFrame = self.ideal_incremental_recovery(discard_from=discard_from)
+        amenability_indices: pd.Series = amenability_index(df, col_target=target_analyte, col_mass_recovery='mass')
+        analytes = [col for col in df.columns if col != "mass"] if gangue_analytes is None else [
+            target_analyte + gangue_analytes]
+        mass_rec: pd.DataFrame = df["mass"]
+        df = df[analytes]
+        fig = go.Figure()
+        for analyte in analytes:
+            fig.add_trace(
+                go.Scatter(x=mass_rec, y=df[analyte], mode="lines",
+                           name=f"{analyte} ({round(amenability_indices[analyte], 2)})",
+                           customdata=df.index.values,
+                           hovertemplate='<b>Recovery: %{y:.3f}</b><br>Cut-point: %{customdata:.3f} '))
+        fig.add_trace(go.Scatter(x=[0, 1], y=[0, 1], mode="lines", name='y=x',
+                                 line=dict(shape='linear', color='gray', dash='dash'),
+                                 ))
+        fig.update_layout(xaxis_title='Yield (Mass Recovery)', yaxis_title='Recovery', title=title,
+                          hovermode='x')
+        return fig
+    def calculate_partition(self, preferred: 'MassComposition') -> pd.DataFrame:
+        """Calculate the partition number (K) [0, 1] of the preferred stream relative to self
+        .. math::
+            K = \\frac{{m_{preferred}}}{{m_{feed}}}
+        """
+        self._check_one_dim_interval()
+        return calculate_partition(df_feed=self.data, df_preferred=preferred.data,
+                                   col_mass_dry='mass_dry')
+    def resample_1d(self, interval_edges: Union[Iterable, int],
+                    precision: Optional[int] = None,
+                    include_original_edges: bool = False) -> 'IntervalSample':
+        """Resample a 1D fractional dim/index
+        Args:
+            interval_edges: The values of the new grid (interval edges).  If an int, will up-sample by that factor, for
+             example the value of 10 will automatically define edges that create 10 x the resolution (up-sampled).
+            precision: Optional integer for the number of decimal places to round the grid values to.
+            include_original_edges: If True include the original edges in the grid.
+        Returns:
+            A new IntervalSample object interpolated onto the new grid
+        """
+        # TODO: add support for supplementary variables
+        # test the index contains a single interval index
+        self._check_one_dim_interval()
+        df_upsampled: pd.DataFrame = mass_preserving_interp(self.mass_data,
+                                                            interval_edges=interval_edges, precision=precision,
+                                                            include_original_edges=include_original_edges,
+                                                            mass_wet=None, mass_dry=self.mass_dry_var,
+                                                            interval_data_as_mass=True)
+        obj: IntervalSample = IntervalSample(df_upsampled, name=self.name, moisture_in_scope=False,
+                                             mass_dry_var=self.mass_dry_var)
+        obj.status.ranges = self.status.ranges
+        return obj
+    def resample_2d(self, interval_edges: dict[str, Iterable],
+                    precision: Optional[int] = None) -> 'IntervalSample':
+        """Resample a 2D fractional dim/index
+        Args:
+            interval_edges: A dict keyed by index name containing the grid the data is resampled to.
+            precision: Optional integer for the number of decimal places to round the grid values to.
+        Returns:
+            A new IntervalSample object interpolated onto the new grid
+        """
+        # TODO: add support for supplementary variables
+        # test the index contains a single interval index
+        self._check_two_dim_interval()
+        df_upsampled_specific_mass: pd.DataFrame = mass_preserving_interp_2d(self._specific_mass(),
+                                                                             interval_edges=interval_edges,
+                                                                             precision=precision,
+                                                                             mass_dry=self.mass_dry_var)
+        # convert from specific mass to mass
+        df_upsampled = df_upsampled_specific_mass.mul(self.mass_data[self.mass_dry_var].sum(), axis=0)
+        df_upsampled[self.composition_columns] = df_upsampled[self.composition_columns].div(
+            df_upsampled[self.mass_dry_var], axis=0).mul(self.composition_factor, axis=0)
+        obj: IntervalSample = IntervalSample(df_upsampled, name=self.name, moisture_in_scope=False,
+                                             mass_dry_var=self.mass_dry_var)
+        if hasattr(obj, 'nodes'):
+            obj.nodes = self.nodes
+        obj.status.ranges = self.status.ranges
+        return obj
+    def _specific_mass(self) -> Optional[pd.DataFrame]:
+        """Calculate the specific mass of the sample
+        Specific mass is the mass of the sample fractions divided by the mass of all fractions.
+        The sum of the specific mass (for mass_dry) is 1.0 by definition.
+        """
+        res = None
+        if self.data is not None:
+            res = self.mass_data.div(self.mass_data[self.mass_dry_var].sum(), axis=0)
+            if self.moisture_in_scope:
+                res.drop(columns=[self.mass_wet_var], inplace=True)
+        return res

geometallurgy 0.4.12__py3-none-any.whl → 0.4.13__py3-none-any.whl

geometallurgy 0.4.12py3-none-any.whl → 0.4.13py3-none-any.whl