PyPI - machinegnostics - Versions diffs - 0.0.1__py3-none-any.whl - Mend

machinegnostics 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

__init__.py +0 -0
machinegnostics/__init__.py +24 -0
machinegnostics/magcal/__init__.py +37 -0
machinegnostics/magcal/characteristics.py +460 -0
machinegnostics/magcal/criteria_eval.py +268 -0
machinegnostics/magcal/criterion.py +140 -0
machinegnostics/magcal/data_conversion.py +381 -0
machinegnostics/magcal/gcor.py +64 -0
machinegnostics/magcal/gdf/__init__.py +2 -0
machinegnostics/magcal/gdf/base_df.py +39 -0
machinegnostics/magcal/gdf/base_distfunc.py +1202 -0
machinegnostics/magcal/gdf/base_egdf.py +823 -0
machinegnostics/magcal/gdf/base_eldf.py +830 -0
machinegnostics/magcal/gdf/base_qgdf.py +1234 -0
machinegnostics/magcal/gdf/base_qldf.py +1019 -0
machinegnostics/magcal/gdf/cluster_analysis.py +456 -0
machinegnostics/magcal/gdf/data_cluster.py +975 -0
machinegnostics/magcal/gdf/data_intervals.py +853 -0
machinegnostics/magcal/gdf/data_membership.py +536 -0
machinegnostics/magcal/gdf/der_egdf.py +243 -0
machinegnostics/magcal/gdf/distfunc_engine.py +841 -0
machinegnostics/magcal/gdf/egdf.py +324 -0
machinegnostics/magcal/gdf/eldf.py +297 -0
machinegnostics/magcal/gdf/eldf_intv.py +609 -0
machinegnostics/magcal/gdf/eldf_ma.py +627 -0
machinegnostics/magcal/gdf/homogeneity.py +1218 -0
machinegnostics/magcal/gdf/intv_engine.py +1523 -0
machinegnostics/magcal/gdf/marginal_intv_analysis.py +558 -0
machinegnostics/magcal/gdf/qgdf.py +289 -0
machinegnostics/magcal/gdf/qldf.py +296 -0
machinegnostics/magcal/gdf/scedasticity.py +197 -0
machinegnostics/magcal/gdf/wedf.py +181 -0
machinegnostics/magcal/gdf/z0_estimator.py +1047 -0
machinegnostics/magcal/layer_base.py +42 -0
machinegnostics/magcal/layer_history_base.py +74 -0
machinegnostics/magcal/layer_io_process_base.py +238 -0
machinegnostics/magcal/layer_param_base.py +448 -0
machinegnostics/magcal/mg_weights.py +36 -0
machinegnostics/magcal/sample_characteristics.py +532 -0
machinegnostics/magcal/scale_optimization.py +185 -0
machinegnostics/magcal/scale_param.py +313 -0
machinegnostics/magcal/util/__init__.py +0 -0
machinegnostics/magcal/util/dis_docstring.py +18 -0
machinegnostics/magcal/util/logging.py +24 -0
machinegnostics/magcal/util/min_max_float.py +34 -0
machinegnostics/magnet/__init__.py +0 -0
machinegnostics/metrics/__init__.py +28 -0
machinegnostics/metrics/accu.py +61 -0
machinegnostics/metrics/accuracy.py +67 -0
machinegnostics/metrics/auto_correlation.py +183 -0
machinegnostics/metrics/auto_covariance.py +204 -0
machinegnostics/metrics/cls_report.py +130 -0
machinegnostics/metrics/conf_matrix.py +93 -0
machinegnostics/metrics/correlation.py +178 -0
machinegnostics/metrics/cross_variance.py +167 -0
machinegnostics/metrics/divi.py +82 -0
machinegnostics/metrics/evalmet.py +109 -0
machinegnostics/metrics/f1_score.py +128 -0
machinegnostics/metrics/gmmfe.py +108 -0
machinegnostics/metrics/hc.py +141 -0
machinegnostics/metrics/mae.py +72 -0
machinegnostics/metrics/mean.py +117 -0
machinegnostics/metrics/median.py +122 -0
machinegnostics/metrics/mg_r2.py +167 -0
machinegnostics/metrics/mse.py +78 -0
machinegnostics/metrics/precision.py +119 -0
machinegnostics/metrics/r2.py +122 -0
machinegnostics/metrics/recall.py +108 -0
machinegnostics/metrics/rmse.py +77 -0
machinegnostics/metrics/robr2.py +119 -0
machinegnostics/metrics/std.py +144 -0
machinegnostics/metrics/variance.py +101 -0
machinegnostics/models/__init__.py +2 -0
machinegnostics/models/classification/__init__.py +1 -0
machinegnostics/models/classification/layer_history_log_reg.py +121 -0
machinegnostics/models/classification/layer_io_process_log_reg.py +98 -0
machinegnostics/models/classification/layer_mlflow_log_reg.py +107 -0
machinegnostics/models/classification/layer_param_log_reg.py +275 -0
machinegnostics/models/classification/mg_log_reg.py +273 -0
machinegnostics/models/cross_validation.py +118 -0
machinegnostics/models/data_split.py +106 -0
machinegnostics/models/regression/__init__.py +2 -0
machinegnostics/models/regression/layer_histroy_rob_reg.py +139 -0
machinegnostics/models/regression/layer_io_process_rob_rig.py +88 -0
machinegnostics/models/regression/layer_mlflow_rob_reg.py +134 -0
machinegnostics/models/regression/layer_param_rob_reg.py +212 -0
machinegnostics/models/regression/mg_lin_reg.py +253 -0
machinegnostics/models/regression/mg_poly_reg.py +258 -0
machinegnostics-0.0.1.dist-info/METADATA +246 -0
machinegnostics-0.0.1.dist-info/RECORD +93 -0
machinegnostics-0.0.1.dist-info/WHEEL +5 -0
machinegnostics-0.0.1.dist-info/licenses/LICENSE +674 -0
machinegnostics-0.0.1.dist-info/top_level.txt +2 -0

machinegnostics/magcal/criteria_eval.py ADDED Viewed

@@ -0,0 +1,268 @@
+'''
+ManGo - Machine Gnostics Library
+Copyright (C) 2025  ManGo Team
+Author: Nirmal Parmar
+Machine Gnostics
+'''
+import numpy as np
+from machinegnostics.magcal.characteristics import GnosticsCharacteristics
+from machinegnostics.magcal.sample_characteristics import GnosticCharacteristicsSample
+import logging
+from machinegnostics.magcal.util.logging import get_logger
+class CriteriaEvaluator:
+    """
+    A class to evaluate the performance of a model's fit to data using various statistical and information-theoretic metrics.
+    This class computes several evaluation metrics, including:
+    - Robust R-squared (RobR2): A robust measure of the goodness of fit.
+    - Geometric Mean of Model Fit Error (GMMFE): A measure of the average relative error between the observed and fitted values.
+    - Divergence Information (DivI): A measure of the divergence between the distributions of observed and fitted values.
+    - Evaluation Metric (EvalMet): A composite metric combining RobR2, GMMFE, and DivI.
+    The class also provides a method to generate a report summarizing these metrics.
+    Attributes:
+        y (np.ndarray): The observed data (ground truth).
+        y_fit (np.ndarray): The fitted data (model predictions).
+        w (np.ndarray): Weights for the data points. Defaults to an array of ones if not provided.
+        robr2 (float): The computed Robust R-squared value. Initialized to None.
+        gmmfe (float): The computed Geometric Mean of Model Fit Error. Initialized to None.
+        divI (float): The computed Divergence Information value. Initialized to None.
+        evalmet (float): The computed Evaluation Metric. Initialized to None.
+        _report (dict): A dictionary containing the computed metrics. Initialized to an empty dictionary.
+    Methods:
+        __init__(y, y_fit, w=None):
+            Initializes the CriteriaEvaluator with observed data, fitted data, and optional weights.
+        _robr2():
+            Computes the Robust R-squared (RobR2) value. This metric measures the proportion of variance in the observed data
+            explained by the fitted data, with robustness to outliers.
+        _gmmfe():
+            Computes the Geometric Mean of Model Fit Error (GMMFE). This metric quantifies the average relative error between
+            the observed and fitted values on a logarithmic scale.
+        _divI():
+            Computes the Divergence Information (DivI). This metric measures the divergence between the distributions of the
+            observed and fitted values using gnostic characteristics.
+        _evalmet():
+            Computes the Evaluation Metric (EvalMet) as a composite measure combining RobR2, GMMFE, and DivI.
+        generate_report():
+            Generates a report summarizing all computed metrics (RobR2, GMMFE, DivI, and EvalMet) in a dictionary format.
+    Usage:
+        Example 1: Basic Usage
+        -----------------------
+        y = np.array([1.0, 2.0, 3.0, 4.0, 5.0])
+        y_fit = np.array([1.1, 1.9, 3.2, 3.8, 5.1])
+        evaluator = CriteriaEvaluator(y, y_fit)
+        robr2 = evaluator._robr2()
+        print("Robust R-squared:", robr2)
+        gmmfe = evaluator._gmmfe()
+        print("Geometric Mean of Model Fit Error:", gmmfe)
+        divI = evaluator._divI()
+        print("Divergence Information:", divI)
+        evalmet = evaluator._evalmet()
+        print("Evaluation Metric:", evalmet)
+        report = evaluator.generate_report()
+        print("Report:", report)
+        Example 2: Using Weights
+        ------------------------
+        y = np.array([1.0, 2.0, 3.0, 4.0, 5.0])
+        y_fit = np.array([1.1, 1.9, 3.2, 3.8, 5.1])
+        weights = np.array([1, 2, 1, 2, 1])
+        evaluator = CriteriaEvaluator(y, y_fit, w=weights)
+        robr2 = evaluator._robr2()
+        print("Weighted Robust R-squared:", robr2)
+        gmmfe = evaluator._gmmfe()
+        print("Weighted Geometric Mean of Model Fit Error:", gmmfe)
+        divI = evaluator._divI()
+        print("Weighted Divergence Information:", divI)
+        evalmet = evaluator._evalmet()
+        print("Weighted Evaluation Metric:", evalmet)
+        report = evaluator.generate_report()
+        print("Weighted Report:", report)
+    Notes:
+        - The class assumes that `y` and `y_fit` are non-negative and of the same shape.
+        - The methods `_robr2`, `_gmmfe`, `_divI`, and `_evalmet` are designed to be called internally, but they can be
+          invoked directly if needed.
+        - The `generate_report` method ensures that all metrics are computed before generating the report.
+    """
+    def __init__(self, y, y_fit, w=None, verbose: bool = False):
+        self.y = np.asarray(y)
+        self.y_fit = np.asarray(y_fit)
+        self.w = np.ones_like(self.y) if w is None else np.asarray(w)
+        self.robr2 = None
+        self.gmmfe = None
+        self.divI = None
+        self.evalmet = None
+        self._report = {}
+        # logger setup
+        self.logger = get_logger(self.__class__.__name__, logging.DEBUG if verbose else logging.WARNING)
+        self.logger.debug(f"{self.__class__.__name__} initialized:")
+    def _robr2(self):
+        """
+        Computes the Robust R-squared (RobR2) value.
+        This metric measures the proportion of variance in the observed data explained by the fitted data,
+        with robustness to outliers. It is calculated as:
+        RobR2 = 1 - (Weighted Sum of Squared Errors / Weighted Total Sum of Squares)
+        Returns:
+            float: The computed Robust R-squared value. A value closer to 1 indicates a better fit.
+        """
+        self.logger.info("Calculating Robust R-squared (RobR2).")
+        e = self.y - self.y_fit
+        e_bar = np.sum(self.w * e) / np.sum(self.w)
+        y_bar = np.sum(self.w * self.y) / np.sum(self.w)
+        num = np.sum(self.w * (e - e_bar) ** 2)
+        denom = np.sum(self.w * (self.y - y_bar) ** 2)
+        self.robr2 = 1 - num / denom if denom != 0 else 0.0
+        self.logger.info(f"Robust R-squared (RobR2) calculated: {self.robr2}")
+        return self.robr2
+    def _gmmfe(self):
+        """
+        Computes the Geometric Mean of Model Fit Error (GMMFE).
+        This metric quantifies the average relative error between the observed and fitted values on a logarithmic scale.
+        It is robust to outliers and provides a measure of the average multiplicative error.
+        Returns:
+            float: The computed GMMFE value. A value closer to 1 indicates a better fit.
+        """
+        self.logger.info("Calculating Geometric Mean of Model Fit Error (GMMFE).")
+        epsilon = 1e-10  # Small value to prevent division by zero
+        # avoid log failure
+        zz = self.y / (self.y_fit + epsilon)
+        zz = np.clip(zz, epsilon, None)  # Clip values to avoid invalid log
+        log_ratios = np.abs(np.log(zz))
+        # avoid exp failure
+        log_ratios = np.clip(log_ratios, None, 100)  # Clip values to avoid invalid exp
+        self.gmmfe = np.exp(np.mean(log_ratios))
+        self.logger.info(f"Geometric Mean of Model Fit Error (GMMFE) calculated: {self.gmmfe}")
+        return self.gmmfe
+    def _divI(self):
+        """
+        Computes the Divergence Information (DivI).
+        This metric measures the divergence between the distributions of the observed and fitted values using gnostic characteristics.
+        It involves calculating the gnostic characteristics of the observed and fitted data, and then computing the divergence
+        in their information content.
+        Returns:
+            float: The computed Divergence Information value. A lower value indicates less divergence and a better fit.
+        """
+        self.logger.info("Calculating Divergence Information (DivI).")
+        gcs_y = GnosticCharacteristicsSample(data=self.y)
+        gcs_y_fit = GnosticCharacteristicsSample(data=self.y_fit)
+        # y_median = gcs_y._gnostic_median(case='i').root
+        # y_fit_median = gcs_y_fit._gnostic_median(case='i').root
+        y_median = np.median(self.y) # Using numpy median for simplicity NOTE
+        y_fit_median = np.median(self.y_fit)
+        zy = self.y / y_median
+        zf = self.y_fit / y_fit_median
+        gc_y = GnosticsCharacteristics(zy)
+        gc_y_fit = GnosticsCharacteristics(zf)
+        qy, q1y = gc_y._get_q_q1()
+        qf, q1f = gc_y_fit._get_q_q1()
+        hi = gc_y._hi(q=qy, q1=q1y)
+        hi_fit = gc_y_fit._hi(q=qf, q1=q1f)
+        pi = gc_y._idistfun(hi)
+        pi_fit = gc_y_fit._idistfun(hi_fit)
+        epsilon = 1e-10  # Small value to prevent log(0)
+        pi = np.clip(pi, epsilon, 1 - epsilon)  # Clip values to avoid invalid log
+        pi_fit = np.clip(pi_fit, epsilon, 1 - epsilon)  # Clip values to avoid invalid log
+        Iy = gc_y._info_i(pi)
+        Iy_fit = gc_y_fit._info_i(pi_fit)
+        self.divI = np.mean(Iy / Iy_fit)
+        self.logger.info(f"Divergence Information (DivI) calculated: {self.divI}")
+        return self.divI
+    def _evalmet(self):
+        """
+        Computes the Evaluation Metric (EvalMet).
+        This is a composite metric that combines Robust R-squared (RobR2), Geometric Mean of Model Fit Error (GMMFE),
+        and Divergence Information (DivI). It is calculated as:
+        EvalMet = RobR2 / (GMMFE * DivI)
+        Returns:
+            float: The computed Evaluation Metric. A higher value indicates a better overall fit.
+        """
+        self.logger.info("Calculating Evaluation Metric (EvalMet).")
+        if self.robr2 is None:
+            self._robr2()
+        if self.gmmfe is None:
+            self._gmmfe()
+        if self.divI is None:
+            self._divI()
+        self.evalmet = self.robr2 / (self.gmmfe * self.divI)
+        self.logger.info(f"Evaluation Metric (EvalMet) calculated: {self.evalmet}")
+        return self.evalmet
+    def generate_report(self):
+        """
+        Generates a report summarizing all computed metrics.
+        This method ensures that all metrics (RobR2, GMMFE, DivI, and EvalMet) are computed before generating the report.
+        The report is returned as a dictionary containing the metric names and their corresponding values.
+        Returns:
+            dict: A dictionary containing the computed metrics:
+                - "RobR2": Robust R-squared value.
+                - "GMMFE": Geometric Mean of Model Fit Error.
+                - "DivI": Divergence Information.
+                - "EvalMet": Evaluation Metric.
+        """
+        self.logger.info("Generating evaluation report.")
+        if self.robr2 is None:
+            self._robr2()
+        if self.gmmfe is None:
+            self._gmmfe()
+        if self.divI is None:
+            self._divI()
+        if self.evalmet is None:
+            self._evalmet()
+        self._report = {
+            "RobR2": self.robr2,
+            "GMMFE": self.gmmfe,
+            "DivI": self.divI,
+            "EvalMet": self.evalmet
+        }
+        self.logger.info("Evaluation report generated.")
+        return self._report

machinegnostics/magcal/criterion.py ADDED Viewed

@@ -0,0 +1,140 @@
+'''
+ManGo - Machine Gnostics Library
+Copyright (C) 2025  ManGo Team
+Author: Nirmal Parmar
+'''
+import numpy as np
+class GnosticCriterion:
+    """
+    A class to compute Gnostic Error Functions for Machine Gnostics Regression.
+    Gnostic Error Functions for Machine Gnostics Regression.
+    Reference: TABLE 19.2, p. 19-4, in the provided reference.
+    """
+    @staticmethod
+    def _compute_error(case:str, f_j=None, f_i=None, h_j=None, h_i=None):
+        """
+        Compute the error function based on the specified case.
+        Args:
+            case (str): The case to compute the error for ('Q1', 'E1', 'Q2', 'E2', 'Q3', 'E3').
+            f_j (float): Filtering weight for J cases.
+            f_i (float): Filtering weight for I cases.
+            h_j (float): Error function input for J cases.
+            h_i (float): Error function input for I cases.
+        Returns:
+            float: The computed error function value.
+        """
+        if case == 'Q1':
+            if f_j is None:
+                raise ValueError("f_j is required for case Q1")
+            return f_j  # h_j = f_j
+        elif case == 'E1':
+            if f_i is None:
+                raise ValueError("f_i is required for case E1")
+            return f_i  # h_i = f_i
+        elif case == 'Q2':
+            if f_j is None or h_j is None:
+                raise ValueError("f_j and h_j are required for case Q2")
+            return f_j * np.arctan(h_j)  # f_j * arctan(h_j)
+        elif case == 'E2':
+            if f_i is None or h_i is None:
+                raise ValueError("f_i and h_i are required for case E2")
+            return f_i * np.arctanh(h_i)  # f_i * arctanh(h_i)
+        elif case == 'Q3':
+            if f_j is None or h_j is None:
+                raise ValueError("f_j and h_j are required for case Q3")
+            return np.sqrt(f_j) * h_j  # sqrt(f_j) * h_j
+        elif case == 'E3':
+            if f_i is None or h_i is None:
+                raise ValueError("f_i and h_i are required for case E3")
+            return np.sqrt(f_i) * h_i  # sqrt(f_i) * h_i
+        else:
+            raise ValueError(f"Invalid case: {case}. Valid cases are 'Q1', 'E1', 'Q2', 'E2', 'Q3', 'E3'.")
+    @staticmethod
+    def _get_filtering_weight(case:str, f_j=None, f_i=None):
+        """
+        Calculate the filtering weight based on the specified case.
+        Args:
+            case (str): The case to compute the filtering weight for ('Q1', 'E1', 'Q2', 'E2', 'Q3', 'E3').
+            f_j (float): Filtering weight for J cases.
+            f_i (float): Filtering weight for I cases.
+        Returns:
+            float: The computed filtering weight.
+        """
+        if case == 'Q1':
+            if f_j is None:
+                raise ValueError("f_j is required for case Q1")
+            return f_j  # Filtering weight is f_j
+        elif case == 'E1':
+            if f_i is None:
+                raise ValueError("f_i is required for case E1")
+            return f_i**2  # Filtering weight is f_i^2
+        elif case == 'Q2':
+            return 1  # Filtering weight is 1
+        elif case == 'E2':
+            if f_i is None:
+                raise ValueError("f_i is required for case E2")
+            return f_i  # Filtering weight is f_i
+        elif case == 'Q3':
+            if f_j is None:
+                raise ValueError("f_j is required for case Q3")
+            return 1 / np.sqrt(f_j)  # Filtering weight is 1 / sqrt(f_j)
+        elif case == 'E3':
+            if f_i is None:
+                raise ValueError("f_i is required for case E3")
+            return 1 / np.sqrt(f_i)  # Filtering weight is 1 / sqrt(f_i)
+        else:
+            raise ValueError(f"Invalid case: {case}. Valid cases are 'Q1', 'E1', 'Q2', 'E2', 'Q3', 'E3'.")
+    @staticmethod
+    def _get_gnostic_criterion(case:str, f_j=None, f_i=None, h_j=None, h_i=None, Ii=None, Ij=None):
+        """
+        Get the gnostic criterion based on the specified case.
+        Args:
+            case (str): The case to compute the gnostic criterion for ('Q1', 'E1', 'Q2', 'E2', 'Q3', 'E3').
+            f_j (float): Filtering weight for J cases.
+            f_i (float): Filtering weight for I cases.
+            h_j (float): Error function input for J cases.
+            h_i (float): Error function input for I cases.
+            Ii (float): Estimating information.
+            Ij (float): Quantifying information.
+        Returns:
+            float: The computed gnostic criterion value.
+        """
+        if case == 'Q1':
+            return h_i**2 / 2
+        elif case == 'E1':
+            return h_j**2 / 2
+        elif case == 'Q2':
+            return Ij
+        elif case == 'E2':
+            return Ii
+        elif case == 'Q3':
+            return f_j
+        elif case == 'E3':
+            return -f_i