PyPI - pcntoolkit - Versions diffs - 0.32.0__py3-none-any.whl - Mend

pcntoolkit 0.32.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

pcntoolkit/__init__.py +4 -0
pcntoolkit/configs.py +9 -0
pcntoolkit/dataio/__init__.py +1 -0
pcntoolkit/dataio/fileio.py +608 -0
pcntoolkit/model/KnuOp.py +48 -0
pcntoolkit/model/NP.py +88 -0
pcntoolkit/model/NPR.py +86 -0
pcntoolkit/model/SHASH.py +509 -0
pcntoolkit/model/__init__.py +6 -0
pcntoolkit/model/architecture.py +219 -0
pcntoolkit/model/bayesreg.py +585 -0
pcntoolkit/model/core.21290 +0 -0
pcntoolkit/model/gp.py +489 -0
pcntoolkit/model/hbr.py +1584 -0
pcntoolkit/model/rfa.py +245 -0
pcntoolkit/normative.py +1647 -0
pcntoolkit/normative_NP.py +336 -0
pcntoolkit/normative_model/__init__.py +6 -0
pcntoolkit/normative_model/norm_base.py +62 -0
pcntoolkit/normative_model/norm_blr.py +303 -0
pcntoolkit/normative_model/norm_gpr.py +112 -0
pcntoolkit/normative_model/norm_hbr.py +752 -0
pcntoolkit/normative_model/norm_np.py +333 -0
pcntoolkit/normative_model/norm_rfa.py +109 -0
pcntoolkit/normative_model/norm_utils.py +29 -0
pcntoolkit/normative_parallel.py +1420 -0
pcntoolkit/regression_model/blr/warp.py +1 -0
pcntoolkit/trendsurf.py +315 -0
pcntoolkit/util/__init__.py +1 -0
pcntoolkit/util/bspline.py +149 -0
pcntoolkit/util/hbr_utils.py +242 -0
pcntoolkit/util/utils.py +1698 -0
pcntoolkit-0.32.0.dist-info/LICENSE +674 -0
pcntoolkit-0.32.0.dist-info/METADATA +134 -0
pcntoolkit-0.32.0.dist-info/RECORD +37 -0
pcntoolkit-0.32.0.dist-info/WHEEL +4 -0
pcntoolkit-0.32.0.dist-info/entry_points.txt +5 -0

pcntoolkit/normative_model/norm_blr.py ADDED Viewed

@@ -0,0 +1,303 @@
+from __future__ import print_function
+from __future__ import division
+import os
+import sys
+import numpy as np
+import pandas as pd
+from ast import literal_eval
+try:  # run as a package if installed
+    from pcntoolkit.model.bayesreg import BLR
+    from pcntoolkit.normative_model.norm_base import NormBase
+    from pcntoolkit.dataio import fileio
+    from pcntoolkit.util.utils import create_poly_basis, WarpBoxCox, \
+        WarpAffine, WarpCompose, WarpSinArcsinh
+except ImportError:
+    pass
+    path = os.path.abspath(os.path.dirname(__file__))
+    if path not in sys.path:
+        sys.path.append(path)
+    del path
+    from model.bayesreg import BLR
+    from norm_base import NormBase
+    from dataio import fileio
+    from util.utils import create_poly_basis, WarpBoxCox, \
+        WarpAffine, WarpCompose, WarpSinArcsinh
+class NormBLR(NormBase):
+    """ Normative modelling based on Bayesian Linear Regression
+    """
+    def __init__(self,  **kwargs):
+        """
+        Initialize the NormBLR object.
+        This function initializes the NormBLR object with the given arguments. It requires a data matrix 'X' and optionally takes a target 'y' and parameters 'theta'.
+        It also configures the model order and heteroskedastic noise if specified in the arguments.
+        :param kwargs: Keyword arguments which should include:
+            - 'X': Data matrix. Must be specified.
+            - 'y': Target values. Optional.
+            - 'theta': Parameters for the model. Optional.
+            - 'optimizer': The optimization algorithm to use. Default is 'powell'.
+            - 'configparam' or 'model_order': The order of the model. Default is 1.
+            - 'varcovfile': File containing the variance-covariance matrix for heteroskedastic noise. Optional.
+        :raises ValueError: If 'X' is not specified in kwargs.
+        """
+        X = kwargs.pop('X', None)
+        y = kwargs.pop('y', None)
+        theta = kwargs.pop('theta', None)
+        if isinstance(theta, str):
+            theta = np.array(literal_eval(theta))
+        self.optim_alg = kwargs.get('optimizer', 'powell')
+        if X is None:
+            raise ValueError("Data matrix must be specified")
+        if len(X.shape) == 1:
+            self.D = 1
+        else:
+            self.D = X.shape[1]
+        # Parse model order
+        if kwargs is None:
+            model_order = 1
+        elif 'configparam' in kwargs:  # deprecated syntax
+            model_order = kwargs.pop('configparam')
+        elif 'model_order' in kwargs:
+            model_order = kwargs.pop('model_order')
+        else:
+            model_order = 1
+        # Force a default model order and check datatype
+        if model_order is None:
+            model_order = 1
+        if type(model_order) is not int:
+            model_order = int(model_order)
+        # configure heteroskedastic noise
+        if 'varcovfile' in kwargs:
+            var_cov_file = kwargs.get('varcovfile')
+            if var_cov_file.endswith('.pkl'):
+                self.var_covariates = pd.read_pickle(var_cov_file)
+            else:
+                self.var_covariates = np.loadtxt(var_cov_file)
+            if len(self.var_covariates.shape) == 1:
+                self.var_covariates = self.var_covariates[:, np.newaxis]
+            n_beta = self.var_covariates.shape[1]
+            self.var_groups = None
+        elif 'vargroupfile' in kwargs:
+            # configure variance groups (e.g. site specific variance)
+            var_groups_file = kwargs.pop('vargroupfile')
+            if var_groups_file.endswith('.pkl'):
+                self.var_groups = pd.read_pickle(var_groups_file)
+            else:
+                self.var_groups = np.loadtxt(var_groups_file)
+            var_ids = set(self.var_groups)
+            var_ids = sorted(list(var_ids))
+            n_beta = len(var_ids)
+        else:
+            self.var_groups = None
+            self.var_covariates = None
+            n_beta = 1
+        # are we using ARD?
+        if 'use_ard' in kwargs:
+            self.use_ard = kwargs.pop('use_ard')
+        else:
+            self.use_ard = False
+        if self.use_ard:
+            n_alpha = self.D * model_order
+        else:
+            n_alpha = 1
+        # Configure warped likelihood
+        if 'warp' in kwargs:
+            warp_str = kwargs.pop('warp')
+            if warp_str is None:
+                self.warp = None
+                n_gamma = 0
+            else:
+                # set up warp
+                exec('self.warp =' + warp_str + '()')
+                n_gamma = self.warp.get_n_params()
+        else:
+            self.warp = None
+            n_gamma = 0
+        self._n_params = n_alpha + n_beta + n_gamma
+        self._model_order = model_order
+        print("configuring BLR ( order", model_order, ")")
+        if (theta is None) or (len(theta) != self._n_params):
+            print("Using default hyperparameters")
+            self.theta0 = np.zeros(self._n_params)
+        else:
+            self.theta0 = theta
+        self.theta = self.theta0
+        # initialise the BLR object if the required parameters are present
+        if (theta is not None) and (y is not None):
+            Phi = create_poly_basis(X, self._model_order)
+            self.blr = BLR(theta=theta, X=Phi, y=y,
+                           warp=self.warp, **kwargs)
+        else:
+            self.blr = BLR(**kwargs)
+    @property
+    def n_params(self):
+        return self._n_params
+    @property
+    def neg_log_lik(self):
+        return self.blr.nlZ
+    def estimate(self, X, y, **kwargs):
+        """
+        Estimate the parameters of the model.
+        This function estimates the parameters of the model given the data matrix 'X' and target 'y'.
+        If 'theta' is provided in kwargs, it is used as the initial guess for the parameters.
+        Otherwise, the initial guess is set to the current value of 'self.theta'.
+        :param X: Data matrix.
+        :param y: Target values.
+        :param kwargs: Keyword arguments which may include:
+            - 'theta': Initial guess for the parameters. Optional.
+            - 'warp': String representing the warp function. It is removed from kwargs before passing to the BLR object.
+        :return: The instance of the NormBLR object.
+        """
+        theta = kwargs.pop('theta', None)
+        if isinstance(theta, str):
+            theta = np.array(literal_eval(theta))
+        # remove warp string to prevent it being passed to the blr object
+        kwargs.pop('warp', None)
+        Phi = create_poly_basis(X, self._model_order)
+        if len(y.shape) > 1:
+            y = y.ravel()
+        if theta is None:
+            theta = self.theta0
+            # (re-)initialize BLR object because parameters were not specified
+            self.blr = BLR(theta=theta, X=Phi, y=y,
+                           var_groups=self.var_groups,
+                           warp=self.warp, **kwargs)
+        self.theta = self.blr.estimate(theta, Phi, y,
+                                       var_covariates=self.var_covariates, **kwargs)
+        return self
+    def predict(self, Xs, X=None, y=None, **kwargs):
+        """
+        Predict the target values for the given test data.
+        This function predicts the target values for the given test data 'Xs' using the estimated parameters of the model.
+        If 'X' and 'y' are provided, they are used to update the model before prediction.
+        :param Xs: Test data matrix.
+        :param X: Training data matrix. Optional.
+        :param y: Training target values. Optional.
+        :param kwargs: Keyword arguments which may include:
+            - 'testvargroup': Variance groups for the test data. Optional.
+            - 'testvargroupfile': File containing the variance groups for the test data. Optional.
+            - 'testvarcov': Variance covariates for the test data. Optional.
+            - 'testvarcovfile': File containing the variance covariates for the test data. Optional.
+            - 'adaptresp': Responses to adapt to. Optional.
+            - 'adaptrespfile': File containing the responses to adapt to. Optional.
+            - 'adaptcov': Covariates to adapt to. Optional.
+            - 'adaptcovfile': File containing the covariates to adapt to. Optional.
+            - 'adaptvargroup': Variance groups to adapt to. Optional.
+            - 'adaptvargroupfile': File containing the variance groups to adapt to. Optional.
+        :return: The predicted target values for the test data.
+        """
+        theta = self.theta  # always use the estimated coefficients
+        # remove from kwargs to avoid downstream problems
+        kwargs.pop('theta', None)
+        Phis = create_poly_basis(Xs, self._model_order)
+        if X is None:
+            Phi = None
+        else:
+            Phi = create_poly_basis(X, self._model_order)
+        # process variance groups for the test data
+        if 'testvargroup' in kwargs:
+            var_groups_te = kwargs.pop('testvargroup')
+        else:
+            if 'testvargroupfile' in kwargs:
+                var_groups_test_file = kwargs.pop('testvargroupfile')
+                if var_groups_test_file.endswith('.pkl'):
+                    var_groups_te = pd.read_pickle(var_groups_test_file)
+                else:
+                    var_groups_te = np.loadtxt(var_groups_test_file)
+            else:
+                var_groups_te = None
+        # process test variance covariates
+        if 'testvarcov' in kwargs:
+            var_cov_te = kwargs.pop('testvarcov')
+        else:
+            if 'testvarcovfile' in kwargs:
+                var_cov_test_file = kwargs.get('testvarcovfile')
+                if var_cov_test_file.endswith('.pkl'):
+                    var_cov_te = pd.read_pickle(var_cov_test_file)
+                else:
+                    var_cov_te = np.loadtxt(var_cov_test_file)
+            else:
+                var_cov_te = None
+        # do we want to adjust the responses?
+        if 'adaptresp' in kwargs:
+            y_adapt = kwargs.pop('adaptresp')
+        else:
+            if 'adaptrespfile' in kwargs:
+                y_adapt = fileio.load(kwargs.pop('adaptrespfile'))
+                if len(y_adapt.shape) == 1:
+                    y_adapt = y_adapt[:, np.newaxis]
+            else:
+                y_adapt = None
+        if 'adaptcov' in kwargs:
+            X_adapt = kwargs.pop('adaptcov')
+            Phi_adapt = create_poly_basis(X_adapt, self._model_order)
+        else:
+            if 'adaptcovfile' in kwargs:
+                X_adapt = fileio.load(kwargs.pop('adaptcovfile'))
+                Phi_adapt = create_poly_basis(X_adapt, self._model_order)
+            else:
+                Phi_adapt = None
+        if 'adaptvargroup' in kwargs:
+            var_groups_ad = kwargs.pop('adaptvargroup')
+        else:
+            if 'adaptvargroupfile' in kwargs:
+                var_groups_adapt_file = kwargs.pop('adaptvargroupfile')
+                if var_groups_adapt_file.endswith('.pkl'):
+                    var_groups_ad = pd.read_pickle(var_groups_adapt_file)
+                else:
+                    var_groups_ad = np.loadtxt(var_groups_adapt_file)
+            else:
+                var_groups_ad = None
+        if y_adapt is None:
+            yhat, s2 = self.blr.predict(theta, Phi, y, Phis,
+                                        var_groups_test=var_groups_te,
+                                        var_covariates_test=var_cov_te,
+                                        **kwargs)
+        else:
+            yhat, s2 = self.blr.predict_and_adjust(theta, Phi_adapt, y_adapt, Phis,
+                                                   var_groups_test=var_groups_te,
+                                                   var_groups_adapt=var_groups_ad,
+                                                   **kwargs)
+        return yhat, s2

pcntoolkit/normative_model/norm_gpr.py ADDED Viewed

@@ -0,0 +1,112 @@
+from __future__ import print_function
+from __future__ import division
+import os
+import sys
+import numpy as np
+try:  # run as a package if installed
+    from pcntoolkit.model.gp import GPR, CovSum
+    from pcntoolkit.normative_model.norm_base import NormBase
+except ImportError:
+    pass
+    path = os.path.abspath(os.path.dirname(__file__))
+    if path not in sys.path:
+        sys.path.append(path)
+    del path
+    from model.gp import GPR, CovSum
+    from norm_base import NormBase
+class NormGPR(NormBase):
+    """ Classical GPR-based normative modelling approach
+    """
+    def __init__(self, **kwargs):  # X=None, y=None, theta=None,
+        """
+        Initialize the NormGPR object.
+        This function initializes the NormGPR object with the given arguments. It requires a data matrix 'X' and optionally takes a target 'y' and parameters 'theta'.
+        It also initializes the covariance function and the Gaussian Process Regression (GPR) model.
+        :param kwargs: Keyword arguments which should include:
+            - 'X': Data matrix. Must be specified.
+            - 'y': Target values. Optional.
+            - 'theta': Parameters for the model. Optional.
+        """
+        X = kwargs.pop('X', None)
+        y = kwargs.pop('y', None)
+        theta = kwargs.pop('theta', None)
+        self.covfunc = CovSum(X, ('CovLin', 'CovSqExpARD'))
+        self.theta0 = np.zeros(self.covfunc.get_n_params() + 1)
+        self.theta = self.theta0
+        if (theta is not None) and (X is not None) and (y is not None):
+            self.gpr = GPR(theta, self.covfunc, X, y)
+            self._n_params = self.covfunc.get_n_params() + 1
+        else:
+            self.gpr = GPR()
+    @property
+    def n_params(self):
+        if not hasattr(self, '_n_params'):
+            self._n_params = self.covfunc.get_n_params() + 1
+        return self._n_params
+    @property
+    def neg_log_lik(self):
+        return self.gpr.nlZ
+    def estimate(self, X, y, **kwargs):
+        """
+        Estimate the parameters of the Gaussian Process Regression model.
+        This function estimates the parameters of the Gaussian Process Regression (GPR) model given the data matrix 'X' and target 'y'.
+        If 'theta' is provided in kwargs, it is used as the initial guess for the parameters.
+        Otherwise, the initial guess is set to the current value of 'self.theta0'.
+        :param X: Data matrix.
+        :param y: Target values.
+        :param kwargs: Keyword arguments which may include:
+            - 'theta': Initial guess for the parameters. Optional.
+        :return: The instance of the NormGPR object.
+        """
+        theta = kwargs.pop('theta', None)
+        if theta is None:
+            theta = self.theta0
+            self.gpr = GPR(theta, self.covfunc, X, y)
+        self.theta = self.gpr.estimate(theta, self.covfunc, X, y)
+        return self
+    def predict(self, Xs, X, y, **kwargs):
+        """
+        Predict the target values for the given test data.
+        This function predicts the target values for the given test data 'Xs' using the estimated parameters of the Gaussian Process Regression (GPR) model.
+        If 'X' and 'y' are provided, they are used to update the model before prediction.
+        If 'theta' is provided in kwargs, it is used as the parameters for prediction.
+        Otherwise, the current value of 'self.theta' is used.
+        :param Xs: Test data matrix.
+        :param X: Training data matrix. Optional.
+        :param y: Training target values. Optional.
+        :param kwargs: Keyword arguments which may include:
+            - 'theta': Parameters for prediction. Optional.
+        :return: A tuple containing the predicted target values and the marginal variances for the test data.
+        """
+        theta = kwargs.pop('theta', None)
+        if theta is None:
+            theta = self.theta
+        yhat, s2 = self.gpr.predict(theta, X, y, Xs)
+        # only return the marginal variances
+        if len(s2.shape) == 2:
+            s2 = np.diag(s2)
+        return yhat, s2