PyPI - sgptools - Versions diffs - 1.2.0__py3-none-any.whl → 2.0.0__py3-none-any.whl - Mend

sgptools 1.2.0py3-none-any.whl → 2.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

sgptools/__init__.py +3 -4
sgptools/core/__init__.py +1 -0
sgptools/{models/core → core}/augmented_gpr.py +11 -17
sgptools/{models/core → core}/augmented_sgpr.py +27 -34
sgptools/core/osgpr.py +417 -0
sgptools/core/transformations.py +699 -0
sgptools/kernels/__init__.py +0 -8
sgptools/kernels/attentive_kernel.py +214 -69
sgptools/kernels/neural_kernel.py +268 -92
sgptools/kernels/neural_network.py +127 -28
sgptools/methods.py +1047 -0
sgptools/objectives.py +275 -0
sgptools/utils/__init__.py +0 -9
sgptools/utils/data.py +452 -149
sgptools/utils/gpflow.py +335 -174
sgptools/utils/metrics.py +375 -102
sgptools/utils/misc.py +145 -111
sgptools/utils/tsp.py +224 -84
sgptools-2.0.0.dist-info/METADATA +216 -0
sgptools-2.0.0.dist-info/RECORD +23 -0
{sgptools-1.2.0.dist-info → sgptools-2.0.0.dist-info}/WHEEL +1 -1
sgptools/models/__init__.py +0 -10
sgptools/models/bo.py +0 -118
sgptools/models/cma_es.py +0 -121
sgptools/models/continuous_sgp.py +0 -68
sgptools/models/core/__init__.py +0 -9
sgptools/models/core/osgpr.py +0 -291
sgptools/models/core/transformations.py +0 -434
sgptools/models/greedy_mi.py +0 -115
sgptools/models/greedy_sgp.py +0 -97
sgptools-1.2.0.dist-info/METADATA +0 -39
sgptools-1.2.0.dist-info/RECORD +0 -27
{sgptools-1.2.0.dist-info → sgptools-2.0.0.dist-info/licenses}/LICENSE.txt +0 -0
{sgptools-1.2.0.dist-info → sgptools-2.0.0.dist-info}/top_level.txt +0 -0

sgptools/objectives.py ADDED Viewed

@@ -0,0 +1,275 @@
+import tensorflow as tf
+import numpy as np
+import gpflow
+from typing import Type, Any, Dict
+def jitter_fn(cov: tf.Tensor, jitter: float = 1e-6) -> tf.Tensor:
+    """
+    Adds a small positive value (jitter) to the diagonal of a covariance matrix
+    for numerical stability. This prevents issues with ill-conditioned matrices
+    during computations like Cholesky decomposition or determinant calculation.
+    Args:
+        cov (tf.Tensor): The input covariance matrix. Expected to be a square matrix.
+        jitter (float): The small positive value to add to the diagonal. Defaults to 1e-6.
+    Returns:
+        tf.Tensor: The covariance matrix with jitter added to its diagonal.
+    Usage:
+        ```python
+        # Example covariance matrix
+        cov_matrix = tf.constant([[1.0, 0.5], [0.5, 1.0]], dtype=tf.float64)
+        # Add default jitter
+        jittered_cov = jitter_fn(cov_matrix)
+        # Add custom jitter
+        custom_jittered_cov = jitter_fn(cov_matrix, jitter=1e-5)
+        ```
+    """
+    cov = tf.linalg.set_diag(cov, tf.linalg.diag_part(cov) + jitter)
+    return cov
+class Objective:
+    """
+    Base class for objective functions used in optimization.
+    Subclasses must implement the `__call__` method to define the objective.
+    """
+    def __init__(self, X_objective: np.ndarray, kernel: gpflow.kernels.Kernel,
+                 noise_variance: float, **kwargs: Any):
+        """
+        Initializes the base objective. This constructor primarily serves to define
+        the expected parameters for all objective subclasses.
+        Args:
+            X_objective (np.ndarray): The input data points that define the context or
+                                      environment for which the objective is calculated.
+                                      Shape: (N, D) where N is number of points, D is dimension.
+            kernel (gpflow.kernels.Kernel): The GPflow kernel function used in the objective.
+            noise_variance (float): The observed data noise variance.
+            **kwargs: Arbitrary keyword arguments.
+        """
+        pass
+    def __call__(self, X: tf.Tensor) -> tf.Tensor:
+        """
+        Computes the objective value for a given set of input points `X`.
+        This method must be implemented by subclasses.
+        Args:
+            X (tf.Tensor): The input points for which the objective is to be computed.
+                           Shape: (M, D) where M is number of points, D is dimension.
+        Returns:
+            tf.Tensor: The computed objective value.
+        Raises:
+            NotImplementedError: If the method is not implemented by a subclass.
+        """
+        raise NotImplementedError
+    def update(self, kernel: gpflow.kernels.Kernel,
+               noise_variance: float) -> None:
+        """
+        Updates the kernel and noise variance parameters used by the objective function.
+        This method should be overridden by subclasses if they maintain internal state
+        that needs updating (e.g., cached kernel matrices or jitter values).
+        Args:
+            kernel (gpflow.kernels.Kernel): The updated GPflow kernel function.
+            noise_variance (float): The updated data noise variance.
+        """
+        pass
+class MI(Objective):
+    """
+    Computes the Mutual Information (MI) between a fixed set of objective points
+    (`X_objective`) and a variable set of input points (`X`).
+    MI is calculated as:
+    $MI(X; X_{objective}) = log|K(X,X)| + log|K(X_{objective},X_{objective})| - log|K(X \cup X_{objective}, X \cup X_{objective})|$
+    Jitter is added to the diagonal of the covariance matrices to ensure numerical stability.
+    """
+    def __init__(self,
+                 X_objective: np.ndarray,
+                 kernel: gpflow.kernels.Kernel,
+                 noise_variance: float,
+                 jitter: float = 1e-6,
+                 **kwargs: Any):
+        """
+        Initializes the Mutual Information (MI) objective.
+        Args:
+            X_objective (np.ndarray): The fixed set of data points (e.g., candidate locations
+                                      or training data points) against which MI is computed.
+                                      Shape: (N, D).
+            kernel (gpflow.kernels.Kernel): The GPflow kernel function to compute covariances.
+            noise_variance (float): The observed data noise variance, which is added to the jitter.
+            jitter (float): A small positive value to add for numerical stability to covariance
+                            matrix diagonals. Defaults to 1e-6.
+            **kwargs: Arbitrary keyword arguments.
+        """
+        self.X_objective = tf.constant(X_objective, dtype=tf.float64)
+        self.kernel = kernel
+        self.noise_variance = noise_variance
+        # Total jitter includes the noise variance
+        self._base_jitter = jitter
+        self.jitter_fn = lambda cov: jitter_fn(
+            cov, jitter=self._base_jitter + self.noise_variance)
+    def __call__(self, X: tf.Tensor) -> tf.Tensor:
+        """
+        Computes the Mutual Information for the given input points `X`.
+        Args:
+            X (tf.Tensor): The input points (e.g., sensing locations) for which
+                           MI is to be computed. Shape: (M, D).
+        Returns:
+            tf.Tensor: The computed Mutual Information value.
+        Usage:
+            ```python
+            import gpflow
+            import numpy as np
+            # Assume X_objective and kernel are defined
+            # X_objective = np.random.rand(100, 2)
+            # kernel = gpflow.kernels.SquaredExponential()
+            # noise_variance = 0.1
+            mi_objective = MI(X_objective=X_objective, kernel=kernel, noise_variance=noise_variance)
+            X_sensing = tf.constant(np.random.rand(10, 2), dtype=tf.float64)
+            mi_value = mi_objective(X_sensing)
+            ```
+        """
+        # K(X_objective, X_objective)
+        K_obj_obj = self.kernel(self.X_objective)
+        # K(X, X)
+        K_X_X = self.kernel(X)
+        # K(X_objective U X, X_objective U X)
+        K_combined = self.kernel(tf.concat([self.X_objective, X], axis=0))
+        # Compute log determinants
+        logdet_K_obj_obj = tf.math.log(tf.linalg.det(
+            self.jitter_fn(K_obj_obj)))
+        logdet_K_X_X = tf.math.log(tf.linalg.det(self.jitter_fn(K_X_X)))
+        logdet_K_combined = tf.math.log(
+            tf.linalg.det(self.jitter_fn(K_combined)))
+        # MI formula
+        mi = logdet_K_obj_obj + logdet_K_X_X - logdet_K_combined
+        return mi
+    def update(self, kernel: gpflow.kernels.Kernel,
+               noise_variance: float) -> None:
+        """
+        Updates the kernel and noise variance for the MI objective.
+        This method is crucial for optimizing the GP hyperparameters externally
+        and having the objective function reflect those changes.
+        Args:
+            kernel (gpflow.kernels.Kernel): The updated GPflow kernel function.
+            noise_variance (float): The updated data noise variance.
+        """
+        # Update kernel's trainable variables (e.g., lengthscales, variance)
+        for self_var, var in zip(self.kernel.trainable_variables,
+                                 kernel.trainable_variables):
+            self_var.assign(var)
+        self.noise_variance = noise_variance
+        # Update the jitter function to reflect the new noise variance
+        self.jitter_fn = lambda cov: jitter_fn(
+            cov, jitter=self._base_jitter + self.noise_variance)
+class SLogMI(MI):
+    """
+    Computes the Mutual Information (MI) using `tf.linalg.slogdet` for numerical stability,
+    especially for large or ill-conditioned covariance matrices.
+    The slogdet (sign and log determinant) method computes the sign and the natural
+    logarithm of the absolute value of the determinant of a square matrix.
+    This is more numerically stable than computing the determinant directly and then
+    taking the logarithm, as `tf.linalg.det` can return very small or very large
+    numbers that lead to underflow/overflow when `tf.math.log` is applied.
+    Jitter is also added to the diagonal for additional numerical stability.
+    """
+    def __call__(self, X: tf.Tensor) -> tf.Tensor:
+        """
+        Computes the Mutual Information for the given input points `X` using `tf.linalg.slogdet`.
+        Args:
+            X (tf.Tensor): The input points (e.g., sensing locations) for which
+                           MI is to be computed. Shape: (M, D).
+        Returns:
+            tf.Tensor: The computed Mutual Information value.
+        Usage:
+            ```python
+            import gpflow
+            import numpy as np
+            # Assume X_objective and kernel are defined
+            # X_objective = np.random.rand(100, 2)
+            # kernel = gpflow.kernels.SquaredExponential()
+            # noise_variance = 0.1
+            slogmi_objective = SLogMI(X_objective=X_objective, kernel=kernel, noise_variance=noise_variance)
+            X_sensing = tf.constant(np.random.rand(10, 2), dtype=tf.float64)
+            mi_value = slogmi_objective(X_sensing)
+            ```
+        """
+        # K(X_objective, X_objective)
+        K_obj_obj = self.kernel(self.X_objective)
+        # K(X, X)
+        K_X_X = self.kernel(X)
+        # K(X_objective U X, X_objective U X)
+        K_combined = self.kernel(tf.concat([self.X_objective, X], axis=0))
+        # Compute log determinants using slogdet for numerical stability
+        _, logdet_K_obj_obj = tf.linalg.slogdet(self.jitter_fn(K_obj_obj))
+        _, logdet_K_X_X = tf.linalg.slogdet(self.jitter_fn(K_X_X))
+        _, logdet_K_combined = tf.linalg.slogdet(self.jitter_fn(K_combined))
+        # MI formula
+        mi = logdet_K_obj_obj + logdet_K_X_X - logdet_K_combined
+        return mi
+OBJECTIVES: Dict[str, Type[Objective]] = {
+    'MI': MI,
+    'SLogMI': SLogMI,
+}
+def get_objective(objective_name: str) -> Type[Objective]:
+    """
+    Retrieves an objective function class by its string name.
+    Args:
+        objective_name (str): The name of the objective function (e.g., 'MI', 'SLogMI').
+    Returns:
+        Type[Objective]: The class of the requested objective function.
+    Raises:
+        KeyError: If the objective name is not found in the registered OBJECTIVES.
+    Usage:
+        ```python
+        # Get the Mutual Information objective class
+        MIObjectiveClass = get_objective('MI')
+        # You can then instantiate it:
+        # mi_instance = MIObjectiveClass(X_objective=..., kernel=..., noise_variance=...)
+        ```
+    """
+    return OBJECTIVES[objective_name]

sgptools/utils/__init__.py CHANGED Viewed

@@ -1,10 +1 @@
 # sgptools/utils/__init__.py
-"""General utilities to support the functionalities of this package:
-- `data`: Provides utilities to preprocess datasets
-- `gpflow`: Provides utilities to interface with GPflow
-- `metrics`: Provides utilities to quantify the solution quality
-- `misc`: Provides miscellaneous helper functions
-- `tsp`: Provides utilities to run TSP/VRP solver
-"""

sgptools 1.2.0__py3-none-any.whl → 2.0.0__py3-none-any.whl

sgptools 1.2.0py3-none-any.whl → 2.0.0py3-none-any.whl