PyPI - ennbo - Versions diffs - 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

ennbo 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

enn/enn/enn.py +71 -31
enn/enn/enn_fit.py +26 -24
enn/enn/enn_normal.py +3 -2
enn/enn/enn_params.py +13 -0
enn/enn/enn_util.py +40 -12
enn/turbo/base_turbo_impl.py +53 -7
enn/turbo/lhd_only_impl.py +7 -0
enn/turbo/morbo_trust_region.py +189 -0
enn/turbo/no_trust_region.py +65 -0
enn/turbo/proposal.py +11 -2
enn/turbo/turbo_config.py +48 -4
enn/turbo/turbo_enn_impl.py +46 -21
enn/turbo/turbo_gp.py +9 -1
enn/turbo/turbo_mode_impl.py +11 -2
enn/turbo/turbo_one_impl.py +163 -24
enn/turbo/turbo_optimizer.py +246 -58
enn/turbo/turbo_trust_region.py +8 -10
enn/turbo/turbo_utils.py +116 -26
enn/turbo/turbo_zero_impl.py +5 -0
{ennbo-0.1.0.dist-info → ennbo-0.1.2.dist-info}/METADATA +5 -4
ennbo-0.1.2.dist-info/RECORD +29 -0
ennbo-0.1.0.dist-info/RECORD +0 -27
{ennbo-0.1.0.dist-info → ennbo-0.1.2.dist-info}/WHEEL +0 -0
{ennbo-0.1.0.dist-info → ennbo-0.1.2.dist-info}/licenses/LICENSE +0 -0

enn/turbo/turbo_one_impl.py CHANGED Viewed

@@ -7,33 +7,85 @@ if TYPE_CHECKING:
     from numpy.random import Generator
 from .base_turbo_impl import BaseTurboImpl
-from .turbo_config import TurboConfig
+from .turbo_config import TurboOneConfig
 from .turbo_utils import gp_thompson_sample
 class TurboOneImpl(BaseTurboImpl):
-    def __init__(self, config: TurboConfig) -> None:
+    def __init__(self, config: TurboOneConfig) -> None:
         super().__init__(config)
         self._gp_model: Any | None = None
-        self._gp_y_mean: float = 0.0
-        self._gp_y_std: float = 1.0
+        self._gp_y_mean: float | Any = 0.0
+        self._gp_y_std: float | Any = 1.0
         self._fitted_n_obs: int = 0
+    def _as_2d(self, a: np.ndarray) -> np.ndarray:
+        import numpy as np
+        a = np.asarray(a, dtype=float)
+        if a.ndim == 1:
+            return a.reshape(-1, 1)
+        if a.ndim == 2:
+            return a.T
+        raise ValueError(a.shape)
+    def _broadcast_gp_mean_std(self, num_metrics: int) -> tuple[np.ndarray, np.ndarray]:
+        import numpy as np
+        num_metrics = int(num_metrics)
+        if num_metrics <= 0:
+            raise ValueError(num_metrics)
+        gp_y_mean = np.asarray(self._gp_y_mean, dtype=float).reshape(-1)
+        gp_y_std = np.asarray(self._gp_y_std, dtype=float).reshape(-1)
+        if gp_y_mean.size == 1 and num_metrics != 1:
+            gp_y_mean = np.full(num_metrics, float(gp_y_mean[0]), dtype=float)
+        if gp_y_std.size == 1 and num_metrics != 1:
+            gp_y_std = np.full(num_metrics, float(gp_y_std[0]), dtype=float)
+        if gp_y_mean.shape != (num_metrics,) or gp_y_std.shape != (num_metrics,):
+            raise ValueError((gp_y_mean.shape, gp_y_std.shape, num_metrics))
+        return gp_y_mean, gp_y_std
+    def _unstandardize(self, y_std_2d: np.ndarray) -> np.ndarray:
+        import numpy as np
+        y_std_2d = np.asarray(y_std_2d, dtype=float)
+        if y_std_2d.ndim != 2:
+            raise ValueError(y_std_2d.shape)
+        num_metrics = int(y_std_2d.shape[1])
+        gp_y_mean, gp_y_std = self._broadcast_gp_mean_std(num_metrics)
+        return gp_y_mean.reshape(1, -1) + gp_y_std.reshape(1, -1) * y_std_2d
     def get_x_center(
         self,
         x_obs_list: list,
         y_obs_list: list,
         rng: Generator,
+        tr_state: Any = None,
     ) -> np.ndarray | None:
         import numpy as np
         import torch
+        import warnings
         from .turbo_utils import argmax_random_tie
         if len(y_obs_list) == 0:
             return None
         if self._gp_model is None:
-            return super().get_x_center(x_obs_list, y_obs_list, rng)
+            if len(y_obs_list) <= 1:
+                x_array = np.asarray(x_obs_list, dtype=float)
+                y_array = np.asarray(y_obs_list, dtype=float)
+                if y_array.ndim == 2:
+                    if self._config.tr_type == "morbo" and tr_state is not None:
+                        scores = tr_state.scalarize(y_array, clip=True)
+                    else:
+                        scores = y_array[:, 0]
+                    best_idx = argmax_random_tie(scores, rng=rng)
+                    return x_array[best_idx]
+                return super().get_x_center(x_obs_list, y_obs_list, rng, tr_state)
+            raise RuntimeError(
+                "TurboOneImpl.get_x_center requires a fitted GP model for 2+ observations; "
+                "call prepare_ask() first."
+            )
         if self._fitted_n_obs != len(x_obs_list):
             raise RuntimeError(
                 f"GP fitted on {self._fitted_n_obs} obs but get_x_center called with {len(x_obs_list)}"
@@ -41,11 +93,38 @@ class TurboOneImpl(BaseTurboImpl):
         x_array = np.asarray(x_obs_list, dtype=float)
         x_torch = torch.as_tensor(x_array, dtype=torch.float64)
+        try:
+            from gpytorch.utils.warnings import GPInputWarning
+        except Exception:  # pragma: no cover
+            GPInputWarning = None
         with torch.no_grad():
-            posterior = self._gp_model.posterior(x_torch)
-            mu = posterior.mean.cpu().numpy().ravel()
+            if GPInputWarning is None:
+                posterior = self._gp_model.posterior(x_torch)
+            else:
+                # We intentionally evaluate the GP posterior at the training inputs
+                # (observed points) when choosing the center. GPyTorch warns about this
+                # in debug mode, but it's expected for our usage.
+                with warnings.catch_warnings():
+                    warnings.filterwarnings(
+                        "ignore",
+                        message=r"The input matches the stored training data\..*",
+                        category=GPInputWarning,
+                    )
+                    posterior = self._gp_model.posterior(x_torch)
+            mu_std = posterior.mean.cpu().numpy()
+        mu = self._unstandardize(self._as_2d(mu_std))
+        # For morbo: scalarize mu values
+        if self._config.tr_type == "morbo" and tr_state is not None:
+            scalarized = tr_state.scalarize(mu, clip=False)
+            best_idx = argmax_random_tie(scalarized, rng=rng)
+        else:
+            if mu.shape[1] != 1:
+                raise ValueError(mu.shape)
+            best_idx = argmax_random_tie(mu[:, 0], rng=rng)
-        best_idx = argmax_random_tie(mu, rng=rng)
         return x_array[best_idx]
     def needs_tr_list(self) -> bool:
@@ -56,7 +135,7 @@ class TurboOneImpl(BaseTurboImpl):
         num_arms: int,
         x_obs_list: list,
         draw_initial_fn: Callable[[int], np.ndarray],
-        get_init_lhd_points_fn: Callable[[int], np.ndarray | None],
+        get_init_lhd_points_fn: Callable[[int], np.ndarray],
     ) -> np.ndarray | None:
         if len(x_obs_list) == 0:
             return get_init_lhd_points_fn(num_arms)
@@ -102,18 +181,22 @@ class TurboOneImpl(BaseTurboImpl):
             self._gp_y_mean = gp_y_mean_fitted
         if gp_y_std_fitted is not None:
             self._gp_y_std = gp_y_std_fitted
-        weights = None
+        lengthscales = None
         if self._gp_model is not None:
-            weights = (
+            lengthscale = (
                 self._gp_model.covar_module.base_kernel.lengthscale.cpu()
                 .detach()
                 .numpy()
-                .ravel()
             )
+            if lengthscale.ndim == 3:
+                lengthscale = lengthscale.mean(axis=0)
+            lengthscales = lengthscale.ravel()
             # First line helps stabilize second line.
-            weights = weights / weights.mean()
-            weights = weights / np.prod(np.power(weights, 1.0 / len(weights)))
-        return self._gp_model, gp_y_mean_fitted, gp_y_std_fitted, weights
+            lengthscales = lengthscales / lengthscales.mean()
+            lengthscales = lengthscales / np.prod(
+                np.power(lengthscales, 1.0 / len(lengthscales))
+            )
+        return self._gp_model, gp_y_mean_fitted, gp_y_std_fitted, lengthscales
     def select_candidates(
         self,
@@ -123,17 +206,63 @@ class TurboOneImpl(BaseTurboImpl):
         rng: Generator,
         fallback_fn: Callable[[np.ndarray, int], np.ndarray],
         from_unit_fn: Callable[[np.ndarray], np.ndarray],
+        tr_state: Any = None,
     ) -> np.ndarray:
+        import numpy as np
         if self._gp_model is None:
+            if self._fitted_n_obs >= 2:
+                raise RuntimeError(
+                    "TurboOneImpl.select_candidates requires a fitted GP model for 2+ observations; "
+                    "call prepare_ask() first."
+                )
             return fallback_fn(x_cand, num_arms)
+        if self._config.tr_type == "morbo" and tr_state is not None:
+            import gpytorch
+            import torch
+            from .turbo_utils import torch_seed_context
+            x_torch = torch.as_tensor(x_cand, dtype=torch.float64)
+            seed = int(rng.integers(2**31 - 1))
+            with (
+                torch.no_grad(),
+                gpytorch.settings.fast_pred_var(),
+                torch_seed_context(seed, device=x_torch.device),
+            ):
+                posterior = self._gp_model.posterior(x_torch)
+                samples = posterior.sample(sample_shape=torch.Size([1]))
+            if samples.ndim == 2:
+                samples_std = samples[0].detach().cpu().numpy().reshape(-1, 1)
+            elif samples.ndim == 3:
+                samples_std = samples[0].detach().cpu().numpy().T
+            else:
+                raise ValueError(samples.shape)
+            y_samples = self._unstandardize(samples_std)
+            scores = tr_state.scalarize(y_samples, clip=False)
+            shuffled_indices = rng.permutation(len(scores))
+            shuffled_scores = scores[shuffled_indices]
+            top_k_in_shuffled = np.argpartition(-shuffled_scores, num_arms - 1)[
+                :num_arms
+            ]
+            idx = shuffled_indices[top_k_in_shuffled]
+            return from_unit_fn(x_cand[idx])
+        if (
+            np.asarray(self._gp_y_mean).ndim != 0
+            or np.asarray(self._gp_y_std).ndim != 0
+        ):
+            raise ValueError("multi-output GP requires tr_type='morbo'")
         idx = gp_thompson_sample(
             self._gp_model,
             x_cand,
             num_arms,
             rng,
-            self._gp_y_mean,
-            self._gp_y_std,
+            float(self._gp_y_mean),
+            float(self._gp_y_std),
         )
         return from_unit_fn(x_cand[idx])
@@ -141,12 +270,18 @@ class TurboOneImpl(BaseTurboImpl):
         import torch
         if self._gp_model is None:
-            return y_observed
+            raise RuntimeError(
+                "TurboOneImpl.estimate_y requires a fitted GP model; call prepare_ask() first."
+            )
         x_torch = torch.as_tensor(x_unit, dtype=torch.float64)
         with torch.no_grad():
             posterior = self._gp_model.posterior(x_torch)
-            mu = posterior.mean.cpu().numpy().ravel()
-        return self._gp_y_mean + self._gp_y_std * mu
+            mu_std = posterior.mean.cpu().numpy()
+        mu = self._unstandardize(self._as_2d(mu_std))
+        if mu.shape[1] == 1:
+            return mu[:, 0]
+        return mu
     def get_mu_sigma(self, x_unit: np.ndarray) -> tuple[np.ndarray, np.ndarray] | None:
         import torch
@@ -156,8 +291,12 @@ class TurboOneImpl(BaseTurboImpl):
         x_torch = torch.as_tensor(x_unit, dtype=torch.float64)
         with torch.no_grad():
             posterior = self._gp_model.posterior(x_torch)
-            mu_std = posterior.mean.cpu().numpy().ravel()
-            sigma_std = posterior.variance.cpu().numpy().ravel() ** 0.5
-        mu = self._gp_y_mean + self._gp_y_std * mu_std
-        sigma = self._gp_y_std * sigma_std
+            mu_std = posterior.mean.cpu().numpy()
+            sigma_std = posterior.variance.cpu().numpy() ** 0.5
+        mu_std_2d = self._as_2d(mu_std)
+        sigma_std_2d = self._as_2d(sigma_std)
+        mu = self._unstandardize(mu_std_2d)
+        _gp_y_mean, gp_y_std = self._broadcast_gp_mean_std(int(mu_std_2d.shape[1]))
+        sigma = gp_y_std.reshape(1, -1) * sigma_std_2d
         return mu, sigma

ennbo 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl

ennbo 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl