PyPI - aspire-inference - Versions diffs - 0.1.0a9__py3-none-any.whl → 0.1.0a11__py3-none-any.whl - Mend

aspire-inference 0.1.0a9py3-none-any.whl → 0.1.0a11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

aspire/aspire.py +356 -4
aspire/flows/torch/flows.py +1 -1
aspire/samplers/base.py +149 -5
aspire/samplers/smc/base.py +133 -48
aspire/samplers/smc/blackjax.py +8 -0
aspire/samplers/smc/emcee.py +8 -0
aspire/samplers/smc/minipcn.py +26 -6
aspire/samples.py +21 -15
aspire/utils.py +157 -4
{aspire_inference-0.1.0a9.dist-info → aspire_inference-0.1.0a11.dist-info}/METADATA +23 -4
aspire_inference-0.1.0a11.dist-info/RECORD +28 -0
aspire_inference-0.1.0a9.dist-info/RECORD +0 -28
{aspire_inference-0.1.0a9.dist-info → aspire_inference-0.1.0a11.dist-info}/WHEEL +0 -0
{aspire_inference-0.1.0a9.dist-info → aspire_inference-0.1.0a11.dist-info}/licenses/LICENSE +0 -0
{aspire_inference-0.1.0a9.dist-info → aspire_inference-0.1.0a11.dist-info}/top_level.txt +0 -0

aspire/aspire.py CHANGED Viewed

@@ -1,5 +1,8 @@
+import copy
 import logging
 import multiprocessing as mp
+import pickle
+from contextlib import contextmanager
 from inspect import signature
 from typing import Any, Callable
@@ -8,13 +11,19 @@ import h5py
 from .flows import get_flow_wrapper
 from .flows.base import Flow
 from .history import History
+from .samplers.base import Sampler
 from .samples import Samples
 from .transforms import (
     CompositeTransform,
     FlowPreconditioningTransform,
     FlowTransform,
 )
-from .utils import recursively_save_to_h5_file
+from .utils import (
+    AspireFile,
+    load_from_h5_file,
+    recursively_save_to_h5_file,
+    resolve_xp,
+)
 logger = logging.getLogger(__name__)
@@ -102,6 +111,7 @@ class Aspire:
         self.dtype = dtype
         self._flow = flow
+        self._sampler = None
     @property
     def flow(self):
@@ -114,7 +124,7 @@ class Aspire:
         self._flow = flow
     @property
-    def sampler(self):
+    def sampler(self) -> Sampler | None:
         """The sampler object."""
         return self._sampler
@@ -192,7 +202,29 @@ class Aspire:
             **self.flow_kwargs,
         )
-    def fit(self, samples: Samples, **kwargs) -> History:
+    def fit(
+        self,
+        samples: Samples,
+        checkpoint_path: str | None = None,
+        checkpoint_save_config: bool = True,
+        overwrite: bool = False,
+        **kwargs,
+    ) -> History:
+        """Fit the normalizing flow to the provided samples.
+        Parameters
+        ----------
+        samples : Samples
+            The samples to fit the flow to.
+        checkpoint_path : str | None
+            Path to save the checkpoint. If None, no checkpoint is saved.
+        checkpoint_save_config : bool
+            Whether to save the Aspire configuration to the checkpoint.
+        overwrite : bool
+            Whether to overwrite an existing flow in the checkpoint file.
+        kwargs : dict
+            Keyword arguments to pass to the flow's fit method.
+        """
         if self.xp is None:
             self.xp = samples.xp
@@ -202,6 +234,28 @@ class Aspire:
         self.training_samples = samples
         logger.info(f"Training with {len(samples.x)} samples")
         history = self.flow.fit(samples.x, **kwargs)
+        defaults = getattr(self, "_checkpoint_defaults", None)
+        if checkpoint_path is None and defaults:
+            checkpoint_path = defaults["path"]
+            checkpoint_save_config = defaults["save_config"]
+        saved_config = (
+            defaults.get("saved_config", False) if defaults else False
+        )
+        if checkpoint_path is not None:
+            with AspireFile(checkpoint_path, "a") as h5_file:
+                if checkpoint_save_config and not saved_config:
+                    if "aspire_config" in h5_file:
+                        del h5_file["aspire_config"]
+                    self.save_config(h5_file, include_sampler_config=False)
+                    if defaults is not None:
+                        defaults["saved_config"] = True
+                # Save flow only if missing or overwrite=True
+                if "flow" in h5_file:
+                    if overwrite:
+                        del h5_file["flow"]
+                        self.save_flow(h5_file)
+                else:
+                    self.save_flow(h5_file)
         return history
     def get_sampler_class(self, sampler_type: str) -> Callable:
@@ -241,6 +295,13 @@ class Aspire:
         ----------
         sampler_type : str
             The type of sampler to use. Options are 'importance', 'emcee', or 'smc'.
+        preconditioning: str
+            Type of preconditioning to apply in the sampler. Options are
+            'default', 'flow', or 'none'.
+        preconditioning_kwargs: dict
+            Keyword arguments to pass to the preconditioning transform.
+        kwargs : dict
+            Keyword arguments to pass to the sampler.
         """
         SamplerClass = self.get_sampler_class(sampler_type)
@@ -304,6 +365,9 @@ class Aspire:
         return_history: bool = False,
         preconditioning: str | None = None,
         preconditioning_kwargs: dict | None = None,
+        checkpoint_path: str | None = None,
+        checkpoint_every: int = 1,
+        checkpoint_save_config: bool = True,
         **kwargs,
     ) -> Samples:
         """Draw samples from the posterior distribution.
@@ -342,6 +406,14 @@ class Aspire:
             will default to 'none' and the other samplers to 'default'
         preconditioning_kwargs: dict
             Keyword arguments to pass to the preconditioning transform.
+        checkpoint_path : str | None
+            Path to save the checkpoint. If None, no checkpoint is saved unless
+            within an :py:meth:`auto_checkpoint` context or a custom callback
+            is provided.
+        checkpoint_every : int
+            Frequency (in number of sampler iterations) to save the checkpoint.
+        checkpoint_save_config : bool
+            Whether to save the Aspire configuration to the checkpoint.
         kwargs : dict
             Keyword arguments to pass to the sampler. These are passed
             automatically to the init method of the sampler or to the sample
@@ -352,6 +424,22 @@ class Aspire:
         samples : Samples
             Samples object contain samples and their corresponding weights.
         """
+        if (
+            sampler == "importance"
+            and hasattr(self, "_resume_sampler_type")
+            and self._resume_sampler_type
+        ):
+            sampler = self._resume_sampler_type
+        if "resume_from" not in kwargs and hasattr(
+            self, "_resume_from_default"
+        ):
+            kwargs["resume_from"] = self._resume_from_default
+            if hasattr(self, "_resume_overrides"):
+                kwargs.update(self._resume_overrides)
+            if hasattr(self, "_resume_n_samples") and n_samples == 1000:
+                n_samples = self._resume_n_samples
         SamplerClass = self.get_sampler_class(sampler)
         # Determine sampler initialization parameters
         # and remove them from kwargs
@@ -373,7 +461,73 @@ class Aspire:
             preconditioning_kwargs=preconditioning_kwargs,
             **sampler_kwargs,
         )
+        self._last_sampler_type = sampler
+        # Auto-checkpoint convenience: set defaults for checkpointing to a single file
+        defaults = getattr(self, "_checkpoint_defaults", None)
+        if checkpoint_path is None and defaults:
+            checkpoint_path = defaults["path"]
+            checkpoint_every = defaults["every"]
+            checkpoint_save_config = defaults["save_config"]
+        saved_flow = defaults.get("saved_flow", False) if defaults else False
+        saved_config = (
+            defaults.get("saved_config", False) if defaults else False
+        )
+        if checkpoint_path is not None:
+            kwargs.setdefault("checkpoint_file_path", checkpoint_path)
+            kwargs.setdefault("checkpoint_every", checkpoint_every)
+            with AspireFile(checkpoint_path, "a") as h5_file:
+                if checkpoint_save_config:
+                    if "aspire_config" in h5_file:
+                        del h5_file["aspire_config"]
+                    self.save_config(
+                        h5_file,
+                        include_sampler_config=True,
+                        include_sample_calls=False,
+                    )
+                    saved_config = True
+                    if defaults is not None:
+                        defaults["saved_config"] = True
+                if (
+                    self.flow is not None
+                    and not saved_flow
+                    and "flow" not in h5_file
+                ):
+                    self.save_flow(h5_file)
+                    saved_flow = True
+                    if defaults is not None:
+                        defaults["saved_flow"] = True
         samples = self._sampler.sample(n_samples, **kwargs)
+        self._last_sample_posterior_kwargs = {
+            "n_samples": n_samples,
+            "sampler": sampler,
+            "xp": xp,
+            "return_history": return_history,
+            "preconditioning": preconditioning,
+            "preconditioning_kwargs": preconditioning_kwargs,
+            "sampler_init_kwargs": sampler_kwargs,
+            "sample_kwargs": copy.deepcopy(kwargs),
+        }
+        if checkpoint_path is not None:
+            with AspireFile(checkpoint_path, "a") as h5_file:
+                if checkpoint_save_config and not saved_config:
+                    if "aspire_config" in h5_file:
+                        del h5_file["aspire_config"]
+                    self.save_config(
+                        h5_file,
+                        include_sampler_config=True,
+                        include_sample_calls=False,
+                    )
+                    if defaults is not None:
+                        defaults["saved_config"] = True
+                if (
+                    self.flow is not None
+                    and not saved_flow
+                    and "flow" not in h5_file
+                ):
+                    self.save_flow(h5_file)
+                    if defaults is not None:
+                        defaults["saved_flow"] = True
         if xp is not None:
             samples = samples.to_namespace(xp)
         samples.parameters = self.parameters
@@ -388,6 +542,122 @@ class Aspire:
         else:
             return samples
+    @classmethod
+    def resume_from_file(
+        cls,
+        file_path: str,
+        *,
+        log_likelihood: Callable,
+        log_prior: Callable,
+        sampler: str | None = None,
+        checkpoint_path: str = "checkpoint",
+        checkpoint_dset: str = "state",
+        flow_path: str = "flow",
+        config_path: str = "aspire_config",
+        resume_kwargs: dict | None = None,
+    ):
+        """
+        Recreate an Aspire object from a single file and prepare to resume sampling.
+        Parameters
+        ----------
+        file_path : str
+            Path to the HDF5 file containing config, flow, and checkpoint.
+        log_likelihood : Callable
+            Log-likelihood function (required, not pickled).
+        log_prior : Callable
+            Log-prior function (required, not pickled).
+        sampler : str
+            Sampler type to use (e.g., 'smc', 'minipcn_smc', 'emcee_smc'). If None,
+            will attempt to infer from saved config or checkpoint metadata.
+        checkpoint_path : str
+            HDF5 group path where the checkpoint is stored.
+        checkpoint_dset : str
+            Dataset name within the checkpoint group.
+        flow_path : str
+            HDF5 path to the saved flow.
+        config_path : str
+            HDF5 path to the saved Aspire config.
+        resume_kwargs : dict | None
+            Optional overrides to apply when resuming (e.g., checkpoint_every).
+        """
+        (
+            aspire,
+            checkpoint_bytes,
+            checkpoint_state,
+            sampler_config,
+            saved_sampler_type,
+            n_samples,
+        ) = cls._build_aspire_from_file(
+            file_path=file_path,
+            log_likelihood=log_likelihood,
+            log_prior=log_prior,
+            checkpoint_path=checkpoint_path,
+            checkpoint_dset=checkpoint_dset,
+            flow_path=flow_path,
+            config_path=config_path,
+        )
+        sampler_config = sampler_config or {}
+        sampler_config.pop("sampler_class", None)
+        if checkpoint_bytes is not None:
+            aspire._resume_from_default = checkpoint_bytes
+            aspire._resume_sampler_type = (
+                sampler
+                or saved_sampler_type
+                or (
+                    checkpoint_state.get("sampler")
+                    if checkpoint_state
+                    else None
+                )
+            )
+            aspire._resume_n_samples = n_samples
+            aspire._resume_overrides = resume_kwargs or {}
+            aspire._resume_sampler_config = sampler_config
+        aspire._checkpoint_defaults = {
+            "path": file_path,
+            "every": 1,
+            "save_config": False,
+            "save_flow": False,
+            "saved_config": False,
+            "saved_flow": False,
+        }
+        return aspire
+    @contextmanager
+    def auto_checkpoint(
+        self,
+        path: str,
+        every: int = 1,
+        save_config: bool = True,
+        save_flow: bool = True,
+    ):
+        """
+        Context manager to auto-save checkpoints, config, and flow to a file.
+        Within the context, sample_posterior will default to writing checkpoints
+        to the given path with the specified frequency, and will append config/flow
+        after sampling.
+        """
+        prev = getattr(self, "_checkpoint_defaults", None)
+        self._checkpoint_defaults = {
+            "path": path,
+            "every": every,
+            "save_config": save_config,
+            "save_flow": save_flow,
+            "saved_config": False,
+            "saved_flow": False,
+        }
+        try:
+            yield self
+        finally:
+            if prev is None:
+                if hasattr(self, "_checkpoint_defaults"):
+                    delattr(self, "_checkpoint_defaults")
+            else:
+                self._checkpoint_defaults = prev
     def enable_pool(self, pool: mp.Pool, **kwargs):
         """Context manager to temporarily replace the log_likelihood method
         with a version that uses a multiprocessing pool to parallelize
@@ -432,12 +702,16 @@ class Aspire:
             "flow_kwargs": self.flow_kwargs,
             "eps": self.eps,
         }
+        if hasattr(self, "_last_sampler_type"):
+            config["sampler_type"] = self._last_sampler_type
         if include_sampler_config:
+            if self.sampler is None:
+                raise ValueError("Sampler has not been initialized.")
             config["sampler_config"] = self.sampler.config_dict(**kwargs)
         return config
     def save_config(
-        self, h5_file: h5py.File, path="aspire_config", **kwargs
+        self, h5_file: h5py.File | AspireFile, path="aspire_config", **kwargs
     ) -> None:
         """Save the configuration to an HDF5 file.
@@ -484,6 +758,7 @@ class Aspire:
         FlowClass, xp = get_flow_wrapper(
             backend=self.flow_backend, flow_matching=self.flow_matching
         )
+        logger.debug(f"Loading flow of type {FlowClass} from {path}")
         self._flow = FlowClass.load(h5_file, path=path)
     def save_config_to_json(self, filename: str) -> None:
@@ -504,3 +779,80 @@ class Aspire:
         x, log_q = self.flow.sample_and_log_prob(n_samples)
         samples = Samples(x=x, log_q=log_q, xp=xp, parameters=self.parameters)
         return samples
+    # --- Resume helpers ---
+    @staticmethod
+    def _build_aspire_from_file(
+        file_path: str,
+        log_likelihood: Callable,
+        log_prior: Callable,
+        checkpoint_path: str,
+        checkpoint_dset: str,
+        flow_path: str,
+        config_path: str,
+    ):
+        """Construct an Aspire instance, load flow, and gather checkpoint metadata from file."""
+        with AspireFile(file_path, "r") as h5_file:
+            if config_path not in h5_file:
+                raise ValueError(
+                    f"Config path '{config_path}' not found in {file_path}"
+                )
+            config_dict = load_from_h5_file(h5_file, config_path)
+            try:
+                checkpoint_bytes = h5_file[checkpoint_path][checkpoint_dset][
+                    ...
+                ].tobytes()
+            except Exception:
+                logger.warning(
+                    "Checkpoint not found at %s/%s in %s; will resume without a checkpoint.",
+                    checkpoint_path,
+                    checkpoint_dset,
+                    file_path,
+                )
+                checkpoint_bytes = None
+        sampler_config = config_dict.pop("sampler_config", None)
+        saved_sampler_type = config_dict.pop("sampler_type", None)
+        if isinstance(config_dict.get("xp"), str):
+            config_dict["xp"] = resolve_xp(config_dict["xp"])
+        config_dict["log_likelihood"] = log_likelihood
+        config_dict["log_prior"] = log_prior
+        aspire = Aspire(**config_dict)
+        with AspireFile(file_path, "r") as h5_file:
+            if flow_path in h5_file:
+                logger.info(f"Loading flow from {flow_path} in {file_path}")
+                aspire.load_flow(h5_file, path=flow_path)
+            else:
+                raise ValueError(
+                    f"Flow path '{flow_path}' not found in {file_path}"
+                )
+        n_samples = None
+        checkpoint_state = None
+        if checkpoint_bytes is not None:
+            try:
+                checkpoint_state = pickle.loads(checkpoint_bytes)
+                samples_saved = (
+                    checkpoint_state.get("samples")
+                    if checkpoint_state
+                    else None
+                )
+                if samples_saved is not None:
+                    n_samples = len(samples_saved)
+                    if aspire.xp is None and hasattr(samples_saved, "xp"):
+                        aspire.xp = samples_saved.xp
+            except Exception:
+                logger.warning(
+                    "Failed to decode checkpoint; proceeding without resume state."
+                )
+        return (
+            aspire,
+            checkpoint_bytes,
+            checkpoint_state,
+            sampler_config,
+            saved_sampler_type,
+            n_samples,
+        )

aspire/flows/torch/flows.py CHANGED Viewed

@@ -92,7 +92,7 @@ class BaseTorchFlow(Flow):
         config = load_from_h5_file(flow_grp, "config")
         config["dtype"] = decode_dtype(torch, config.get("dtype"))
         if "data_transform" in flow_grp:
-            from ..transforms import BaseTransform
+            from ...transforms import BaseTransform
             data_transform = BaseTransform.load(
                 flow_grp,

aspire/samplers/base.py CHANGED Viewed

@@ -1,10 +1,12 @@
 import logging
+import pickle
+from pathlib import Path
 from typing import Any, Callable
 from ..flows.base import Flow
 from ..samples import Samples
 from ..transforms import IdentityTransform
-from ..utils import track_calls
+from ..utils import AspireFile, asarray, dump_state, track_calls
 logger = logging.getLogger(__name__)
@@ -49,6 +51,8 @@ class Sampler:
         self.parameters = parameters
         self.history = None
         self.n_likelihood_evaluations = 0
+        self._last_checkpoint_state: dict | None = None
+        self._last_checkpoint_bytes: bytes | None = None
         if preconditioning_transform is None:
             self.preconditioning_transform = IdentityTransform(xp=self.xp)
         else:
@@ -56,7 +60,11 @@ class Sampler:
     def fit_preconditioning_transform(self, x):
         """Fit the data transform to the data."""
-        x = self.preconditioning_transform.xp.asarray(x)
+        x = asarray(
+            x,
+            xp=self.preconditioning_transform.xp,
+            dtype=self.preconditioning_transform.dtype,
+        )
         return self.preconditioning_transform.fit(x)
     @track_calls
@@ -71,7 +79,7 @@ class Sampler:
         self.n_likelihood_evaluations += len(samples)
         return self._log_likelihood(samples)
-    def config_dict(self, include_sample_calls: bool = True) -> dict:
+    def config_dict(self, include_sample_calls: bool = False) -> dict:
         """
         Returns a dictionary with the configuration of the sampler.
@@ -79,9 +87,9 @@ class Sampler:
         ----------
         include_sample_calls : bool
             Whether to include the sample calls in the configuration.
-            Default is True.
+            Default is False.
         """
-        config = {}
+        config = {"sampler_class": self.__class__.__name__}
         if include_sample_calls:
             if hasattr(self, "sample") and hasattr(self.sample, "calls"):
                 config["sample_calls"] = self.sample.calls.to_dict(
@@ -92,3 +100,139 @@ class Sampler:
                     "Sampler does not have a sample method with calls attribute."
                 )
         return config
+    # --- Checkpointing helpers shared across samplers ---
+    def _checkpoint_extra_state(self) -> dict:
+        """Sampler-specific extras for checkpointing (override in subclasses)."""
+        return {}
+    def _restore_extra_state(self, state: dict) -> None:
+        """Restore sampler-specific extras (override in subclasses)."""
+        _ = state  # no-op for base
+    def build_checkpoint_state(
+        self,
+        samples: Samples,
+        iteration: int | None = None,
+        meta: dict | None = None,
+    ) -> dict:
+        """Prepare a serializable checkpoint payload for the sampler state."""
+        checkpoint_samples = samples
+        base_state = {
+            "sampler": self.__class__.__name__,
+            "iteration": iteration,
+            "samples": checkpoint_samples,
+            "config": self.config_dict(include_sample_calls=False),
+            "parameters": self.parameters,
+            "meta": meta or {},
+        }
+        base_state.update(self._checkpoint_extra_state())
+        return base_state
+    def serialize_checkpoint(
+        self, state: dict, protocol: int | None = None
+    ) -> bytes:
+        """Serialize a checkpoint state to bytes with pickle."""
+        protocol = (
+            pickle.HIGHEST_PROTOCOL if protocol is None else int(protocol)
+        )
+        return pickle.dumps(state, protocol=protocol)
+    def default_checkpoint_callback(self, state: dict) -> None:
+        """Store the latest checkpoint (state + pickled bytes) on the sampler."""
+        self._last_checkpoint_state = state
+        self._last_checkpoint_bytes = self.serialize_checkpoint(state)
+    def default_file_checkpoint_callback(
+        self, file_path: str | Path | None
+    ) -> Callable[[dict], None]:
+        """Return a simple default callback that overwrites an HDF5 file."""
+        if file_path is None:
+            return self.default_checkpoint_callback
+        file_path = Path(file_path)
+        lower_path = file_path.name.lower()
+        if not lower_path.endswith((".h5", ".hdf5")):
+            raise ValueError(
+                "Checkpoint file must be an HDF5 file (.h5 or .hdf5)."
+            )
+        def _callback(state: dict) -> None:
+            with AspireFile(file_path, "a") as h5_file:
+                self.save_checkpoint_to_hdf(
+                    state, h5_file, path="checkpoint", dsetname="state"
+                )
+            self.default_checkpoint_callback(state)
+        return _callback
+    def save_checkpoint_to_hdf(
+        self,
+        state: dict,
+        h5_file,
+        path: str = "sampler_checkpoints",
+        dsetname: str | None = None,
+        protocol: int | None = None,
+    ) -> None:
+        """Save a checkpoint state into an HDF5 file as a pickled blob."""
+        if dsetname is None:
+            iter_str = state.get("iteration", "unknown")
+            dsetname = f"iter_{iter_str}"
+        dump_state(
+            state,
+            h5_file,
+            path=path,
+            dsetname=dsetname,
+            protocol=protocol or pickle.HIGHEST_PROTOCOL,
+        )
+    def load_checkpoint_from_file(
+        self,
+        file_path: str | Path,
+        h5_path: str = "checkpoint",
+        dsetname: str = "state",
+    ) -> dict:
+        """Load a checkpoint dictionary from .pkl or .hdf5 file."""
+        file_path = Path(file_path)
+        lower_path = file_path.name.lower()
+        if lower_path.endswith((".h5", ".hdf5")):
+            with AspireFile(file_path, "r") as h5_file:
+                data = h5_file[h5_path][dsetname][...]
+                checkpoint_bytes = data.tobytes()
+        else:
+            with open(file_path, "rb") as f:
+                checkpoint_bytes = f.read()
+        return pickle.loads(checkpoint_bytes)
+    def restore_from_checkpoint(
+        self, source: str | bytes | dict
+    ) -> tuple[Samples, dict]:
+        """Restore sampler state from a checkpoint source."""
+        if isinstance(source, str):
+            state = self.load_checkpoint_from_file(source)
+        elif isinstance(source, bytes):
+            state = pickle.loads(source)
+        elif isinstance(source, dict):
+            state = source
+        else:
+            raise TypeError("Unsupported checkpoint source type.")
+        samples_saved = state.get("samples")
+        if samples_saved is None:
+            raise ValueError("Checkpoint missing samples.")
+        samples = Samples.from_samples(
+            samples_saved, xp=self.xp, dtype=self.dtype
+        )
+        # Allow subclasses to restore sampler-specific components
+        self._restore_extra_state(state)
+        return samples, state
+    @property
+    def last_checkpoint_state(self) -> dict | None:
+        """Return the most recent checkpoint state stored by the default callback."""
+        return self._last_checkpoint_state
+    @property
+    def last_checkpoint_bytes(self) -> bytes | None:
+        """Return the most recent pickled checkpoint produced by the default callback."""
+        return self._last_checkpoint_bytes

aspire-inference 0.1.0a9__py3-none-any.whl → 0.1.0a11__py3-none-any.whl

aspire-inference 0.1.0a9py3-none-any.whl → 0.1.0a11py3-none-any.whl