PyPI - jaxspec - Versions diffs - 0.0.4__py3-none-any.whl → 0.0.6__py3-none-any.whl - Mend

jaxspec 0.0.4py3-none-any.whl → 0.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

jaxspec/__init__.py +1 -1
jaxspec/analysis/compare.py +3 -3
jaxspec/analysis/results.py +239 -110
jaxspec/data/instrument.py +0 -2
jaxspec/data/ogip.py +18 -0
jaxspec/data/util.py +11 -3
jaxspec/fit.py +166 -72
jaxspec/model/_additive/__init__.py +0 -0
jaxspec/model/_additive/apec.py +377 -0
jaxspec/model/_additive/apec_loaders.py +90 -0
jaxspec/model/abc.py +55 -7
jaxspec/model/additive.py +2 -51
jaxspec/tables/abundances.dat +31 -0
jaxspec/util/abundance.py +111 -0
jaxspec/util/integrate.py +5 -4
{jaxspec-0.0.4.dist-info → jaxspec-0.0.6.dist-info}/METADATA +5 -3
{jaxspec-0.0.4.dist-info → jaxspec-0.0.6.dist-info}/RECORD +19 -14
{jaxspec-0.0.4.dist-info → jaxspec-0.0.6.dist-info}/LICENSE.md +0 -0
{jaxspec-0.0.4.dist-info → jaxspec-0.0.6.dist-info}/WHEEL +0 -0

jaxspec/fit.py CHANGED Viewed

@@ -4,11 +4,12 @@ import numpyro
 import arviz as az
 import jax
 from typing import Callable, TypeVar
-from abc import ABC
+from abc import ABC, abstractmethod
 from jax import random
 from jax.tree_util import tree_map
+from jax.flatten_util import ravel_pytree
 from jax.experimental.sparse import BCSR
-from .analysis.results import ChainResult
+from .analysis.results import FitResult
 from .model.abc import SpectralModel
 from .data import ObsConfiguration
 from .model.background import BackgroundModel
@@ -17,13 +18,15 @@ from numpyro.distributions import Distribution, TransformedDistribution
 from numpyro.distributions import Poisson
 from jax.typing import ArrayLike
 from numpyro.infer.reparam import TransformReparam
+from numpyro.infer.util import initialize_model
+from jax.random import PRNGKey
+import jaxopt
 T = TypeVar("T")
-class HaikuDict(dict[str, dict[str, T]]):
-    ...
+class HaikuDict(dict[str, dict[str, T]]): ...
 def build_prior(prior: HaikuDict[Distribution | ArrayLike], expand_shape: tuple = ()):
@@ -32,7 +35,8 @@ def build_prior(prior: HaikuDict[Distribution | ArrayLike], expand_shape: tuple
     for i, (m, n, sample) in enumerate(hk.data_structures.traverse(prior)):
         match sample:
             case Distribution():
-                parameters[m][n] = numpyro.sample(f"{m}_{n}", sample.expand(expand_shape))
+                parameters[m][n] = jnp.ones(expand_shape) * numpyro.sample(f"{m}_{n}", sample)
+                # parameters[m][n] = numpyro.sample(f"{m}_{n}", sample.expand(expand_shape)) build a free parameter for each obs
             case float() | ArrayLike():
                 parameters[m][n] = jnp.ones(expand_shape) * sample
             case _:
@@ -54,7 +58,7 @@ def build_numpyro_model(
         if (getattr(obs, "folded_background", None) is not None) and (background_model is not None):
             bkg_countrate = background_model.numpyro_model(
-                obs.out_energies, obs.folded_background.data, name=name + "bkg", observed=observed
+                obs.out_energies, obs.folded_background.data, name="bkg_" + name, observed=observed
             )
         elif (getattr(obs, "folded_background", None) is None) and (background_model is not None):
             raise ValueError("Trying to fit a background model but no background is linked to this observation")
@@ -66,9 +70,9 @@ def build_numpyro_model(
         countrate = obs_model(prior_params)
         # This is the case where we fit a model to a TOTAL spectrum as defined in OGIP standard
-        with numpyro.plate(name + "obs_plate", len(obs.folded_counts)):
+        with numpyro.plate("obs_plate_" + name, len(obs.folded_counts)):
             numpyro.sample(
-                name + "obs",
+                "obs_" + name,
                 Poisson(countrate + bkg_countrate / obs.folded_backratio.data),
                 obs=obs.folded_counts.data if observed else None,
             )
@@ -76,6 +80,25 @@ def build_numpyro_model(
     return numpro_model
+def filter_inference_data(inference_data, observation_container, background_model=None) -> az.InferenceData:
+    predictive_parameters = []
+    for key, value in observation_container.items():
+        if background_model is not None:
+            predictive_parameters.append(f"obs_{key}")
+            predictive_parameters.append(f"bkg_{key}")
+        else:
+            predictive_parameters.append(f"obs_{key}")
+    inference_data.posterior_predictive = inference_data.posterior_predictive[predictive_parameters]
+    parameters = [x for x in inference_data.posterior.keys() if not x.endswith("_base")]
+    inference_data.posterior = inference_data.posterior[parameters]
+    inference_data.prior = inference_data.prior[parameters]
+    return inference_data
 class CountForwardModel(hk.Module):
     """
     A haiku module which allows to build the function that simulates the measured counts
@@ -97,27 +120,87 @@ class CountForwardModel(hk.Module):
         Compute the count functions for a given observation.
         """
-        expected_counts = self.transfer_matrix @ self.model(parameters, *self.energies)
+        expected_counts = self.transfer_matrix @ self.model.photon_flux(parameters, *self.energies)
         return jnp.clip(expected_counts, a_min=1e-6)
-class BayesianModelAbstract(ABC):
+class ModelFitter(ABC):
     """
     Abstract class to fit a model to a given set of observation.
     """
-    model: SpectralModel
-    """The model to fit to the data."""
-    numpyro_model: Callable
-    """The numpyro model defining the likelihood."""
-    background_model: BackgroundModel
-    """The background model."""
-    pars: dict
+    def __init__(
+        self,
+        model: SpectralModel,
+        observations: ObsConfiguration | list[ObsConfiguration] | dict[str, ObsConfiguration],
+        background_model: BackgroundModel = None,
+        sparsify_matrix: bool = False,
+    ):
+        """
+        Initialize the fitter.
-    def __init__(self, model: SpectralModel):
+        Parameters:
+            model: the spectral model to fit.
+            observations: the observations to fit the model to.
+            background_model: the background model to fit.
+            sparsify_matrix: whether to sparsify the transfer matrix.
+        """
         self.model = model
+        self._observations = observations
+        self.background_model = background_model
         self.pars = tree_map(lambda x: jnp.float64(x), self.model.params)
+        self.sparse = sparsify_matrix
+    @property
+    def _observation_container(self) -> dict[str, ObsConfiguration]:
+        """
+        The observations used in the fit as a dictionary of observations.
+        """
+        if isinstance(self._observations, dict):
+            return self._observations
+        elif isinstance(self._observations, list):
+            return {f"data_{i}": obs for i, obs in enumerate(self._observations)}
+        elif isinstance(self._observations, ObsConfiguration):
+            return {"data": self._observations}
+        else:
+            raise ValueError(f"Invalid type for observations : {type(self._observations)}")
+    def numpyro_model(self, prior_distributions: HaikuDict[Distribution]) -> Callable:
+        """
+        Build the numpyro model using the observed data, the prior distributions and the spectral model.
+        Parameters:
+            prior_distributions: a nested dictionary containing the prior distributions for the model parameters.
+        Returns:
+            A model function that can be used with numpyro.
+        """
+        def model(observed=True):
+            prior_params = build_prior(prior_distributions, expand_shape=(len(self._observation_container),))
+            for i, (key, observation) in enumerate(self._observation_container.items()):
+                params = tree_map(lambda x: x[i], prior_params)
+                obs_model = build_numpyro_model(observation, self.model, self.background_model, name=key, sparse=self.sparse)
+                obs_model(params, observed=observed)
+        return model
+    @abstractmethod
+    def fit(self, prior_distributions: HaikuDict[Distribution], **kwargs) -> FitResult: ...
+class BayesianFitter(ModelFitter):
+    """
+    A class to fit a model to a given set of observation using a Bayesian approach. This class uses the NUTS sampler
+    from numpyro to perform the inference on the model parameters.
+    """
     def fit(
         self,
@@ -128,11 +211,11 @@ class BayesianModelAbstract(ABC):
         num_samples: int = 1000,
         max_tree_depth: int = 10,
         target_accept_prob: float = 0.8,
-        dense_mass=False,
+        dense_mass: bool = False,
         mcmc_kwargs: dict = {},
-    ) -> ChainResult:
+    ) -> FitResult:
         """
-        Fit the model to the data using NUTS sampler from numpyro. This is the default sampler in jaxspec.
+        Fit the model to the data using NUTS sampler from numpyro.
         Parameters:
             prior_distributions: a nested dictionary containing the prior distributions for the model parameters.
@@ -146,7 +229,7 @@ class BayesianModelAbstract(ABC):
             mcmc_kwargs: additional arguments to pass to the MCMC sampler. See [`MCMC`][numpyro.infer.mcmc.MCMC] for more details.
         Returns:
-            A [`ChainResult`][jaxspec.analysis.results.ChainResult] instance containing the results of the fit.
+            A [`FitResult`][jaxspec.analysis.results.FitResult] instance containing the results of the fit.
         """
         transform_dict = {}
@@ -174,80 +257,91 @@ class BayesianModelAbstract(ABC):
         prior = Predictive(bayesian_model, num_samples=num_samples)(keys[2], observed=False)
         inference_data = az.from_numpyro(mcmc, prior=prior, posterior_predictive=posterior_predictive)
-        predictive_parameters = ["obs", "bkg"] if self.background_model is not None else ["obs"]
-        inference_data.posterior_predictive = inference_data.posterior_predictive[predictive_parameters]
-        parameters = [x for x in inference_data.posterior.keys() if not x.endswith("_base")]
-        inference_data.posterior = inference_data.posterior[parameters]
-        inference_data.prior = inference_data.prior[parameters]
+        inference_data = filter_inference_data(inference_data, self._observation_container, self.background_model)
-        return ChainResult(
+        return FitResult(
             self.model,
-            self.observation,
+            self._observation_container,
             inference_data,
-            mcmc.get_samples(),
             self.model.params,
             background_model=self.background_model,
         )
-class BayesianModel(BayesianModelAbstract):
+class MinimizationFitter(ModelFitter):
     """
-    Class to fit a model to a given observation using a Bayesian approach.
+    A class to fit a model to a given set of observation using a minimization algorithm. This class uses the L-BFGS
+    algorithm from jaxopt to perform the minimization on the model parameters. The uncertainties are computed using the
+    Hessian of the log-likelihood, assuming that it is a multivariate Gaussian in the unbounded space defined by
+    numpyro.
     """
-    def __init__(self, model, observation, background_model: BackgroundModel = None, sparsify_matrix: bool = False):
-        super().__init__(model)
-        self.observation = observation
-        self.pars = tree_map(lambda x: jnp.float64(x), self.model.params)
-        self.sparse = sparsify_matrix
-        self.background_model = background_model
-    def numpyro_model(self, prior_distributions: HaikuDict[Distribution]) -> Callable:
+    def fit(
+        self,
+        prior_distributions: HaikuDict[Distribution],
+        rng_key: int = 0,
+        num_iter_max: int = 10_000,
+        num_samples: int = 1_000,
+    ) -> FitResult:
         """
-        Build the numpyro model for the Bayesian fit. It returns a callable which can be used
-        to fit the model using numpyro's various samplers.
+        Fit the model to the data using L-BFGS algorithm.
         Parameters:
             prior_distributions: a nested dictionary containing the prior distributions for the model parameters.
-        """
-        def model(observed=True):
-            prior_params = build_prior(prior_distributions)
-            obs_model = build_numpyro_model(self.observation, self.model, self.background_model, sparse=self.sparse)
-            obs_model(prior_params, observed=observed)
-        return model
+            rng_key: the random key used to initialize the sampler.
+            num_iter_max: the maximum number of iteration in the minimization algorithm.
+            num_samples: the number of sample to draw from the best-fit covariance.
+        Returns:
+            A [`FitResult`][jaxspec.analysis.results.FitResult] instance containing the results of the fit.
+        """
-"""
-class MultipleObservationMCMC(BayesianModelAbstract):
+        bayesian_model = self.numpyro_model(prior_distributions)
-    def __init__(self, model, observations, background_model: BackgroundModel = None):
+        param_info, potential_fn, postprocess_fn, *_ = initialize_model(
+            PRNGKey(0),
+            bayesian_model,
+            model_args=tuple(),
+            dynamic_args=True,  # <- this is important!
+        )
-        super().__init__(model)
-        self.observations = observations
-        self.pars = tree_map(lambda x: jnp.float64(x), self.model.params)
-        self.background_model = background_model
+        # get negative log-density from the potential function
+        @jax.jit
+        def nll_fn(position):
+            func = potential_fn()
+            return func(position)
-    def numpyro_model(self, prior_distributions: HaikuDict[Distribution]) -> Callable:
+        solver = jaxopt.LBFGS(fun=nll_fn, maxiter=10_000)
+        params, state = solver.run(param_info.z)
+        keys = random.split(random.PRNGKey(rng_key), 3)
-        def model(observed=True):
+        value_flat, unflatten_fun = ravel_pytree(params)
+        covariance = jnp.linalg.inv(jax.hessian(lambda p: nll_fn(unflatten_fun(p)))(value_flat))
-            prior_params = build_prior(prior_distributions, expand_shape=(len(self.observations),))
+        samples_flat = jax.random.multivariate_normal(keys[0], value_flat, covariance, shape=(num_samples,))
+        samples = jax.vmap(unflatten_fun)(samples_flat.block_until_ready())
+        posterior_samples = postprocess_fn()(samples)
-            for i, (key, observation) in enumerate(self.observations.items()):
+        posterior_predictive = Predictive(bayesian_model, posterior_samples)(keys[1], observed=False)
+        prior = Predictive(bayesian_model, num_samples=num_samples)(keys[2], observed=False)
+        log_likelihood = numpyro.infer.log_likelihood(bayesian_model, posterior_samples)
-                params = tree_map(lambda x: x[i], prior_params)
+        def sanitize_chain(chain):
+            return tree_map(lambda x: x[None, ...], chain)
-                obs_model = build_numpyro_model(
-                    observation,
-                    self.model,
-                    self.background_model,
-                    name=key + '_'
-                )
+        inference_data = az.from_dict(
+            sanitize_chain(posterior_samples),
+            prior=sanitize_chain(prior),
+            posterior_predictive=sanitize_chain(posterior_predictive),
+            log_likelihood=sanitize_chain(log_likelihood),
+        )
-                obs_model(params, observed=observed)
+        inference_data = filter_inference_data(inference_data, self._observation_container, self.background_model)
-        return model
-"""
+        return FitResult(
+            self.model,
+            self._observation_container,
+            inference_data,
+            self.model.params,
+            background_model=self.background_model,
+        )

jaxspec/model/_additive/__init__.py ADDED Viewed

File without changes

jaxspec 0.0.4__py3-none-any.whl → 0.0.6__py3-none-any.whl

jaxspec 0.0.4py3-none-any.whl → 0.0.6py3-none-any.whl