PyPI - reflectorch - Versions diffs - 1.3.0__py3-none-any.whl → 1.5.0__py3-none-any.whl - Mend

reflectorch 1.3.0py3-none-any.whl → 1.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of reflectorch might be problematic. Click here for more details.

Files changed (96) hide show

reflectorch/__init__.py +17 -17
reflectorch/data_generation/__init__.py +128 -126
reflectorch/data_generation/dataset.py +210 -210
reflectorch/data_generation/likelihoods.py +80 -80
reflectorch/data_generation/noise.py +470 -470
reflectorch/data_generation/priors/__init__.py +60 -60
reflectorch/data_generation/priors/base.py +55 -55
reflectorch/data_generation/priors/exp_subprior_sampler.py +298 -298
reflectorch/data_generation/priors/independent_priors.py +195 -195
reflectorch/data_generation/priors/multilayer_models.py +311 -311
reflectorch/data_generation/priors/multilayer_structures.py +104 -104
reflectorch/data_generation/priors/no_constraints.py +206 -206
reflectorch/data_generation/priors/parametric_models.py +841 -841
reflectorch/data_generation/priors/parametric_subpriors.py +369 -369
reflectorch/data_generation/priors/params.py +252 -252
reflectorch/data_generation/priors/sampler_strategies.py +369 -369
reflectorch/data_generation/priors/scaler_mixin.py +65 -65
reflectorch/data_generation/priors/subprior_sampler.py +371 -371
reflectorch/data_generation/priors/utils.py +118 -118
reflectorch/data_generation/process_data.py +41 -41
reflectorch/data_generation/q_generator.py +280 -246
reflectorch/data_generation/reflectivity/__init__.py +102 -102
reflectorch/data_generation/reflectivity/abeles.py +97 -97
reflectorch/data_generation/reflectivity/kinematical.py +70 -70
reflectorch/data_generation/reflectivity/memory_eff.py +105 -105
reflectorch/data_generation/reflectivity/numpy_implementations.py +120 -120
reflectorch/data_generation/reflectivity/smearing.py +138 -138
reflectorch/data_generation/reflectivity/smearing_pointwise.py +109 -109
reflectorch/data_generation/scale_curves.py +112 -112
reflectorch/data_generation/smearing.py +98 -98
reflectorch/data_generation/utils.py +223 -222
reflectorch/extensions/jupyter/__init__.py +11 -6
reflectorch/extensions/jupyter/api.py +85 -0
reflectorch/extensions/jupyter/callbacks.py +34 -34
reflectorch/extensions/jupyter/components.py +758 -0
reflectorch/extensions/jupyter/custom_select.py +268 -0
reflectorch/extensions/jupyter/log_widget.py +241 -0
reflectorch/extensions/jupyter/model_selection.py +495 -0
reflectorch/extensions/jupyter/plotly_plot_manager.py +329 -0
reflectorch/extensions/jupyter/widget.py +625 -0
reflectorch/extensions/matplotlib/__init__.py +5 -5
reflectorch/extensions/matplotlib/losses.py +32 -32
reflectorch/extensions/refnx/refnx_conversion.py +76 -76
reflectorch/inference/__init__.py +28 -24
reflectorch/inference/inference_model.py +847 -851
reflectorch/inference/input_interface.py +239 -0
reflectorch/inference/loading_data.py +37 -0
reflectorch/inference/multilayer_fitter.py +171 -171
reflectorch/inference/multilayer_inference_model.py +193 -193
reflectorch/inference/plotting.py +524 -98
reflectorch/inference/preprocess_exp/__init__.py +6 -6
reflectorch/inference/preprocess_exp/attenuation.py +36 -36
reflectorch/inference/preprocess_exp/cut_with_q_ratio.py +31 -31
reflectorch/inference/preprocess_exp/footprint.py +81 -81
reflectorch/inference/preprocess_exp/interpolation.py +19 -16
reflectorch/inference/preprocess_exp/normalize.py +21 -21
reflectorch/inference/preprocess_exp/preprocess.py +121 -121
reflectorch/inference/query_matcher.py +81 -81
reflectorch/inference/record_time.py +43 -43
reflectorch/inference/sampler_solution.py +56 -56
reflectorch/inference/scipy_fitter.py +272 -248
reflectorch/inference/torch_fitter.py +87 -87
reflectorch/ml/__init__.py +32 -32
reflectorch/ml/basic_trainer.py +292 -292
reflectorch/ml/callbacks.py +80 -80
reflectorch/ml/dataloaders.py +26 -26
reflectorch/ml/loggers.py +55 -55
reflectorch/ml/schedulers.py +355 -355
reflectorch/ml/trainers.py +200 -191
reflectorch/ml/utils.py +2 -2
reflectorch/models/__init__.py +15 -14
reflectorch/models/activations.py +50 -50
reflectorch/models/encoders/__init__.py +19 -17
reflectorch/models/encoders/conv_encoder.py +218 -218
reflectorch/models/encoders/conv_res_net.py +115 -115
reflectorch/models/encoders/fno.py +133 -133
reflectorch/models/encoders/integral_kernel_embedding.py +390 -0
reflectorch/models/networks/__init__.py +14 -14
reflectorch/models/networks/mlp_networks.py +434 -428
reflectorch/models/networks/residual_net.py +156 -156
reflectorch/paths.py +29 -27
reflectorch/runs/__init__.py +31 -31
reflectorch/runs/config.py +25 -25
reflectorch/runs/slurm_utils.py +93 -93
reflectorch/runs/train.py +78 -78
reflectorch/runs/utils.py +404 -401
reflectorch/test_config.py +4 -4
reflectorch/train.py +4 -4
reflectorch/train_on_cluster.py +4 -4
reflectorch/utils.py +98 -68
{reflectorch-1.3.0.dist-info → reflectorch-1.5.0.dist-info}/METADATA +129 -125
reflectorch-1.5.0.dist-info/RECORD +96 -0
{reflectorch-1.3.0.dist-info → reflectorch-1.5.0.dist-info}/WHEEL +1 -1
{reflectorch-1.3.0.dist-info → reflectorch-1.5.0.dist-info}/licenses/LICENSE.txt +20 -20
reflectorch-1.3.0.dist-info/RECORD +0 -86
{reflectorch-1.3.0.dist-info → reflectorch-1.5.0.dist-info}/top_level.txt +0 -0

reflectorch/inference/inference_model.py CHANGED Viewed

@@ -1,852 +1,848 @@
-import asyncio
-import logging
-from pathlib import Path
-import time
-import numpy as np
-import torch
-from torch import Tensor
-from typing import List, Tuple, Union
-import ipywidgets as widgets
-from IPython.display import display
-from huggingface_hub import hf_hub_download
-from reflectorch.data_generation.priors import Params, BasicParams, ExpUniformSubPriorSampler, UniformSubPriorParams
-from reflectorch.data_generation.priors.parametric_models import NuisanceParamsWrapper
-from reflectorch.data_generation.q_generator import ConstantQ, VariableQ
-from reflectorch.data_generation.utils import get_density_profiles, get_param_labels
-from reflectorch.inference.plotting import plot_prediction_results
-from reflectorch.inference.preprocess_exp.interpolation import interp_reflectivity
-from reflectorch.paths import CONFIG_DIR, ROOT_DIR, SAVED_MODELS_DIR
-from reflectorch.runs.utils import (
-    get_trainer_by_name, train_from_config
-)
-from reflectorch.runs.config import load_config
-from reflectorch.ml.trainers import PointEstimatorTrainer
-from reflectorch.data_generation.likelihoods import LogLikelihood
-from reflectorch.inference.preprocess_exp import StandardPreprocessing
-from reflectorch.inference.scipy_fitter import standard_refl_fit, refl_fit, get_fit_with_growth
-from reflectorch.inference.sampler_solution import simple_sampler_solution, get_best_mse_param
-from reflectorch.inference.record_time import print_time
-from reflectorch.utils import to_t
-class EasyInferenceModel(object):
-    """Facilitates the inference process using pretrained models
-    Args:
-        config_name (str, optional): the name of the configuration file used to initialize the model (either with or without the '.yaml' extension). Defaults to None.
-        model_name (str, optional): the name of the file containing the weights of the model (either with or without the '.pt' extension), only required if different than: `'model_' + config_name + '.pt'`. Defaults to None
-        root_dir (str, optional): path to root directory containing the 'configs' and 'saved_models' subdirectories, if different from the package root directory (ROOT_DIR). Defaults to None.
-        weights_format (str, optional): format (extension) of the weights file, either 'pt' or 'safetensors'. Defaults to 'safetensors'.
-        repo_id (str, optional): the id of the Huggingface repository from which the configuration files and model weights should be downloaded automatically if not found locally (in the 'configs' and 'saved_models' subdirectories of the root directory). Defaults to 'valentinsingularity/reflectivity'.
-        trainer (PointEstimatorTrainer, optional): if provided, this trainer instance is used directly instead of being initialized from the configuration file. Defaults to None.
-        device (str, optional): the Pytorch device ('cuda' or 'cpu'). Defaults to 'cuda'.
-    """
-    def __init__(self, config_name: str = None, model_name: str = None, root_dir:str = None, weights_format: str = 'safetensors',
-                 repo_id: str = 'valentinsingularity/reflectivity', trainer: PointEstimatorTrainer = None, device='cuda'):
-        self.config_name = config_name
-        self.model_name = model_name
-        self.root_dir = root_dir
-        self.weights_format = weights_format
-        self.repo_id = repo_id
-        self.trainer = trainer
-        self.device = device
-        if trainer is None and self.config_name is not None:
-            self.load_model(self.config_name, self.model_name, self.root_dir)
-        self.prediction_result = None
-    def load_model(self, config_name: str, model_name: str, root_dir: str) -> None:
-        """Loads a model for inference
-        Args:
-            config_name (str): the name of the configuration file used to initialize the model (either with or without the '.yaml' extension).
-            model_name (str): the name of the file containing the weights of the model (either with or without the '.pt' or '.safetensors'  extension), only required if different than: `'model_' + config_name + extension`.
-            root_dir (str): path to root directory containing the 'configs' and 'saved_models' subdirectories, if different from the package root directory (ROOT_DIR).
-        """
-        if self.config_name == config_name and self.trainer is not None:
-            return
-        if not config_name.endswith('.yaml'):
-            config_name_no_extension = config_name
-            self.config_name = config_name_no_extension + '.yaml'
-        else:
-            config_name_no_extension = config_name[:-5]
-            self.config_name = config_name
-        self.config_dir = Path(root_dir) / 'configs' if root_dir else CONFIG_DIR
-        weights_extension = '.' + self.weights_format
-        self.model_name = model_name or 'model_' + config_name_no_extension + weights_extension
-        if not self.model_name.endswith(weights_extension):
-            self.model_name += weights_extension
-        self.model_dir = Path(root_dir) / 'saved_models' if root_dir else SAVED_MODELS_DIR
-        config_path = Path(self.config_dir) / self.config_name
-        if config_path.exists():
-            print(f"Configuration file `{config_path}` found locally.")
-        else:
-            print(f"Configuration file `{config_path}` not found locally.")
-            if self.repo_id is None:
-                raise ValueError("repo_id must be provided to download files from Huggingface.")
-            print("Downloading from Huggingface...")
-            hf_hub_download(repo_id=self.repo_id, subfolder='configs', filename=self.config_name, local_dir=config_path.parents[1])
-        model_path = Path(self.model_dir) / self.model_name
-        if model_path.exists():
-            print(f"Weights file `{model_path}` found locally.")
-        else:
-            print(f"Weights file `{model_path}` not found locally.")
-            if self.repo_id is None:
-                raise ValueError("repo_id must be provided to download files from Huggingface.")
-            print("Downloading from Huggingface...")
-            hf_hub_download(repo_id=self.repo_id, subfolder='saved_models', filename=self.model_name, local_dir=model_path.parents[1])
-        self.trainer = get_trainer_by_name(config_name=config_name, config_dir=self.config_dir, model_path=model_path, load_weights=True, inference_device = self.device)
-        self.trainer.model.eval()
-        param_model = self.trainer.loader.prior_sampler.param_model
-        param_model_name = param_model.base_model.NAME if isinstance(param_model, NuisanceParamsWrapper) else param_model.NAME
-        print(f'The model corresponds to a `{param_model_name}` parameterization with {self.trainer.loader.prior_sampler.max_num_layers} layers ({self.trainer.loader.prior_sampler.param_dim} predicted parameters)')
-        print("Parameter types and total ranges:")
-        for param, range_ in self.trainer.loader.prior_sampler.param_ranges.items():
-            print(f"- {param}: {range_}")
-        print("Allowed widths of the prior bound intervals (max-min):")
-        for param, range_ in self.trainer.loader.prior_sampler.bound_width_ranges.items():
-            print(f"- {param}: {range_}")
-        if isinstance(self.trainer.loader.q_generator, ConstantQ):
-            q_min = self.trainer.loader.q_generator.q[0].item()
-            q_max = self.trainer.loader.q_generator.q[-1].item()
-            n_q = self.trainer.loader.q_generator.q.shape[0]
-            print(f'The model was trained on curves discretized at {n_q} uniform points between q_min={q_min} and q_max={q_max}')
-        elif isinstance(self.trainer.loader.q_generator, VariableQ):
-            q_min_range = self.trainer.loader.q_generator.q_min_range
-            q_max_range = self.trainer.loader.q_generator.q_max_range
-            n_q_range = self.trainer.loader.q_generator.n_q_range
-            if n_q_range[0] == n_q_range[1]:
-                n_q_fixed = n_q_range[0]
-                print(f'The model was trained on curves discretized at exactly {n_q_fixed} uniform points, '
-                    f'between q_min in [{q_min_range[0]}, {q_min_range[1]}] and q_max in [{q_max_range[0]}, {q_max_range[1]}]')
-            else:
-                print(f'The model was trained on curves discretized at a number between {n_q_range[0]} and {n_q_range[1]} '
-                    f'of uniform points between q_min in [{q_min_range[0]}, {q_min_range[1]}] and q_max in [{q_max_range[0]}, {q_max_range[1]}]')
-        if self.trainer.loader.smearing is not None:
-            q_res_min = self.trainer.loader.smearing.sigma_min
-            q_res_max = self.trainer.loader.smearing.sigma_max
-            if self.trainer.loader.smearing.constant_dq == False:
-                print(f"The model was trained with linear resolution smearing (dq/q) in the range [{q_res_min}, {q_res_max}]")
-            elif self.trainer.loader.smearing.constant_dq == True:
-                print(f"The model was trained with constant resolution smearing in the range [{q_res_min}, {q_res_max}]")
-        additional_inputs = ["prior bounds"]
-        if self.trainer.train_with_q_input:
-            additional_inputs.append("q values")
-        if self.trainer.condition_on_q_resolutions:
-            additional_inputs.append("the resolution dq/q")
-        if additional_inputs:
-            inputs_str = ", ".join(additional_inputs)
-            print(f"The following quantities are additional inputs to the network: {inputs_str}.")
-    def predict(self,
-                reflectivity_curve: Union[np.ndarray, Tensor],
-                q_values: Union[np.ndarray, Tensor] = None,
-                prior_bounds: Union[np.ndarray, List[Tuple]] = None,
-                q_resolution: Union[float, np.ndarray] = None,
-                ambient_sld: float = None,
-                clip_prediction: bool = False,
-                polish_prediction: bool = False,
-                polishing_kwargs_reflectivity: dict = None,
-                fit_growth: bool = False,
-                max_d_change: float = 5.,
-                use_q_shift: bool = False,
-                calc_pred_curve: bool = True,
-                calc_pred_sld_profile: bool = False,
-                calc_polished_sld_profile: bool = False,
-                ):
-        """Predict the thin film parameters
-        Args:
-            reflectivity_curve (Union[np.ndarray, Tensor]): The reflectivity curve (which has been already preprocessed, normalized and interpolated).
-            q_values (Union[np.ndarray, Tensor], optional): The momentum transfer (q) values for the reflectivity curve (in units of inverse angstroms).
-            prior_bounds (Union[np.ndarray, List[Tuple]], optional): the prior bounds for the thin film parameters.
-            q_resolution (Union[float, np.ndarray], optional): the instrumental resolution. Either as a float with meaning dq/q for linear smearing or as a numpy array with meaning dq for pointwise smearing.
-            ambient_sld (float, optional): the SLD of the ambient medium (fronting), if different from air.
-            clip_prediction (bool, optional): If ``True``, the values of the predicted parameters are clipped to not be outside the interval set by the prior bounds. Defaults to False.
-            polish_prediction (bool, optional): If ``True``, the neural network predictions are further polished using a simple least mean squares (LMS) fit. Only for the standard box-model parameterization. Defaults to False.
-            polishing_kwargs_reflectivity (dict): extra arguments for the reflectivity function used during polishing.
-            fit_growth (bool, optional): If ``True``, an additional parameters is introduced during the LMS polishing to account for the change in the thickness of the upper layer during the in-situ measurement of the reflectivity curve (a linear growth is assumed). Defaults to False.
-            max_d_change (float): The maximum possible change in the thickness of the upper layer during the in-situ measurement, relevant when polish_prediction and fit_growth are True. Defaults to 5.
-            use_q_shift: If ``True``, the prediction is performed for a batch of slightly shifted versions of the input curve and the best result is returned, which is meant to mitigate the influence of imperfect sample alignment, as introduced in Greco et al. (only for models with fixed q-discretization). Defaults to False.
-            calc_pred_curve (bool, optional): Whether to calculate the curve corresponding to the predicted parameters. Defaults to True.
-            calc_pred_sld_profile (bool, optional): Whether to calculate the SLD profile corresponding to the predicted parameters. Defaults to False.
-            calc_polished_sld_profile (bool, optional): Whether to calculate the SLD profile corresponding to the polished parameters. Defaults to False.
-        Returns:
-            dict: dictionary containing the predictions
-        """
-        scaled_curve = self._scale_curve(reflectivity_curve)
-        prior_bounds = np.array(prior_bounds)
-        if ambient_sld:
-            n_layers = self.trainer.loader.prior_sampler.max_num_layers
-            sld_indices = slice(2*n_layers+1, 3*n_layers+2)
-            prior_bounds[sld_indices, ...] -= ambient_sld
-            training_min_bounds = self.trainer.loader.prior_sampler.min_bounds.squeeze().cpu().numpy()
-            training_max_bounds = self.trainer.loader.prior_sampler.max_bounds.squeeze().cpu().numpy()
-            lower_bound_check = (prior_bounds[sld_indices, 0] >= training_min_bounds[sld_indices]).all()
-            upper_bound_check = (prior_bounds[sld_indices, 1] <= training_max_bounds[sld_indices]).all()
-            assert lower_bound_check and upper_bound_check, "Shifting the layer SLDs by the ambient SLD exceeded the training ranges."
-        try:
-            scaled_prior_bounds = self._scale_prior_bounds(prior_bounds)
-        except ValueError as e:
-            print(str(e))
-            return None
-        if not self.trainer.train_with_q_input:
-            q_values = self.trainer.loader.q_generator.q
-        else:
-            q_values = torch.atleast_2d(to_t(q_values)).to(scaled_curve)
-        if use_q_shift and not self.trainer.train_with_q_input:
-            predicted_params = self._qshift_prediction(reflectivity_curve, scaled_prior_bounds, num = 1024, dq_coef = 1.)
-        else:
-            with torch.no_grad():
-                self.trainer.model.eval()
-                scaled_q_values = self.trainer.loader.q_generator.scale_q(q_values).to(torch.float32) if self.trainer.train_with_q_input else None
-                if q_resolution is not None:
-                    q_resolution_tensor = torch.atleast_2d(torch.as_tensor(q_resolution)).to(scaled_curve)
-                    if isinstance(q_resolution, float):
-                        unscaled_q_resolutions = q_resolution_tensor
-                    else:
-                        unscaled_q_resolutions = (q_resolution_tensor / q_values).mean(dim=-1, keepdim=True)
-                    scaled_q_resolutions = self.trainer.loader.smearing.scale_resolutions(unscaled_q_resolutions) if self.trainer.condition_on_q_resolutions else None
-                    scaled_conditioning_params = scaled_q_resolutions
-                    if polishing_kwargs_reflectivity is None:
-                        polishing_kwargs_reflectivity = {'dq': q_resolution}
-                else:
-                    q_resolution_tensor = None
-                    scaled_conditioning_params = None
-                scaled_predicted_params = self.trainer.model(
-                    curves=scaled_curve,
-                    bounds=scaled_prior_bounds,
-                    q_values=scaled_q_values,
-                    conditioning_params = scaled_conditioning_params,
-                    )
-                predicted_params = self.trainer.loader.prior_sampler.restore_params(torch.cat([scaled_predicted_params, scaled_prior_bounds], dim=-1))
-        if clip_prediction:
-            predicted_params = self.trainer.loader.prior_sampler.clamp_params(predicted_params)
-        prediction_dict = {
-            "predicted_params_object": predicted_params,
-            "predicted_params_array": predicted_params.parameters.squeeze().cpu().numpy(),
-            "param_names" : self.trainer.loader.prior_sampler.param_model.get_param_labels()
-        }
-        if calc_pred_curve:
-            predicted_curve = predicted_params.reflectivity(q=q_values, dq=q_resolution_tensor).squeeze().cpu().numpy()
-            prediction_dict[ "predicted_curve"] = predicted_curve
-        ambient_sld_tensor = torch.atleast_2d(torch.as_tensor(ambient_sld)).to(predicted_params.thicknesses.device) if ambient_sld is not None else None
-        if calc_pred_sld_profile:
-            predicted_sld_xaxis, predicted_sld_profile, _ = get_density_profiles(
-                predicted_params.thicknesses, predicted_params.roughnesses, predicted_params.slds, ambient_sld_tensor, num=1024,
-            )
-            prediction_dict['predicted_sld_profile'] = predicted_sld_profile.squeeze().cpu().numpy()
-            prediction_dict['predicted_sld_xaxis'] = predicted_sld_xaxis.squeeze().cpu().numpy()
-        else:
-            predicted_sld_xaxis = None
-        if polish_prediction:
-            if ambient_sld_tensor:
-                ambient_sld_tensor = ambient_sld_tensor.cpu()
-            polished_dict = self._polish_prediction(q = q_values.squeeze().cpu().numpy(),
-                                                    curve = reflectivity_curve,
-                                                    predicted_params = predicted_params,
-                                                    priors = np.array(prior_bounds),
-                                                    fit_growth = fit_growth,
-                                                    max_d_change = max_d_change,
-                                                    calc_polished_curve = calc_pred_curve,
-                                                    calc_polished_sld_profile = calc_polished_sld_profile,
-                                                    ambient_sld_tensor=ambient_sld_tensor,
-                                                    sld_x_axis = predicted_sld_xaxis,
-                                                    polishing_kwargs_reflectivity=polishing_kwargs_reflectivity,
-                                                    )
-            prediction_dict.update(polished_dict)
-            if fit_growth and "polished_params_array" in prediction_dict:
-                prediction_dict["param_names"].append("max_d_change")
-        if ambient_sld: #Note: the SLD shift will only be reflected in predicted_params_array but not in predicted_params_object
-            prediction_dict["predicted_params_array"][sld_indices] += ambient_sld
-            if "polished_params_array" in prediction_dict:
-                prediction_dict["polished_params_array"][sld_indices] += ambient_sld
-        return prediction_dict
-    def predict_using_widget(self, reflectivity_curve, **kwargs):
-        """
-        """
-        NUM_INTERVALS = self.trainer.loader.prior_sampler.param_dim
-        param_labels = self.trainer.loader.prior_sampler.param_model.get_param_labels()
-        min_bounds = self.trainer.loader.prior_sampler.min_bounds.cpu().numpy().flatten()
-        max_bounds = self.trainer.loader.prior_sampler.max_bounds.cpu().numpy().flatten()
-        max_deltas = self.trainer.loader.prior_sampler.max_delta.cpu().numpy().flatten()
-        print(f'Adjust the sliders for each parameter and press "Predict". Repeat as desired. Press "Close Widget" to finish.')
-        interval_widgets = []
-        for i in range(NUM_INTERVALS):
-            label = widgets.Label(value=f'{param_labels[i]}')
-            initial_max = min(max_bounds[i], min_bounds[i] + max_deltas[i])
-            slider = widgets.FloatRangeSlider(
-                value=[min_bounds[i], initial_max],
-                min=min_bounds[i],
-                max=max_bounds[i],
-                step=0.01,
-                layout=widgets.Layout(width='400px'),
-                style={'description_width': '60px'}
-            )
-            def validate_range(change, slider=slider, max_width=max_deltas[i]):
-                min_val, max_val = change['new']
-                if max_val - min_val > max_width:
-                    old_min_val, old_max_val = change['old']
-                    if abs(old_min_val - min_val) > abs(old_max_val - max_val):
-                        max_val = min_val + max_width
-                    else:
-                        min_val = max_val - max_width
-                    slider.value = [min_val, max_val]
-            slider.observe(validate_range, names='value')
-            interval_widgets.append((slider, widgets.HBox([label, slider])))
-        sliders_box = widgets.VBox([iw[1] for iw in interval_widgets])
-        output = widgets.Output()
-        predict_button = widgets.Button(description="Predict")
-        close_button = widgets.Button(description="Close Widget")
-        container = widgets.VBox([sliders_box, widgets.HBox([predict_button, close_button]), output])
-        display(container)
-        @output.capture(clear_output=True)
-        def on_predict_click(_):
-            if 'prior_bounds' in kwargs:
-                array_values = kwargs.pop('prior_bounds')
-                for i, (s, _) in enumerate(interval_widgets):
-                    s.value = tuple(array_values[i])
-            else:
-                values = [(s.value[0], s.value[1]) for s, _ in interval_widgets]
-                array_values = np.array(values)
-            prediction_result = self.predict(reflectivity_curve=reflectivity_curve,
-                                            prior_bounds=array_values,
-                                            **kwargs)
-            param_names = self.trainer.loader.prior_sampler.param_model.get_param_labels()
-            for param_name, pred_param_val in zip(param_names, prediction_result["predicted_params_array"]):
-                print(f'{param_name.ljust(14)} : {pred_param_val:.2f}')
-            plot_prediction_results(
-                prediction_result,
-                q_exp=kwargs['q_values'],
-                curve_exp=reflectivity_curve,
-                q_model=kwargs['q_values'],
-            )
-            self.prediction_result = prediction_result
-        def on_close_click(_):
-            container.close()
-            print("Widget closed.")
-        predict_button.on_click(on_predict_click)
-        close_button.on_click(on_close_click)
-    def _qshift_prediction(self, curve, scaled_bounds, num: int = 1000, dq_coef: float = 1.) -> BasicParams:
-        assert isinstance(self.trainer.loader.q_generator, ConstantQ), "Prediction with q shifts available only for models with fixed discretization"
-        q = self.trainer.loader.q_generator.q.squeeze().float()
-        dq_max = (q[1] - q[0]) * dq_coef
-        q_shifts = torch.linspace(-dq_max, dq_max, num).to(q)
-        curve = to_t(curve).to(scaled_bounds)
-        shifted_curves = _qshift_interp(q.squeeze(), curve, q_shifts)
-        assert shifted_curves.shape == (num, q.shape[0])
-        scaled_curves = self.trainer.loader.curves_scaler.scale(shifted_curves)
-        scaled_prior_bounds = torch.atleast_2d(scaled_bounds).expand(scaled_curves.shape[0], -1)
-        with torch.no_grad():
-            self.trainer.model.eval()
-            scaled_predicted_params = self.trainer.model(scaled_curves, scaled_prior_bounds)
-            restored_params = self.trainer.loader.prior_sampler.restore_params(torch.cat([scaled_predicted_params, scaled_prior_bounds], dim=-1))
-            best_param = get_best_mse_param(
-                restored_params,
-                self._get_likelihood(q=self.trainer.loader.q_generator.q, curve=curve),
-            )
-            return best_param
-    def _polish_prediction(self,
-                           q: np.ndarray,
-                           curve: np.ndarray,
-                           predicted_params: BasicParams,
-                           priors: np.ndarray,
-                           sld_x_axis,
-                           ambient_sld_tensor: Tensor = None,
-                           fit_growth: bool = False,
-                           max_d_change: float = 5.,
-                           calc_polished_curve: bool = True,
-                           calc_polished_sld_profile: bool = False,
-                           polishing_kwargs_reflectivity: dict = None,
-                           ) -> dict:
-        params = predicted_params.parameters.squeeze().cpu().numpy()
-        polished_params_dict = {}
-        polishing_kwargs_reflectivity = polishing_kwargs_reflectivity or {}
-        try:
-            if fit_growth:
-                polished_params_arr, curve_polished = get_fit_with_growth(
-                    q = q,
-                    curve = curve,
-                    init_params = params,
-                    bounds = priors.T,
-                    max_d_change = max_d_change,
-                )
-                polished_params = BasicParams(
-                    torch.from_numpy(polished_params_arr[:-1][None]),
-                    torch.from_numpy(priors.T[0][None]),
-                    torch.from_numpy(priors.T[1][None]),
-                    self.trainer.loader.prior_sampler.max_num_layers,
-                    self.trainer.loader.prior_sampler.param_model
-                    )
-            else:
-                polished_params_arr, curve_polished = refl_fit(
-                    q = q,
-                    curve = curve,
-                    init_params = params,
-                    bounds=priors.T,
-                    prior_sampler=self.trainer.loader.prior_sampler,
-                    reflectivity_kwargs=polishing_kwargs_reflectivity,
-                )
-                polished_params = BasicParams(
-                    torch.from_numpy(polished_params_arr[None]),
-                    torch.from_numpy(priors.T[0][None]),
-                    torch.from_numpy(priors.T[1][None]),
-                    self.trainer.loader.prior_sampler.max_num_layers,
-                    self.trainer.loader.prior_sampler.param_model
-                )
-        except Exception as err:
-            polished_params = predicted_params
-            polished_params_arr = get_prediction_array(polished_params)
-            curve_polished = np.zeros_like(q)
-        polished_params_dict['polished_params_array'] = polished_params_arr
-        if calc_polished_curve:
-            polished_params_dict['polished_curve'] = curve_polished
-        if calc_polished_sld_profile:
-            _, sld_profile_polished, _ = get_density_profiles(
-                polished_params.thicknesses, polished_params.roughnesses, polished_params.slds, ambient_sld_tensor, z_axis=sld_x_axis.cpu(),
-            )
-            polished_params_dict['sld_profile_polished'] = sld_profile_polished.squeeze().numpy()
-        return polished_params_dict
-    def _scale_curve(self, curve: Union[np.ndarray, Tensor]):
-        if not isinstance(curve, Tensor):
-            curve = torch.from_numpy(curve).float()
-        curve = torch.atleast_2d(curve).to(self.device)
-        scaled_curve = self.trainer.loader.curves_scaler.scale(curve)
-        return scaled_curve
-    def _scale_prior_bounds(self, prior_bounds: List[Tuple]):
-        try:
-            prior_bounds = torch.tensor(prior_bounds)
-            prior_bounds = prior_bounds.to(self.device).T
-            min_bounds, max_bounds = prior_bounds[:, None]
-            scaled_bounds = torch.cat([
-                self.trainer.loader.prior_sampler.scale_bounds(min_bounds),
-                self.trainer.loader.prior_sampler.scale_bounds(max_bounds)
-            ], -1)
-            return scaled_bounds.float()
-        except RuntimeError as e:
-            expected_param_dim = self.trainer.loader.prior_sampler.param_dim
-            actual_param_dim = prior_bounds.shape[1] if prior_bounds.ndim == 2 else len(prior_bounds)
-            msg = (
-                f"\n **Parameter dimension mismatch during inference!**\n"
-                f"- Model expects **{expected_param_dim}** parameters.\n"
-                f"- You provided **{actual_param_dim}** prior bounds.\n\n"
-                f"💡This often occurs when:\n"
-                f"- The model was trained with additional nuisance parameters like `r_scale`, `q_shift`, or `log10_background`,\n"
-                f"  but they were not included in the `prior_bounds` passed to `.predict()`.\n"
-                f"- The number of layers or parameterization type differs from the one used during training.\n\n"
-                f" Check the configuration or the summary of expected parameters."
-            )
-            raise ValueError(msg) from e
-    def interpolate_data_to_model_q(self, q_exp, curve_exp):
-        if isinstance(self.trainer.loader.q_generator, ConstantQ):
-            q_model = self.trainer.loader.q_generator.q.cpu().numpy()
-        elif isinstance(self.trainer.loader.q_generator, VariableQ):
-            if self.trainer.loader.q_generator.n_q_range[0] == self.trainer.loader.q_generator.n_q_range[1]:
-                n_q_model = self.trainer.loader.q_generator.n_q_range[0]
-                q_model_min = max(q_exp.min(), self.trainer.loader.q_generator.q_min_range[0])
-                q_model_max = min(q_exp.max(), self.trainer.loader.q_generator.q_max_range[1])
-                q_model = np.linspace(q_model_min, q_model_max, n_q_model)
-            else:
-                q_model = q_exp
-                exp_curve_interp = curve_exp
-        exp_curve_interp = interp_reflectivity(q_model, q_exp, curve_exp)
-        return q_model, exp_curve_interp
-    def _get_likelihood(self, q, curve, rel_err: float = 0.1, abs_err: float = 1e-12):
-        return LogLikelihood(
-            q, curve, self.trainer.loader.prior_sampler, curve * rel_err + abs_err
-        )
-class InferenceModel(object):
-    def __init__(self, name: str = None, trainer: PointEstimatorTrainer = None, preprocessing_parameters: dict = None,
-                 num_sampling: int = 2 ** 13):
-        self.log = logging.getLogger(__name__)
-        self.model_name = name
-        self.trainer = trainer
-        self.q = None
-        self.preprocessing = StandardPreprocessing(**(preprocessing_parameters or {}))
-        self._sampling_num = num_sampling
-        if trainer is None and self.model_name is not None:
-            self.load_model(self.model_name)
-        elif trainer is not None:
-            self._set_trainer(trainer, preprocessing_parameters)
-    ### API methods ###
-    def load_model(self, name: str) -> None:
-        self.log.debug(f"loading model {name}")
-        if self.model_name == name and self.trainer is not None:
-            return
-        self.model_name = name
-        self._set_trainer(get_trainer_by_name(name))
-        self.log.info(f"Model {name} is loaded.")
-    def train_model(self, name: str):
-        self.model_name = name
-        self.trainer = train_from_config(load_config(name))
-    def set_preprocessing_parameters(self, **kwargs) -> None:
-        self.preprocessing.set_parameters(**kwargs)
-    def preprocess(self,
-                   intensity: np.ndarray,
-                   scattering_angle: np.ndarray,
-                   attenuation: np.ndarray,
-                   update_params: bool = False,
-                   **kwargs) -> dict:
-        if update_params:
-            self.preprocessing.set_parameters(**kwargs)
-        preprocessed_dict = self.preprocessing(intensity, scattering_angle, attenuation, **kwargs)
-        return preprocessed_dict
-    def predict(self,
-                intensity: np.ndarray,
-                scattering_angle: np.ndarray,
-                attenuation: np.ndarray,
-                priors: np.ndarray,
-                preprocessing_parameters: dict = None,
-                polish: bool = True,
-                use_sampler: bool = False,
-                use_q_shift: bool = True,
-                max_d_change: float = 5.,
-                fit_growth: bool = True,
-                ) -> dict:
-        with print_time("everything"):
-            with print_time("preprocess"):
-                preprocessed_dict = self.preprocess(
-                    intensity, scattering_angle, attenuation, **(preprocessing_parameters or {})
-                )
-            preprocessed_curve = preprocessed_dict["curve_interp"]
-            raw_curve, raw_q = preprocessed_dict["curve"], preprocessed_dict["q_values"]
-            q_ratio = preprocessed_dict["q_ratio"]
-            with print_time("predict_from_preprocessed_curve"):
-                preprocessed_dict.update(self.predict_from_preprocessed_curve(
-                    preprocessed_curve, priors, raw_curve=raw_curve, raw_q=raw_q, polish=polish, q_ratio=q_ratio,
-                    use_sampler=use_sampler, use_q_shift=use_q_shift, max_d_change=max_d_change,
-                    fit_growth=fit_growth,
-                ))
-            return preprocessed_dict
-    def predict_from_preprocessed_curve(self,
-                                        curve: np.ndarray,
-                                        priors: np.ndarray, *,
-                                        polish: bool = True,
-                                        raw_curve: np.ndarray = None,
-                                        raw_q: np.ndarray = None,
-                                        clip_prediction: bool = True,
-                                        q_ratio: float = 1.,
-                                        use_sampler: bool = False,
-                                        use_q_shift: bool = True,
-                                        max_d_change: float = 5.,
-                                        fit_growth: bool = True,
-                                        ) -> dict:
-        scaled_curve = self._scale_curve(curve)
-        scaled_bounds, min_bounds, max_bounds = self._scale_priors(priors, q_ratio)
-        if not use_q_shift:
-            predicted_params: UniformSubPriorParams = self._simple_prediction(scaled_curve, scaled_bounds)
-        else:
-            predicted_params: UniformSubPriorParams = self._qshift_prediction(curve, scaled_bounds)
-        if use_sampler:
-            predicted_params: UniformSubPriorParams = self._sampler_solution(
-                curve, predicted_params,
-            )
-        if clip_prediction:
-            predicted_params = self._prior_sampler.clamp_params(predicted_params)
-        if raw_curve is None:
-            raw_curve = curve
-        if raw_q is None:
-            raw_q = self.q.squeeze().cpu().numpy()
-            raw_q_t = self.q
-        else:
-            raw_q_t = torch.from_numpy(raw_q).to(self.q)
-        if q_ratio != 1.:
-            predicted_params.scale_with_q(q_ratio)
-            raw_q = raw_q * q_ratio
-            raw_q_t = raw_q_t * q_ratio
-        prediction_dict = {
-            "params": get_prediction_array(predicted_params),
-            "param_names": get_param_labels(
-                predicted_params.max_layer_num,
-                thickness_name='d',
-                roughness_name='sigma',
-                sld_name='rho',
-            ),
-            "curve_predicted": predicted_params.reflectivity(raw_q_t).squeeze().cpu().numpy()
-        }
-        sld_x_axis, sld_profile, _ = get_density_profiles(
-            predicted_params.thicknesses, predicted_params.roughnesses, predicted_params.slds, num=1024,
-        )
-        prediction_dict['sld_profile'] = sld_profile.squeeze().cpu().numpy()
-        prediction_dict['sld_x_axis'] = sld_x_axis.squeeze().cpu().numpy()
-        if polish:
-            prediction_dict.update(self._polish_prediction(
-                raw_q, raw_curve, predicted_params, priors, sld_x_axis,
-                max_d_change=max_d_change, fit_growth=fit_growth,
-            ))
-            if fit_growth and "params_polished" in prediction_dict:
-                prediction_dict["param_names"].append("max_d_change")
-        return prediction_dict
-    ### some shortcut methods for data processing ###
-    def _simple_prediction(self, scaled_curve, scaled_bounds) -> UniformSubPriorParams:
-        context = torch.cat([scaled_curve, scaled_bounds], -1)
-        with torch.no_grad():
-            self.trainer.model.eval()
-            scaled_params = self.trainer.model(context)
-        predicted_params: UniformSubPriorParams = self._restore_predicted_params(scaled_params, context)
-        return predicted_params
-    @print_time
-    def _qshift_prediction(self, curve, scaled_bounds, num: int = 1000, dq_coef: float = 1.) -> UniformSubPriorParams:
-        q = self.q.squeeze().float()
-        curve = to_t(curve).to(q)
-        dq_max = (q[1] - q[0]) * dq_coef
-        q_shifts = torch.linspace(-dq_max, dq_max, num).to(q)
-        shifted_curves = _qshift_interp(q.squeeze(), curve, q_shifts)
-        assert shifted_curves.shape == (num, q.shape[0])
-        scaled_curves = self.trainer.loader.curves_scaler.scale(shifted_curves)
-        context = torch.cat([scaled_curves, torch.atleast_2d(scaled_bounds).expand(scaled_curves.shape[0], -1)], -1)
-        with torch.no_grad():
-            self.trainer.model.eval()
-            scaled_params = self.trainer.model(context)
-            restored_params = self._restore_predicted_params(scaled_params, context)
-            best_param = get_best_mse_param(
-                restored_params,
-                self._get_likelihood(curve),
-            )
-            return best_param
-    @print_time
-    def _polish_prediction(self,
-                           q: np.ndarray,
-                           curve: np.ndarray,
-                           predicted_params: Params,
-                           priors: np.ndarray,
-                           sld_x_axis,
-                           fit_growth: bool = True,
-                           max_d_change: float = 5.,
-                           ) -> dict:
-        params = torch.cat([
-            predicted_params.thicknesses.squeeze(),
-            predicted_params.roughnesses.squeeze(),
-            predicted_params.slds.squeeze()
-        ]).cpu().numpy()
-        polished_params_dict = {}
-        try:
-            if fit_growth:
-                polished_params_arr, curve_polished = get_fit_with_growth(
-                    q, curve, params, bounds=priors.T,
-                    max_d_change=max_d_change,
-                )
-                polished_params = Params.from_tensor(torch.from_numpy(polished_params_arr[:-1][None]).to(self.q))
-            else:
-                polished_params_arr, curve_polished = standard_refl_fit(q, curve, params, bounds=priors.T)
-                polished_params = Params.from_tensor(torch.from_numpy(polished_params_arr[None]).to(self.q))
-        except Exception as err:
-            self.log.exception(err)
-            polished_params = predicted_params
-            polished_params_arr = get_prediction_array(polished_params)
-            curve_polished = np.zeros_like(q)
-        polished_params_dict['params_polished'] = polished_params_arr
-        polished_params_dict['curve_polished'] = curve_polished
-        sld_x_axis_polished, sld_profile_polished, _ = get_density_profiles(
-            polished_params.thicknesses, polished_params.roughnesses, polished_params.slds, z_axis=sld_x_axis,
-        )
-        polished_params_dict['sld_profile_polished'] = sld_profile_polished.squeeze().cpu().numpy()
-        return polished_params_dict
-    def _restore_predicted_params(self, scaled_params: Tensor, context: Tensor) -> UniformSubPriorParams:
-        predicted_params: UniformSubPriorParams = self.trainer.loader.prior_sampler.restore_params(
-            self.trainer.loader.prior_sampler.PARAM_CLS.restore_params_from_context(scaled_params, context)
-        )
-        return predicted_params
-    def _input2context(self, curve: np.ndarray, priors: np.ndarray, q_ratio: float = 1.):
-        scaled_curve = self._scale_curve(curve)
-        scaled_bounds, min_bounds, max_bounds = self._scale_priors(priors, q_ratio)
-        scaled_input = torch.cat([scaled_curve, scaled_bounds], -1)
-        return scaled_input, min_bounds, max_bounds
-    def _scale_curve(self, curve: np.ndarray or Tensor):
-        if not isinstance(curve, Tensor):
-            curve = torch.from_numpy(curve).float()
-        curve = torch.atleast_2d(curve).to(self.q)
-        scaled_curve = self.trainer.loader.curves_scaler.scale(curve)
-        return scaled_curve.float()
-    def _scale_priors(self, priors: np.ndarray or Tensor, q_ratio: float = 1.):
-        if not isinstance(priors, Tensor):
-            priors = torch.from_numpy(priors)
-        priors = priors.float().clone()
-        priors = priors.to(self.q).T
-        priors = self._prior_sampler.scale_bounds_with_q(priors, 1 / q_ratio)
-        priors = self._prior_sampler.clamp_bounds(priors)
-        min_bounds, max_bounds = priors[:, None].to(self.q)
-        prior_sampler = self._prior_sampler
-        scaled_bounds = torch.cat([
-            prior_sampler.scale_bounds(min_bounds), prior_sampler.scale_bounds(max_bounds)
-        ], -1)
-        return scaled_bounds.float(), min_bounds, max_bounds
-    @property
-    def _prior_sampler(self) -> ExpUniformSubPriorSampler:
-        return self.trainer.loader.prior_sampler
-    def _set_trainer(self, trainer, preprocessing_parameters: dict = None):
-        self.trainer = trainer
-        self.trainer.model.eval()
-        self._update_preprocessing(preprocessing_parameters)
-    def _update_preprocessing(self, preprocessing_parameters: dict = None):
-        self.log.debug(f"setting preprocessing_parameters {preprocessing_parameters}.")
-        self.q = self.trainer.loader.q_generator.q
-        self.preprocessing = StandardPreprocessing(
-            self.q.cpu().squeeze().numpy(),
-            **(preprocessing_parameters or {})
-        )
-        self.log.info(f"preprocessing params are set: {preprocessing_parameters}.")
-    @print_time
-    def _sampler_solution(
-            self,
-            curve: Tensor or np.ndarray,
-            predicted_params: UniformSubPriorParams,
-    ) -> UniformSubPriorParams:
-        if not isinstance(curve, Tensor):
-            curve = torch.from_numpy(curve).float()
-        curve = curve.to(self.q)
-        refined_params = simple_sampler_solution(
-            self._get_likelihood(curve),
-            predicted_params,
-            self._prior_sampler.min_bounds,
-            self._prior_sampler.max_bounds,
-            num=self._sampling_num, coef=0.1,
-        )
-        return refined_params
-    def _get_likelihood(self, curve, rel_err: float = 0.1, abs_err: float = 1e-12):
-        return LogLikelihood(
-            self.q, curve, self._prior_sampler, curve * rel_err + abs_err
-        )
-def get_prediction_array(params: BasicParams) -> np.ndarray:
-    predict_arr = torch.cat([
-        params.thicknesses.squeeze(),
-        params.roughnesses.squeeze(),
-        params.slds.squeeze(),
-    ]).cpu().numpy()
-    return predict_arr
-def _qshift_interp(q, r, q_shifts):
-    qs = q[None] + q_shifts[:, None]
-    eps = torch.finfo(r.dtype).eps
-    ind = torch.searchsorted(q[None].expand_as(qs).contiguous(), qs.contiguous())
-    ind = torch.clamp(ind - 1, 0, q.shape[0] - 2)
-    slopes = (r[1:] - r[:-1]) / (eps + (q[1:] - q[:-1]))
+from pathlib import Path
+import numpy as np
+import torch
+from torch import Tensor
+from typing import List, Tuple, Union
+from huggingface_hub import hf_hub_download
+from reflectorch.data_generation.priors import BasicParams
+from reflectorch.data_generation.priors.parametric_models import NuisanceParamsWrapper
+from reflectorch.data_generation.q_generator import ConstantQ, VariableQ, MaskedVariableQ
+from reflectorch.data_generation.utils import get_density_profiles
+from reflectorch.inference.preprocess_exp.interpolation import interp_reflectivity
+from reflectorch.paths import CONFIG_DIR, SAVED_MODELS_DIR
+from reflectorch.runs.utils import (
+    get_trainer_by_name
+)
+from reflectorch.ml.trainers import PointEstimatorTrainer
+from reflectorch.data_generation.likelihoods import LogLikelihood
+from reflectorch.inference.scipy_fitter import refl_fit, get_fit_with_growth
+from reflectorch.inference.sampler_solution import get_best_mse_param
+from reflectorch.utils import get_filtering_mask, to_t
+from huggingface_hub.utils import disable_progress_bars
+# that causes some Rust related errors when downloading models from Huggingface
+disable_progress_bars()
+class InferenceModel(object):
+    """Facilitates the inference process using pretrained models
+    Args:
+        config_name (str, optional): the name of the configuration file used to initialize the model (either with or without the '.yaml' extension). Defaults to None.
+        model_name (str, optional): the name of the file containing the weights of the model (either with or without the '.pt' extension), only required if different than: `'model_' + config_name + '.pt'`. Defaults to None
+        root_dir (str, optional): path to root directory containing the 'configs' and 'saved_models' subdirectories, if different from the package root directory (ROOT_DIR). Defaults to None.
+        weights_format (str, optional): format (extension) of the weights file, either 'pt' or 'safetensors'. Defaults to 'safetensors'.
+        repo_id (str, optional): the id of the Huggingface repository from which the configuration files and model weights should be downloaded automatically if not found locally (in the 'configs' and 'saved_models' subdirectories of the root directory). Defaults to 'valentinsingularity/reflectivity'.
+        trainer (PointEstimatorTrainer, optional): if provided, this trainer instance is used directly instead of being initialized from the configuration file. Defaults to None.
+        device (str, optional): the Pytorch device ('cuda' or 'cpu'). Defaults to 'cuda'.
+    """
+    def __init__(self, config_name: str = None, model_name: str = None, root_dir:str = None, weights_format: str = 'safetensors',
+                 repo_id: str = 'valentinsingularity/reflectivity', trainer: PointEstimatorTrainer = None, device='cuda'):
+        self.config_name = config_name
+        self.model_name = model_name
+        self.root_dir = root_dir
+        self.weights_format = weights_format
+        self.repo_id = repo_id
+        self.trainer = trainer
+        self.device = device
+        if trainer is None and self.config_name is not None:
+            self.load_model(self.config_name, self.model_name, self.root_dir)
+        self.prediction_result = None
+    def load_model(self, config_name: str, model_name: str, root_dir: str) -> None:
+        """Loads a model for inference
+        Args:
+            config_name (str): the name of the configuration file used to initialize the model (either with or without the '.yaml' extension).
+            model_name (str): the name of the file containing the weights of the model (either with or without the '.pt' or '.safetensors'  extension), only required if different than: `'model_' + config_name + extension`.
+            root_dir (str): path to root directory containing the 'configs' and 'saved_models' subdirectories, if different from the package root directory (ROOT_DIR).
+        """
+        if self.config_name == config_name and self.trainer is not None:
+            return
+        if not config_name.endswith('.yaml'):
+            config_name_no_extension = config_name
+            self.config_name = config_name_no_extension + '.yaml'
+        else:
+            config_name_no_extension = config_name[:-5]
+            self.config_name = config_name
+        self.config_dir = Path(root_dir) / 'configs' if root_dir else CONFIG_DIR
+        weights_extension = '.' + self.weights_format
+        self.model_name = model_name or 'model_' + config_name_no_extension + weights_extension
+        if not self.model_name.endswith(weights_extension):
+            self.model_name += weights_extension
+        self.model_dir = Path(root_dir) / 'saved_models' if root_dir else SAVED_MODELS_DIR
+        def _download_with_fallback(filename: str, local_target_dir: Path, legacy_subfolder: str):
+            """Try to download from repo root (new layout). If not found, retry with legacy `subfolder=legacy_subfolder`. Place result under local_target_dir using `local_dir`.
+            """
+            try: # new layout: files at repo root (same level as README.md)
+                hf_hub_download(repo_id=self.repo_id + '/' + config_name, filename=filename, local_dir=str(local_target_dir))
+            except Exception : # legacy layout fallback: e.g. subfolder='configs' or 'saved_models'
+                hf_hub_download(repo_id=self.repo_id, filename=filename, subfolder=legacy_subfolder, local_dir=str(local_target_dir.parent))
+        config_path = Path(self.config_dir) / self.config_name
+        if config_path.exists():
+            print(f"Configuration file `{config_path}` found locally.")
+        else:
+            print(f"Configuration file `{config_path}` not found locally.")
+            if self.repo_id is None:
+                raise ValueError("repo_id must be provided to download files from Huggingface.")
+            print("Downloading from Huggingface...")
+            _download_with_fallback(self.config_name, self.config_dir, legacy_subfolder='configs')
+        model_path = Path(self.model_dir) / self.model_name
+        if model_path.exists():
+            print(f"Weights file `{model_path}` found locally.")
+        else:
+            print(f"Weights file `{model_path}` not found locally.")
+            if self.repo_id is None:
+                raise ValueError("repo_id must be provided to download files from Huggingface.")
+            print("Downloading from Huggingface...")
+            _download_with_fallback(self.model_name, self.model_dir, legacy_subfolder='saved_models')
+        self.trainer = get_trainer_by_name(config_name=config_name, config_dir=self.config_dir, model_path=model_path, load_weights=True, inference_device = self.device)
+        self.trainer.model.eval()
+        param_model = self.trainer.loader.prior_sampler.param_model
+        param_model_name = param_model.base_model.NAME if isinstance(param_model, NuisanceParamsWrapper) else param_model.NAME
+        print(f'The model corresponds to a `{param_model_name}` parameterization with {self.trainer.loader.prior_sampler.max_num_layers} layers ({self.trainer.loader.prior_sampler.param_dim} predicted parameters)')
+        print("Parameter types and total ranges:")
+        for param, range_ in self.trainer.loader.prior_sampler.param_ranges.items():
+            print(f"- {param}: {range_}")
+        print("Allowed widths of the prior bound intervals (max-min):")
+        for param, range_ in self.trainer.loader.prior_sampler.bound_width_ranges.items():
+            print(f"- {param}: {range_}")
+        if isinstance(self.trainer.loader.q_generator, ConstantQ):
+            q_min = self.trainer.loader.q_generator.q[0].item()
+            q_max = self.trainer.loader.q_generator.q[-1].item()
+            n_q = self.trainer.loader.q_generator.q.shape[0]
+            print(f'The model was trained on curves discretized at {n_q} uniform points between q_min={q_min} and q_max={q_max}')
+        elif isinstance(self.trainer.loader.q_generator, VariableQ):
+            q_min_range = self.trainer.loader.q_generator.q_min_range
+            q_max_range = self.trainer.loader.q_generator.q_max_range
+            n_q_range = self.trainer.loader.q_generator.n_q_range
+            if n_q_range[0] == n_q_range[1]:
+                n_q_fixed = n_q_range[0]
+                print(f'The model was trained on curves discretized at exactly {n_q_fixed} uniform points, '
+                    f'between q_min in [{q_min_range[0]}, {q_min_range[1]}] and q_max in [{q_max_range[0]}, {q_max_range[1]}]')
+            else:
+                print(f'The model was trained on curves discretized at a number between {n_q_range[0]} and {n_q_range[1]} '
+                    f'of uniform points between q_min in [{q_min_range[0]}, {q_min_range[1]}] and q_max in [{q_max_range[0]}, {q_max_range[1]}]')
+        if self.trainer.loader.smearing is not None:
+            q_res_min = self.trainer.loader.smearing.sigma_min
+            q_res_max = self.trainer.loader.smearing.sigma_max
+            if self.trainer.loader.smearing.constant_dq == False:
+                print(f"The model was trained with linear resolution smearing (dq/q) in the range [{q_res_min}, {q_res_max}]")
+            elif self.trainer.loader.smearing.constant_dq == True:
+                print(f"The model was trained with constant resolution smearing in the range [{q_res_min}, {q_res_max}]")
+        additional_inputs = ["prior bounds"]
+        if self.trainer.train_with_q_input:
+            additional_inputs.append("q values")
+        if self.trainer.condition_on_q_resolutions:
+            additional_inputs.append("the resolution dq/q")
+        if additional_inputs:
+            inputs_str = ", ".join(additional_inputs)
+            print(f"The following quantities are additional inputs to the network: {inputs_str}.")
+    def preprocess_and_predict(self,
+                            reflectivity_curve: np.ndarray,
+                            q_values: np.ndarray = None,
+                            prior_bounds: Union[np.ndarray, List[Tuple]] = None,
+                            sigmas: np.ndarray = None,
+                            q_resolution: Union[float, np.ndarray] = None,
+                            ambient_sld: float = None,
+                            clip_prediction: bool = True,
+                            polish_prediction: bool = False,
+                            polishing_method: str = 'trf',
+                            polishing_kwargs_reflectivity: dict = None,
+                            use_sigmas_for_polishing: bool = False,
+                            polishing_max_steps: int = None,
+                            fit_growth: bool = False,
+                            max_d_change: float = 5.,
+                            calc_pred_curve: bool = True,
+                            calc_pred_sld_profile: bool = False,
+                            calc_polished_sld_profile: bool = False,
+                            sld_profile_padding_left: float = 0.2,
+                            sld_profile_padding_right: float = 1.1,
+                            kwargs_param_labels: dict = {},
+                            truncate_index_left: int = None,
+                            truncate_index_right: int = None,
+                            enable_error_bars_filtering: bool = True,
+                            filter_threshold=0.3,
+                            filter_remove_singles=True,
+                            filter_remove_consecutives=True,
+                            filter_consecutive=3,
+                            filter_q_start_trunc=0.1,
+                            ):
+        """Preprocess experimental data (clean, truncate, filter, interpolate) and run prediction. This wrapper prepares inputs according to the model's Q generator calls `predict(...)` on the interpolated/padded data, and (optionally) performs a polishing step on the original data (pre-interpolation)
+        Args:
+            reflectivity_curve (Union[np.ndarray, Tensor]): 1D array of experimental reflectivity values.
+            q_values (Union[np.ndarray, Tensor]): 1D array of momentum transfer values for the reflectivity curve (in units of inverse angstroms).
+            prior_bounds (Union[np.ndarray, List[Tuple]]): Prior bounds for all parameters, shape ``(num_params, 2)`` as ``[(min, max), …]``.
+            sigmas (Union[np.ndarray, Tensor], optional): 1D array of experimental uncertainties (same length as `reflectivity_curve`). Used for error-bar filtering (if enabled) and for polishing (if requested).
+            q_resolution (Union[float, np.ndarray], optional): The q resolution for neutron reflectometry models. Can be either a float (dq/q) for linear resolution smearing (e.g. 0.05 meaning 5% reolution smearing) or an array of dq values for pointwise resolution smearing.
+            ambient_sld (float, optional): The SLD of the fronting (i.e. ambient) medium for structure with fronting medium different than air.
+            clip_prediction (bool, optional): If ``True``, the values of the predicted parameters are clipped to not be outside the interval set by the prior bounds. Defaults to True.
+            polish_prediction (bool, optional): If ``True``, the neural network predictions are further polished using a simple least mean squares (LMS) fit. Defaults to False.
+            polishing_method (str): {'trf', 'dogbox', 'lm'} SciPy least-squares method used for polishing.
+            use_sigmas_for_polishing (bool): If ``True``, weigh residuals by `sigmas` during polishing.
+            polishing_max_steps (int, optional): Maximum number of function evaluations for the SciPy optimizer.
+            fit_growth (bool, optional): (Deprecated) If ``True``, an additional parameters is introduced during the LMS polishing to account for the change in the thickness of the upper layer during the in-situ measurement of the reflectivity curve (a linear growth is assumed). Defaults to False.
+            max_d_change (float): The maximum possible change in the thickness of the upper layer during the in-situ measurement, relevant when polish_prediction and fit_growth are True. Defaults to 5.
+            calc_pred_curve (bool, optional): Whether to calculate the curve corresponding to the predicted parameters. Defaults to True.
+            calc_pred_sld_profile (bool, optional): Whether to calculate the SLD profile corresponding to the predicted parameters. Defaults to False.
+            calc_polished_sld_profile (bool, optional): Whether to calculate the SLD profile corresponding to the polished parameters. Defaults to False.
+            sld_profile_padding_left (float, optional): Controls the amount of padding applied to the left side of the computed SLD profiles.
+            sld_profile_padding_right (float, optional): Controls the amount of padding applied to the right side of the computed SLD profiles.
+            truncate_index_left (int, optional): The data provided as input to the neural network will be truncated between the indices [truncate_index_left, truncate_index_right].
+            truncate_index_right (int, optional): The data provided as input to the neural network will be truncated between the indices [truncate_index_left, truncate_index_right].
+            enable_error_bars_filtering (bool, optional). If ``True``, the data points with high error bars (above a threshold) will be removed before constructing the input to the neural network (they are still used in the polishing step). Default to True.
+            filter_threshold (float, optional). The relative threshold (dR/R) for error bar filtering. Defaults to 0.3.
+            filter_remove_singles (float, optional). If ``True``, all isolated points exceeding the filtering threshold will be eliminated. Default to True.
+            filter_remove_consecutives (float, optional). If ``True``, in the situation when a number of ``filter_consecutive`` consecutive points exceeding the filtering threshold are detected at a position higher than ``filter_q_start_trunc``, all the subsequent points in the curve are eliminated.
+        Returns:
+            dict: dictionary containing the predictions
+        """
+        ## Preprocess the data for inference (remove negative intensities, truncation, filer out points with high error bars)
+        (q_values, reflectivity_curve, sigmas, q_resolution,
+         q_values_original, reflectivity_curve_original, sigmas_original, q_resolution_original) = self._preprocess_input_data(
+            reflectivity_curve=reflectivity_curve,
+            q_values=q_values,
+            sigmas=sigmas,
+            q_resolution=q_resolution,
+            truncate_index_left=truncate_index_left,
+            truncate_index_right=truncate_index_right,
+            enable_error_bars_filtering=enable_error_bars_filtering,
+            filter_threshold=filter_threshold,
+            filter_remove_singles=filter_remove_singles,
+            filter_remove_consecutives=filter_remove_consecutives,
+            filter_consecutive=filter_consecutive,
+            filter_q_start_trunc=filter_q_start_trunc,
+        )
+        ### Interpolate the experimental data if needed by the embedding network
+        interp_data = self.interpolate_data_to_model_q(
+            q_exp=q_values,
+            refl_exp=reflectivity_curve,
+            sigmas_exp=sigmas,
+            q_res_exp=q_resolution,
+            as_dict=True
+        )
+        q_model = interp_data["q_model"]
+        reflectivity_curve_interp = interp_data["reflectivity"]
+        sigmas_interp = interp_data.get("sigmas")
+        q_resolution_interp = interp_data.get("q_resolution")
+        key_padding_mask = interp_data.get("key_padding_mask")
+        ### Make the prediction
+        prediction_dict = self.predict(
+            reflectivity_curve=reflectivity_curve_interp,
+            q_values=q_model,
+            sigmas=sigmas_interp,
+            q_resolution=q_resolution_interp,
+            key_padding_mask=key_padding_mask,
+            prior_bounds=prior_bounds,
+            ambient_sld=ambient_sld,
+            clip_prediction=clip_prediction,
+            polish_prediction=False, ###do the polishing outside the predict method on the full data
+            supress_sld_amb_back_shift=True, ###do not shift back the slds by the ambient yet
+            calc_pred_curve=calc_pred_curve,
+            calc_pred_sld_profile=calc_pred_sld_profile,
+            sld_profile_padding_left=sld_profile_padding_left,
+            sld_profile_padding_right=sld_profile_padding_right,
+            kwargs_param_labels=kwargs_param_labels,
+        )
+        ### Save interpolated data
+        prediction_dict['q_model'] = q_model
+        prediction_dict['reflectivity_curve_interp'] = reflectivity_curve_interp
+        if q_resolution_interp is not None:
+            prediction_dict['q_resolution_interp'] = q_resolution_interp
+        if sigmas_interp is not None:
+            prediction_dict['sigmas_interp'] = sigmas_interp
+        if key_padding_mask is not None:
+            prediction_dict['key_padding_mask'] = key_padding_mask
+        ### Shift the slds for nonzero ambient
+        prior_bounds = np.array(prior_bounds)
+        if ambient_sld:
+            sld_indices = self._shift_slds_by_ambient(prior_bounds, ambient_sld)
+        ### Perform polishing on the original data
+        if polish_prediction:
+            polishing_kwargs = polishing_kwargs_reflectivity or {}
+            polishing_kwargs.setdefault('dq', q_resolution_original)
+            polished_dict = self._polish_prediction(
+                q=q_values_original,
+                curve=reflectivity_curve_original,
+                predicted_params=prediction_dict['predicted_params_object'],
+                priors=prior_bounds,
+                ambient_sld_tensor=torch.atleast_2d(torch.as_tensor(ambient_sld)) if ambient_sld is not None else None,
+                calc_polished_sld_profile=calc_polished_sld_profile,
+                sld_x_axis=torch.from_numpy(prediction_dict['predicted_sld_xaxis']),
+                polishing_kwargs_reflectivity = polishing_kwargs,
+                error_bars=sigmas_original if use_sigmas_for_polishing else None,
+                polishing_method=polishing_method,
+                polishing_max_steps=polishing_max_steps,
+                fit_growth=fit_growth,
+                max_d_change=max_d_change,
+            )
+            prediction_dict.update(polished_dict)
+            if fit_growth and "polished_params_array" in prediction_dict:
+                prediction_dict["param_names"].append("max_d_change")
+        ### Shift back the slds for nonzero ambient
+        if ambient_sld:
+            self._restore_slds_after_ambient_shift(prediction_dict, sld_indices, ambient_sld)
+        return prediction_dict
+    def predict(self,
+                reflectivity_curve: Union[np.ndarray, Tensor],
+                q_values: Union[np.ndarray, Tensor] = None,
+                prior_bounds: Union[np.ndarray, List[Tuple]] = None,
+                sigmas: Union[np.ndarray, Tensor] = None,
+                key_padding_mask: Union[np.ndarray, Tensor] = None,
+                q_resolution: Union[float, np.ndarray] = None,
+                ambient_sld: float = None,
+                clip_prediction: bool = True,
+                polish_prediction: bool = False,
+                polishing_method: str = 'trf',
+                polishing_kwargs_reflectivity: dict = None,
+                polishing_max_steps: int = None,
+                fit_growth: bool = False,
+                max_d_change: float = 5.,
+                use_q_shift: bool = False,
+                calc_pred_curve: bool = True,
+                calc_pred_sld_profile: bool = False,
+                calc_polished_sld_profile: bool = False,
+                sld_profile_padding_left: float = 0.2,
+                sld_profile_padding_right: float = 1.1,
+                supress_sld_amb_back_shift: bool = False,
+                kwargs_param_labels: dict = {},
+                ):
+        """Predict the thin film parameters
+        Args:
+            reflectivity_curve (Union[np.ndarray, Tensor]): The reflectivity curve (which has been already preprocessed, normalized and interpolated).
+            q_values (Union[np.ndarray, Tensor], optional): The momentum transfer (q) values for the reflectivity curve (in units of inverse angstroms).
+            prior_bounds (Union[np.ndarray, List[Tuple]]): The prior bounds for the predicted parameters.
+            sigmas (Union[np.ndarray, Tensor], optional): The error bars of the reflectivity curve, if available. They are used for filtering out points with high error bars if ``enable_error_bars_filtering`` is ``True``, as well as for the polishing step if ``use_sigmas_for_polishing`` is ``True``.
+            key_padding_mask (Union[np.ndarray, Tensor], optional): The key padding mask required for some embedding networks.
+            q_resolution (Union[float, np.ndarray], optional): The q resolution for neutron reflectometry models. Can be either a float dq/q for linear resolution smearing (e.g. 0.05 meaning 5% reolution smearing) or an array of dq values for pointwise resolution smearing.
+            ambient_sld (float, optional): The SLD of the fronting (i.e. ambient) medium for structure with fronting medium different than air.
+            clip_prediction (bool, optional): If ``True``, the values of the predicted parameters are clipped to not be outside the interval set by the prior bounds. Defaults to True.
+            polish_prediction (bool, optional): If ``True``, the neural network predictions are further polished using a simple least mean squares (LMS) fit. Defaults to False.
+            polishing_method (str): Type of scipy method used for polishing.
+            polishing_max_steps (int, optional): Sets the maximum number of steps for the polishing algorithm.
+            fit_growth (bool, optional): (Deprecated) If ``True``, an additional parameters is introduced during the LMS polishing to account for the change in the thickness of the upper layer during the in-situ measurement of the reflectivity curve (a linear growth is assumed). Defaults to False.
+            max_d_change (float): The maximum possible change in the thickness of the upper layer during the in-situ measurement, relevant when polish_prediction and fit_growth are True. Defaults to 5.
+            use_q_shift: (Deprecated) If ``True``, the prediction is performed for a batch of slightly shifted versions of the input curve and the best result is returned, which is meant to mitigate the influence of imperfect sample alignment, as introduced in Greco et al. (only for models with fixed q-discretization). Defaults to False.
+            calc_pred_curve (bool, optional): Whether to calculate the curve corresponding to the predicted parameters. Defaults to True.
+            calc_pred_sld_profile (bool, optional): Whether to calculate the SLD profile corresponding to the predicted parameters. Defaults to False.
+            calc_polished_sld_profile (bool, optional): Whether to calculate the SLD profile corresponding to the polished parameters. Defaults to False.
+            sld_profile_padding_left (float, optional): Controls the amount of padding applied to the left side of the computed SLD profiles.
+            sld_profile_padding_right (float, optional): Controls the amount of padding applied to the right side of the computed SLD profiles.
+        Returns:
+            dict: dictionary containing the predictions
+        """
+        scaled_curve = self._scale_curve(reflectivity_curve)
+        if prior_bounds is None:
+            raise ValueError(f'Prior bounds were not provided')
+        prior_bounds = np.array(prior_bounds)
+        if ambient_sld:
+            sld_indices = self._shift_slds_by_ambient(prior_bounds, ambient_sld)
+        scaled_prior_bounds = self._scale_prior_bounds(prior_bounds)
+        if isinstance(self.trainer.loader.q_generator, ConstantQ):
+            q_values = self.trainer.loader.q_generator.q
+        else:
+            if q_values is None:
+                raise ValueError(f'The q values were not provided')
+            q_values = torch.atleast_2d(to_t(q_values)).to(scaled_curve)
+        scaled_q_values = self.trainer.loader.q_generator.scale_q(q_values).to(torch.float32) if self.trainer.train_with_q_input else None
+        if q_resolution is None and self.trainer.loader.smearing is not None:
+            raise ValueError(f'The q resolution must be provided for NR models')
+        if q_resolution is not None:
+            q_resolution_tensor = torch.atleast_2d(torch.as_tensor(q_resolution)).to(scaled_curve)
+            if isinstance(q_resolution, float):
+                unscaled_q_resolutions = q_resolution_tensor
+            else:
+                unscaled_q_resolutions = (q_resolution_tensor / q_values).nanmean(dim=-1, keepdim=True) ##when q_values is padded with 0s, there will be nan at the padded positions
+            scaled_q_resolutions = self.trainer.loader.smearing.scale_resolutions(unscaled_q_resolutions) if self.trainer.condition_on_q_resolutions else None
+            scaled_conditioning_params = scaled_q_resolutions
+            if polishing_kwargs_reflectivity is None:
+                polishing_kwargs_reflectivity = {'dq': q_resolution}
+        else:
+            q_resolution_tensor = None
+            scaled_conditioning_params = None
+        if key_padding_mask is not None:
+            key_padding_mask = torch.as_tensor(key_padding_mask, device=self.device)
+            key_padding_mask = key_padding_mask.unsqueeze(0) if key_padding_mask.dim() == 1 else key_padding_mask
+        if use_q_shift and not self.trainer.train_with_q_input:
+            predicted_params = self._qshift_prediction(reflectivity_curve, scaled_prior_bounds, num = 1024, dq_coef = 1.)
+        else:
+            with torch.no_grad():
+                self.trainer.model.eval()
+                scaled_predicted_params = self.trainer.model(
+                    curves=scaled_curve,
+                    bounds=scaled_prior_bounds,
+                    q_values=scaled_q_values,
+                    conditioning_params = scaled_conditioning_params,
+                    key_padding_mask = key_padding_mask,
+                    unscaled_q_values = q_values,
+                    )
+                predicted_params = self.trainer.loader.prior_sampler.restore_params(torch.cat([scaled_predicted_params, scaled_prior_bounds], dim=-1))
+        if clip_prediction:
+            predicted_params = self.trainer.loader.prior_sampler.clamp_params(predicted_params)
+        prediction_dict = {
+            "predicted_params_object": predicted_params,
+            "predicted_params_array": predicted_params.parameters.squeeze().cpu().numpy(),
+            "param_names" : self.trainer.loader.prior_sampler.param_model.get_param_labels(**kwargs_param_labels)
+        }
+        key_padding_mask = None if key_padding_mask is None else key_padding_mask.squeeze().cpu().numpy()
+        if calc_pred_curve:
+            predicted_curve = predicted_params.reflectivity(q=q_values, dq=q_resolution_tensor).squeeze().cpu().numpy()
+            prediction_dict[ "predicted_curve"] = predicted_curve if key_padding_mask is None else predicted_curve[key_padding_mask]
+        ambient_sld_tensor = torch.atleast_2d(torch.as_tensor(ambient_sld, device=self.device)) if ambient_sld is not None else None
+        if calc_pred_sld_profile:
+            predicted_sld_xaxis, predicted_sld_profile, _ = get_density_profiles(
+                predicted_params.thicknesses, predicted_params.roughnesses, predicted_params.slds + (ambient_sld_tensor or 0), ambient_sld_tensor,
+                num=1024, padding_left=sld_profile_padding_left, padding_right=sld_profile_padding_right,
+            )
+            prediction_dict['predicted_sld_profile'] = predicted_sld_profile.squeeze().cpu().numpy()
+            prediction_dict['predicted_sld_xaxis'] = predicted_sld_xaxis.squeeze().cpu().numpy()
+        else:
+            predicted_sld_xaxis = None
+        refl_curve_polish = reflectivity_curve if key_padding_mask is None else reflectivity_curve[key_padding_mask]
+        q_polish = q_values.squeeze().cpu().numpy() if key_padding_mask is None else q_values.squeeze().cpu().numpy()[key_padding_mask]
+        prediction_dict['q_plot_pred'] = q_polish
+        if polish_prediction:
+            if ambient_sld_tensor:
+                ambient_sld_tensor = ambient_sld_tensor.cpu()
+            polished_dict = self._polish_prediction(
+                q = q_polish,
+                curve = refl_curve_polish,
+                predicted_params = predicted_params,
+                priors = np.array(prior_bounds),
+                error_bars = sigmas,
+                fit_growth = fit_growth,
+                max_d_change = max_d_change,
+                calc_polished_curve = calc_pred_curve,
+                calc_polished_sld_profile = calc_polished_sld_profile,
+                ambient_sld_tensor=ambient_sld_tensor,
+                sld_x_axis = predicted_sld_xaxis,
+                polishing_method=polishing_method,
+                polishing_max_steps=polishing_max_steps,
+                polishing_kwargs_reflectivity=polishing_kwargs_reflectivity,
+            )
+            prediction_dict.update(polished_dict)
+            if fit_growth and "polished_params_array" in prediction_dict:
+                prediction_dict["param_names"].append("max_d_change")
+        if ambient_sld and not supress_sld_amb_back_shift: #Note: the SLD shift will only be reflected in predicted_params_array but not in predicted_params_object; supress_sld_amb_back_shift is required for the 'preprocess_and_predict' method
+            self._restore_slds_after_ambient_shift(prediction_dict, sld_indices, ambient_sld)
+        return prediction_dict
+    def _polish_prediction(self,
+                           q: np.ndarray,
+                           curve: np.ndarray,
+                           predicted_params: BasicParams,
+                           priors: np.ndarray,
+                           sld_x_axis,
+                           ambient_sld_tensor: Tensor = None,
+                           fit_growth: bool = False,
+                           max_d_change: float = 5.,
+                           calc_polished_curve: bool = True,
+                           calc_polished_sld_profile: bool = False,
+                           error_bars: np.ndarray = None,
+                           polishing_method: str = 'trf',
+                           polishing_max_steps: int = None,
+                           polishing_kwargs_reflectivity: dict = None,
+                           ) -> dict:
+        params = predicted_params.parameters.squeeze().cpu().numpy()
+        polished_params_dict = {}
+        polishing_kwargs_reflectivity = polishing_kwargs_reflectivity or {}
+        try:
+            if fit_growth:
+                polished_params_arr, curve_polished = get_fit_with_growth(
+                    q = q,
+                    curve = curve,
+                    init_params = params,
+                    bounds = priors.T,
+                    max_d_change = max_d_change,
+                )
+                polished_params = BasicParams(
+                    torch.from_numpy(polished_params_arr[:-1][None]),
+                    torch.from_numpy(priors.T[0][None]),
+                    torch.from_numpy(priors.T[1][None]),
+                    self.trainer.loader.prior_sampler.max_num_layers,
+                    self.trainer.loader.prior_sampler.param_model
+                    )
+            else:
+                polished_params_arr, polished_params_err, curve_polished = refl_fit(
+                    q = q,
+                    curve = curve,
+                    init_params = params,
+                    bounds=priors.T,
+                    prior_sampler=self.trainer.loader.prior_sampler,
+                    error_bars=error_bars,
+                    method=polishing_method,
+                    polishing_max_steps=polishing_max_steps,
+                    reflectivity_kwargs=polishing_kwargs_reflectivity,
+                )
+                polished_params = BasicParams(
+                    torch.from_numpy(polished_params_arr[None]),
+                    torch.from_numpy(priors.T[0][None]),
+                    torch.from_numpy(priors.T[1][None]),
+                    self.trainer.loader.prior_sampler.max_num_layers,
+                    self.trainer.loader.prior_sampler.param_model
+                )
+        except Exception as err:
+            polished_params = predicted_params
+            polished_params_arr = get_prediction_array(polished_params)
+            curve_polished = np.zeros_like(q)
+            polished_params_err = None
+        polished_params_dict['polished_params_array'] = polished_params_arr
+        polished_params_dict['polished_params_error_array'] = (
+            np.array(polished_params_err)
+            if polished_params_err is not None
+            else np.full_like(polished_params, np.nan, dtype=np.float64)
+            )
+        if calc_polished_curve:
+            polished_params_dict['polished_curve'] = curve_polished
+        if ambient_sld_tensor is not None:
+            ambient_sld_tensor = ambient_sld_tensor.to(polished_params.slds.device)
+        if calc_polished_sld_profile:
+            _, sld_profile_polished, _ = get_density_profiles(
+                polished_params.thicknesses, polished_params.roughnesses, polished_params.slds + (ambient_sld_tensor or 0), ambient_sld_tensor,
+                z_axis=sld_x_axis.to(polished_params.slds.device),
+            )
+            polished_params_dict['sld_profile_polished'] = sld_profile_polished.squeeze().cpu().numpy()
+        return polished_params_dict
+    def _scale_curve(self, curve: Union[np.ndarray, Tensor]):
+        if not isinstance(curve, Tensor):
+            curve = torch.from_numpy(curve).float()
+        curve = curve.unsqueeze(0).to(self.device)
+        scaled_curve = self.trainer.loader.curves_scaler.scale(curve)
+        return scaled_curve
+    def _scale_prior_bounds(self, prior_bounds: List[Tuple]):
+        try:
+            prior_bounds = torch.tensor(prior_bounds)
+            prior_bounds = prior_bounds.to(self.device).T
+            min_bounds, max_bounds = prior_bounds[:, None]
+            scaled_bounds = torch.cat([
+                self.trainer.loader.prior_sampler.scale_bounds(min_bounds),
+                self.trainer.loader.prior_sampler.scale_bounds(max_bounds)
+            ], -1)
+            return scaled_bounds.float()
+        except RuntimeError as e:
+            expected_param_dim = self.trainer.loader.prior_sampler.param_dim
+            actual_param_dim = prior_bounds.shape[1] if prior_bounds.ndim == 2 else len(prior_bounds)
+            msg = (
+                f"\n **Parameter dimension mismatch during inference!**\n"
+                f"- Model expects **{expected_param_dim}** parameters.\n"
+                f"- You provided **{actual_param_dim}** prior bounds.\n\n"
+                f"💡This often occurs when:\n"
+                f"- The model was trained with additional nuisance parameters like `r_scale`, `q_shift`, or `log10_background`,\n"
+                f"  but they were not included in the `prior_bounds` passed to `.predict()`.\n"
+                f"- The number of layers or parameterization type differs from the one used during training.\n\n"
+                f" Check the configuration or the summary of expected parameters."
+            )
+            raise ValueError(msg) from e
+    def _shift_slds_by_ambient(self, prior_bounds: np.ndarray, ambient_sld: float):
+        n_layers = self.trainer.loader.prior_sampler.max_num_layers
+        sld_indices = slice(2*n_layers+1, 3*n_layers+2)
+        prior_bounds[sld_indices, ...] -= ambient_sld
+        training_min_bounds = self.trainer.loader.prior_sampler.min_bounds.squeeze().cpu().numpy()
+        training_max_bounds = self.trainer.loader.prior_sampler.max_bounds.squeeze().cpu().numpy()
+        lower_bound_check = (prior_bounds[sld_indices, 0] >= training_min_bounds[sld_indices]).all()
+        upper_bound_check = (prior_bounds[sld_indices, 1] <= training_max_bounds[sld_indices]).all()
+        assert lower_bound_check and upper_bound_check, "Shifting the layer SLDs by the ambient SLD exceeded the training ranges."
+        return sld_indices
+    def _restore_slds_after_ambient_shift(self, prediction_dict, sld_indices, ambient_sld):
+        prediction_dict["predicted_params_array"][sld_indices] += ambient_sld
+        if "polished_params_array" in prediction_dict:
+            prediction_dict["polished_params_array"][sld_indices] += ambient_sld
+    def _get_likelihood(self, q, curve, rel_err: float = 0.1, abs_err: float = 1e-12):
+        return LogLikelihood(
+            q, curve, self.trainer.loader.prior_sampler, curve * rel_err + abs_err
+        )
+    def get_param_labels(self, **kwargs):
+        return self.trainer.loader.prior_sampler.param_model.get_param_labels(**kwargs)
+    @staticmethod
+    def _preprocess_input_data(
+                           reflectivity_curve,
+                           q_values,
+                           sigmas=None,
+                           q_resolution=None,
+                           truncate_index_left=None,
+                           truncate_index_right=None,
+                           enable_error_bars_filtering=True,
+                           filter_threshold=0.3,
+                           filter_remove_singles=True,
+                           filter_remove_consecutives=True,
+                           filter_consecutive=3,
+                           filter_q_start_trunc=0.1):
+        # Save originals for polishing
+        reflectivity_curve_original = reflectivity_curve.copy()
+        q_values_original = q_values.copy() if q_values is not None else None
+        q_resolution_original = q_resolution.copy() if isinstance(q_resolution, np.ndarray) else q_resolution
+        sigmas_original = sigmas.copy() if sigmas is not None else None
+        # Remove points with non-positive intensities
+        nonnegative_mask = reflectivity_curve > 0.0
+        reflectivity_curve = reflectivity_curve[nonnegative_mask]
+        q_values = q_values[nonnegative_mask]
+        if sigmas is not None:
+            sigmas = sigmas[nonnegative_mask]
+        if isinstance(q_resolution, np.ndarray):
+            q_resolution = q_resolution[nonnegative_mask]
+        # Truncate arrays
+        if truncate_index_left is not None or truncate_index_right is not None:
+            slice_obj = slice(truncate_index_left, truncate_index_right)
+            reflectivity_curve = reflectivity_curve[slice_obj]
+            q_values = q_values[slice_obj]
+            if sigmas is not None:
+                sigmas = sigmas[slice_obj]
+            if isinstance(q_resolution, np.ndarray):
+                q_resolution = q_resolution[slice_obj]
+        # Filter high-error points
+        if enable_error_bars_filtering and sigmas is not None:
+            valid_mask = get_filtering_mask(
+                q_values,
+                reflectivity_curve,
+                sigmas,
+                threshold=filter_threshold,
+                consecutive=filter_consecutive,
+                remove_singles=filter_remove_singles,
+                remove_consecutives=filter_remove_consecutives,
+                q_start_trunc=filter_q_start_trunc
+            )
+            reflectivity_curve = reflectivity_curve[valid_mask]
+            q_values = q_values[valid_mask]
+            sigmas = sigmas[valid_mask]
+            if isinstance(q_resolution, np.ndarray):
+                q_resolution = q_resolution[valid_mask]
+        return (q_values, reflectivity_curve, sigmas, q_resolution,
+                q_values_original, reflectivity_curve_original,
+                sigmas_original, q_resolution_original)
+    def interpolate_data_to_model_q(
+        self,
+        q_exp,
+        refl_exp,
+        sigmas_exp=None,
+        q_res_exp=None,
+        as_dict=False
+    ):
+        q_generator = self.trainer.loader.q_generator
+        def _pad(arr, pad_to, value=0.0):
+            if arr is None:
+                return None
+            return np.pad(arr, (0, pad_to - len(arr)), constant_values=value)
+        def _interp_or_keep(q_model, q_exp, arr):
+            """Interpolate arrays, keep floats or None unchanged."""
+            if arr is None:
+                return None
+            return np.interp(q_model, q_exp, arr) if isinstance(arr, np.ndarray) else arr
+        def _pad_or_keep(arr, max_n):
+            """Pad arrays, keep floats or None unchanged."""
+            if arr is None:
+                return None
+            return _pad(arr, max_n, 0.0) if isinstance(arr, np.ndarray) else arr
+        def _prepare_return(q, refl, sigmas=None, q_res=None, mask=None, as_dict=False):
+            if as_dict:
+                result = {"q_model": q, "reflectivity": refl}
+                if sigmas is not None: result["sigmas"] = sigmas
+                if q_res is not None: result["q_resolution"] = q_res
+                if mask is not None: result["key_padding_mask"] = mask
+                return result
+            result = [q, refl]
+            if sigmas is not None: result.append(sigmas)
+            if q_res is not None: result.append(q_res)
+            if mask is not None: result.append(mask)
+            return tuple(result)
+        # ConstantQ
+        if isinstance(q_generator, ConstantQ):
+            q_model = q_generator.q.cpu().numpy()
+            refl_out = interp_reflectivity(q_model, q_exp, refl_exp)
+            sigmas_out = _interp_or_keep(q_model, q_exp, sigmas_exp)
+            q_res_out = _interp_or_keep(q_model, q_exp, q_res_exp)
+            return _prepare_return(q_model, refl_out, sigmas_out, q_res_out, None, as_dict)
+        # VariableQ
+        elif isinstance(q_generator, VariableQ):
+            if q_generator.n_q_range[0] == q_generator.n_q_range[1]:
+                n_q_model = q_generator.n_q_range[0]
+                q_min = max(q_exp.min(), q_generator.q_min_range[0])
+                q_max = min(q_exp.max(), q_generator.q_max_range[1])
+                if self.trainer.loader.q_generator.mode == 'logspace':
+                    q_model = torch.logspace(start=torch.log10(torch.tensor(q_min, device=self.device)),
+                                             end=torch.log10(torch.tensor(q_max, device=self.device)),
+                                             steps=n_q_model, device=self.device).to('cpu')
+                    logspace = True
+                else:
+                    q_model = np.linspace(q_min, q_max, n_q_model)
+                    logspace = False
+            else:
+                return _prepare_return(q_exp, refl_exp, sigmas_exp, q_res_exp, None, as_dict)
+            refl_out = interp_reflectivity(q_model, q_exp, refl_exp, logspace=logspace)
+            sigmas_out = _interp_or_keep(q_model, q_exp, sigmas_exp)
+            q_res_out = _interp_or_keep(q_model, q_exp, q_res_exp)
+            return _prepare_return(q_model, refl_out, sigmas_out, q_res_out, None, as_dict)
+        # MaskedVariableQ
+        elif isinstance(q_generator, MaskedVariableQ):
+            min_n, max_n = q_generator.n_q_range
+            n_exp = len(q_exp)
+            if min_n <= n_exp <= max_n:
+                # Pad only
+                q_model = _pad(q_exp, max_n, 0.0)
+                refl_out = _pad(refl_exp, max_n, 0.0)
+                sigmas_out = _pad_or_keep(sigmas_exp, max_n)
+                q_res_out = _pad_or_keep(q_res_exp, max_n)
+                key_padding_mask = np.zeros(max_n, dtype=bool)
+                key_padding_mask[:n_exp] = True
+            else:
+                # Interpolate + pad
+                n_interp = min(max(n_exp, min_n), max_n)
+                q_min = max(q_exp.min(), q_generator.q_min_range[0])
+                q_max = min(q_exp.max(), q_generator.q_max_range[1])
+                q_interp = np.linspace(q_min, q_max, n_interp)
+                refl_interp = interp_reflectivity(q_interp, q_exp, refl_exp)
+                sigmas_interp = _interp_or_keep(q_interp, q_exp, sigmas_exp)
+                q_res_interp = _interp_or_keep(q_interp, q_exp, q_res_exp)
+                q_model = _pad(q_interp, max_n, 0.0)
+                refl_out = _pad(refl_interp, max_n, 0.0)
+                sigmas_out = _pad_or_keep(sigmas_interp, max_n)
+                q_res_out = _pad_or_keep(q_res_interp, max_n)
+                key_padding_mask = np.zeros(max_n, dtype=bool)
+                key_padding_mask[:n_interp] = True
+            return _prepare_return(q_model, refl_out, sigmas_out, q_res_out, key_padding_mask, as_dict)
+        else:
+            raise TypeError(f"Unsupported QGenerator type: {type(q_generator)}")
+    def _qshift_prediction(self, curve, scaled_bounds, num: int = 1000, dq_coef: float = 1.) -> BasicParams:
+        assert isinstance(self.trainer.loader.q_generator, ConstantQ), "Prediction with q shifts available only for models with fixed discretization"
+        q = self.trainer.loader.q_generator.q.squeeze().float()
+        dq_max = (q[1] - q[0]) * dq_coef
+        q_shifts = torch.linspace(-dq_max, dq_max, num).to(q)
+        curve = to_t(curve).to(scaled_bounds)
+        shifted_curves = _qshift_interp(q.squeeze(), curve, q_shifts)
+        assert shifted_curves.shape == (num, q.shape[0])
+        scaled_curves = self.trainer.loader.curves_scaler.scale(shifted_curves)
+        scaled_prior_bounds = torch.atleast_2d(scaled_bounds).expand(scaled_curves.shape[0], -1)
+        with torch.no_grad():
+            self.trainer.model.eval()
+            scaled_predicted_params = self.trainer.model(scaled_curves, scaled_prior_bounds)
+            restored_params = self.trainer.loader.prior_sampler.restore_params(torch.cat([scaled_predicted_params, scaled_prior_bounds], dim=-1))
+            best_param = get_best_mse_param(
+                restored_params,
+                self._get_likelihood(q=self.trainer.loader.q_generator.q, curve=curve),
+            )
+            return best_param
+EasyInferenceModel = InferenceModel
+def get_prediction_array(params: BasicParams) -> np.ndarray:
+    predict_arr = torch.cat([
+        params.thicknesses.squeeze(),
+        params.roughnesses.squeeze(),
+        params.slds.squeeze(),
+    ]).cpu().numpy()
+    return predict_arr
+def _qshift_interp(q, r, q_shifts):
+    qs = q[None] + q_shifts[:, None]
+    eps = torch.finfo(r.dtype).eps
+    ind = torch.searchsorted(q[None].expand_as(qs).contiguous(), qs.contiguous())
+    ind = torch.clamp(ind - 1, 0, q.shape[0] - 2)
+    slopes = (r[1:] - r[:-1]) / (eps + (q[1:] - q[:-1]))
     return r[ind] + slopes[ind] * (qs - q[ind])

reflectorch 1.3.0__py3-none-any.whl → 1.5.0__py3-none-any.whl

Potentially problematic release.

reflectorch 1.3.0py3-none-any.whl → 1.5.0py3-none-any.whl