PyPI - reflectorch - Versions diffs - 1.5.1__py3-none-any.whl - Mend

reflectorch 1.5.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (96) hide show

reflectorch/__init__.py +17 -0
reflectorch/data_generation/__init__.py +128 -0
reflectorch/data_generation/dataset.py +216 -0
reflectorch/data_generation/likelihoods.py +80 -0
reflectorch/data_generation/noise.py +471 -0
reflectorch/data_generation/priors/__init__.py +60 -0
reflectorch/data_generation/priors/base.py +55 -0
reflectorch/data_generation/priors/exp_subprior_sampler.py +298 -0
reflectorch/data_generation/priors/independent_priors.py +195 -0
reflectorch/data_generation/priors/multilayer_models.py +311 -0
reflectorch/data_generation/priors/multilayer_structures.py +104 -0
reflectorch/data_generation/priors/no_constraints.py +206 -0
reflectorch/data_generation/priors/parametric_models.py +842 -0
reflectorch/data_generation/priors/parametric_subpriors.py +369 -0
reflectorch/data_generation/priors/params.py +252 -0
reflectorch/data_generation/priors/sampler_strategies.py +370 -0
reflectorch/data_generation/priors/scaler_mixin.py +65 -0
reflectorch/data_generation/priors/subprior_sampler.py +371 -0
reflectorch/data_generation/priors/utils.py +118 -0
reflectorch/data_generation/process_data.py +41 -0
reflectorch/data_generation/q_generator.py +280 -0
reflectorch/data_generation/reflectivity/__init__.py +102 -0
reflectorch/data_generation/reflectivity/abeles.py +97 -0
reflectorch/data_generation/reflectivity/kinematical.py +71 -0
reflectorch/data_generation/reflectivity/memory_eff.py +105 -0
reflectorch/data_generation/reflectivity/numpy_implementations.py +120 -0
reflectorch/data_generation/reflectivity/smearing.py +138 -0
reflectorch/data_generation/reflectivity/smearing_pointwise.py +110 -0
reflectorch/data_generation/scale_curves.py +112 -0
reflectorch/data_generation/smearing.py +99 -0
reflectorch/data_generation/utils.py +223 -0
reflectorch/extensions/__init__.py +0 -0
reflectorch/extensions/jupyter/__init__.py +11 -0
reflectorch/extensions/jupyter/api.py +85 -0
reflectorch/extensions/jupyter/callbacks.py +34 -0
reflectorch/extensions/jupyter/components.py +758 -0
reflectorch/extensions/jupyter/custom_select.py +268 -0
reflectorch/extensions/jupyter/log_widget.py +241 -0
reflectorch/extensions/jupyter/model_selection.py +495 -0
reflectorch/extensions/jupyter/plotly_plot_manager.py +329 -0
reflectorch/extensions/jupyter/widget.py +625 -0
reflectorch/extensions/matplotlib/__init__.py +5 -0
reflectorch/extensions/matplotlib/losses.py +32 -0
reflectorch/extensions/refnx/refnx_conversion.py +77 -0
reflectorch/inference/__init__.py +28 -0
reflectorch/inference/inference_model.py +848 -0
reflectorch/inference/input_interface.py +239 -0
reflectorch/inference/loading_data.py +55 -0
reflectorch/inference/multilayer_fitter.py +171 -0
reflectorch/inference/multilayer_inference_model.py +193 -0
reflectorch/inference/plotting.py +524 -0
reflectorch/inference/preprocess_exp/__init__.py +7 -0
reflectorch/inference/preprocess_exp/attenuation.py +36 -0
reflectorch/inference/preprocess_exp/cut_with_q_ratio.py +31 -0
reflectorch/inference/preprocess_exp/footprint.py +81 -0
reflectorch/inference/preprocess_exp/interpolation.py +19 -0
reflectorch/inference/preprocess_exp/normalize.py +21 -0
reflectorch/inference/preprocess_exp/preprocess.py +121 -0
reflectorch/inference/query_matcher.py +82 -0
reflectorch/inference/record_time.py +43 -0
reflectorch/inference/sampler_solution.py +56 -0
reflectorch/inference/scipy_fitter.py +364 -0
reflectorch/inference/torch_fitter.py +87 -0
reflectorch/ml/__init__.py +32 -0
reflectorch/ml/basic_trainer.py +292 -0
reflectorch/ml/callbacks.py +81 -0
reflectorch/ml/dataloaders.py +27 -0
reflectorch/ml/loggers.py +56 -0
reflectorch/ml/schedulers.py +356 -0
reflectorch/ml/trainers.py +201 -0
reflectorch/ml/utils.py +2 -0
reflectorch/models/__init__.py +16 -0
reflectorch/models/activations.py +50 -0
reflectorch/models/encoders/__init__.py +19 -0
reflectorch/models/encoders/conv_encoder.py +219 -0
reflectorch/models/encoders/conv_res_net.py +115 -0
reflectorch/models/encoders/fno.py +134 -0
reflectorch/models/encoders/integral_kernel_embedding.py +390 -0
reflectorch/models/networks/__init__.py +14 -0
reflectorch/models/networks/mlp_networks.py +434 -0
reflectorch/models/networks/residual_net.py +157 -0
reflectorch/paths.py +29 -0
reflectorch/runs/__init__.py +31 -0
reflectorch/runs/config.py +25 -0
reflectorch/runs/slurm_utils.py +93 -0
reflectorch/runs/train.py +78 -0
reflectorch/runs/utils.py +405 -0
reflectorch/test_config.py +4 -0
reflectorch/train.py +4 -0
reflectorch/train_on_cluster.py +4 -0
reflectorch/utils.py +98 -0
reflectorch-1.5.1.dist-info/METADATA +151 -0
reflectorch-1.5.1.dist-info/RECORD +96 -0
reflectorch-1.5.1.dist-info/WHEEL +5 -0
reflectorch-1.5.1.dist-info/licenses/LICENSE.txt +21 -0
reflectorch-1.5.1.dist-info/top_level.txt +1 -0

reflectorch/ml/basic_trainer.py ADDED Viewed

@@ -0,0 +1,292 @@
+from typing import Optional, Tuple, Iterable, Any, Union, Type
+from collections import defaultdict
+from tqdm import tqdm as standard_tqdm
+from tqdm.notebook import tqdm as notebook_tqdm
+import numpy as np
+import torch
+from torch.nn import Module
+from reflectorch.ml.loggers import Logger, Loggers
+from .utils import is_divisor
+__all__ = [
+    'Trainer',
+    'TrainerCallback',
+    'DataLoader',
+    'PeriodicTrainerCallback',
+]
+class Trainer(object):
+    """Trainer class
+    Args:
+        model (nn.Module): neural network
+        loader (DataLoader): data loader
+        lr (float): learning rate
+        batch_size (int): batch size
+        clip_grad_norm (int, optional): maximum norm for gradient clipping if it is not ``None``. Defaults to None.
+        logger (Union[Logger, Tuple[Logger, ...], Loggers], optional): logger. Defaults to None.
+        optim_cls (Type[torch.optim.Optimizer], optional): Pytorch optimizer. Defaults to torch.optim.Adam.
+        optim_kwargs (dict, optional): optimizer arguments. Defaults to None.
+    """
+    TOTAL_LOSS_KEY: str = 'total_loss'
+    def __init__(self,
+                 model: Module,
+                 loader: 'DataLoader',
+                 lr: float,
+                 batch_size: int,
+                 clip_grad_norm_max: Optional[int] = None,
+                 logger: Union[Logger, Tuple[Logger, ...], Loggers] = None,
+                 optim_cls: Type[torch.optim.Optimizer] = torch.optim.Adam,
+                 optim_kwargs: dict = None,
+                 **kwargs
+                 ):
+        self.model = model
+        self.loader = loader
+        self.batch_size = batch_size
+        self.clip_grad_norm_max = clip_grad_norm_max
+        self.optim = self.configure_optimizer(optim_cls, lr=lr, **(optim_kwargs or {}))
+        self.lrs = []
+        self.losses = defaultdict(list)
+        self.logger = _init_logger(logger)
+        self.callback_params = {}
+        for k, v in kwargs.items():
+            setattr(self, k, v)
+        self.init()
+    def init(self):
+        pass
+    def log(self, name: str, data):
+        """log data"""
+        self.logger.log(name, data)
+    def train(self,
+                    num_batches: int,
+                    callbacks: Union[Tuple['TrainerCallback', ...], 'TrainerCallback'] = (),
+                    disable_tqdm: bool = False,
+                    use_notebook_tqdm: bool = False,
+                    update_tqdm_freq: int = 1,
+                    grad_accumulation_steps: int = 1,
+                    ):
+        """starts the training process
+        Args:
+            num_batches (int): total number of training iterations
+            callbacks (Union[Tuple['TrainerCallback'], 'TrainerCallback']): the trainer callbacks. Defaults to ().
+            disable_tqdm (bool, optional): if ``True``, the progress bar is disabled. Defaults to False.
+            use_notebook_tqdm (bool, optional): should be set to ``True`` when used in a Jupyter Notebook. Defaults to False.
+            update_tqdm_freq (int, optional): frequency for updating the progress bar. Defaults to 10.
+            grad_accumulation_steps (int, optional): number of gradient accumulation steps. Defaults to 1.
+        """
+        if isinstance(callbacks, TrainerCallback):
+            callbacks = (callbacks,)
+        callbacks = _StackedTrainerCallbacks(list(callbacks) + [self.loader])
+        tqdm_class = notebook_tqdm if use_notebook_tqdm else standard_tqdm
+        pbar = tqdm_class(range(num_batches), disable=disable_tqdm)
+        callbacks.start_training(self)
+        for batch_num in pbar:
+            self.model.train()
+            self.optim.zero_grad()
+            total_loss, avr_loss_dict = 0, defaultdict(list)
+            for _ in range(grad_accumulation_steps):
+                batch_data = self.get_batch_by_idx(batch_num)
+                loss_dict = self.get_loss_dict(batch_data)
+                loss = loss_dict['loss'] / grad_accumulation_steps
+                total_loss += loss.item()
+                _update_loss_dict(avr_loss_dict, loss_dict)
+                if not torch.isfinite(loss).item():
+                    raise ValueError('Loss is not finite!')
+                loss.backward()
+            if self.clip_grad_norm_max is not None:
+                torch.nn.utils.clip_grad_norm_(self.model.parameters(), max_norm=self.clip_grad_norm_max)
+            self.optim.step()
+            avr_loss_dict = {k: np.mean(v) for k, v in avr_loss_dict.items()}
+            self._update_losses(avr_loss_dict, total_loss)
+            if not disable_tqdm:
+                self._update_tqdm(pbar, batch_num, update_tqdm_freq)
+            break_epoch = callbacks.end_batch(self, batch_num)
+            if break_epoch:
+                break
+        callbacks.end_training(self)
+    def _update_tqdm(self, pbar, batch_num: int, update_tqdm_freq: int):
+        if is_divisor(batch_num, update_tqdm_freq):
+            last_loss = np.mean(self.losses[self.TOTAL_LOSS_KEY][-10:])
+            pbar.set_description(f'Loss = {last_loss:.2e}')
+            postfix = {}
+            for key in self.losses.keys():
+                if key != self.TOTAL_LOSS_KEY:
+                    last_value = self.losses[key][-1]
+                    postfix[key] = f'{last_value:.4f}'
+            postfix['lr'] = f'{self.lr():.2e}'
+            pbar.set_postfix(postfix)
+    def get_batch_by_idx(self, batch_num: int) -> Any:
+        raise NotImplementedError
+    def get_loss_dict(self, batch_data) -> dict:
+        raise NotImplementedError
+    def _update_losses(self, loss_dict: dict, loss: float) -> None:
+        _update_loss_dict(self.losses, loss_dict)
+        self.losses[self.TOTAL_LOSS_KEY].append(loss)
+        self.lrs.append(self.lr())
+    def configure_optimizer(self, optim_cls, lr: float, **kwargs) -> torch.optim.Optimizer:
+        """configure the optimizer based on the optimizer class, the learning rate and the optimizer keyword arguments
+        Args:
+            optim_cls: the class of the optimizer
+            lr (float): the learning rate
+        Returns:
+            torch.optim.Optimizer:
+        """
+        optim = optim_cls(self.model.parameters(), lr,  **kwargs)
+        return optim
+    def lr(self, param_group: int = 0) -> float:
+        """get the learning rate"""
+        return self.optim.param_groups[param_group]['lr']
+    def set_lr(self, lr: float, param_group: int = 0) -> None:
+        """set the learning rate"""
+        self.optim.param_groups[param_group]['lr'] = lr
+class TrainerCallback(object):
+    """Base class for trainer callbacks
+    """
+    def start_training(self, trainer: Trainer) -> None:
+        """add functionality the start of training
+        Args:
+            trainer (Trainer): the trainer object
+        """
+        pass
+    def end_training(self, trainer: Trainer) -> None:
+        """add functionality at the end of training
+        Args:
+            trainer (Trainer): the trainer object
+        """
+        pass
+    def end_batch(self, trainer: Trainer, batch_num: int) -> Union[bool, None]:
+        """add functionality at the end of the iteration / batch
+        Args:
+            trainer (Trainer): the trainer object
+            batch_num (int): the index of the current iteration / batch
+        Returns:
+            Union[bool, None]:
+        """
+        pass
+    def __repr__(self):
+        return f'{self.__class__.__name__}()'
+class DataLoader(TrainerCallback):
+    pass
+class PeriodicTrainerCallback(TrainerCallback):
+    """Base class for trainer callbacks which perform an action periodically after a number of iterations
+    Args:
+        step (int, optional): Number of iterations after which the action is repeated. Defaults to 1.
+        last_epoch (int, optional): the last training  iteration for which the action is performed. Defaults to -1.
+    """
+    def __init__(self, step: int = 1, last_epoch: int = -1):
+        self.step = step
+        self.last_epoch = last_epoch
+    def end_batch(self, trainer: Trainer, batch_num: int) -> Union[bool, None]:
+        """add functionality at the end of the iteration / batch
+        Args:
+            trainer (Trainer): the trainer object
+            batch_num (int): the index of the current iteration / batch
+        Returns:
+            Union[bool, None]:
+        """
+        if (
+                is_divisor(batch_num, self.step) and
+                (self.last_epoch == -1 or batch_num < self.last_epoch)
+        ):
+            return self._end_batch(trainer, batch_num)
+    def _end_batch(self, trainer: Trainer, batch_num: int) -> Union[bool, None]:
+        pass
+class _StackedTrainerCallbacks(TrainerCallback):
+    def __init__(self, callbacks: Iterable[TrainerCallback]):
+        self.callbacks = tuple(callbacks)
+    def start_training(self, trainer: Trainer) -> None:
+        for c in self.callbacks:
+            c.start_training(trainer)
+    def end_training(self, trainer: Trainer) -> None:
+        for c in self.callbacks:
+            c.end_training(trainer)
+    def end_batch(self, trainer: Trainer, batch_num: int) -> Union[bool, None]:
+        break_epoch = False
+        for c in self.callbacks:
+            break_epoch += bool(c.end_batch(trainer, batch_num))
+        return break_epoch
+    def __repr__(self):
+        callbacks = ", ".join(repr(c) for c in self.callbacks)
+        return f'StackedTrainerCallbacks({callbacks})'
+def _init_logger(logger: Union[Logger, Tuple[Logger, ...], Loggers] = None):
+    if not logger:
+        return Logger()
+    if isinstance(logger, Logger):
+        return logger
+    return Loggers(*logger)
+def _update_loss_dict(loss_dict: dict, new_values: dict):
+    for k, v in new_values.items():
+        loss_dict[k].append(v.item())

reflectorch/ml/callbacks.py ADDED Viewed

@@ -0,0 +1,81 @@
+import torch
+import numpy as np
+from reflectorch.ml.basic_trainer import (
+    TrainerCallback,
+    Trainer,
+)
+from reflectorch.ml.utils import is_divisor
+__all__ = [
+    'SaveBestModel',
+    'LogLosses',
+]
+class SaveBestModel(TrainerCallback):
+    """Callback for periodically saving the best model weights
+    Args:
+        path (str): path for saving the model weights
+        freq (int, optional): frequency in iterations at which the current average loss is evaluated. Defaults to 50.
+        average (int, optional): number of recent iterations over which the average loss is computed. Defaults to 10.
+    """
+    def __init__(self, path: str, freq: int = 50, average: int = 10):
+        self.path = path
+        self.average = average
+        self._best_loss = np.inf
+        self.freq = freq
+    def end_batch(self, trainer: Trainer, batch_num: int) -> None:
+        """checks if the current average loss has improved from the previous save, if true the model is saved
+        Args:
+            trainer (Trainer): the trainer object
+            batch_num (int): the current iteration / batch
+        """
+        if is_divisor(batch_num, self.freq):
+            loss = np.mean(trainer.losses['total_loss'][-self.average:])
+            if loss < self._best_loss:
+                self._best_loss = loss
+                self.save(trainer, batch_num)
+    def save(self, trainer: Trainer, batch_num: int):
+        """saves a dictionary containing the network weights, the learning rates, the losses and the current \
+            best loss with its corresponding iteration to the disk
+        Args:
+            trainer (Trainer): the trainer object
+            batch_num (int): the current iteration / batch
+        """
+        prev_save = trainer.callback_params.pop('saved_iteration', 0)
+        trainer.callback_params['saved_iteration'] = batch_num
+        save_dict = {
+            'model': trainer.model.state_dict(),
+            'lrs': trainer.lrs,
+            'losses': trainer.losses,
+            'prev_save': prev_save,
+            'batch_num': batch_num,
+            'best_loss': self._best_loss
+        }
+        torch.save(save_dict, self.path)
+class LogLosses(TrainerCallback):
+    """Callback for logging the training losses"""
+    def end_batch(self, trainer: Trainer, batch_num: int) -> None:
+        """log loss at the current iteration
+        Args:
+            trainer (Trainer): the trainer object
+            batch_num (int): the index of the current iteration / batch
+        """
+        for loss_name, loss_values in trainer.losses.items():
+            try:
+                trainer.log(f'train/{loss_name}', loss_values[-1])
+            except IndexError:
+                continue

reflectorch/ml/dataloaders.py ADDED Viewed

@@ -0,0 +1,27 @@
+from torch import Tensor
+from reflectorch.data_generation import BasicDataset
+from reflectorch.data_generation.reflectivity import kinematical_approximation
+from reflectorch.data_generation.priors import BasicParams
+from reflectorch.ml.basic_trainer import DataLoader
+__all__ = [
+    "ReflectivityDataLoader",
+    "MultilayerDataLoader",
+]
+class ReflectivityDataLoader(BasicDataset, DataLoader):
+    """Dataloader for reflectivity data, combining functionality from the ``BasicDataset`` (basic dataset class for reflectivity) and the ``DataLoader`` (which inherits from ``TrainerCallback``) classes"""
+    pass
+class MultilayerDataLoader(ReflectivityDataLoader):
+    """Dataloader for reflectivity curves simulated using the kinematical approximation"""
+    def _sample_from_prior(self, batch_size: int):
+        return self.prior_sampler.optimized_sample(batch_size)
+    def _calc_curves(self, q_values: Tensor, params: BasicParams):
+        return kinematical_approximation(q_values, params.thicknesses, params.roughnesses, params.slds)

reflectorch/ml/loggers.py ADDED Viewed

@@ -0,0 +1,56 @@
+from torch.utils.tensorboard import SummaryWriter
+__all__ = [
+    'Logger',
+    'Loggers',
+    'PrintLogger',
+    'TensorBoardLogger',
+]
+class Logger(object):
+    "Base class defining a common interface for logging"
+    def log(self, name: str, data):
+        pass
+    def __setitem__(self, key, value):
+        """Enable dictionary-style setting to log data."""
+        self.log(key, value)
+class Loggers(Logger):
+    """Class for using multiple loggers"""
+    def __init__(self, *loggers):
+        self._loggers = tuple(loggers)
+    def log(self, name: str, data):
+        for logger in self._loggers:
+            logger.log(name, data)
+class PrintLogger(Logger):
+    """Logger which prints to the console"""
+    def log(self, name: str, data):
+        print(name, ': ', data)
+class TensorBoardLogger(Logger):
+    def __init__(self, log_dir: str):
+        """
+        Args:
+            log_dir (str): Directory where TensorBoard logs will be written
+        """
+        super().__init__()
+        self.writer = SummaryWriter(log_dir=log_dir)
+        self.step = 1
+    def log(self, name: str, data):
+        """Log scalar data to TensorBoard
+        Args:
+            name (str): Name/tag for the data
+            data: Scalar value to log
+        """
+        if hasattr(data, 'item'):
+            data = data.item()
+        self.writer.add_scalar(name, data, self.step)
+        self.step += 1