PyPI - autogluon.timeseries - Versions diffs - 1.2.1b20250224__py3-none-any.whl → 1.4.1b20251215__py3-none-any.whl - Mend - Supply Chain Defender

autogluon.timeseries 1.2.1b20250224py3-none-any.whl → 1.4.1b20251215py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of autogluon.timeseries might be problematic. Click here for more details.

Files changed (108) hide show

autogluon/timeseries/models/chronos/pipeline/chronos.py DELETED Viewed

@@ -1,585 +0,0 @@
-# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
-# SPDX-License-Identifier: Apache-2.0
-# Original Source: https://github.com/amazon-science/chronos-forecasting
-# Authors: Lorenzo Stella <stellalo@amazon.com>, Abdul Fatir Ansari <ansarnd@amazon.com>
-import logging
-import warnings
-from dataclasses import dataclass
-from typing import Any, Dict, List, Literal, Optional, Tuple, Union
-import torch
-import torch.nn as nn
-from transformers import AutoConfig, AutoModelForSeq2SeqLM, GenerationConfig, PreTrainedModel
-from autogluon.timeseries.utils.warning_filters import set_loggers_level
-from .base import BaseChronosPipeline, ForecastType
-logger = logging.getLogger("autogluon.timeseries.models.chronos")
-__all__ = ["ChronosConfig", "ChronosPipeline"]
-@dataclass
-class ChronosConfig:
-    """
-    This class holds all the configuration parameters to be used
-    by ``ChronosTokenizer`` and ``ChronosPretrainedModel``.
-    """
-    tokenizer_class: str
-    tokenizer_kwargs: Dict[str, Any]
-    n_tokens: int
-    n_special_tokens: int
-    pad_token_id: int
-    eos_token_id: int
-    use_eos_token: bool
-    model_type: Literal["seq2seq"]
-    context_length: int
-    prediction_length: int
-    num_samples: int
-    temperature: float
-    top_k: int
-    top_p: float
-    def __post_init__(self):
-        assert self.pad_token_id < self.n_special_tokens and self.eos_token_id < self.n_special_tokens, (
-            f"Special token id's must be smaller than {self.n_special_tokens=}"
-        )
-    def create_tokenizer(self) -> "ChronosTokenizer":
-        if self.tokenizer_class == "MeanScaleUniformBins":
-            return MeanScaleUniformBins(**self.tokenizer_kwargs, config=self)
-        raise ValueError
-class ChronosTokenizer:
-    """
-    A ``ChronosTokenizer`` defines how time series are mapped into token IDs
-    and back.
-    For details, see the ``input_transform`` and ``output_transform`` methods,
-    which concrete classes must implement.
-    """
-    def context_input_transform(
-        self,
-        context: torch.Tensor,
-    ) -> Tuple:
-        """
-        Turn a batch of time series into token IDs, attention mask, and tokenizer_state.
-        Parameters
-        ----------
-        context
-            A tensor shaped (batch_size, time_length), containing the
-            timeseries to forecast. Use left-padding with ``torch.nan``
-            to align time series of different lengths.
-        Returns
-        -------
-        token_ids
-            A tensor of integers, shaped (batch_size, time_length + 1)
-            if ``config.use_eos_token`` and (batch_size, time_length)
-            otherwise, containing token IDs for the input series.
-        attention_mask
-            A boolean tensor, same shape as ``token_ids``, indicating
-            which input observations are not ``torch.nan`` (i.e. not
-            missing nor padding).
-        tokenizer_state
-            An object that can be passed to ``label_input_transform``
-            and ``output_transform``. Contains the relevant information
-            to decode output samples into real values,
-            such as location and scale parameters.
-        """
-        raise NotImplementedError()
-    def label_input_transform(self, label: torch.Tensor, tokenizer_state: Any) -> Tuple:
-        """
-        Turn a batch of label slices of time series into token IDs and attention mask
-        using the ``tokenizer_state`` provided by ``context_input_transform``.
-        Parameters
-        ----------
-        label
-            A tensor shaped (batch_size, time_length), containing the
-            timeseries label, i.e., the ground-truth future values.
-        tokenizer_state
-            An object returned by ``context_input_transform`` containing
-            relevant information to preprocess data, such as location and
-            scale. The nature of this depends on the specific tokenizer.
-            This is used for tokenizing the label, in order to use the same
-            scaling used to tokenize the context.
-        Returns
-        -------
-        token_ids
-            A tensor of integers, shaped (batch_size, time_length + 1)
-            if ``config.use_eos_token`` and (batch_size, time_length)
-            otherwise, containing token IDs for the input series.
-        attention_mask
-            A boolean tensor, same shape as ``token_ids``, indicating
-            which input observations are not ``torch.nan`` (i.e. not
-            missing nor padding).
-        """
-        raise NotImplementedError()
-    def output_transform(self, samples: torch.Tensor, tokenizer_state: Any) -> torch.Tensor:
-        """
-        Turn a batch of sample token IDs into real values.
-        Parameters
-        ----------
-        samples
-            A tensor of integers, shaped (batch_size, num_samples, time_length),
-            containing token IDs of sample trajectories.
-        tokenizer_state
-            An object returned by ``input_transform`` containing
-            relevant context to decode samples, such as location and scale.
-            The nature of this depends on the specific tokenizer.
-        Returns
-        -------
-        forecasts
-            A real tensor, shaped (batch_size, num_samples, time_length),
-            containing forecasted sample paths.
-        """
-        raise NotImplementedError()
-class MeanScaleUniformBins(ChronosTokenizer):
-    """
-    A tokenizer that performs mean scaling and then quantizes the scaled time series into
-    uniformly-spaced bins between some bounds on the real line.
-    """
-    def __init__(self, low_limit: float, high_limit: float, config: ChronosConfig) -> None:
-        self.config = config
-        self.centers = torch.linspace(
-            low_limit,
-            high_limit,
-            config.n_tokens - config.n_special_tokens - 1,
-        )
-        self.boundaries = torch.concat(
-            (
-                torch.tensor([-1e20], device=self.centers.device),
-                (self.centers[1:] + self.centers[:-1]) / 2,
-                torch.tensor([1e20], device=self.centers.device),
-            )
-        )
-    def _input_transform(
-        self, context: torch.Tensor, scale: Optional[torch.Tensor] = None
-    ) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
-        attention_mask = ~torch.isnan(context)
-        if scale is None:
-            scale = torch.nansum(torch.abs(context) * attention_mask, dim=-1) / torch.nansum(attention_mask, dim=-1)
-            scale[~(scale > 0)] = 1.0
-        scaled_context = context / scale.unsqueeze(dim=-1)
-        token_ids = (
-            torch.bucketize(
-                input=scaled_context,
-                boundaries=self.boundaries,
-                # buckets are open to the right, see:
-                # https://pytorch.org/docs/2.1/generated/torch.bucketize.html#torch-bucketize
-                right=True,
-            )
-            + self.config.n_special_tokens
-        )
-        token_ids[~attention_mask] = self.config.pad_token_id
-        token_ids.clamp_(0, self.config.n_tokens - 1)
-        return token_ids, attention_mask, scale
-    def _append_eos_token(
-        self, token_ids: torch.Tensor, attention_mask: torch.Tensor
-    ) -> Tuple[torch.Tensor, torch.Tensor]:
-        batch_size = token_ids.shape[0]
-        eos_tokens = torch.full((batch_size, 1), fill_value=self.config.eos_token_id)
-        token_ids = torch.concat((token_ids, eos_tokens), dim=1)
-        eos_mask = torch.full((batch_size, 1), fill_value=True)
-        attention_mask = torch.concat((attention_mask, eos_mask), dim=1)
-        return token_ids, attention_mask
-    def context_input_transform(self, context: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
-        length = context.shape[-1]
-        if length > self.config.context_length:
-            context = context[..., -self.config.context_length :]
-        token_ids, attention_mask, scale = self._input_transform(context=context)
-        if self.config.use_eos_token and self.config.model_type == "seq2seq":
-            token_ids, attention_mask = self._append_eos_token(token_ids=token_ids, attention_mask=attention_mask)
-        return token_ids, attention_mask, scale
-    def label_input_transform(self, label: torch.Tensor, scale: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor]:
-        token_ids, attention_mask, _ = self._input_transform(context=label, scale=scale)
-        if self.config.use_eos_token:
-            token_ids, attention_mask = self._append_eos_token(token_ids=token_ids, attention_mask=attention_mask)
-        return token_ids, attention_mask
-    def output_transform(self, samples: torch.Tensor, scale: torch.Tensor) -> torch.Tensor:
-        scale_unsqueezed = scale.unsqueeze(-1).unsqueeze(-1)
-        indices = torch.clamp(
-            samples - self.config.n_special_tokens - 1,
-            min=0,
-            max=len(self.centers) - 1,
-        )
-        return self.centers[indices] * scale_unsqueezed
-class ChronosPretrainedModel(nn.Module):
-    """
-    A ``ChronosPretrainedModel`` wraps a ``PreTrainedModel`` object from ``transformers``
-    and uses it to predict sample paths for time series tokens.
-    Parameters
-    ----------
-    config
-        The configuration to use.
-    model
-        The pre-trained model to use.
-    """
-    def __init__(self, config: ChronosConfig, model: PreTrainedModel) -> None:
-        super().__init__()
-        self.config = config
-        self.model = model
-    @property
-    def device(self):
-        return self.model.device
-    def encode(
-        self,
-        input_ids: torch.Tensor,
-        attention_mask: torch.Tensor,
-    ):
-        """
-        Extract the encoder embedding for the given token sequences.
-        Parameters
-        ----------
-        input_ids
-            Tensor of indices of input sequence tokens in the vocabulary
-            with shape (batch_size, sequence_length).
-        attention_mask
-            A mask tensor of the same shape as input_ids to avoid attending
-            on padding or missing tokens.
-        Returns
-        -------
-        embedding
-            A tensor of encoder embeddings with shape
-            (batch_size, sequence_length, d_model).
-        """
-        assert self.config.model_type == "seq2seq", "Encoder embeddings are only supported for encoder-decoder models"
-        return self.model.encoder(input_ids=input_ids, attention_mask=attention_mask).last_hidden_state
-    def forward(
-        self,
-        input_ids: torch.Tensor,
-        attention_mask: torch.Tensor,
-        prediction_length: Optional[int] = None,
-        num_samples: Optional[int] = None,
-        temperature: Optional[float] = None,
-        top_k: Optional[int] = None,
-        top_p: Optional[float] = None,
-    ) -> torch.Tensor:
-        """
-        Predict future sample tokens for the given token sequences.
-        Arguments ``prediction_length``, ``num_samples``, ``temperature``,
-        ``top_k``, ``top_p`` can be used to customize the model inference,
-        and default to the corresponding attributes in ``self.config`` if
-        not provided.
-        Returns
-        -------
-        samples
-            A tensor of integers, shaped (batch_size, num_samples, time_length),
-            containing forecasted sample paths.
-        """
-        if prediction_length is None:
-            prediction_length = self.config.prediction_length
-        if num_samples is None:
-            num_samples = self.config.num_samples
-        if temperature is None:
-            temperature = self.config.temperature
-        if top_k is None:
-            top_k = self.config.top_k
-        if top_p is None:
-            top_p = self.config.top_p
-        preds = self.model.generate(
-            input_ids=input_ids,
-            attention_mask=attention_mask.long(),  # int64 (long) type conversion needed for ONNX
-            generation_config=GenerationConfig(
-                min_new_tokens=prediction_length,
-                max_new_tokens=prediction_length,
-                do_sample=True,
-                num_return_sequences=num_samples,
-                eos_token_id=self.config.eos_token_id,
-                pad_token_id=self.config.pad_token_id,
-                temperature=temperature,
-                top_k=top_k,
-                top_p=top_p,
-            ),
-        )
-        if self.config.model_type == "seq2seq":
-            preds = preds[..., 1:]  # remove the decoder start token
-        else:
-            assert self.config.model_type == "causal"
-            assert preds.size(-1) == input_ids.size(-1) + prediction_length
-            preds = preds[..., -prediction_length:]
-        return preds.reshape(input_ids.size(0), num_samples, -1)
-class ChronosPipeline(BaseChronosPipeline):
-    """
-    A ``ChronosPipeline`` uses the given tokenizer and model to forecast
-    input time series.
-    Use the ``from_pretrained`` class method to load serialized models.
-    Use the ``predict`` method to get forecasts.
-    Parameters
-    ----------
-    tokenizer
-        The tokenizer object to use.
-    model
-        The model to use.
-    """
-    tokenizer: ChronosTokenizer
-    model: ChronosPretrainedModel
-    forecast_type: ForecastType = ForecastType.SAMPLES
-    def __init__(self, tokenizer, model):
-        super().__init__(inner_model=model.model)
-        self.tokenizer = tokenizer
-        self.model = model
-    @torch.no_grad()
-    def embed(self, context: Union[torch.Tensor, List[torch.Tensor]]) -> Tuple[torch.Tensor, Any]:
-        """
-        Get encoder embeddings for the given time series.
-        Parameters
-        ----------
-        context
-            Input series. This is either a 1D tensor, or a list
-            of 1D tensors, or a 2D tensor whose first dimension
-            is batch. In the latter case, use left-padding with
-            ``torch.nan`` to align series of different lengths.
-        Returns
-        -------
-        embeddings, tokenizer_state
-            A tuple of two tensors: the encoder embeddings and the tokenizer_state,
-            e.g., the scale of the time series in the case of mean scaling.
-            The encoder embeddings are shaped (batch_size, context_length, d_model)
-            or (batch_size, context_length + 1, d_model), where context_length
-            is the size of the context along the time axis if a 2D tensor was provided
-            or the length of the longest time series, if a list of 1D tensors was
-            provided, and the extra 1 is for EOS.
-        """
-        context_tensor = self._prepare_and_validate_context(context=context)
-        token_ids, attention_mask, tokenizer_state = self.tokenizer.context_input_transform(context_tensor)
-        embeddings = self.model.encode(
-            input_ids=token_ids.to(self.model.device),
-            attention_mask=attention_mask.to(self.model.device),
-        ).cpu()
-        return embeddings, tokenizer_state
-    def predict(
-        self,
-        context: Union[torch.Tensor, List[torch.Tensor]],
-        prediction_length: Optional[int] = None,
-        num_samples: Optional[int] = None,
-        temperature: Optional[float] = None,
-        top_k: Optional[int] = None,
-        top_p: Optional[float] = None,
-        limit_prediction_length: bool = False,
-        **kwargs,
-    ) -> torch.Tensor:
-        """
-        Get forecasts for the given time series.
-        Parameters
-        ----------
-        context
-            Input series. This is either a 1D tensor, or a list
-            of 1D tensors, or a 2D tensor whose first dimension
-            is batch. In the latter case, use left-padding with
-            ``torch.nan`` to align series of different lengths.
-        prediction_length
-            Time steps to predict. Defaults to what specified
-            in ``self.model.config``.
-        num_samples
-            Number of sample paths to predict. Defaults to what
-            specified in ``self.model.config``.
-        temperature
-            Temperature to use for generating sample tokens.
-            Defaults to what specified in ``self.model.config``.
-        top_k
-            Top-k parameter to use for generating sample tokens.
-            Defaults to what specified in ``self.model.config``.
-        top_p
-            Top-p parameter to use for generating sample tokens.
-            Defaults to what specified in ``self.model.config``.
-        limit_prediction_length
-            Force prediction length smaller or equal than the
-            built-in prediction length from the model. True by
-            default. When true, fail loudly if longer predictions
-            are requested, otherwise longer predictions are allowed.
-        Returns
-        -------
-        samples
-            Tensor of sample forecasts, of shape
-            (batch_size, num_samples, prediction_length).
-        """
-        context_tensor = self._prepare_and_validate_context(context=context)
-        if prediction_length is None:
-            prediction_length = self.model.config.prediction_length
-        if prediction_length > self.model.config.prediction_length:
-            msg = (
-                f"We recommend keeping prediction length <= {self.model.config.prediction_length}. "
-                f"The quality of longer predictions may degrade since the model is not optimized for it. "
-            )
-            if limit_prediction_length:
-                msg += "You can turn off this check by setting `limit_prediction_length=False`."
-                raise ValueError(msg)
-            warnings.warn(msg, stacklevel=2)
-        predictions = []
-        remaining = prediction_length
-        while remaining > 0:
-            token_ids, attention_mask, scale = self.tokenizer.context_input_transform(context_tensor)
-            samples = self.model(
-                token_ids.to(self.model.device),
-                attention_mask.to(self.model.device),
-                min(remaining, self.model.config.prediction_length),
-                num_samples,
-                temperature,
-                top_k,
-                top_p,
-            )
-            prediction = self.tokenizer.output_transform(samples.to(scale.device), scale)
-            predictions.append(prediction)
-            remaining -= prediction.shape[-1]
-            if remaining <= 0:
-                break
-            context_tensor = torch.cat([context_tensor, prediction.median(dim=1).values], dim=-1)
-        return torch.cat(predictions, dim=-1)
-    def predict_quantiles(
-        self,
-        context: torch.Tensor,
-        prediction_length: int,
-        quantile_levels: List[float],
-        num_samples: Optional[int] = None,
-        **kwargs,
-    ) -> Tuple[torch.Tensor, torch.Tensor]:
-        num_samples = num_samples or self.model.config.num_samples
-        prediction_samples = (
-            self.predict(
-                context,
-                prediction_length=prediction_length,
-                num_samples=num_samples,
-            )
-            .detach()
-            .cpu()
-            .swapaxes(1, 2)
-        )
-        mean = prediction_samples.mean(dim=-1, keepdim=True)
-        quantiles = torch.quantile(
-            prediction_samples,
-            q=torch.tensor(quantile_levels, dtype=prediction_samples.dtype),
-            dim=-1,
-        ).permute(1, 2, 0)
-        return quantiles, mean
-    @classmethod
-    def from_pretrained(cls, *args, **kwargs):
-        """
-        Load the model, either from a local path or from the HuggingFace Hub.
-        Supports the same arguments as ``AutoConfig`` and ``AutoModel``
-        from ``transformers``.
-        """
-        kwargs = kwargs.copy()
-        optimization_strategy = kwargs.pop("optimization_strategy", None)
-        context_length = kwargs.pop("context_length", None)
-        config = AutoConfig.from_pretrained(*args, **kwargs)
-        assert hasattr(config, "chronos_config"), "Not a Chronos config file"
-        if context_length is not None:
-            config.chronos_config["context_length"] = context_length
-        chronos_config = ChronosConfig(**config.chronos_config)
-        assert chronos_config.model_type == "seq2seq"
-        if optimization_strategy is None:
-            inner_model = AutoModelForSeq2SeqLM.from_pretrained(*args, **kwargs)
-        else:
-            assert optimization_strategy in [
-                "onnx",
-                "openvino",
-            ], "optimization_strategy not recognized. Please provide one of `onnx` or `openvino`"
-            kwargs.pop("resume_download", None)  # Optimized pipeline does not support 'resume_download' kwargs
-            torch_dtype = kwargs.pop("torch_dtype", "auto")
-            if torch_dtype != "auto":
-                logger.warning(f"\t`torch_dtype` will be ignored for optimization_strategy {optimization_strategy}")
-            if optimization_strategy == "onnx":
-                try:
-                    from optimum.onnxruntime import ORTModelForSeq2SeqLM
-                except ImportError:
-                    raise ImportError(
-                        "Huggingface Optimum library must be installed with ONNX for using the `onnx` strategy. "
-                        "Please try running `pip install optimum[onnxruntime]` or use Chronos-Bolt models for "
-                        "faster performance on the CPU."
-                    )
-                assert kwargs.pop("device_map", "cpu") in ["cpu", "auto"], "ONNX mode only available on the CPU"
-                with set_loggers_level(regex=r"^optimum.*", level=logging.ERROR):
-                    inner_model = ORTModelForSeq2SeqLM.from_pretrained(*args, **{**kwargs, "export": True})
-            elif optimization_strategy == "openvino":
-                try:
-                    from optimum.intel import OVModelForSeq2SeqLM
-                except ImportError:
-                    raise ImportError(
-                        "Huggingface Optimum library must be installed with OpenVINO for using the `openvino` strategy. "
-                        "Please try running `pip install optimum-intel[openvino,nncf] optimum[openvino,nncf]` or use "
-                        "Chronos-Bolt models for faster performance on the CPU."
-                    )
-                with set_loggers_level(regex=r"^optimum.*", level=logging.ERROR):
-                    inner_model = OVModelForSeq2SeqLM.from_pretrained(
-                        *args, **{**kwargs, "device_map": "cpu", "export": True}
-                    )
-        return cls(
-            tokenizer=chronos_config.create_tokenizer(),
-            model=ChronosPretrainedModel(config=chronos_config, model=inner_model),
-        )