PyPI - tsagentkit-timesfm - Versions diffs - 1.0.0__py3-none-any.whl - Mend

tsagentkit-timesfm 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

timesfm/__init__.py +29 -0
timesfm/configs.py +105 -0
timesfm/flax/__init__.py +13 -0
timesfm/flax/dense.py +110 -0
timesfm/flax/normalization.py +71 -0
timesfm/flax/transformer.py +356 -0
timesfm/flax/util.py +107 -0
timesfm/timesfm_2p5/timesfm_2p5_base.py +422 -0
timesfm/timesfm_2p5/timesfm_2p5_flax.py +602 -0
timesfm/timesfm_2p5/timesfm_2p5_torch.py +472 -0
timesfm/torch/__init__.py +13 -0
timesfm/torch/dense.py +94 -0
timesfm/torch/normalization.py +39 -0
timesfm/torch/transformer.py +370 -0
timesfm/torch/util.py +94 -0
timesfm/utils/xreg_lib.py +520 -0
tsagentkit_timesfm-1.0.0.dist-info/METADATA +152 -0
tsagentkit_timesfm-1.0.0.dist-info/RECORD +21 -0
tsagentkit_timesfm-1.0.0.dist-info/WHEEL +5 -0
tsagentkit_timesfm-1.0.0.dist-info/licenses/LICENSE +202 -0
tsagentkit_timesfm-1.0.0.dist-info/top_level.txt +1 -0

timesfm/flax/util.py ADDED Viewed

@@ -0,0 +1,107 @@
+# Copyright 2025 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Flax utility functions for TimesFM layers."""
+import dataclasses
+import functools
+import jax
+import jax.numpy as jnp
+import jaxtyping
+Float = jaxtyping.Float
+Array = jaxtyping.Array
+Bool = jaxtyping.Bool
+Integer = jaxtyping.Integer
+_TOLERANCE = 1e-6
+@jax.tree_util.register_dataclass
+@dataclasses.dataclass(frozen=False)
+class DecodeCache:
+  """Cache for decoding."""
+  next_index: Integer[Array, "b"]
+  num_masked: Integer[Array, "b"]
+  key: Float[Array, "b n h d"]
+  value: Float[Array, "b n h d"]
+@jax.jit
+def update_running_stats(
+  n: Float[Array, "b"],
+  mu: Float[Array, "b"],
+  sigma: Float[Array, "b"],
+  x: Float[Array, "b p"],
+  mask: Bool[Array, "b p"],
+) -> tuple[
+  tuple[Float[Array, "b"], Float[Array, "b"], Float[Array, "b"]],
+  tuple[Float[Array, "b"], Float[Array, "b"], Float[Array, "b"]],
+]:
+  """Updates the running stats."""
+  is_legit = jnp.logical_not(mask)
+  inc_n = jnp.sum(is_legit.astype(jnp.float32), axis=-1, keepdims=False)
+  inc_mu = jnp.where(
+    inc_n == 0, 0.0, jnp.mean(x, axis=-1, keepdims=False, where=is_legit)
+  )
+  inc_sigma = jnp.where(
+    inc_n == 0, 0.0, jnp.std(x, axis=-1, keepdims=False, where=is_legit)
+  )
+  new_n = n + inc_n
+  new_mu = jnp.where(new_n == 0, 0.0, (n * mu + inc_mu * inc_n) / new_n)
+  new_sigma = jnp.sqrt(
+    jnp.where(
+      new_n == 0,
+      0.0,
+      (
+        n * sigma * sigma
+        + inc_n * inc_sigma * inc_sigma
+        + n * (mu - new_mu) * (mu - new_mu)
+        + inc_n * (inc_mu - new_mu) * (inc_mu - new_mu)
+      )
+      / new_n,
+    )
+  )
+  return (w := (new_n, new_mu, new_sigma), w)
+def scan_along_axis(f, init, xs, axis: int, **kwargs):
+  """Scans along an axis."""
+  moved_xs = jax.tree_util.tree_map(lambda x: jnp.moveaxis(x, axis, 0), xs)
+  carry, moved_ys = jax.lax.scan(f, init, moved_xs, **kwargs)
+  return (
+    carry,
+    jax.tree_util.tree_map(lambda x: jnp.moveaxis(x, 0, axis), moved_ys),
+  )
+@functools.partial(jax.jit, static_argnames=("reverse",))
+def revin(
+  x: Float[Array, "b ..."],
+  mu: Float[Array, "b ..."],
+  sigma: Float[Array, "b ..."],
+  reverse: bool = False,
+):
+  """Reversible per-instance normalization."""
+  if len(mu.shape) == len(x.shape) - 1:
+    mu = mu[..., None]
+    sigma = sigma[..., None]
+  elif len(mu.shape) == len(x.shape) - 2:
+    mu = mu[..., None, None]
+    sigma = sigma[..., None, None]
+  if reverse:
+    return x * sigma + mu
+  else:
+    return (x - mu) / jnp.where(sigma < _TOLERANCE, 1.0, sigma)

timesfm/timesfm_2p5/timesfm_2p5_base.py ADDED Viewed

@@ -0,0 +1,422 @@
+# Copyright 2025 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""TimesFM 2p5 base implementation."""
+import dataclasses
+from typing import Any, Callable, Sequence
+import collections
+import numpy as np
+from .. import configs
+ResidualBlockConfig = configs.ResidualBlockConfig
+StackedTransformersConfig = configs.StackedTransformersConfig
+TransformerConfig = configs.TransformerConfig
+ForecastConfig = configs.ForecastConfig
+Category = int | str
+XRegMode = str
+def strip_leading_nans(arr):
+  """Removes contiguous NaN values from the beginning of a NumPy array.
+  Args:
+    arr: The input NumPy array.
+  Returns:
+    A new NumPy array with leading NaN values removed.
+    If the array is all NaNs or empty, returns an empty array.
+  """
+  isnan = np.isnan(arr)
+  first_valid_index = np.argmax(~isnan)
+  return arr[first_valid_index:]
+def linear_interpolation(arr):
+  """Performs linear interpolation to fill NaN values in a 1D numpy array.
+  Args:
+      arr: The 1D numpy array containing NaN values.
+  Returns:
+      A new numpy array with NaN values filled using linear interpolation,
+      or the original array if no NaNs are present.
+      Returns None if the input is not a 1D array.
+      Returns the original array if there are no NaN values.
+  """
+  nans = np.isnan(arr)
+  if not np.any(nans):  # Check if there are any NaNs
+    return arr
+  def x(z):
+    return z.nonzero()[0]
+  nans_indices = x(nans)
+  non_nans_indices = x(~nans)
+  non_nans_values = arr[~nans]
+  try:
+    arr[nans] = np.interp(nans_indices, non_nans_indices, non_nans_values)
+  except ValueError:
+    if non_nans_values:
+      mu = np.nanmean(arr)
+    else:
+      mu = 0.0
+    arr = np.where(np.isfinite(arr), arr, mu)
+  return arr
+@dataclasses.dataclass(frozen=True)
+class TimesFM_2p5_200M_Definition:
+  """Framework-agnostic config of TimesFM 2.5."""
+  context_limit = 16384
+  input_patch_len: int = 32
+  output_patch_len: int = 128
+  output_quantile_len: int = 1024
+  quantiles: list[float] = dataclasses.field(
+    default_factory=lambda: [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9]
+  )
+  decode_index: int = 5
+  tokenizer: ResidualBlockConfig = ResidualBlockConfig(
+    input_dims=64,
+    hidden_dims=1280,
+    output_dims=1280,
+    use_bias=True,
+    activation="swish",
+  )
+  stacked_transformers: StackedTransformersConfig = StackedTransformersConfig(
+    num_layers=20,
+    transformer=TransformerConfig(
+      model_dims=1280,
+      hidden_dims=1280,
+      num_heads=16,
+      attention_norm="rms",
+      feedforward_norm="rms",
+      qk_norm="rms",
+      use_bias=False,
+      use_rotary_position_embeddings=True,
+      ff_activation="swish",
+      fuse_qkv=True,
+    ),
+  )
+  output_projection_point: ResidualBlockConfig = ResidualBlockConfig(
+    input_dims=1280,
+    hidden_dims=1280,
+    output_dims=1280,
+    use_bias=False,
+    activation="swish",
+  )
+  output_projection_quantiles: ResidualBlockConfig = ResidualBlockConfig(
+    input_dims=1280,
+    hidden_dims=1280,
+    output_dims=10240,
+    use_bias=False,
+    activation="swish",
+  )
+class TimesFM_2p5:
+  """Abstract base class for TimesFM models.
+  Attributes:
+    forecast_config: Configuration for forecasting flags.
+    compiled_decode: Compiled decode function.
+    global_batch_size: Global batch size.
+  """
+  forecast_config: ForecastConfig | None = None
+  compiled_decode: Callable[..., Any] | None = None
+  global_batch_size: int = 0
+  def load_checkpoint(self, path: str):
+    """Loads a TimesFM model from a checkpoint."""
+    raise NotImplementedError()
+  def compile(self, forecast_config: ForecastConfig | None = None):
+    """Compiles the TimesFM model for fast decoding."""
+    raise NotImplementedError()
+  def forecast(
+    self, horizon: int, inputs: list[np.ndarray]
+  ) -> tuple[np.ndarray, np.ndarray]:
+    """Forecasts the time series."""
+    if self.compiled_decode is None:
+      raise RuntimeError("Model is not compiled. Please call compile() first.")
+    assert self.global_batch_size > 0
+    assert self.forecast_config is not None
+    context = self.forecast_config.max_context
+    num_inputs = len(inputs)
+    if (w := num_inputs % self.global_batch_size) != 0:
+      inputs += [np.array([0.0] * 3)] * (self.global_batch_size - w)
+    output_points = []
+    output_quantiles = []
+    values = []
+    masks = []
+    idx = 0
+    for each_input in inputs:
+      value = linear_interpolation(strip_leading_nans(np.array(each_input)))
+      if (w := len(value)) >= context:
+        value = value[-context:]
+        mask = np.zeros_like(value, dtype=bool)
+      else:
+        mask = np.array([True] * (context - w) + [False] * w)
+        value = np.pad(value, (context - w, 0), "constant", constant_values=0.0)
+      values.append(value)
+      masks.append(mask)
+      idx += 1
+      if idx == self.global_batch_size:
+        idx = 0
+        point_forecast, quantile_forecast = self.compiled_decode(horizon, values, masks)
+        output_points.append(point_forecast)
+        output_quantiles.append(quantile_forecast)
+        values = []
+        masks = []
+    output_points = np.concatenate(output_points, axis=0)
+    output_quantiles = np.concatenate(output_quantiles, axis=0)
+    return output_points[:num_inputs], output_quantiles[:num_inputs]
+  def forecast_with_covariates(
+    self,
+    inputs: list[Sequence[float]],
+    dynamic_numerical_covariates: dict[str, Sequence[Sequence[float]]] | None = None,
+    dynamic_categorical_covariates: (
+      dict[str, Sequence[Sequence[Category]]] | None
+    ) = None,
+    static_numerical_covariates: dict[str, Sequence[float]] | None = None,
+    static_categorical_covariates: dict[str, Sequence[Category]] | None = None,
+    xreg_mode: XRegMode = "xreg + timesfm",
+    normalize_xreg_target_per_input: bool = True,
+    ridge: float = 0.0,
+    max_rows_per_col: int = 0,
+    force_on_cpu: bool = False,
+  ):
+    """Forecasts on a list of time series with covariates.
+    To optimize inference speed, avoid string valued categorical covariates.
+    Args:
+      inputs: A list of time series forecast contexts. Each context time series
+        should be in a format convertible to JTensor by `jnp.array`.
+      dynamic_numerical_covariates: A dict of dynamic numerical covariates.
+      dynamic_categorical_covariates: A dict of dynamic categorical covariates.
+      static_numerical_covariates: A dict of static numerical covariates.
+      static_categorical_covariates: A dict of static categorical covariates.
+      xreg_mode: one of "xreg + timesfm" or "timesfm + xreg". "xreg + timesfm"
+        fits a model on the residuals of the TimesFM forecast. "timesfm + xreg"
+        fits a model on the targets then forecasts on the residuals via TimesFM.
+      normalize_xreg_target_per_input: whether to normalize the xreg target per
+        input in the given batch.
+      ridge: ridge penalty for the linear model.
+      max_rows_per_col: max number of rows per column for the linear model.
+      force_on_cpu: whether to force running on cpu for the linear model.
+    Returns:
+      A tuple of two lists. The first is the outputs of the model. The second is
+      the outputs of the xreg.
+    """
+    if self.forecast_config is None:
+      raise ValueError("Model is not compiled. Please call compile() first.")
+    elif not self.forecast_config.return_backcast:
+      raise ValueError(
+        "For XReg, `return_backcast` must be set to True in the forecast config. Please recompile the model."
+      )
+    from ..utils import xreg_lib
+    # Verify and bookkeep covariates.
+    if not (
+      dynamic_numerical_covariates
+      or dynamic_categorical_covariates
+      or static_numerical_covariates
+      or static_categorical_covariates
+    ):
+      raise ValueError(
+        "At least one of dynamic_numerical_covariates,"
+        " dynamic_categorical_covariates, static_numerical_covariates,"
+        " static_categorical_covariates must be set."
+      )
+    # Track the lengths of (1) each input, (2) the part that can be used in the
+    # linear model, and (3) the horizon.
+    input_lens, train_lens, test_lens = [], [], []
+    for i, input_ts in enumerate(inputs):
+      input_len = len(input_ts)
+      input_lens.append(input_len)
+      if xreg_mode == "timesfm + xreg":
+        # For fitting residuals, no TimesFM forecast on the first patch.
+        train_lens.append(max(0, input_len - self.model.p))
+      elif xreg_mode == "xreg + timesfm":
+        train_lens.append(input_len)
+      else:
+        raise ValueError(f"Unsupported mode: {xreg_mode}")
+      if dynamic_numerical_covariates:
+        test_lens.append(
+          len(list(dynamic_numerical_covariates.values())[0][i]) - input_len
+        )
+      elif dynamic_categorical_covariates:
+        test_lens.append(
+          len(list(dynamic_categorical_covariates.values())[0][i]) - input_len
+        )
+      else:
+        test_lens.append(self.forecast_config.max_horizon)
+      if test_lens[-1] > self.forecast_config.max_horizon:
+        raise ValueError(
+          "Forecast horizon length inferred from the dynamic covaraites is longer than the"
+          f"max_horizon defined in the forecast config: {test_lens[-1]} > {self.forecast_config.max_horizon=}."
+        )
+    # Prepare the covariates into train and test.
+    train_dynamic_numerical_covariates = collections.defaultdict(list)
+    test_dynamic_numerical_covariates = collections.defaultdict(list)
+    train_dynamic_categorical_covariates = collections.defaultdict(list)
+    test_dynamic_categorical_covariates = collections.defaultdict(list)
+    for covariates, train_covariates, test_covariates in (
+      (
+        dynamic_numerical_covariates,
+        train_dynamic_numerical_covariates,
+        test_dynamic_numerical_covariates,
+      ),
+      (
+        dynamic_categorical_covariates,
+        train_dynamic_categorical_covariates,
+        test_dynamic_categorical_covariates,
+      ),
+    ):
+      if not covariates:
+        continue
+      for covariate_name, covariate_values in covariates.items():
+        for input_len, train_len, covariate_value in zip(
+          input_lens, train_lens, covariate_values
+        ):
+          train_covariates[covariate_name].append(
+            covariate_value[(input_len - train_len) : input_len]
+          )
+          test_covariates[covariate_name].append(covariate_value[input_len:])
+    # Fit models.
+    if xreg_mode == "timesfm + xreg":
+      # Forecast via TimesFM then fit a model on the residuals.
+      point_outputs, quantile_outputs = self.forecast(
+        horizon=self.forecast_config.max_horizon, inputs=inputs
+      )
+      targets = [
+        (
+          np.array(input_ts)[-train_len:]
+          - point_output[: -self.forecast_config.max_horizon][-train_len:]
+        )
+        for input_ts, point_output, train_len in zip(inputs, point_outputs, train_lens)
+      ]
+      per_instance_stats = None
+      if normalize_xreg_target_per_input:
+        targets, per_instance_stats = xreg_lib.normalize(targets)
+      xregs = xreg_lib.BatchedInContextXRegLinear(
+        targets=targets,
+        train_lens=train_lens,
+        test_lens=test_lens,
+        train_dynamic_numerical_covariates=train_dynamic_numerical_covariates,
+        test_dynamic_numerical_covariates=test_dynamic_numerical_covariates,
+        train_dynamic_categorical_covariates=train_dynamic_categorical_covariates,
+        test_dynamic_categorical_covariates=test_dynamic_categorical_covariates,
+        static_numerical_covariates=static_numerical_covariates,
+        static_categorical_covariates=static_categorical_covariates,
+      ).fit(
+        ridge=ridge,
+        one_hot_encoder_drop=None if ridge > 0 else "first",
+        max_rows_per_col=max_rows_per_col,
+        force_on_cpu=force_on_cpu,
+        debug_info=False,
+        assert_covariates=True,
+        assert_covariate_shapes=True,
+      )
+      if normalize_xreg_target_per_input:
+        xregs = xreg_lib.renormalize(xregs, per_instance_stats)
+      xregs = np.array(xregs)
+      new_point_outputs = [
+        (point_output[-self.forecast_config.max_horizon :][:test_len] + xreg)
+        for point_output, test_len, xreg in zip(point_outputs, test_lens, xregs)
+      ]
+      new_quantile_outputs = [
+        (
+          quantile_output[-self.forecast_config.max_horizon :][:test_len]
+          + xreg[..., None]
+        )
+        for quantile_output, test_len, xreg in zip(quantile_outputs, test_lens, xregs)
+      ]
+    else:
+      # Fit a model on the targets then forecast on the residuals via TimesFM.
+      targets = [
+        np.array(input_ts)[-train_len:]
+        for input_ts, train_len in zip(inputs, train_lens)
+      ]
+      per_instance_stats = None
+      if normalize_xreg_target_per_input:
+        targets, per_instance_stats = xreg_lib.normalize(targets)
+      xregs, xregs_on_context, _, _, _ = xreg_lib.BatchedInContextXRegLinear(
+        targets=targets,
+        train_lens=train_lens,
+        test_lens=test_lens,
+        train_dynamic_numerical_covariates=train_dynamic_numerical_covariates,
+        test_dynamic_numerical_covariates=test_dynamic_numerical_covariates,
+        train_dynamic_categorical_covariates=train_dynamic_categorical_covariates,
+        test_dynamic_categorical_covariates=test_dynamic_categorical_covariates,
+        static_numerical_covariates=static_numerical_covariates,
+        static_categorical_covariates=static_categorical_covariates,
+      ).fit(
+        ridge=ridge,
+        one_hot_encoder_drop=None if ridge > 0 else "first",
+        max_rows_per_col=max_rows_per_col,
+        force_on_cpu=force_on_cpu,
+        debug_info=True,
+        assert_covariates=True,
+        assert_covariate_shapes=True,
+      )
+      point_outputs, quantile_outputs = self.forecast(
+        horizon=self.forecast_config.max_horizon,
+        inputs=[
+          target - xreg_on_context
+          for target, xreg_on_context in zip(targets, xregs_on_context)
+        ],
+      )
+      new_point_outputs = [
+        (point_output[-self.forecast_config.max_horizon :][:test_len] + xreg)
+        for point_output, test_len, xreg in zip(point_outputs, test_lens, xregs)
+      ]
+      new_quantile_outputs = [
+        (
+          quantile_output[-self.forecast_config.max_horizon :][:test_len]
+          + xreg[..., None]
+        )
+        for quantile_output, test_len, xreg in zip(quantile_outputs, test_lens, xregs)
+      ]
+      if normalize_xreg_target_per_input:
+        new_point_outputs = xreg_lib.renormalize(new_point_outputs, per_instance_stats)
+        new_quantile_outputs = xreg_lib.renormalize(
+          new_quantile_outputs, per_instance_stats
+        )
+    return new_point_outputs, new_quantile_outputs