PyPI - tabpfn-time-series - Versions diffs - 1.0.3__py3-none-any.whl → 1.0.5__py3-none-any.whl - Mend

tabpfn-time-series 1.0.3py3-none-any.whl → 1.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

tabpfn_time_series/predictor.py CHANGED Viewed

@@ -2,8 +2,13 @@ import logging
 from enum import Enum
 from tabpfn_time_series.ts_dataframe import TimeSeriesDataFrame
-from tabpfn_time_series.tabpfn_worker import TabPFNClient, LocalTabPFN, MockTabPFN
+from tabpfn_time_series.tabpfn_worker import (
+    TabPFNClient,
+    LocalTabPFN,
+    MockTabPFN,
+)
 from tabpfn_time_series.defaults import TABPFN_TS_DEFAULT_CONFIG
+from tabpfn_common_utils.telemetry import set_extension
 logger = logging.getLogger(__name__)
@@ -14,6 +19,7 @@ class TabPFNMode(Enum):
     MOCK = "tabpfn-mock"
+@set_extension("time-series")
 class TabPFNTimeSeriesPredictor:
     """
     Given a TimeSeriesDataFrame (multiple time series), perform prediction on each time series individually.
@@ -29,6 +35,7 @@ class TabPFNTimeSeriesPredictor:
             TabPFNMode.LOCAL: lambda: LocalTabPFN(config),
             TabPFNMode.MOCK: lambda: MockTabPFN(config),
         }
+        self.tabpfn_mode = tabpfn_mode
         self.tabpfn_worker = worker_mapping[tabpfn_mode]()
     def predict(

tabpfn_time_series/tabpfn_worker.py CHANGED Viewed

@@ -1,6 +1,8 @@
+import contextvars
 import logging
 from abc import ABC, abstractmethod
-from joblib import Parallel, delayed
+from joblib import Parallel, delayed, parallel_config
+import backoff
 from tqdm import tqdm
 import pandas as pd
@@ -14,6 +16,9 @@ from tabpfn_time_series.defaults import TABPFN_TS_DEFAULT_QUANTILE_CONFIG
 logger = logging.getLogger(__name__)
+# Per-call attempt counter, isolated per thread & task
+_retry_attempts = contextvars.ContextVar("predict_attempts", default=0)
 class TabPFNWorker(ABC):
     def __init__(
@@ -29,24 +34,7 @@ class TabPFNWorker(ABC):
         train_tsdf: TimeSeriesDataFrame,
         test_tsdf: TimeSeriesDataFrame,
     ):
-        predictions = Parallel(
-            n_jobs=self.num_workers,
-            backend="loky",
-        )(
-            delayed(self._prediction_routine)(
-                item_id,
-                train_tsdf.loc[item_id],
-                test_tsdf.loc[item_id],
-            )
-            for item_id in tqdm(train_tsdf.item_ids, desc="Predicting time series")
-        )
-        predictions = pd.concat(predictions)
-        # Sort predictions according to original item_ids order (important for MASE and WQL calculation)
-        predictions = predictions.loc[train_tsdf.item_ids]
-        return TimeSeriesDataFrame(predictions)
+        raise NotImplementedError("Predict method must be implemented in subclass")
     def _prediction_routine(
         self,
@@ -54,8 +42,6 @@ class TabPFNWorker(ABC):
         single_train_tsdf: TimeSeriesDataFrame,
         single_test_tsdf: TimeSeriesDataFrame,
     ) -> pd.DataFrame:
-        # logger.debug(f"Predicting on item_id: {item_id}")
         test_index = single_test_tsdf.index
         train_X, train_y = split_time_series_to_X_y(single_train_tsdf.copy())
         test_X, _ = split_time_series_to_X_y(single_test_tsdf.copy())
@@ -116,6 +102,39 @@ class TabPFNWorker(ABC):
         return result
+def _reset_attempts(_details=None):
+    """Convenience function to reset the attempt counter."""
+    _retry_attempts.set(0)
+def _predict_giveup_mixed(exc: Exception) -> bool:
+    """Determine whether to give up on a prediction call or not.
+    Returns:
+        True if the prediction call should be given up on, False otherwise.
+    """
+    if _is_tabpfn_gcs_429(exc):
+        return False
+    # Stop after first retry for non-429
+    return _retry_attempts.get() >= 2
+def _is_tabpfn_gcs_429(err: Exception) -> bool:
+    """Determine if an error is a 429 error raised from TabPFN API
+    and relates to GCS 429 errors.
+    Returns:
+        True if the error is a 429 error raised from TabPFN API.
+    """
+    markers = (
+        "TooManyRequests: 429",
+        "rateLimitExceeded",
+        "cloud.google.com/storage/docs/gcs429",
+    )
+    return any(m in str(err) for m in markers)
 class TabPFNClient(TabPFNWorker):
     def __init__(
         self,
@@ -135,6 +154,53 @@ class TabPFNClient(TabPFNWorker):
         super().__init__(config, num_workers)
+    def predict(
+        self,
+        train_tsdf: TimeSeriesDataFrame,
+        test_tsdf: TimeSeriesDataFrame,
+    ):
+        # Run the predictions in parallel
+        with parallel_config(backend="threading"):
+            results = Parallel(
+                n_jobs=self.num_workers,
+            )(
+                delayed(self._prediction_routine)(
+                    item_id,
+                    train_tsdf.loc[item_id],
+                    test_tsdf.loc[item_id],
+                )
+                for item_id in tqdm(train_tsdf.item_ids, desc="Predicting time series")
+            )
+        # Convert list to DataFrame
+        predictions = pd.concat(results)
+        # Sort predictions according to original item_ids order (important for MASE and WQL calculation)
+        predictions = predictions.loc[train_tsdf.item_ids]
+        return TimeSeriesDataFrame(predictions)
+    @backoff.on_exception(
+        backoff.expo,
+        Exception,
+        base=1,
+        factor=2,
+        max_tries=5,
+        jitter=backoff.full_jitter,
+        giveup=_predict_giveup_mixed,
+        on_success=_reset_attempts,
+    )
+    def _prediction_routine(
+        self,
+        item_id: str,
+        single_train_tsdf: TimeSeriesDataFrame,
+        single_test_tsdf: TimeSeriesDataFrame,
+    ) -> pd.DataFrame:
+        # Increment attempt count at start of each try
+        _retry_attempts.set(_retry_attempts.get() + 1)
+        return super()._prediction_routine(item_id, single_train_tsdf, single_test_tsdf)
     def _get_tabpfn_engine(self):
         from tabpfn_client import TabPFNRegressor

{tabpfn_time_series-1.0.3.dist-info → tabpfn_time_series-1.0.5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: tabpfn_time_series
-Version: 1.0.3
+Version: 1.0.5
 Summary: Zero-shot time series forecasting with TabPFNv2
 Project-URL: Homepage, https://github.com/liam-sbhoo/tabpfn-time-series
 Project-URL: Bug Tracker, https://github.com/liam-sbhoo/tabpfn-time-series/issues
@@ -10,6 +10,7 @@ Classifier: License :: OSI Approved :: Apache Software License
 Classifier: Operating System :: OS Independent
 Classifier: Programming Language :: Python :: 3
 Requires-Python: >=3.10
+Requires-Dist: backoff>=2.2.1
 Requires-Dist: datasets>=4.0
 Requires-Dist: gluonts>=0.16.0
 Requires-Dist: pandas<2.2.0,>=2.1.2
@@ -17,6 +18,7 @@ Requires-Dist: python-dotenv>=1.1.0
 Requires-Dist: pyyaml>=6.0.1
 Requires-Dist: statsmodels>=0.14.5
 Requires-Dist: tabpfn-client>=0.1.7
+Requires-Dist: tabpfn-common-utils[telemetry-interactive]>=0.2.2
 Requires-Dist: tabpfn>=2.0.9
 Requires-Dist: tqdm
 Provides-Extra: dev
@@ -97,3 +99,33 @@ uv pip install -e ".[dev]"
 [![colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/PriorLabs/tabpfn-time-series/blob/main/demo.ipynb)
 The demo should explain it all. 😉
+## 📊 Anonymous Telemetry
+This project collects **anonymous usage telemetry** by default.
+The data is used exclusively to help us understand how the library is being used and to guide future improvements.
+- **No personal data is collected**
+- **No code, model inputs, or outputs are ever sent**
+- **Data is strictly anonymous and cannot be linked to individuals**
+### What we collect
+We only collect high-level, non-identifying information such as:
+- Package version
+- Python version
+- How often fit and inference are called, including simple metadata like the dimensionality of the input and the type of task (e.g., classification vs. regression) (:warning: never the data itself)
+See the [Telemetry documentation](https://github.com/priorlabs/tabpfn/blob/main/TELEMETRY.md) for the full details of events and metadata.
+This data is processed in compliance with the **General Data Protection Regulation (GDPR)** principles of data minimization and purpose limitation.
+For more details, please see our [Privacy Policy](https://priorlabs.ai/privacy_policy/).
+### How to opt out
+If you prefer not to send telemetry, you can disable it by setting the following environment variable:
+```bash
+export TABPFN_DISABLE_TELEMETRY=1
+```
+---

{tabpfn_time_series-1.0.3.dist-info → tabpfn_time_series-1.0.5.dist-info}/RECORD RENAMED Viewed

@@ -2,15 +2,15 @@ tabpfn_time_series/__init__.py,sha256=XJXSKqWp3AF9mAaWi-4KCgHQG7NzNTaBkLOYOMxvhS
 tabpfn_time_series/data_preparation.py,sha256=wWjSaKgV9KqKonMtSuDbYnW59ixflrScKIP_HSJ_MlA,5427
 tabpfn_time_series/defaults.py,sha256=ki1y38FR4zmbHWgRjcryA5T88GzNMwhlZC-sTRjuK2U,248
 tabpfn_time_series/plot.py,sha256=UXgLR2S94vi-vv1ArQKI6uYl_QwSAwAau5jFzGmQ7hw,6582
-tabpfn_time_series/predictor.py,sha256=UDhvH7reB3HAuxOyggE4yl2ntQXivvxgXCN_RhoddHc,1467
-tabpfn_time_series/tabpfn_worker.py,sha256=ZlJrU0O1dxfKh_As5Le4phm0P4RCDeXKpqp9X-h5bQs,9619
+tabpfn_time_series/predictor.py,sha256=6R9Pb-8jD2jZp0nw1VOQFudJ7i676hwcUh96NRQRhOI,1609
+tabpfn_time_series/tabpfn_worker.py,sha256=k6td4Ml0E3Xr1gERze-S0kyvBB6q_hbLMzvSurdaSp0,11589
 tabpfn_time_series/ts_dataframe.py,sha256=X94mssw_mSFedjplG55hjwTzKj8mM3VwWynveX3fegA,52834
 tabpfn_time_series/features/__init__.py,sha256=lzdZWkEfntfg3ZHqNNbfbg-3o_VIzju0tebdRu3AzF4,421
 tabpfn_time_series/features/auto_features.py,sha256=3OqqY2h7umcoLjLx4hOXypLTjwzrMtd6cQKTNi83vrU,11561
 tabpfn_time_series/features/basic_features.py,sha256=OV3B__S30-CX88vGjwYQDWqAbJajQw80PxcnvJVUbm4,2955
 tabpfn_time_series/features/feature_generator_base.py,sha256=jtySWLJyX4E31v6CbX44EHa8cdz7OMyauf4ltNEQeAQ,534
 tabpfn_time_series/features/feature_transformer.py,sha256=JzxswTGRGlt00QoYFyvAILlUVD68njdvoU3v-phnyi8,1774
-tabpfn_time_series-1.0.3.dist-info/METADATA,sha256=qp6gKaktKWsK3WiyyONpLI3r5pIoio2dEeFwWhYKjY8,4917
-tabpfn_time_series-1.0.3.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-tabpfn_time_series-1.0.3.dist-info/licenses/LICENSE.txt,sha256=iwhPL7kIWQG6gyLZZwIMDItGrNgxMDIq9itxkUSMapY,11345
-tabpfn_time_series-1.0.3.dist-info/RECORD,,
+tabpfn_time_series-1.0.5.dist-info/METADATA,sha256=tYxI37YfTs2irkka6-LmSNMOAvoyR6llSTNVcnbh_A8,6254
+tabpfn_time_series-1.0.5.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+tabpfn_time_series-1.0.5.dist-info/licenses/LICENSE.txt,sha256=iwhPL7kIWQG6gyLZZwIMDItGrNgxMDIq9itxkUSMapY,11345
+tabpfn_time_series-1.0.5.dist-info/RECORD,,

{tabpfn_time_series-1.0.3.dist-info → tabpfn_time_series-1.0.5.dist-info}/WHEEL RENAMED Viewed

File without changes

{tabpfn_time_series-1.0.3.dist-info → tabpfn_time_series-1.0.5.dist-info}/licenses/LICENSE.txt RENAMED Viewed

File without changes

tabpfn-time-series 1.0.3__py3-none-any.whl → 1.0.5__py3-none-any.whl

tabpfn-time-series 1.0.3py3-none-any.whl → 1.0.5py3-none-any.whl