PyPI - zipline_polygon_bundle - Versions diffs - 0.2.0.dev1__tar.gz → 0.2.1__tar.gz - Mend

zipline_polygon_bundle 0.2.0.dev1tar.gz → 0.2.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

{zipline_polygon_bundle-0.2.0.dev1 → zipline_polygon_bundle-0.2.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: zipline_polygon_bundle
-Version: 0.2.0.dev1
+Version: 0.2.1
 Summary: A zipline-reloaded data provider bundle for Polygon.io
 License: GNU AFFERO GENERAL PUBLIC LICENSE
                                 Version 3, 19 November 2007
@@ -666,22 +666,21 @@ License: GNU AFFERO GENERAL PUBLIC LICENSE
 Keywords: zipline,data-bundle,finance
 Author: Jim White
 Author-email: jim@fovi.com
-Requires-Python: >=3.9,<4.0
+Requires-Python: >=3.10,<4.0
 Classifier: Programming Language :: Python :: 3
 Classifier: License :: OSI Approved :: GNU Affero General Public License v3
 Classifier: Operating System :: OS Independent
 Requires-Dist: bcolz-zipline (>=1.2.11)
+Requires-Dist: filelock (>=3.16.0)
 Requires-Dist: fsspec (>=2024.10)
 Requires-Dist: numpy (<2)
 Requires-Dist: pandas (>=2.2,<3)
-Requires-Dist: pandas-market-calendars (>=4.4.2)
-Requires-Dist: pandas_ta (>=0.3)
 Requires-Dist: polygon-api-client (>=1.14.2)
 Requires-Dist: pyarrow (>=18.1.0,<19)
 Requires-Dist: pytz (>=2018.5)
 Requires-Dist: requests (>=2.9.1)
-Requires-Dist: toolz (>=0.8.2)
-Requires-Dist: zipline-reloaded (>=3.1)
+Requires-Dist: toolz (>=1)
+Requires-Dist: zipline-arrow (>=3.2.2)
 Project-URL: Repository, https://github.com/fovi-llc/zipline-polygon-bundle
 Description-Content-Type: text/markdown
@@ -745,6 +744,9 @@ register_polygon_equities_bundle(
 ## Install the Zipline Polygon.io Bundle PyPi package and check that it works.
 Listing bundles will show if everything is working correctly.
 ```bash
+pip install -U git+https://github.com/fovi-llc/zipline-reloaded.git@calendar
+pip install -U git+https://github.com/fovi-llc/zipline-polygon-bundle.git
 pip install zipline_polygon_bundle
 zipline -e extension.py bundles
 ```

{zipline_polygon_bundle-0.2.0.dev1 → zipline_polygon_bundle-0.2.1}/README.md RENAMED Viewed

@@ -58,6 +58,9 @@ register_polygon_equities_bundle(
 ## Install the Zipline Polygon.io Bundle PyPi package and check that it works.
 Listing bundles will show if everything is working correctly.
 ```bash
+pip install -U git+https://github.com/fovi-llc/zipline-reloaded.git@calendar
+pip install -U git+https://github.com/fovi-llc/zipline-polygon-bundle.git
 pip install zipline_polygon_bundle
 zipline -e extension.py bundles
 ```

{zipline_polygon_bundle-0.2.0.dev1 → zipline_polygon_bundle-0.2.1}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = 'zipline_polygon_bundle'
-version = '0.2.0dev1'
+version = '0.2.1'
 description = 'A zipline-reloaded data provider bundle for Polygon.io'
 authors = [
     { name = 'Jim White', email = 'jim@fovi.com' },
@@ -19,7 +19,7 @@ Repository = 'https://github.com/fovi-llc/zipline-polygon-bundle'
 [tool.poetry]
 name = 'zipline-polygon-bundle'
-version = '0.2.0dev1'
+version = '0.2.1'
 description = 'A zipline-reloaded data provider bundle for Polygon.io'
 authors = ['Jim White <jim@fovi.com>']
 license = 'AGPL-3.0'
@@ -33,25 +33,28 @@ classifiers = [
 [tool.poetry.dependencies]
 fsspec = ">=2024.10"
-python = ">=3.9,<4.0"
+filelock = ">=3.16.0"
+python = ">=3.10,<4.0"
 polygon-api-client = ">=1.14.2"
 pandas = ">=2.2,<3"
-pandas-market-calendars = ">=4.4.2"
-pandas_ta = ">=0.3"
+# pandas-market-calendars = ">=4.4.2"
+# pandas-ta install doesn't work with poetry for some reason.
+# It is used in compute_signals.py which we're not using yet.
+# pandas-ta = ">=0.3"
 pytz = ">=2018.5"
 requests = ">=2.9.1"
 bcolz-zipline = ">=1.2.11"
 pyarrow = ">=18.1.0,<19"
 numpy = "<2"
-toolz = ">=0.8.2"
-zipline-reloaded = ">=3.1"
+toolz = ">=1"
+zipline-arrow = { version = ">=3.2.2" }
 [tool.poetry.dev-dependencies]
 pytest = "*"
 [build-system]
 build-backend = "poetry.core.masonry.api"
-requires = ["poetry_core>=1.0.0"]
+requires = ["poetry_core>=2.1.0"]
 [tool.pytest.ini_options]
 # https://docs.pytest.org/en/stable/how-to/capture-warnings.html#controlling-warnings

{zipline_polygon_bundle-0.2.0.dev1 → zipline_polygon_bundle-0.2.1}/zipline_polygon_bundle/__init__.py RENAMED Viewed

@@ -1,17 +1,17 @@
 from .bundle import (
     register_polygon_equities_bundle,
     symbol_to_upper,
-    polygon_equities_bundle_day,
-    polygon_equities_bundle_minute,
+    ingest_polygon_equities_bundle
 )
 from .config import PolygonConfig
 from .nyse_all_hours_calendar import NYSE_ALL_HOURS, register_nyse_all_hours_calendar
 from .concat_all_aggs import concat_all_aggs_from_csv, generate_csv_agg_tables
 from .adjustments import load_splits, load_dividends, load_conditions
-from .trades import trades_schema, trades_dataset, cast_trades, date_to_path
+from .trades import trades_schema, trades_dataset, cast_trades
 from .trades import custom_aggs_partitioning, custom_aggs_schema, trades_to_custom_aggs, convert_trades_to_custom_aggs
-from .trades import get_custom_aggs_dates, generate_csv_trades_tables, compute_signals_for_all_custom_aggs
+from .trades import get_aggs_dates, generate_csv_trades_tables
+# from .compute_signals import compute_signals_for_all_custom_aggs
 from .quotes import quotes_schema, quotes_dataset, cast_quotes
 # from .tickers_and_names import load_all_tickers, merge_tickers, ticker_names_from_merged_tickers, get_ticker_universe
 from .tickers_and_names import PolygonAssets, get_ticker_universe
@@ -22,8 +22,7 @@ __all__ = [
     "register_nyse_all_hours_calendar",
     "NYSE_ALL_HOURS",
     "symbol_to_upper",
-    "polygon_equities_bundle_day",
-    "polygon_equities_bundle_minute",
+    "ingest_polygon_equities_bundle",
     "PolygonConfig",
     "concat_all_aggs_from_csv",
     "generate_csv_agg_tables",
@@ -33,14 +32,13 @@ __all__ = [
     "trades_schema",
     "trades_dataset",
     "cast_trades",
-    "date_to_path",
-    "get_custom_aggs_dates",
+    "get_aggs_dates",
     "generate_csv_trades_tables",
     "custom_aggs_partitioning",
     "custom_aggs_schema",
     "trades_to_custom_aggs",
     "convert_trades_to_custom_aggs",
-    "compute_signals_for_all_custom_aggs",
+    # "compute_signals_for_all_custom_aggs",
     "quotes_schema",
     "quotes_dataset",
     "cast_quotes",

{zipline_polygon_bundle-0.2.0.dev1 → zipline_polygon_bundle-0.2.1}/zipline_polygon_bundle/adjustments.py RENAMED Viewed

@@ -10,19 +10,19 @@ from urllib3 import HTTPResponse
 def load_polygon_splits(
-    config: PolygonConfig, first_start_end: datetime.date, last_end_date: datetime.date
+    config: PolygonConfig, first_day: pd.Timestamp, last_day: pd.Timestamp
 ) -> pd.DataFrame:
     # N.B. If the schema changes then the filename should change.  We're on v3 now.
     splits_path = config.api_cache_path(
-        start_date=first_start_end, end_date=last_end_date, filename="list_splits"
+        first_day=first_day, last_day=last_day, filename="list_splits"
     )
-    expected_split_count = (last_end_date - first_start_end).days * 3
+    expected_split_count = (last_day - first_day).days * 3
     if not os.path.exists(splits_path):
         client = polygon.RESTClient(api_key=config.api_key)
         splits = client.list_splits(
             limit=1000,
-            execution_date_gte=first_start_end,
-            execution_date_lt=last_end_date + datetime.timedelta(days=1),
+            execution_date_gte=first_day.date(),
+            execution_date_lt=last_day.date() + datetime.timedelta(days=1),
         )
         if splits is HTTPResponse:
             raise ValueError(f"Polygon.list_splits bad HTTPResponse: {splits}")
@@ -32,7 +32,7 @@ def load_polygon_splits(
         splits.to_parquet(splits_path)
         if len(splits) < expected_split_count:
             logging.warning(
-                f"Only got {len(splits)=} from Polygon list_splits (expected {expected_split_count=}).  "
+                f"Only got {len(splits)=} from Polygon list_splits ({expected_split_count=}).  "
                 "This is probably fine if your historical range is short."
             )
         # We will always load from the file to avoid any chance of weird errors.
@@ -41,7 +41,7 @@ def load_polygon_splits(
         print(f"Loaded {len(splits)=} from {splits_path}")
         if len(splits) < expected_split_count:
             logging.warning(
-                f"Only got {len(splits)=} from Polygon list_splits (expected {expected_split_count=}).  "
+                f"Only got {len(splits)=} from Polygon list_splits ({expected_split_count=}).  "
                 "This is probably fine if your historical range is short."
             )
         return splits
@@ -50,11 +50,11 @@ def load_polygon_splits(
 def load_splits(
     config: PolygonConfig,
-    first_start_end: datetime.date,
-    last_end_date: datetime.date,
+    first_day: pd.Timestamp,
+    last_day: pd.Timestamp,
     ticker_to_sid: dict[str, int],
 ) -> pd.DataFrame:
-    splits = load_polygon_splits(config, first_start_end, last_end_date)
+    splits = load_polygon_splits(config, first_day=first_day, last_day=last_day)
     splits["sid"] = splits["ticker"].apply(lambda t: ticker_to_sid.get(t, pd.NA))
     splits.dropna(inplace=True)
     splits["sid"] = splits["sid"].astype("int64")
@@ -70,18 +70,18 @@ def load_splits(
 def load_polygon_dividends(
-    config: PolygonConfig, first_start_date: datetime.date, last_end_date: datetime.date
+    config: PolygonConfig, first_day: pd.Timestamp, last_day: pd.Timestamp
 ) -> pd.DataFrame:
     # N.B. If the schema changes then the filename should change.  We're on v3 now.
     dividends_path = config.api_cache_path(
-        start_date=first_start_date, end_date=last_end_date, filename="list_dividends"
+        first_day=first_day, last_day=last_day, filename="list_dividends"
     )
     if not os.path.exists(dividends_path):
         client = polygon.RESTClient(api_key=config.api_key)
         dividends = client.list_dividends(
             limit=1000,
-            record_date_gte=first_start_date,
-            pay_date_lt=last_end_date + datetime.timedelta(days=1),
+            record_date_gte=first_day.date(),
+            pay_date_lt=last_day.date() + datetime.timedelta(days=1),
         )
         if dividends is HTTPResponse:
             raise ValueError(f"Polygon.list_dividends bad HTTPResponse: {dividends}")
@@ -104,35 +104,30 @@ def load_polygon_dividends(
 def load_chunked_polygon_dividends(
-    config: PolygonConfig, first_start_end: datetime.date, last_end_date: datetime.date
+    config: PolygonConfig, first_day: pd.Timestamp,
+    last_day: pd.Timestamp
 ) -> pd.DataFrame:
     dividends_list = []
-    next_start_end = first_start_end
-    while next_start_end < last_end_date:
+    next_start_end = first_day
+    while next_start_end < last_day:
         # We want at most a month of dividends at a time.  They should end on the last day of the month.
-        # So the next_end_date is the day before the first day of the next month.
-        first_of_next_month = datetime.date(
-            next_start_end.year + (next_start_end.month // 12),
-            (next_start_end.month % 12) + 1,
-            1,
-        )
-        next_end_date = first_of_next_month - datetime.timedelta(days=1)
-        if next_end_date > last_end_date:
-            next_end_date = last_end_date
+        next_end_date = next_start_end + pd.offsets.MonthEnd()
+        if next_end_date > last_day:
+            next_end_date = last_day
         dividends_list.append(
-            load_polygon_dividends(config, next_start_end, next_end_date)
+            load_polygon_dividends(config, first_day=next_start_end, last_day=next_end_date)
         )
-        next_start_end = next_end_date + datetime.timedelta(days=1)
+        next_start_end = next_end_date + pd.Timedelta(days=1)
     return pd.concat(dividends_list)
 def load_dividends(
     config: PolygonConfig,
-    first_start_end: datetime.date,
-    last_end_date: datetime.date,
+    first_day: pd.Timestamp,
+    last_day: pd.Timestamp,
     ticker_to_sid: dict[str, int],
 ) -> pd.DataFrame:
-    dividends = load_chunked_polygon_dividends(config, first_start_end, last_end_date)
+    dividends = load_chunked_polygon_dividends(config, first_day=first_day, last_day=last_day)
     dividends["sid"] = dividends["ticker"].apply(lambda t: ticker_to_sid.get(t, pd.NA))
     dividends.dropna(how="any", inplace=True)
     dividends["sid"] = dividends["sid"].astype("int64")
@@ -159,7 +154,7 @@ def load_conditions(config: PolygonConfig) -> pd.DataFrame:
     # The API doesn't use dates for the condition codes but this is a way to provide control over caching.
     # Main thing is to get the current conditions list but we don't want to call more than once a day.
     conditions_path = config.api_cache_path(
-        start_date=config.start_timestamp.date(), end_date=config.end_timestamp.date(), filename="conditions"
+        first_day=config.start_timestamp, last_day=config.end_timestamp, filename="conditions"
     )
     expected_conditions_count = 100
     if not os.path.exists(conditions_path):

zipline_polygon_bundle 0.2.0.dev1__tar.gz → 0.2.1__tar.gz

zipline_polygon_bundle 0.2.0.dev1tar.gz → 0.2.1tar.gz