PyPI - awx-zipline-ai - Versions diffs - 0.2.1__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

awx-zipline-ai 0.2.1py3-none-any.whl → 0.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (96) hide show

agent/ttypes.py +6 -6
ai/chronon/airflow_helpers.py +20 -23
ai/chronon/cli/__init__.py +0 -0
ai/chronon/cli/compile/__init__.py +0 -0
ai/chronon/cli/compile/column_hashing.py +40 -17
ai/chronon/cli/compile/compile_context.py +13 -17
ai/chronon/cli/compile/compiler.py +59 -36
ai/chronon/cli/compile/conf_validator.py +251 -99
ai/chronon/cli/compile/display/__init__.py +0 -0
ai/chronon/cli/compile/display/class_tracker.py +6 -16
ai/chronon/cli/compile/display/compile_status.py +10 -10
ai/chronon/cli/compile/display/diff_result.py +79 -14
ai/chronon/cli/compile/fill_templates.py +3 -8
ai/chronon/cli/compile/parse_configs.py +10 -17
ai/chronon/cli/compile/parse_teams.py +38 -34
ai/chronon/cli/compile/serializer.py +3 -9
ai/chronon/cli/compile/version_utils.py +42 -0
ai/chronon/cli/git_utils.py +2 -13
ai/chronon/cli/logger.py +0 -2
ai/chronon/constants.py +1 -1
ai/chronon/group_by.py +47 -47
ai/chronon/join.py +46 -32
ai/chronon/logger.py +1 -2
ai/chronon/model.py +9 -4
ai/chronon/query.py +2 -2
ai/chronon/repo/__init__.py +1 -2
ai/chronon/repo/aws.py +17 -31
ai/chronon/repo/cluster.py +121 -50
ai/chronon/repo/compile.py +14 -8
ai/chronon/repo/constants.py +1 -1
ai/chronon/repo/default_runner.py +32 -54
ai/chronon/repo/explore.py +70 -73
ai/chronon/repo/extract_objects.py +6 -9
ai/chronon/repo/gcp.py +89 -88
ai/chronon/repo/gitpython_utils.py +3 -2
ai/chronon/repo/hub_runner.py +145 -55
ai/chronon/repo/hub_uploader.py +2 -1
ai/chronon/repo/init.py +12 -5
ai/chronon/repo/join_backfill.py +19 -5
ai/chronon/repo/run.py +42 -39
ai/chronon/repo/serializer.py +4 -12
ai/chronon/repo/utils.py +72 -63
ai/chronon/repo/zipline.py +3 -19
ai/chronon/repo/zipline_hub.py +211 -39
ai/chronon/resources/__init__.py +0 -0
ai/chronon/resources/gcp/__init__.py +0 -0
ai/chronon/resources/gcp/group_bys/__init__.py +0 -0
ai/chronon/resources/gcp/group_bys/test/data.py +13 -17
ai/chronon/resources/gcp/joins/__init__.py +0 -0
ai/chronon/resources/gcp/joins/test/data.py +4 -8
ai/chronon/resources/gcp/sources/__init__.py +0 -0
ai/chronon/resources/gcp/sources/test/data.py +9 -6
ai/chronon/resources/gcp/teams.py +9 -21
ai/chronon/source.py +2 -4
ai/chronon/staging_query.py +60 -19
ai/chronon/types.py +3 -2
ai/chronon/utils.py +21 -68
ai/chronon/windows.py +2 -4
{awx_zipline_ai-0.2.1.dist-info → awx_zipline_ai-0.3.1.dist-info}/METADATA +48 -24
awx_zipline_ai-0.3.1.dist-info/RECORD +96 -0
awx_zipline_ai-0.3.1.dist-info/top_level.txt +4 -0
gen_thrift/__init__.py +0 -0
{ai/chronon → gen_thrift}/api/ttypes.py +327 -197
{ai/chronon/api → gen_thrift}/common/ttypes.py +9 -39
gen_thrift/eval/ttypes.py +660 -0
{ai/chronon → gen_thrift}/hub/ttypes.py +12 -131
{ai/chronon → gen_thrift}/observability/ttypes.py +343 -180
{ai/chronon → gen_thrift}/planner/ttypes.py +326 -45
ai/chronon/eval/__init__.py +0 -122
ai/chronon/eval/query_parsing.py +0 -19
ai/chronon/eval/sample_tables.py +0 -100
ai/chronon/eval/table_scan.py +0 -186
ai/chronon/orchestration/ttypes.py +0 -4406
ai/chronon/resources/gcp/README.md +0 -174
ai/chronon/resources/gcp/zipline-cli-install.sh +0 -54
awx_zipline_ai-0.2.1.dist-info/RECORD +0 -93
awx_zipline_ai-0.2.1.dist-info/licenses/LICENSE +0 -202
awx_zipline_ai-0.2.1.dist-info/top_level.txt +0 -3
/jars/__init__.py → /__init__.py +0 -0
{awx_zipline_ai-0.2.1.dist-info → awx_zipline_ai-0.3.1.dist-info}/WHEEL +0 -0
{awx_zipline_ai-0.2.1.dist-info → awx_zipline_ai-0.3.1.dist-info}/entry_points.txt +0 -0
{ai/chronon → gen_thrift}/api/__init__.py +0 -0
{ai/chronon/api/common → gen_thrift/api}/constants.py +0 -0
{ai/chronon/api → gen_thrift}/common/__init__.py +0 -0
{ai/chronon/api → gen_thrift/common}/constants.py +0 -0
{ai/chronon/fetcher → gen_thrift/eval}/__init__.py +0 -0
{ai/chronon/fetcher → gen_thrift/eval}/constants.py +0 -0
{ai/chronon/hub → gen_thrift/fetcher}/__init__.py +0 -0
{ai/chronon/hub → gen_thrift/fetcher}/constants.py +0 -0
{ai/chronon → gen_thrift}/fetcher/ttypes.py +0 -0
{ai/chronon/observability → gen_thrift/hub}/__init__.py +0 -0
{ai/chronon/observability → gen_thrift/hub}/constants.py +0 -0
{ai/chronon/orchestration → gen_thrift/observability}/__init__.py +0 -0
{ai/chronon/orchestration → gen_thrift/observability}/constants.py +0 -0
{ai/chronon → gen_thrift}/planner/__init__.py +0 -0
{ai/chronon → gen_thrift}/planner/constants.py +0 -0

ai/chronon/resources/gcp/group_bys/test/data.py CHANGED Viewed

@@ -1,34 +1,30 @@
 from sources.test.data import source_v1
 from ai.chronon.group_by import Aggregation, GroupBy, Operation, TimeUnit, Window
-window_sizes = [Window(length=day, time_unit=TimeUnit.DAYS) for day in [3, 14, 30]] # Define some window sizes to use below
+window_sizes = [
+    Window(length=day, time_unit=TimeUnit.DAYS) for day in [3, 14, 30]
+]  # Define some window sizes to use below
 group_by_v1 = GroupBy(
     backfill_start_date="2023-11-01",
     sources=[source_v1],
-    keys=["user_id"], # We are aggregating by user
+    keys=["user_id"],  # We are aggregating by user
     online=True,
-    aggregations=[Aggregation(
-        input_column="purchase_price",
-        operation=Operation.SUM,
-        windows=window_sizes
-    ), # The sum of purchases prices in various windows
+    aggregations=[
         Aggregation(
-            input_column="purchase_price",
-            operation=Operation.COUNT,
-            windows=window_sizes
-        ), # The count of purchases in various windows
+            input_column="purchase_price", operation=Operation.SUM, windows=window_sizes
+        ),  # The sum of purchases prices in various windows
         Aggregation(
-            input_column="purchase_price",
-            operation=Operation.AVERAGE,
-            windows=window_sizes
-        ), # The average purchases by user in various windows
+            input_column="purchase_price", operation=Operation.COUNT, windows=window_sizes
+        ),  # The count of purchases in various windows
+        Aggregation(
+            input_column="purchase_price", operation=Operation.AVERAGE, windows=window_sizes
+        ),  # The average purchases by user in various windows
         Aggregation(
             input_column="purchase_price",
             operation=Operation.LAST_K(10),
         ),
     ],
     version=0,
-)
+)

ai/chronon/resources/gcp/joins/__init__.py ADDED Viewed

File without changes

ai/chronon/resources/gcp/joins/test/data.py CHANGED Viewed

@@ -1,6 +1,6 @@
+from gen_thrift.api.ttypes import EventSource, Source
 from group_bys.test.data import group_by_v1
-from ai.chronon.api.ttypes import EventSource, Source
 from ai.chronon.join import Join, JoinPart
 from ai.chronon.query import Query, selects
@@ -12,9 +12,7 @@ source = Source(
     events=EventSource(
         table="data.checkouts",
         query=Query(
-            selects=selects(
-                "user_id"
-            ),  # The primary key used to join various GroupBys together
+            selects=selects("user_id"),  # The primary key used to join various GroupBys together
             time_column="ts",
         ),  # The event time used to compute feature values as-of
     )
@@ -22,9 +20,7 @@ source = Source(
 v1 = Join(
     left=source,
-    right_parts=[
-        JoinPart(group_by=group_by_v1)
-    ],
+    right_parts=[JoinPart(group_by=group_by_v1)],
     row_ids="user_id",
     version=0,
-)
+)

ai/chronon/resources/gcp/sources/__init__.py ADDED Viewed

File without changes

ai/chronon/resources/gcp/sources/test/data.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from ai.chronon.api.ttypes import EventSource, Source
+from gen_thrift.api.ttypes import EventSource, Source
 from ai.chronon.query import Query, selects
 """
@@ -13,11 +14,13 @@ with a clear event time column and selected fields for downstream feature comput
 source_v1 = Source(
     events=EventSource(
-        table="data.purchases", # This points to the log table in the warehouse with historical purchase events, updated in batch daily
-        topic=None, # See the 'returns' GroupBy for an example that has a streaming source configured. In this case, this would be the streaming source topic that can be listened to for realtime events
+        table="data.purchases",  # This points to the log table in the warehouse with historical purchase events, updated in batch daily
+        topic=None,  # See the 'returns' GroupBy for an example that has a streaming source configured. In this case, this would be the streaming source topic that can be listened to for realtime events
         query=Query(
-            selects=selects("user_id","purchase_price"), # Select the fields we care about
-            time_column="ts") # The event time
-    ))
+            selects=selects("user_id", "purchase_price"),  # Select the fields we care about
+            time_column="ts",
+        ),  # The event time
+    )
+)
 # The `source_v1` object can now be used in a Chronon join or pipeline definition

ai/chronon/resources/gcp/teams.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from ai.chronon.api.ttypes import Team
+from gen_thrift.api.ttypes import Team
 from ai.chronon.repo.constants import RunMode
 from ai.chronon.types import ConfigProperties, EnvironmentVariables
@@ -10,34 +11,25 @@ default = Team(
         common={
             "spark.chronon.table.format_provider.class": "ai.chronon.integrations.cloud_gcp.GcpFormatProvider",
             "spark.chronon.table_write.format": "iceberg",
             "spark.sql.defaultCatalog": "bigquery_catalog",
             "spark.sql.catalog.bigquery_catalog": "ai.chronon.integrations.cloud_gcp.DelegatingBigQueryMetastoreCatalog",
             "spark.sql.catalog.bigquery_catalog.catalog-impl": "org.apache.iceberg.gcp.bigquery.BigQueryMetastoreCatalog",
             "spark.sql.catalog.bigquery_catalog.io-impl": "org.apache.iceberg.io.ResolvingFileIO",
             "spark.sql.defaultUrlStreamHandlerFactory.enabled": "false",
             "spark.kryo.registrator": "ai.chronon.integrations.cloud_gcp.ChrononIcebergKryoRegistrator",
             "spark.chronon.coalesce.factor": "10",
             "spark.default.parallelism": "10",
             "spark.sql.shuffle.partitions": "10",
             # TODO: Please fill in the following values
             "spark.sql.catalog.bigquery_catalog.warehouse": "gs://zipline-warehouse-<customer_id>/data/tables/",
-            "spark.sql.catalog.bigquery_catalog.gcp_location": "<region>",
-            "spark.sql.catalog.bigquery_catalog.gcp_project": "<project-id>",
-            "spark.chronon.partition.format": "<date-format>", # ex: "yyyy-MM-dd",
-            "spark.chronon.partition.column": "<partition-column-name>", # ex: "ds",
+            "spark.sql.catalog.bigquery_catalog.gcp.bigquery.location": "<region>",
+            "spark.sql.catalog.bigquery_catalog.gcp.bigquery.project-id": "<project-id>",
+            "spark.chronon.partition.format": "<date-format>",  # ex: "yyyy-MM-dd",
+            "spark.chronon.partition.column": "<partition-column-name>",  # ex: "ds",
         },
     ),
     env=EnvironmentVariables(
         common={
-            "JOB_MODE": "local[*]",
-            "CHRONON_ONLINE_CLASS": "[ONLINE-TODO]your.online.class",
-            "CHRONON_ONLINE_ARGS": "[ONLINE-TODO]args prefixed with -Z become constructor map for your implementation of ai.chronon.online.Api, -Zkv-host=<YOUR_HOST> -Zkv-port=<YOUR_PORT>",
             # TODO: Please fill in the following values
             "CUSTOMER_ID": "<customer_id>",
             "GCP_PROJECT_ID": "<project-id>",
@@ -45,7 +37,7 @@ default = Team(
             "GCP_DATAPROC_CLUSTER_NAME": "<dataproc-cluster-name>",
             "GCP_BIGTABLE_INSTANCE_ID": "<bigtable-instance-id>",
             "ARTIFACT_PREFIX": "<customer-artifact-bucket>",
-            "CLOUD_PROVIDER": "<gcp | aws>"
+            "CLOUD_PROVIDER": "<gcp | aws>",
         },
     ),
 )
@@ -54,11 +46,7 @@ default = Team(
 test = Team(
     outputNamespace="data",
     env=EnvironmentVariables(
-        common={},
-        modeEnvironments={
-            RunMode.BACKFILL: {},
-            RunMode.UPLOAD: {}
-        }
+        common={}, modeEnvironments={RunMode.BACKFILL: {}, RunMode.UPLOAD: {}}
     ),
 )
@@ -67,4 +55,4 @@ team_conf = Team(
     env=EnvironmentVariables(
         common={},
     ),
-)
+)

ai/chronon/source.py CHANGED Viewed

@@ -2,7 +2,7 @@
 Wrappers to directly create Source objects.
 """
-import ai.chronon.api.ttypes as ttypes
+import gen_thrift.api.ttypes as ttypes
 def EventSource(
@@ -29,9 +29,7 @@ def EventSource(
     """
     return ttypes.Source(
-        events=ttypes.EventSource(
-            table=table, topic=topic, query=query, isCumulative=is_cumulative
-        )
+        events=ttypes.EventSource(table=table, topic=topic, query=query, isCumulative=is_cumulative)
     )

ai/chronon/staging_query.py CHANGED Viewed

@@ -1,20 +1,28 @@
 import inspect
 import json
 from dataclasses import dataclass
 from typing import Dict, List, Optional, Union
+import gen_thrift.api.ttypes as ttypes
+import gen_thrift.common.ttypes as common
 import ai.chronon.airflow_helpers as airflow_helpers
-import ai.chronon.api.common.ttypes as common
-import ai.chronon.api.ttypes as ttypes
+from ai.chronon import utils
 from ai.chronon.constants import AIRFLOW_DEPENDENCIES_KEY
+def _get_output_table_name(staging_query: ttypes.StagingQuery, full_name: bool = False):
+    """generate output table name for staging query job"""
+    utils.__set_name(staging_query, ttypes.StagingQuery, "staging_queries")
+    return utils.output_table_name(staging_query, full_name=full_name)
 # Wrapper for EngineType
 class EngineType:
     SPARK = ttypes.EngineType.SPARK
     BIGQUERY = ttypes.EngineType.BIGQUERY
 @dataclass
 class TableDependency:
     table: str
@@ -26,26 +34,54 @@ class TableDependency:
     def to_thrift(self):
         if self.offset is None:
             raise ValueError(f"Dependency offset for table {self.table} must be specified.")
-        offset_window = common.Window(length = self.offset, timeUnit= common.TimeUnit.DAYS)
+        offset_window = common.Window(length=self.offset, timeUnit=common.TimeUnit.DAYS)
         return common.TableDependency(
             tableInfo=common.TableInfo(
-                table=self.table,
+                table=self.table,
                 partitionColumn=self.partition_column,
                 partitionFormat=self.partition_format,
-                partitionInterval=common.Window(1, common.TimeUnit.DAYS)
+                partitionInterval=common.Window(1, common.TimeUnit.DAYS),
             ),
             startOffset=offset_window,
             endOffset=offset_window,
             startCutOff=None,
-            endCutOff=None
+            endCutOff=None,
         )
+def Import(
+    query: str,
+    version: int,
+    output_namespace: Optional[str] = None,
+    engine_type: Optional[EngineType] = None,
+    dependencies: Optional[List[Union[TableDependency, Dict]]] = None,
+    conf: Optional[common.ConfigProperties] = None,
+    env_vars: Optional[common.EnvironmentVariables] = None,
+    offline_schedule: str = "@daily",
+):
+    assert dependencies is not None and len(dependencies) == 1, (
+        f"Import must specify exactly one table dependency. Got: {dependencies}"
+    )
+    assert dependencies[0].partition_column is not None, (
+        f"Import must specify a partition column for the table dependency. Got: {dependencies[0].partition_column}"
+    )
+    return StagingQuery(
+        query=query,
+        version=version,
+        output_namespace=output_namespace,
+        dependencies=dependencies,
+        conf=conf,
+        env_vars=env_vars,
+        engine_type=engine_type,
+        offline_schedule=offline_schedule,
+    )
 def StagingQuery(
-    name: str,
     query: str,
     version: int,
     output_namespace: Optional[str] = None,
-    start_partition: Optional[str] = None,
     table_properties: Optional[Dict[str, str]] = None,
     setups: Optional[List[str]] = None,
     engine_type: Optional[EngineType] = None,
@@ -58,23 +94,20 @@ def StagingQuery(
     cluster_conf: common.ClusterConfigProperties = None,
     step_days: Optional[int] = None,
     recompute_days: Optional[int] = None,
+    additional_partitions: List[str] = None,
 ) -> ttypes.StagingQuery:
     """
     Creates a StagingQuery object for executing arbitrary SQL queries with templated date parameters.
     :param query:
         Arbitrary spark query that should be written with template parameters:
-        - `{{ start_date }}`: Initial run uses start_partition, future runs use latest partition + 1 day
+        - `{{ start_date }}`: Initial run uses start_date, future runs use latest partition + 1 day
         - `{{ end_date }}`: The end partition of the computing range
         - `{{ latest_date }}`: End partition independent of the computing range (for cumulative sources)
         - `{{ max_date(table=namespace.my_table) }}`: Max partition available for a given table
         These parameters can be modified with offset and bounds:
         - `{{ start_date(offset=-10, lower_bound='2023-01-01', upper_bound='2024-01-01') }}`
     :type query: str
-    :param start_partition:
-        On the first run, `{{ start_date }}` will be set to this user provided start date,
-        future incremental runs will set it to the latest existing partition + 1 day.
-    :type start_partition: str
     :param setups:
         Spark SQL setup statements. Used typically to register UDFs.
     :type setups: List[str]
@@ -121,13 +154,17 @@ def StagingQuery(
     # Get caller's filename to assign team
     team = inspect.stack()[1].filename.split("/")[-2]
+    assert isinstance(version, int), (
+        f"Version must be an integer, but found {type(version).__name__}"
+    )
     # Create execution info
     exec_info = common.ExecutionInfo(
         scheduleCron=offline_schedule,
         conf=conf,
         env=env_vars,
         stepDays=step_days,
-        clusterConf=cluster_conf
+        clusterConf=cluster_conf,
     )
     airflow_dependencies = []
@@ -155,14 +192,14 @@ def StagingQuery(
     # Create metadata
     meta_data = ttypes.MetaData(
-        name=name,
         outputNamespace=output_namespace,
         team=team,
         executionInfo=exec_info,
         tags=tags,
         customJson=custom_json,
         tableProperties=table_properties,
-        version=str(version)
+        version=str(version),
+        additionalOutputPartitionColumns=additional_partitions,
     )
     thrift_deps = []
@@ -175,11 +212,15 @@ def StagingQuery(
     staging_query = ttypes.StagingQuery(
         metaData=meta_data,
         query=query,
-        startPartition=start_partition,
         setups=setups,
         engineType=engine_type,
         tableDependencies=thrift_deps,
         recomputeDays=recompute_days,
     )
-    return staging_query
+    # Add the table property that calls the private function
+    staging_query.__class__.table = property(
+        lambda self: _get_output_table_name(self, full_name=True)
+    )
+    return staging_query

ai/chronon/types.py CHANGED Viewed

@@ -2,8 +2,9 @@
 importing ai.chronon.types will bring in all the api's needed to create any chronon object
 """
-import ai.chronon.api.common.ttypes as common
-import ai.chronon.api.ttypes as ttypes
+import gen_thrift.api.ttypes as ttypes
+import gen_thrift.common.ttypes as common
 import ai.chronon.group_by as group_by
 import ai.chronon.join as join
 import ai.chronon.query as query

ai/chronon/utils.py CHANGED Viewed

@@ -23,9 +23,9 @@ import tempfile
 from collections.abc import Iterable
 from typing import List, Optional, Union, cast
-import ai.chronon.api.ttypes as api
+import gen_thrift.api.ttypes as api
 import ai.chronon.repo.extract_objects as eo
-from ai.chronon.cli.compile import parse_teams
 from ai.chronon.repo import FOLDER_NAME_TO_CLASS
 ChrononJobTypes = Union[api.GroupBy, api.Join, api.StagingQuery]
@@ -56,21 +56,16 @@ class JsonDiffer:
         self.new_name = "new.json"
         self.old_name = "old.json"
-    def diff(
-        self, new_json_str: object, old_json_str: object, skipped_keys=None
-    ) -> str:
+    def diff(self, new_json_str: object, old_json_str: object, skipped_keys=None) -> str:
         if skipped_keys is None:
             skipped_keys = []
-        new_json = {
-            k: v for k, v in json.loads(new_json_str).items() if k not in skipped_keys
-        }
-        old_json = {
-            k: v for k, v in json.loads(old_json_str).items() if k not in skipped_keys
-        }
-        with open(os.path.join(self.temp_dir, self.old_name), mode="w") as old, open(
-            os.path.join(self.temp_dir, self.new_name), mode="w"
-        ) as new:
+        new_json = {k: v for k, v in json.loads(new_json_str).items() if k not in skipped_keys}
+        old_json = {k: v for k, v in json.loads(old_json_str).items() if k not in skipped_keys}
+        with (
+            open(os.path.join(self.temp_dir, self.old_name), mode="w") as old,
+            open(os.path.join(self.temp_dir, self.new_name), mode="w") as new,
+        ):
             old.write(json.dumps(old_json, sort_keys=True, indent=2))
             new.write(json.dumps(new_json, sort_keys=True, indent=2))
         diff_str = subprocess.run(
@@ -131,6 +126,7 @@ def _get_underlying_source(
     else:
         return source.joinSource
 def get_root_source(
     source: api.Source,
 ) -> Union[api.EventSource, api.EntitySource]:
@@ -141,6 +137,7 @@ def get_root_source(
     else:
         return get_root_source(source.joinSource.join.left)
 def get_query(source: api.Source) -> api.Query:
     return _get_underlying_source(source).query
@@ -151,7 +148,9 @@ def get_table(source: api.Source) -> str:
     elif source.events:
         table = source.events.table
     else:
-        table = get_join_output_table_name(source.joinSource.join, True)
+        from ai.chronon.join import _get_output_table_name
+        table = _get_output_table_name(source.joinSource.join, True)
     return table.split("/")[0]
@@ -229,11 +228,7 @@ def dict_to_bash_commands(d):
         return ""
     bash_commands = []
     for key, value in d.items():
-        cmd = (
-            f"--{key.replace('_', '-')}={value}"
-            if value
-            else f"--{key.replace('_', '-')}"
-        )
+        cmd = f"--{key.replace('_', '-')}={value}" if value else f"--{key.replace('_', '-')}"
         bash_commands.append(cmd)
     return " ".join(bash_commands)
@@ -259,9 +254,7 @@ def output_table_name(obj, full_name: bool):
 def join_part_name(jp):
     if jp.groupBy is None:
-        raise NotImplementedError(
-            "Join Part names for non group bys is not implemented."
-        )
+        raise NotImplementedError("Join Part names for non group bys is not implemented.")
     if not jp.groupBy.metaData.name and isinstance(jp.groupBy, api.GroupBy):
         __set_name(jp.groupBy, api.GroupBy, "group_bys")
     return "_".join(
@@ -296,51 +289,15 @@ def join_part_output_table_name(join, jp, full_name: bool = False):
     )
-def group_by_output_table_name(obj, full_name: bool = False):
-    """
-    Group by backfill output table name
-    To be synced with api.Extensions.scala
-    """
-    if not obj.metaData.name:
-        __set_name(obj, api.GroupBy, "group_bys")
-    return output_table_name(obj, full_name)
 def log_table_name(obj, full_name: bool = False):
     return output_table_name(obj, full_name=full_name) + "_logged"
-def get_staging_query_output_table_name(
-    staging_query: api.StagingQuery, full_name: bool = False
-):
-    """generate output table name for staging query job"""
-    __set_name(staging_query, api.StagingQuery, "staging_queries")
-    return output_table_name(staging_query, full_name=full_name)
 def get_team_conf_from_py(team, key):
     team_module = importlib.import_module(f"teams.{team}")
     return getattr(team_module, key)
-def get_join_output_table_name(join: api.Join, full_name: bool = False):
-    """generate output table name for join backfill job"""
-    # join sources could also be created inline alongside groupBy file
-    # so we specify fallback module as group_bys
-    if isinstance(join, api.Join):
-        __set_name(join, api.Join, "joins")
-    # set output namespace
-    if not join.metaData.outputNamespace:
-        team_name = join.metaData.name.split(".")[0]
-        namespace = (
-            parse_teams.load_teams(chronon_root_path, print=False)
-            .get(team_name)
-            .outputNamespace
-        )
-        join.metaData.outputNamespace = namespace
-    return output_table_name(join, full_name=full_name)
 def wait_for_simple_schema(table, lag, start, end):
     if not table:
         return None
@@ -348,9 +305,7 @@ def wait_for_simple_schema(table, lag, start, end):
     clean_name = table_tokens[0]
     subpartition_spec = "/".join(table_tokens[1:]) if len(table_tokens) > 1 else ""
     return {
-        "name": "wait_for_{}_ds{}".format(
-            clean_name, "" if lag == 0 else f"_minus_{lag}"
-        ),
+        "name": "wait_for_{}_ds{}".format(clean_name, "" if lag == 0 else f"_minus_{lag}"),
         "spec": "{}/ds={}{}".format(
             clean_name,
             "{{ ds }}" if lag == 0 else "{{{{ macros.ds_add(ds, -{}) }}}}".format(lag),
@@ -413,7 +368,6 @@ def get_applicable_modes(conf: ChrononJobTypes) -> List[str]:
                 modes.append("streaming")
     elif isinstance(conf, api.Join):
         join = cast(api.Join, conf)
         if get_offline_schedule(conf) is not None:
@@ -483,9 +437,9 @@ def chronon_path(file_path: str) -> str:
     conf_types = FOLDER_NAME_TO_CLASS.keys()
     splits = file_path.split("/")
     conf_occurences = [splits.index(typ) for typ in conf_types if typ in splits]
-    assert (
-        len(conf_occurences) > 0
-    ), f"Path: {file_path} doesn't contain folder with name among {conf_types}"
+    assert len(conf_occurences) > 0, (
+        f"Path: {file_path} doesn't contain folder with name among {conf_types}"
+    )
     index = min([splits.index(typ) for typ in conf_types if typ in splits])
     rel_path = "/".join(splits[index:])
@@ -535,7 +489,6 @@ def compose(arg, *methods):
     result = [indent + arg]
     for method in methods:
         method_parts = method.split(" ", 1)
         method = method_parts[0]

ai/chronon/windows.py CHANGED Viewed

@@ -1,4 +1,4 @@
-import ai.chronon.api.common.ttypes as common
+import gen_thrift.common.ttypes as common
 def _days(length: int) -> common.Window:
@@ -40,9 +40,7 @@ def _from_str(s: str) -> common.Window:
         elif unit == "h":
             return _hours(length)
         else:
-            raise ValueError(
-                f"Invalid time unit '{unit}'. Must be 'd' for days or 'h' for hours"
-            )
+            raise ValueError(f"Invalid time unit '{unit}'. Must be 'd' for days or 'h' for hours")
     except ValueError as e:
         if "invalid literal for int()" in str(e):

{awx_zipline_ai-0.2.1.dist-info → awx_zipline_ai-0.3.1.dist-info}/METADATA RENAMED Viewed

@@ -1,33 +1,57 @@
 Metadata-Version: 2.4
 Name: awx-zipline-ai
-Version: 0.2.1
-Summary: Zipline python API library
-Classifier: Programming Language :: Python :: 3.11
+Version: 0.3.1
+Summary: CLI tool for the Zipline AI platform
+Author-email: Zipline AI <hello@zipline.ai>
+License: Apache License 2.0
+Project-URL: homepage, https://zipline.ai
+Project-URL: documentation, https://docs.zipline.ai
+Project-URL: github, https://github.com/zipline-ai/chronon/
 Requires-Python: >=3.11
 Description-Content-Type: text/markdown
-License-File: LICENSE
-Requires-Dist: click
-Requires-Dist: thrift==0.20.0
-Requires-Dist: pyspark==3.5.4
-Requires-Dist: sqlglot
+Requires-Dist: boto3==1.40.26
+Requires-Dist: botocore==1.40.26
+Requires-Dist: cachetools==5.5.2
+Requires-Dist: certifi==2025.8.3
+Requires-Dist: charset-normalizer==3.4.3
+Requires-Dist: click==8.2.1
 Requires-Dist: crcmod==1.7
-Requires-Dist: glom
-Requires-Dist: boto3
-Requires-Dist: importlib-resources==6.5.2
-Requires-Dist: rich
+Requires-Dist: gitdb==4.0.12
+Requires-Dist: gitpython==3.1.45
+Requires-Dist: google-api-core[grpc]==2.25.1
+Requires-Dist: google-auth==2.40.3
+Requires-Dist: google-cloud-bigquery-storage==2.33.0
+Requires-Dist: google-cloud-core==2.4.3
+Requires-Dist: google-cloud-iam==2.19.1
 Requires-Dist: google-cloud-storage==2.19.0
-Requires-Dist: google-cloud-bigquery-storage
-Requires-Dist: GitPython
-Provides-Extra: pip2compat
-Requires-Dist: click<8; extra == "pip2compat"
-Dynamic: classifier
-Dynamic: description
-Dynamic: description-content-type
-Dynamic: license-file
-Dynamic: provides-extra
-Dynamic: requires-dist
-Dynamic: requires-python
-Dynamic: summary
+Requires-Dist: google-crc32c==1.7.1
+Requires-Dist: google-resumable-media==2.7.2
+Requires-Dist: googleapis-common-protos[grpc]==1.70.0
+Requires-Dist: grpc-google-iam-v1==0.14.2
+Requires-Dist: grpcio<=1.74.0,>=1.66.2
+Requires-Dist: grpcio-status<=1.74.0,>=1.62.3
+Requires-Dist: idna==3.10
+Requires-Dist: importlib-resources==6.5.2
+Requires-Dist: jmespath==1.0.1
+Requires-Dist: markdown-it-py==4.0.0
+Requires-Dist: mdurl==0.1.2
+Requires-Dist: proto-plus==1.26.1
+Requires-Dist: protobuf<=6.32.0,>=4.25.5
+Requires-Dist: py4j==0.10.9.7
+Requires-Dist: pyasn1==0.6.1
+Requires-Dist: pyasn1-modules==0.4.2
+Requires-Dist: pygments==2.19.2
+Requires-Dist: pyspark==3.5.4
+Requires-Dist: python-dateutil==2.9.0.post0
+Requires-Dist: requests==2.32.5
+Requires-Dist: rich==14.1.0
+Requires-Dist: rsa==4.9.1
+Requires-Dist: s3transfer==0.13.1
+Requires-Dist: six==1.17.0
+Requires-Dist: smmap==5.0.2
+Requires-Dist: thrift==0.20.0
+Requires-Dist: urllib3==2.5.0
+Requires-Dist: python-dotenv>=1.0.1
 ### Chronon Python API

awx-zipline-ai 0.2.1__py3-none-any.whl → 0.3.1__py3-none-any.whl

awx-zipline-ai 0.2.1py3-none-any.whl → 0.3.1py3-none-any.whl