PyPI - dasl-client - Versions diffs - 1.0.13__tar.gz → 1.0.16__tar.gz - Mend

dasl-client 1.0.13tar.gz → 1.0.16tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of dasl-client might be problematic. Click here for more details.

Files changed (43) hide show

{dasl_client-1.0.13 → dasl_client-1.0.16}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: dasl_client
-Version: 1.0.13
+Version: 1.0.16
 Summary: The DASL client library used for interacting with the DASL workspace
 Home-page: https://github.com/antimatter/asl
 Author: Antimatter Team
@@ -8,10 +8,10 @@ Author-email: Antimatter Team <support@antimatter.io>
 Requires-Python: >=3.8
 Description-Content-Type: text/markdown
 License-File: LICENSE
-Requires-Dist: dasl_api==0.1.15
+Requires-Dist: dasl_api==0.1.17
 Requires-Dist: databricks-sdk>=0.41.0
 Requires-Dist: pydantic>=2
-Requires-Dist: typing_extensions==4.10.0
+Requires-Dist: typing_extensions>=4.10.0
 # DASL Client Library

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/client.py RENAMED Viewed

@@ -1,5 +1,9 @@
 from copy import deepcopy
-from typing import Any, Callable, Iterator, List, Optional, TypeVar
+from datetime import datetime, timedelta
+from time import sleep
+from typing import Any, Callable, Iterator, List, Optional, Tuple, TypeVar
+from pydantic import Field
+from pyspark.sql import DataFrame
 from dasl_api import (
     CoreV1Api,
@@ -9,8 +13,6 @@ from dasl_api import (
     WorkspaceV1CreateWorkspaceRequest,
     api,
 )
-from pydantic import Field
 from dasl_client.auth.auth import (
     Authorization,
     DatabricksSecretAuth,
@@ -569,10 +571,46 @@ class Client:
             )
         return Rule.from_api_obj(result)
+    def exec_rule(
+        self, rule_in: Rule, df: DataFrame
+    ) -> Tuple[DataFrame, Optional[DataFrame]]:
+        """
+        Locally execute a Rule. Must be run from within a Databricks
+        notebook or else an exception will be raised. This is intended
+        to facilitate Rule development.
+        :param rule_in: The specification of the Rule to execute.
+        :param df: The DataFrame to use as the input to the Rule.
+        :returns Tuple[DataFrame, Optional[DataFrame]]: The first
+            element of the tuple contains the notables produced by
+            the rule, and the second element contains the observables
+            or None if no observables were produced.
+        """
+        Helpers.ensure_databricks()
+        with error_handler():
+            result = self._core_client().core_v1_render_rule(
+                self._workspace(),
+                rule_in.to_api_obj(),
+            )
+            try:
+                import notebook_utils
+            except ImportError as e:
+                raise ImportError(
+                    "Package 'notebook_utils' not found. "
+                    "Install it within this this notebook using "
+                    f"%pip install {result.notebook_utils_path}"
+                )
+            namespace = {}
+            exec(result.content, namespace)
+            return namespace["generate"](df)
     def adhoc_transform(
         self,
         warehouse: str,
         request: TransformRequest,
+        timeout: timedelta = timedelta(minutes=5),
     ) -> TransformResponse:
         """
         Run a sequence of ADHOC transforms against a SQL warehouse to
@@ -583,16 +621,29 @@ class Client:
         :return: a TransformResponse object containing the results
             after running the transforms.
         :raises: NotFoundError if the rule does not exist
+        :raises: Exception for a server-side error or timeout
         """
         with error_handler():
-            return TransformResponse.from_api_obj(
-                self._dbui_client().dbui_v1_transform(
-                    self._workspace(),
-                    warehouse,
-                    request.to_api_obj(),
-                )
+            status = self._dbui_client().dbui_v1_transform(
+                self._workspace(),
+                warehouse,
+                request.to_api_obj(),
             )
+            begin = datetime.now()
+            while datetime.now() - begin < timeout:
+                sleep(5)
+                status = self._dbui_client().dbui_v1_transform_status(
+                    self._workspace(), status.id
+                )
+                if status.status == "failure":
+                    raise Exception(f"adhoc transform failed with {status.error}")
+                elif status.status == "success":
+                    return TransformResponse.from_api_obj(status.result)
+            raise Exception("timed out waiting for adhoc transform result")
     def get_observable_events(
         self,
         warehouse: str,

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/helpers.py RENAMED Viewed

@@ -6,15 +6,18 @@ class Helpers:
     default_dasl_host = "https://api.prod.sl.antimatter.io"
     @staticmethod
-    def databricks_context():
-        # This import raises an exception if outside a notebook context, so only
-        # import if this method is called
+    def ensure_databricks():
         if "DATABRICKS_RUNTIME_VERSION" not in os.environ:
             raise Exception(
                 "attempted to access databricks context outside "
                 + "of databricks notebook"
             )
+    @staticmethod
+    def databricks_context():
+        # This import raises an exception if outside a notebook context, so only
+        # import if this method is called
+        Helpers.ensure_databricks()
         from databricks.sdk.runtime import dbutils
         return dbutils.notebook.entry_point.getDbutils().notebook().getContext()

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/preset_development/errors.py RENAMED Viewed

@@ -149,7 +149,10 @@ class AssertionFailedError(PresetError):
     def __init__(self, expr: str, assertion_message: str, df: DataFrame):
         # Get the Databricks built-in functions out the namespace.
         ipython = get_ipython()
-        display = ipython.user_ns["display"]
+        if ipython is not None:
+            display = ipython.user_ns["display"]
+        else:
+            display = lambda x: x.show()
         self.expr = expr
         self.assertion_message = assertion_message

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/preset_development/preview_engine.py RENAMED Viewed

@@ -54,10 +54,13 @@ class PreviewEngine:
                 self._preset.get("silver", None), self._pretransform_name
             )
+        self._bronze = None
         self._pre = None
         self._silver = []
         self._gold = []
-        self._result_df_map = {}
+        self._result_df_map: Tuple[
+            DataFrame, Dict[str, DataFrame], Dict[str, DataFrame]
+        ] = (None, {}, {})
     def _validate_pretransform_name(
         self, silver: Dict[str, str], pretransform_name: str
@@ -181,8 +184,12 @@ class PreviewEngine:
         # Get the Databricks built-in functions out the namespace.
         ipython = get_ipython()
-        displayHTML = ipython.user_ns["displayHTML"]
-        display = ipython.user_ns["display"]
+        if ipython is not None:
+            displayHTML = ipython.user_ns["displayHTML"]
+            display = ipython.user_ns["display"]
+        else:
+            displayHTML = lambda x: print(x)
+            display = lambda x: x.show()
         def d(txt, lvl) -> None:
             displayHTML(
@@ -245,7 +252,7 @@ class PreviewEngine:
                 raise UnknownGoldTableError(name, gold_table_schema)
             # Performs the type check.
-            delta_df = self._spark.table(f"{gold_table_schema}.{name}").limit(0)
+            delta_df = self._spark.table(f"`{gold_table_schema}`.`{name}`").limit(0)
             unioned_df = delta_df.unionByName(df, allowMissingColumns=True)
             # Now we check no new columns.
@@ -286,7 +293,7 @@ class PreviewEngine:
             d("Resultant gold table preview", 3)
             display(unioned_df)
-    def evaluate(self, gold_table_schema: str) -> None:
+    def evaluate(self, gold_table_schema: str, display: bool = True) -> None:
         """
         Evaluates the loaded preset YAML using the input datasource configuration to load
         records. Finally, checks that the output from the Gold stages is compatible with
@@ -303,7 +310,9 @@ class PreviewEngine:
         ):
             if not any(
                 row.databaseName == schema_name
-                for row in self._spark.sql(f"SHOW SCHEMAS IN {catalog_name}").collect()
+                for row in self._spark.sql(
+                    f"SHOW SCHEMAS IN `{catalog_name}`"
+                ).collect()
             ):
                 raise InvalidGoldTableSchemaError(
                     gold_table_schema,
@@ -340,5 +349,12 @@ class PreviewEngine:
         self._compile_stages()
         with self._ds_params as df:
+            self._bronze = df
             self._result_df_map = self._run(df)
-            self._render_output(df, self._result_df_map, gold_table_schema)
+            if display:
+                self._render_output(df, self._result_df_map, gold_table_schema)
+    def results(
+        self,
+    ) -> Tuple[DataFrame, DataFrame, Dict[str, DataFrame], Dict[str, DataFrame]]:
+        return self._bronze, *self._result_df_map

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/preset_development/preview_parameters.py RENAMED Viewed

@@ -1,3 +1,5 @@
+from typing import Optional
 from pyspark.sql import DataFrame, SparkSession
 from pyspark.sql.types import *
 from pyspark.sql.dataframe import DataFrame
@@ -115,6 +117,7 @@ class PreviewParameters:
         self._table = None
         self._pretransform_name = None
+        self._bronze_pre_transform: Optional[List[str]] = None
         self._df = None
@@ -166,10 +169,13 @@ class PreviewParameters:
                 self._record_limit
             )
+            if self._bronze_pre_transform is not None:
+                stream_df = stream_df.selectExpr(*self._bronze_pre_transform)
             query = (
                 stream_df.writeStream.format("memory")
                 .queryName("batch_data")
-                .trigger(once=True)
+                .trigger(availableNow=True)
                 .start()
             )
@@ -193,12 +199,17 @@ class PreviewParameters:
         # Get the Databricks built-in functions out the namespace.
         ipython = get_ipython()
-        dbutils = ipython.user_ns["dbutils"]
+        if ipython is not None:
+            dbutils = ipython.user_ns["dbutils"]
-        dbutils.fs.rm(
-            f"{self._autoloader_temp_schema_location}/{self._schema_uuid_str}",
-            recurse=True,
-        )
+            dbutils.fs.rm(
+                f"{self._autoloader_temp_schema_location}/{self._schema_uuid_str}",
+                recurse=True,
+            )
+        else:
+            print(
+                f"FYI, we are leaking temp data {self._autoloader_temp_schema_location}/{self._schema_uuid_str}"
+            )
     def from_input(self):
         """
@@ -286,6 +297,10 @@ class PreviewParameters:
         Returns:
             PreviewParameters: The current instance with updated configuration.
         """
+        if file_format.lower() == "jsonl":
+            self._autoloader_format = "json"
+            self.set_autoloader_multiline(False)
+            return self
         self._autoloader_format = file_format
         return self
@@ -350,6 +365,16 @@ class PreviewParameters:
         self._pretransform_name = pretransform_name
         return self
+    def set_bronze_pre_transform(self, expr: List[str]):
+        """
+        Sets a pre-transform expression that will run before data is written to bronze
+        Returns:
+            PreviewParameters: The current instance with updated configuration.
+        """
+        self._bronze_pre_transform = expr
+        return self
     def set_date_range(self, column: str, start_time: str, end_time: str):
         """
         Set the TIMESTAMP column and date range to use as the input data filter to

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/preset_development/stage.py RENAMED Viewed

@@ -150,17 +150,19 @@ class Stage:
         if target_col not in existing_columns:
             raise ReferencedColumnMissingError("jsonExtract", target_col)
         schema = self._spark.sql(
-            f"SELECT schema_of_json_agg({target_col}) AS sc FROM {{df}}", df=df
+            f"SELECT schema_of_json_agg({self.auto_backtick(target_col)}) AS sc FROM {{df}}",
+            df=df,
         ).collect()[0][0]
         extract_df = self._spark.createDataFrame(data=[], schema=schema)
         columns = extract_df.columns
         columns = [
-            f"extract.{col} AS {col}"
+            self.auto_backtick(f"extract.{col}") + f" AS {self.auto_backtick(col)}"
             for col in columns
             if col not in omit_fields and col not in existing_columns
         ]
         columns += [
-            f"extract.{col} AS {duplicate_prefix}{col}"
+            self.auto_backtick(f"extract.{col}")
+            + f" AS {self.auto_backtick(duplicate_prefix + col)}"
             for col in columns
             if col not in omit_fields and col in existing_columns
         ]
@@ -176,7 +178,10 @@ class Stage:
             A DataFrame with the resultant operation's records.
         """
         return (
-            df.selectExpr("*", f"from_json({target_col}, '{schema}') AS extract")
+            df.selectExpr(
+                "*",
+                f"from_json({self.auto_backtick(target_col)}, '{schema}') AS extract",
+            )
             .selectExpr("*", *columns)
             .drop("extract")
         )
@@ -198,7 +203,10 @@ class Stage:
         """
         extract_df = self._spark.createDataFrame(data=[], schema=schema)
         schema = extract_df.drop(omit_fields).schema.simpleString()
-        return df.selectExpr("*", f"from_json({target_col}, '{schema}') AS {name}")
+        return df.selectExpr(
+            "*",
+            f"from_json({self.auto_backtick(target_col)}, '{schema}') AS {self.auto_backtick(name)}",
+        )
     def preserved_columns(
         self, df: DataFrame
@@ -224,7 +232,7 @@ class Stage:
         duplicate_prefix = self._duplicate_prefix()
         column_names = self._column_names()
         duplicate_renames = [
-            f"{col} AS {duplicate_prefix}{col}"
+            f"{self.auto_backtick(col)} AS {self.auto_backtick(duplicate_prefix + col)}"
             for col in preserved_columns
             if col in column_names
         ]
@@ -296,14 +304,46 @@ class Stage:
         """
         if field.get("from", None):
             # check that the from column exists in the df?
-            return f"{field['from']} AS {name}"
+            return f"{self.auto_backtick(field['from'])} AS {self.auto_backtick(name)}"
         elif field.get("literal", None):
-            return f"'{field['literal']}' AS {name}"
-        elif field.get("expr", None):
-            return f"{field['expr']} AS {name}"
+            return f"'{field['literal']}' AS {self.auto_backtick(name)}"
+        elif field.get("expr", None) is not None:
+            return f"{field['expr']} AS {self.auto_backtick(name)}"
         else:
             return ""
+    def is_backtick_escaped(self, name: str) -> bool:
+        """
+        check if a given (column) name is backtick escaped or not
+        :param name: column name
+        :return: bool
+        """
+        return name.startswith("`") and name.endswith("`")
+    def auto_backtick(self, name: str) -> str:
+        """
+        auto-backtick given name in case it isn't already backtick escaped.
+        if the name contains dots it will get split and each component backticked individually.
+        Returns the name wrapped in backticks or the passed name if it already had backticks.
+        :param name: column name
+        :return: str
+        """
+        if self.is_backtick_escaped(name):
+            return name
+        parts = name.split(".")
+        return ".".join(list(map(lambda s: f"`{s}`", parts)))
+    def force_apply_backticks(self, name: str) -> str:
+        """
+        forces application of backticks to the given (column) name as a single unit
+        if it already has backticks this is a noop
+        :param name: column name
+        :return: str
+        """
+        if self.is_backtick_escaped(name):
+            return name
+        return f"`{name}`"
     def process_node(self, name: str, node: Node) -> str:
         """
         Processes a single node in a tree of nodes.
@@ -319,7 +359,7 @@ class Stage:
                 child_expr = self.process_node(child_name, child_node)
                 fields_list.append(f"{child_expr}")
             joined_fields = ",\n".join(fields_list)
-            return f"struct(\n{joined_fields}\n) AS {name}"
+            return f"struct(\n{joined_fields}\n) AS {self.auto_backtick(name)}"
         else:
             return ""
@@ -341,12 +381,22 @@ class Stage:
         """
         Renders a list of field specifications containing both simple and
         STRUCT references into valid, STRUCT cognicient, SELECT expressions.
+        if a nested field is wrapped in backticks it will be treated as a simple field
+        for example field of name `col.with.dots` will NOT be treated as nested field.
         Returns:
             The SQL expression.
         """
-        simple_fields = [f for f in fields if "." not in f["name"]]
-        nested_fields = [f for f in fields if "." in f["name"]]
+        simple_fields = [
+            f
+            for f in fields
+            if "." not in f["name"] or self.is_backtick_escaped(f["name"])
+        ]
+        nested_fields = [
+            f
+            for f in fields
+            if "." in f["name"] and not self.is_backtick_escaped(f["name"])
+        ]
         result_parts = []
         for field in simple_fields:
@@ -358,7 +408,7 @@ class Stage:
             nested_str = self.parse_to_string(tree)
             result_parts.append(nested_str)
-        return [p for p in result_parts if p]
+        return [p for p in result_parts if p is not None and len(p) > 0]
     def select_expr(self, df: DataFrame) -> str:
         """
@@ -379,8 +429,12 @@ class Stage:
             if should_preserve:
                 if embed_col := preserve.get("embedColumn", None):
                     preserved_columns = self.preserved_columns_embed_column(df)
+                    # preserved_columns is obtained from df.columns
+                    # applying backticks to all of them is OK here
+                    # since they will never use "obj.key" to reference nested fields of structs
+                    # so we just go ahead and apply backticks to all across the board
                     select_fields += [
-                        f"struct({', '.join(preserved_columns)}) AS {embed_col}"
+                        f"struct({', '.join(list(map(lambda x: self.force_apply_backticks(x), preserved_columns)))}) AS {self.auto_backtick(embed_col)}"
                     ]
                 else:
                     (
@@ -388,8 +442,13 @@ class Stage:
                         duplicate_renames,
                         column_names,
                     ) = self.preserved_columns(df)
-                    select_fields += preserved_columns
-                    select_fields += duplicate_renames
+                    # see note above: same here - apply backticks to all columns across the board
+                    select_fields += list(
+                        map(lambda x: self.force_apply_backticks(x), preserved_columns)
+                    )
+                    select_fields += list(
+                        map(lambda x: self.force_apply_backticks(x), duplicate_renames)
+                    )
         return ["*"] + select_fields if self._stage == "temp_fields" else select_fields
@@ -475,7 +534,9 @@ class Stage:
                 df = (
                     df.alias("tmp")
                     .join(df_joined, on=[df[lhs] == df_joined[rhs]], how="left")
-                    .selectExpr("tmp.*", f"{select} AS {field.get('name')}")
+                    .selectExpr(
+                        "tmp.*", f"{select} AS {self.auto_backtick(field.get('name'))}"
+                    )
                 )
             elif csv := join.get("withCSV", None):
                 if path := csv.get("path", None):
@@ -485,7 +546,10 @@ class Stage:
                     df = (
                         df.alias("tmp")
                         .join(df_joined, on=[df[lhs] == df_joined[rhs]], how="left")
-                        .selectExpr("tmp.*", f"{select} AS {field.get('name')}")
+                        .selectExpr(
+                            "tmp.*",
+                            f"{select} AS {self.auto_backtick(field.get('name'))}",
+                        )
                     )
             else:
                 raise MissingJoinFieldError("withTable or withCSV (please supply 1)")
@@ -500,7 +564,10 @@ class Stage:
         """
         for field in self._fields:
             if field.get("alias", None):
-                df = df.selectExpr("*", f"{field.get('alias')} AS {field.get('name')}")
+                df = df.selectExpr(
+                    "*",
+                    f"{self.auto_backtick(field.get('alias'))} AS {self.auto_backtick(field.get('name'))}",
+                )
         return df
     def run_assertions(self, df: DataFrame) -> DataFrame:

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/content.py RENAMED Viewed

@@ -173,6 +173,8 @@ class DataSourcePreset(BaseModel):
     name: Optional[str] = None
     author: Optional[str] = None
     description: Optional[str] = None
+    title: Optional[str] = None
+    icon_url: Optional[str] = None
     autoloader: Optional[PresetAutoloader] = None
     silver: Optional[SilverPreset] = None
     gold: Optional[List[GoldPreset]] = None
@@ -188,6 +190,8 @@ class DataSourcePreset(BaseModel):
             name=obj.name,
             author=obj.author,
             description=obj.description,
+            title=obj.title,
+            icon_url=obj.icon_url,
             autoloader=PresetAutoloader.from_api_obj(obj.autoloader),
             silver=SilverPreset.from_api_obj(obj.silver),
             gold=[GoldPreset.from_api_obj(item) for item in obj.gold],

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/dbui.py RENAMED Viewed

@@ -12,6 +12,8 @@ from dasl_api import (
     DbuiV1TransformRequestTransformsInnerPresetOverrides,
     DbuiV1TransformResponse,
     DbuiV1TransformResponseStagesInner,
+    ContentV1DatasourcePresetAutoloaderCloudFiles,
+    DbuiV1TransformRequestAutoloaderInput,
 )
 from .datasource import DataSource, FieldSpec, FieldUtils
@@ -131,7 +133,7 @@ class TransformRequest(BaseModel):
     Attributes:
         input (TransformRequest.Input):
             The input block containing the columns metadata and data.
-        autoloader_input (DataSource.Autoloader):
+        autoloader_input (Autoloader):
             The autoloader input configuration.
         use_preset (str):
             Indicates which preset to use for the transforms.
@@ -172,6 +174,86 @@ class TransformRequest(BaseModel):
                 data=self.data,
             )
+    class Autoloader(BaseModel):
+        """
+        Autoloader configuration for the DataSource.
+        Attributes:
+            format (Optional[str]):
+                The format of the data (e.g., json, parquet, csv, etc.).
+            location (str):
+                External location for the volume in Unity Catalog.
+            schema_file (Optional[str]):
+                An optional file containing the schema of the data source.
+            cloud_files (Optional[Autoloader.CloudFiles]):
+                CloudFiles configuration.
+        """
+        class CloudFiles(BaseModel):
+            """
+            CloudFiles configuration for the Autoloader.
+            Attributes:
+                schema_hints_file (Optional[str]):
+                schema_hints (Optional[str]):
+            """
+            schema_hints_file: Optional[str] = None
+            schema_hints: Optional[str] = None
+            @staticmethod
+            def from_api_obj(
+                obj: Optional[ContentV1DatasourcePresetAutoloaderCloudFiles],
+            ) -> "TransformRequest.Autoloader.CloudFiles":
+                if obj is None:
+                    return None
+                return TransformRequest.Autoloader.CloudFiles(
+                    schema_hints_file=obj.schema_hints_file,
+                    schema_hints=obj.schema_hints,
+                )
+            def to_api_obj(self) -> ContentV1DatasourcePresetAutoloaderCloudFiles:
+                return ContentV1DatasourcePresetAutoloaderCloudFiles(
+                    schema_hints_file=self.schema_hints_file,
+                    schema_hints=self.schema_hints,
+                )
+        format: Optional[str] = None
+        location: str
+        schema_file: Optional[str] = None
+        schema: Optional[str] = None
+        cloud_files: Optional["TransformRequest.Autoloader.CloudFiles"] = None
+        row_count: Optional[int] = None
+        row_offset: Optional[int] = None
+        @staticmethod
+        def from_api_obj(
+            obj: Optional[DbuiV1TransformRequestAutoloaderInput],
+        ) -> "Optional[TransformRequest.Autoloader]":
+            if obj is None:
+                return None
+            return TransformRequest.Autoloader(
+                format=obj.format,
+                location=obj.location,
+                schema_file=obj.schema_file,
+                cloud_files=TransformRequest.Autoloader.CloudFiles.from_api_obj(
+                    obj.cloud_files
+                ),
+                row_count=obj.row_count,
+                row_offset=obj.row_offset,
+            )
+        def to_api_obj(self) -> DbuiV1TransformRequestAutoloaderInput:
+            return DbuiV1TransformRequestAutoloaderInput(
+                format=self.format,
+                location=self.location,
+                schemaFile=self.schema_file,
+                schema=self.schema_file,
+                cloudFiles=Helpers.maybe(lambda o: o.to_api_obj(), self.cloud_files),
+                rowCount=self.row_count,
+                rowOffset=self.row_offset,
+            )
     class Transform(BaseModel):
         """
         A transform configuration to apply to the data.
@@ -273,7 +355,7 @@ class TransformRequest(BaseModel):
             )
     input: Optional["TransformRequest.Input"] = None
-    autoloader_input: Optional[DataSource.Autoloader] = None
+    autoloader_input: Optional["TransformRequest.Autoloader"] = None
     use_preset: Optional[str] = None
     transforms: List["TransformRequest.Transform"]
@@ -281,7 +363,9 @@ class TransformRequest(BaseModel):
     def from_api_obj(obj: DbuiV1TransformRequest) -> "TransformRequest":
         return TransformRequest(
             input=TransformRequest.Input.from_api_obj(obj.input),
-            autoloader_input=DataSource.Autoloader.from_api_obj(obj.autoloader_input),
+            autoloader_input=TransformRequest.Autoloader.from_api_obj(
+                obj.autoloader_input
+            ),
             use_preset=obj.use_preset,
             transforms=[
                 TransformRequest.Transform.from_api_obj(item) for item in obj.transforms

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: dasl_client
-Version: 1.0.13
+Version: 1.0.16
 Summary: The DASL client library used for interacting with the DASL workspace
 Home-page: https://github.com/antimatter/asl
 Author: Antimatter Team
@@ -8,10 +8,10 @@ Author-email: Antimatter Team <support@antimatter.io>
 Requires-Python: >=3.8
 Description-Content-Type: text/markdown
 License-File: LICENSE
-Requires-Dist: dasl_api==0.1.15
+Requires-Dist: dasl_api==0.1.17
 Requires-Dist: databricks-sdk>=0.41.0
 Requires-Dist: pydantic>=2
-Requires-Dist: typing_extensions==4.10.0
+Requires-Dist: typing_extensions>=4.10.0
 # DASL Client Library

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client.egg-info/SOURCES.txt RENAMED Viewed

@@ -31,6 +31,10 @@ dasl_client/types/helpers.py
 dasl_client/types/rule.py
 dasl_client/types/types.py
 dasl_client/types/workspace_config.py
+test/__init__.py
+test/conftest.py
+test/constants.py
 test/test_api_changes.py
 test/test_api_surface.py
+test/test_databricks_secret_auth.py
 test/test_marshaling.py

dasl_client-1.0.16/dasl_client.egg-info/requires.txt ADDED Viewed

@@ -0,0 +1,4 @@
+dasl_api==0.1.17
+databricks-sdk>=0.41.0
+pydantic>=2
+typing_extensions>=4.10.0

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client.egg-info/top_level.txt RENAMED Viewed

	@@ -1 +1,2 @@
1 1	dasl_client
2	+ test

{dasl_client-1.0.13 → dasl_client-1.0.16}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "dasl_client"
-version = "1.0.13"
+version = "1.0.16"
 description = "The DASL client library used for interacting with the DASL workspace"
 readme = "README.md"
 authors = [
@@ -13,8 +13,8 @@ authors = [
 requires-python = ">=3.8"
 dependencies = [
-    "dasl_api==0.1.15",
+    "dasl_api==0.1.17",
     "databricks-sdk>=0.41.0",
     "pydantic>=2",
-    "typing_extensions==4.10.0"
+    "typing_extensions>=4.10.0",
 ]

dasl_client-1.0.16/test/__init__.py ADDED Viewed

File without changes

dasl_client-1.0.16/test/conftest.py ADDED Viewed

@@ -0,0 +1,18 @@
+import pytest
+from dasl_client import Client
+from .constants import *
+@pytest.fixture(scope="session")
+def api_client():
+    client = Client.new_workspace(
+        admin_email="test@antimatter.io",
+        app_client_id=app_client_id,
+        service_principal_id=databricks_client_id,
+        service_principal_secret=databricks_client_secret,
+        workspace_url=databricks_host,
+        dasl_host=dasl_host,
+    )
+    yield client

dasl_client-1.0.16/test/constants.py ADDED Viewed

@@ -0,0 +1,10 @@
+import os
+from urllib.parse import urlparse
+dasl_host = os.environ["DASL_API_URL"]
+databricks_host = os.environ["DASL_DATABRICKS_HOST"]
+databricks_client_id = os.environ["DASL_DATABRICKS_CLIENT_ID"]
+databricks_client_secret = os.environ["DASL_DATABRICKS_CLIENT_SECRET"]
+workspace = urlparse(databricks_host).hostname
+app_client_id = "22853b93-68ba-4ae2-8e41-976417f501dd"
+alternate_app_client_id = "335ac0d3-e0ea-4732-ba93-0277423b5029"

{dasl_client-1.0.13 → dasl_client-1.0.16}/test/test_api_surface.py RENAMED Viewed

@@ -1,29 +1,6 @@
-import os
-import pytest
-from urllib.parse import urlparse
 from dasl_client import *
-dasl_host = os.environ["DASL_API_URL"]
-databricks_host = os.environ["DATABRICKS_HOST"]
-databricks_client_id = os.environ["DATABRICKS_CLIENT_ID"]
-databricks_client_secret = os.environ["DATABRICKS_CLIENT_SECRET"]
-workspace = urlparse(databricks_host).hostname
-app_client_id = "22853b93-68ba-4ae2-8e41-976417f501dd"
-alternate_app_client_id = "335ac0d3-e0ea-4732-ba93-0277423b5029"
-@pytest.fixture(scope="session")
-def api_client():
-    client = Client.new_workspace(
-        admin_email="test@antimatter.io",
-        app_client_id=app_client_id,
-        service_principal_id=databricks_client_id,
-        service_principal_secret=databricks_client_secret,
-        workspace_url=databricks_host,
-        dasl_host=dasl_host,
-    )
-    yield client
+from .constants import *
 def test_admin_config(api_client):

dasl_client-1.0.16/test/test_databricks_secret_auth.py ADDED Viewed

@@ -0,0 +1,116 @@
+import base64
+import datetime
+import os
+import time
+from databricks.sdk import WorkspaceClient
+from databricks.sdk.service import jobs, workspace as dbworkspace
+from .constants import *
+pylib_volume_path = os.environ["PYLIB_VOLUME_PATH"]
+pylib_wheel_path = os.environ["PYLIB_WHEEL_PATH"]
+def test_secret_auth(api_client):
+    # making sure it's even possible to get a config
+    api_client.get_config()
+    # need to do an API operation using databricks secret auth.
+    notebook_data = f"""
+    %pip install {pylib_wheel_path}
+    dbutils.library.restartPython()
+    # COMMAND ----------
+    from dasl_client.client import Client
+    Client.for_workspace(
+        workspace_url="{databricks_host}",
+        dasl_host="{dasl_host}",
+    ).get_config()
+    # COMMAND ----------
+    dbutils.notebook.exit("SUCCESS")
+    """
+    print(f"notebook_data={notebook_data}")
+    wsc = WorkspaceClient()
+    wsc.workspace.mkdirs(path=pylib_volume_path)
+    notebook_path = f"{pylib_volume_path}/test_secret_auth_notebook"
+    wsc.workspace.import_(
+        path=notebook_path,
+        format=dbworkspace.ImportFormat.SOURCE,
+        language=dbworkspace.Language.PYTHON,
+        content=base64.b64encode(notebook_data.encode("utf-8")).decode("utf-8"),
+        overwrite=True,
+    )
+    job_id = None
+    try:
+        job_id = wsc.jobs.create(
+            name="run test_secret_auth notebook",
+            tasks=[
+                jobs.Task(
+                    task_key="run_notebook",
+                    notebook_task=jobs.NotebookTask(notebook_path=notebook_path),
+                ),
+            ],
+        ).job_id
+        wsc.jobs.run_now(job_id=job_id)
+        logs = []
+        start = datetime.datetime.now()
+        complete = False
+        while not complete:
+            elapsed = datetime.datetime.now() - start
+            if elapsed > datetime.timedelta(seconds=300):
+                raise Exception(f"timed out waiting for job")
+            time.sleep(5)
+            status, logs = fetch_latest_run_status_and_logs(wsc, job_id)
+            print(f"logs={logs}")
+            if status == jobs.TerminationCodeCode.RUN_EXECUTION_ERROR:
+                raise Exception(f"job terminated with error")
+            complete = status == jobs.TerminationCodeCode.SUCCESS
+        print(logs)
+        assert len(logs) == 1
+        assert logs[0] == "SUCCESS"
+    finally:
+        wsc.workspace.delete(pylib_volume_path, recursive=True)
+        if job_id is not None:
+            wsc.jobs.delete(job_id=job_id)
+def fetch_latest_run_status_and_logs(
+    wsc: WorkspaceClient,
+    job_id: str,
+):
+    runs = list(wsc.jobs.list_runs(job_id=job_id, expand_tasks=True))
+    if not runs:
+        return "No runs found", None
+    # Find the latest run based on the start time
+    latest_run = max(runs, key=lambda r: r.start_time)
+    if latest_run.status.termination_details is None:
+        return "No runs found", None
+    status = latest_run.status.termination_details.code
+    logs = []
+    for task in latest_run.tasks:
+        output = wsc.jobs.get_run_output(task.run_id)
+        if output.error is not None:
+            logs.append(output.error)
+        elif output.logs is not None:
+            logs.append(output.logs)
+        elif output.notebook_output is not None:
+            logs.append(output.notebook_output.result)
+        elif output.run_job_output is not None:
+            raise Exception("Nested jobs are not supported")
+        elif output.sql_output is not None:
+            raise Exception("SQL jobs are unsupported")
+        else:
+            logs.append("")
+    return status, logs

{dasl_client-1.0.13 → dasl_client-1.0.16}/test/test_marshaling.py RENAMED Viewed

@@ -1,9 +1,6 @@
-import os
 from dasl_client import *
-databricks_host = os.environ["DATABRICKS_HOST"]
-workspace = databricks_host.split("//")[1]
+from .constants import *
 def test_workspace_config_marshal_unmarshal():
@@ -701,13 +698,15 @@ def test_transform_request_marshal_unmarshal():
             ],
             data=[{"col1": "1", "col2": "a"}, {"col1": "2", "col2": "b"}],
         ),
-        autoloader_input=DataSource.Autoloader(
+        autoloader_input=TransformRequest.Autoloader(
             format="csv",
             location="s3://bucket/data",
             schema_file="schema.json",
-            cloud_files=DataSource.Autoloader.CloudFiles(
+            cloud_files=TransformRequest.Autoloader.CloudFiles(
                 schema_hints_file="hints_file.csv", schema_hints="hint1, hint2"
             ),
+            row_count=1,
+            row_offset=5,
         ),
         use_preset="preset_value",
         transforms=[

dasl_client-1.0.13/dasl_client.egg-info/requires.txt DELETED Viewed

@@ -1,4 +0,0 @@
-dasl_api==0.1.15
-databricks-sdk>=0.41.0
-pydantic>=2
-typing_extensions==4.10.0

{dasl_client-1.0.13 → dasl_client-1.0.16}/LICENSE RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/README.md RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/__init__.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/auth/__init__.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/auth/auth.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/conn/__init__.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/conn/client_identifier.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/conn/conn.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/errors/__init__.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/errors/errors.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/preset_development/__init__.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/__init__.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/admin_config.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/datasource.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/helpers.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/rule.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/types.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client/types/workspace_config.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/dasl_client.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/setup.cfg RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/setup.py RENAMED Viewed

File without changes

{dasl_client-1.0.13 → dasl_client-1.0.16}/test/test_api_changes.py RENAMED Viewed

File without changes

dasl-client 1.0.13__tar.gz → 1.0.16__tar.gz

Potentially problematic release.

dasl-client 1.0.13tar.gz → 1.0.16tar.gz