PyPI - tracdap-runtime - Versions diffs - 0.7.1__py3-none-any.whl → 0.8.0__py3-none-any.whl - Mend

tracdap-runtime 0.7.1py3-none-any.whl → 0.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

tracdap/rt/_impl/core/__init__.py +14 -0
tracdap/rt/_impl/{config_parser.py → core/config_parser.py} +36 -19
tracdap/rt/_impl/{data.py → core/data.py} +136 -32
tracdap/rt/_impl/core/logging.py +195 -0
tracdap/rt/_impl/{models.py → core/models.py} +15 -12
tracdap/rt/_impl/{repos.py → core/repos.py} +12 -3
tracdap/rt/_impl/{schemas.py → core/schemas.py} +5 -5
tracdap/rt/_impl/{shim.py → core/shim.py} +5 -4
tracdap/rt/_impl/{storage.py → core/storage.py} +21 -10
tracdap/rt/_impl/core/struct.py +547 -0
tracdap/rt/_impl/{util.py → core/util.py} +1 -111
tracdap/rt/_impl/{validation.py → core/validation.py} +99 -31
tracdap/rt/_impl/exec/__init__.py +14 -0
tracdap/rt/{_exec → _impl/exec}/actors.py +12 -14
tracdap/rt/{_exec → _impl/exec}/context.py +228 -82
tracdap/rt/{_exec → _impl/exec}/dev_mode.py +163 -81
tracdap/rt/{_exec → _impl/exec}/engine.py +230 -105
tracdap/rt/{_exec → _impl/exec}/functions.py +191 -100
tracdap/rt/{_exec → _impl/exec}/graph.py +24 -36
tracdap/rt/{_exec → _impl/exec}/graph_builder.py +252 -115
tracdap/rt/_impl/grpc/codec.py +1 -1
tracdap/rt/{_exec → _impl/grpc}/server.py +7 -6
tracdap/rt/_impl/grpc/tracdap/api/internal/runtime_pb2.py +3 -3
tracdap/rt/_impl/grpc/tracdap/api/internal/runtime_pb2_grpc.py +1 -1
tracdap/rt/_impl/grpc/tracdap/metadata/common_pb2.py +1 -1
tracdap/rt/_impl/grpc/tracdap/metadata/config_pb2.py +40 -0
tracdap/rt/_impl/grpc/tracdap/metadata/config_pb2.pyi +62 -0
tracdap/rt/_impl/grpc/tracdap/metadata/custom_pb2.py +1 -1
tracdap/rt/_impl/grpc/tracdap/metadata/data_pb2.py +32 -20
tracdap/rt/_impl/grpc/tracdap/metadata/data_pb2.pyi +48 -2
tracdap/rt/_impl/grpc/tracdap/metadata/file_pb2.py +4 -2
tracdap/rt/_impl/grpc/tracdap/metadata/file_pb2.pyi +8 -0
tracdap/rt/_impl/grpc/tracdap/metadata/flow_pb2.py +1 -1
tracdap/rt/_impl/grpc/tracdap/metadata/job_pb2.py +65 -63
tracdap/rt/_impl/grpc/tracdap/metadata/job_pb2.pyi +16 -2
tracdap/rt/_impl/grpc/tracdap/metadata/model_pb2.py +28 -26
tracdap/rt/_impl/grpc/tracdap/metadata/model_pb2.pyi +14 -4
tracdap/rt/_impl/grpc/tracdap/metadata/object_id_pb2.py +4 -4
tracdap/rt/_impl/grpc/tracdap/metadata/object_id_pb2.pyi +6 -0
tracdap/rt/_impl/grpc/tracdap/metadata/object_pb2.py +9 -7
tracdap/rt/_impl/grpc/tracdap/metadata/object_pb2.pyi +12 -4
tracdap/rt/_impl/grpc/tracdap/metadata/resource_pb2.py +18 -5
tracdap/rt/_impl/grpc/tracdap/metadata/resource_pb2.pyi +42 -2
tracdap/rt/_impl/grpc/tracdap/metadata/search_pb2.py +1 -1
tracdap/rt/_impl/grpc/tracdap/metadata/{stoarge_pb2.py → storage_pb2.py} +4 -4
tracdap/rt/_impl/grpc/tracdap/metadata/tag_pb2.py +1 -1
tracdap/rt/_impl/grpc/tracdap/metadata/tag_update_pb2.py +1 -1
tracdap/rt/_impl/grpc/tracdap/metadata/type_pb2.py +1 -1
tracdap/rt/{_exec → _impl}/runtime.py +32 -18
tracdap/rt/_impl/static_api.py +65 -37
tracdap/rt/_plugins/format_csv.py +1 -1
tracdap/rt/_plugins/repo_git.py +56 -11
tracdap/rt/_plugins/storage_sql.py +1 -1
tracdap/rt/_version.py +1 -1
tracdap/rt/api/__init__.py +5 -24
tracdap/rt/api/constants.py +57 -0
tracdap/rt/api/experimental.py +32 -0
tracdap/rt/api/hook.py +26 -7
tracdap/rt/api/model_api.py +16 -0
tracdap/rt/api/static_api.py +265 -127
tracdap/rt/config/__init__.py +11 -11
tracdap/rt/config/common.py +2 -26
tracdap/rt/config/dynamic.py +28 -0
tracdap/rt/config/platform.py +17 -31
tracdap/rt/config/runtime.py +2 -0
tracdap/rt/ext/embed.py +2 -2
tracdap/rt/ext/plugins.py +3 -3
tracdap/rt/launch/launch.py +12 -14
tracdap/rt/metadata/__init__.py +28 -18
tracdap/rt/metadata/config.py +95 -0
tracdap/rt/metadata/data.py +40 -0
tracdap/rt/metadata/file.py +10 -0
tracdap/rt/metadata/job.py +16 -0
tracdap/rt/metadata/model.py +12 -2
tracdap/rt/metadata/object.py +9 -1
tracdap/rt/metadata/object_id.py +6 -0
tracdap/rt/metadata/resource.py +41 -1
{tracdap_runtime-0.7.1.dist-info → tracdap_runtime-0.8.0.dist-info}/METADATA +23 -17
tracdap_runtime-0.8.0.dist-info/RECORD +129 -0
{tracdap_runtime-0.7.1.dist-info → tracdap_runtime-0.8.0.dist-info}/WHEEL +1 -1
tracdap/rt/_exec/__init__.py +0 -0
tracdap_runtime-0.7.1.dist-info/RECORD +0 -121
/tracdap/rt/_impl/{guard_rails.py → core/guard_rails.py} +0 -0
/tracdap/rt/_impl/{type_system.py → core/type_system.py} +0 -0
/tracdap/rt/_impl/grpc/tracdap/metadata/{stoarge_pb2.pyi → storage_pb2.pyi} +0 -0
/tracdap/rt/metadata/{stoarge.py → storage.py} +0 -0
{tracdap_runtime-0.7.1.dist-info → tracdap_runtime-0.8.0.dist-info/licenses}/LICENSE +0 -0
{tracdap_runtime-0.7.1.dist-info → tracdap_runtime-0.8.0.dist-info}/top_level.txt +0 -0

tracdap/rt/{_exec → _impl/exec}/context.py RENAMED Viewed

@@ -13,7 +13,9 @@
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
+import contextlib
 import copy
+import io
 import logging
 import pathlib
 import typing as tp
@@ -24,11 +26,13 @@ import tracdap.rt.api as _api
 import tracdap.rt.api.experimental as _eapi
 import tracdap.rt.metadata as _meta
 import tracdap.rt.exceptions as _ex
-import tracdap.rt._impl.type_system as _types  # noqa
-import tracdap.rt._impl.data as _data  # noqa
-import tracdap.rt._impl.storage as _storage  # noqa
-import tracdap.rt._impl.util as _util  # noqa
-import tracdap.rt._impl.validation as _val  # noqa
+import tracdap.rt._impl.core.data as _data
+import tracdap.rt._impl.core.logging as _logging
+import tracdap.rt._impl.core.storage as _storage
+import tracdap.rt._impl.core.struct as _struct
+import tracdap.rt._impl.core.type_system as _types
+import tracdap.rt._impl.core.util as _util
+import tracdap.rt._impl.core.validation as _val
 class TracContextImpl(_api.TracContext):
@@ -61,10 +65,15 @@ class TracContextImpl(_api.TracContext):
                  model_class: _api.TracModel.__class__,
                  local_ctx: tp.Dict[str, tp.Any],
                  dynamic_outputs: tp.List[str] = None,
-                 checkout_directory: pathlib.Path = None):
+                 checkout_directory: pathlib.Path = None,
+                 log_provider: _logging.LogProvider = None):
-        self.__ctx_log = _util.logger_for_object(self)
-        self.__model_log = _util.logger_for_class(model_class)
+        # If no log provider is supplied, use the default (system logs only)
+        if log_provider is None:
+            log_provider = _logging.LogProvider()
+        self.__ctx_log = log_provider.logger_for_object(self)
+        self.__model_log = log_provider.logger_for_class(model_class)
         self.__model_def = model_def
         self.__model_class = model_class
@@ -82,9 +91,9 @@ class TracContextImpl(_api.TracContext):
         _val.validate_signature(self.get_parameter, parameter_name)
-        self.__val.check_param_valid_identifier(parameter_name)
-        self.__val.check_param_defined_in_model(parameter_name)
-        self.__val.check_param_available_in_context(parameter_name)
+        self.__val.check_item_valid_identifier(parameter_name, TracContextValidator.PARAMETER)
+        self.__val.check_item_defined_in_model(parameter_name, TracContextValidator.PARAMETER)
+        self.__val.check_item_available_in_context(parameter_name, TracContextValidator.PARAMETER)
         value: _meta.Value = self.__local_ctx.get(parameter_name)
@@ -96,8 +105,8 @@ class TracContextImpl(_api.TracContext):
         _val.validate_signature(self.has_dataset, dataset_name)
-        self.__val.check_dataset_valid_identifier(dataset_name)
-        self.__val.check_dataset_defined_in_model(dataset_name)
+        self.__val.check_item_valid_identifier(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_defined_in_model(dataset_name, TracContextValidator.DATASET)
         data_view: _data.DataView = self.__local_ctx.get(dataset_name)
@@ -105,6 +114,7 @@ class TracContextImpl(_api.TracContext):
             return False
         self.__val.check_context_object_type(dataset_name, data_view, _data.DataView)
+        self.__val.check_context_data_view_type(dataset_name, data_view, _meta.ObjectType.DATA)
         return not data_view.is_empty()
@@ -112,9 +122,9 @@ class TracContextImpl(_api.TracContext):
         _val.validate_signature(self.get_schema, dataset_name)
-        self.__val.check_dataset_valid_identifier(dataset_name)
-        self.__val.check_dataset_defined_in_model(dataset_name)
-        self.__val.check_dataset_available_in_context(dataset_name)
+        self.__val.check_item_valid_identifier(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_defined_in_model(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_available_in_context(dataset_name, TracContextValidator.DATASET)
         static_schema = self.__get_static_schema(self.__model_def, dataset_name)
         data_view: _data.DataView = self.__local_ctx.get(dataset_name)
@@ -123,6 +133,7 @@ class TracContextImpl(_api.TracContext):
         # This ensures errors are always reported and is consistent with get_pandas_table()
         self.__val.check_context_object_type(dataset_name, data_view, _data.DataView)
+        self.__val.check_context_data_view_type(dataset_name, data_view, _meta.ObjectType.DATA)
         self.__val.check_dataset_schema_defined(dataset_name, data_view)
         # If a static schema exists, that takes priority
@@ -138,9 +149,9 @@ class TracContextImpl(_api.TracContext):
         _val.validate_signature(self.get_table, dataset_name, framework)
         _val.require_package(framework.protocol_name, framework.api_type)
-        self.__val.check_dataset_valid_identifier(dataset_name)
-        self.__val.check_dataset_defined_in_model(dataset_name)
-        self.__val.check_dataset_available_in_context(dataset_name)
+        self.__val.check_item_valid_identifier(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_defined_in_model(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_available_in_context(dataset_name, TracContextValidator.DATASET)
         self.__val.check_data_framework_args(framework, framework_args)
         static_schema = self.__get_static_schema(self.__model_def, dataset_name)
@@ -150,6 +161,7 @@ class TracContextImpl(_api.TracContext):
         converter = _data.DataConverter.for_framework(framework, **framework_args)
         self.__val.check_context_object_type(dataset_name, data_view, _data.DataView)
+        self.__val.check_context_data_view_type(dataset_name, data_view, _meta.ObjectType.DATA)
         self.__val.check_dataset_schema_defined(dataset_name, data_view)
         self.__val.check_dataset_part_present(dataset_name, data_view, part_key)
@@ -174,6 +186,45 @@ class TracContextImpl(_api.TracContext):
         return self.get_table(dataset_name, _eapi.POLARS)
+    def get_struct(self, struct_name: str, python_class: type[_eapi.STRUCT_TYPE] = None) -> _eapi.STRUCT_TYPE:
+        _val.validate_signature(self.get_struct, struct_name, python_class)
+        self.__val.check_item_valid_identifier(struct_name, TracContextValidator.DATASET)
+        self.__val.check_item_defined_in_model(struct_name, TracContextValidator.DATASET)
+        self.__val.check_item_available_in_context(struct_name, TracContextValidator.DATASET)
+        data_view: _data.DataView = self.__local_ctx.get(struct_name)
+        part_key = _data.DataPartKey.for_root()
+        self.__val.check_context_object_type(struct_name, data_view, _data.DataView)
+        self.__val.check_context_data_view_type(struct_name, data_view, _meta.ObjectType.DATA)
+        self.__val.check_dataset_schema_defined(struct_name, data_view)
+        struct_data: dict = data_view.parts[part_key][0].content
+        return _struct.StructProcessor.parse_struct(struct_data, None, python_class)
+    def get_file(self, file_name: str) -> bytes:
+        _val.validate_signature(self.get_file, file_name)
+        self.__val.check_item_valid_identifier(file_name, TracContextValidator.FILE)
+        self.__val.check_item_defined_in_model(file_name, TracContextValidator.FILE)
+        self.__val.check_item_available_in_context(file_name, TracContextValidator.FILE)
+        file_view: _data.DataView = self.__local_ctx.get(file_name)
+        self.__val.check_context_object_type(file_name, file_view, _data.DataView)
+        self.__val.check_context_data_view_type(file_name, file_view, _meta.ObjectType.FILE)
+        self.__val.check_file_content_present(file_name, file_view)
+        return file_view.file_item.content
+    def get_file_stream(self, file_name: str) -> tp.ContextManager[tp.BinaryIO]:
+        buffer = self.get_file(file_name)
+        return contextlib.closing(io.BytesIO(buffer))
     def put_schema(self, dataset_name: str, schema: _meta.SchemaDefinition):
         _val.validate_signature(self.get_schema, dataset_name, schema)
@@ -182,7 +233,7 @@ class TracContextImpl(_api.TracContext):
         # If field ordering is not assigned by the model, assign it here (model code will not see the numbers)
         schema_copy = self.__assign_field_order(copy.deepcopy(schema))
-        self.__val.check_dataset_valid_identifier(dataset_name)
+        self.__val.check_item_valid_identifier(dataset_name, TracContextValidator.DATASET)
         self.__val.check_dataset_is_dynamic_output(dataset_name)
         self.__val.check_provided_schema_is_valid(dataset_name, schema_copy)
@@ -197,6 +248,7 @@ class TracContextImpl(_api.TracContext):
         # If there is a prior view it must contain nothing and will be replaced
         self.__val.check_context_object_type(dataset_name, data_view, _data.DataView)
+        self.__val.check_context_data_view_type(dataset_name, data_view, _meta.ObjectType.DATA)
         self.__val.check_dataset_schema_not_defined(dataset_name, data_view)
         self.__val.check_dataset_is_empty(dataset_name, data_view)
@@ -216,8 +268,8 @@ class TracContextImpl(_api.TracContext):
         _val.require_package(framework.protocol_name, framework.api_type)
-        self.__val.check_dataset_valid_identifier(dataset_name)
-        self.__val.check_dataset_is_model_output(dataset_name)
+        self.__val.check_item_valid_identifier(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_is_model_output(dataset_name, TracContextValidator.DATASET)
         self.__val.check_provided_dataset_type(dataset, framework.api_type)
         self.__val.check_data_framework_args(framework, framework_args)
@@ -234,19 +286,22 @@ class TracContextImpl(_api.TracContext):
                 data_view = _data.DataView.create_empty()
         self.__val.check_context_object_type(dataset_name, data_view, _data.DataView)
+        self.__val.check_context_data_view_type(dataset_name, data_view, _meta.ObjectType.DATA)
         self.__val.check_dataset_schema_defined(dataset_name, data_view)
         self.__val.check_dataset_part_not_present(dataset_name, data_view, part_key)
         # Prefer static schemas for data conformance
         if static_schema is not None:
-            schema = _data.DataMapping.trac_to_arrow_schema(static_schema)
+            trac_schema = static_schema
+            native_schema = _data.DataMapping.trac_to_arrow_schema(static_schema)
         else:
-            schema = data_view.arrow_schema
+            trac_schema = _data.DataMapping.arrow_to_trac_schema(data_view.arrow_schema)
+            native_schema = data_view.arrow_schema
         # Data conformance is applied automatically inside the converter, if schema != None
-        table = converter.to_internal(dataset, schema)
-        item = _data.DataItem(schema, table)
+        table = converter.to_internal(dataset, native_schema)
+        item = _data.DataItem.for_table(table, native_schema, trac_schema)
         updated_view = _data.DataMapping.add_item_to_view(data_view, part_key, item)
@@ -260,6 +315,73 @@ class TracContextImpl(_api.TracContext):
         self.put_table(dataset_name, dataset, _eapi.POLARS)
+    def put_struct(self, struct_name: str, struct: _eapi.STRUCT_TYPE):
+        _val.validate_signature(self.put_struct, struct_name, struct)
+        self.__val.check_item_valid_identifier(struct_name, TracContextValidator.DATASET)
+        self.__val.check_item_is_model_output(struct_name, TracContextValidator.DATASET)
+        static_schema = self.__get_static_schema(self.__model_def, struct_name)
+        data_view = self.__local_ctx.get(struct_name)
+        part_key = _data.DataPartKey.for_root()
+        if data_view is None:
+            if static_schema is not None:
+                data_view = _data.DataView.for_trac_schema(static_schema)
+            else:
+                data_view = _data.DataView.create_empty()
+        self.__val.check_context_object_type(struct_name, data_view, _data.DataView)
+        self.__val.check_context_data_view_type(struct_name, data_view, _meta.ObjectType.DATA)
+        self.__val.check_dataset_schema_defined(struct_name, data_view)
+        self.__val.check_dataset_part_not_present(struct_name, data_view, part_key)
+        data_item = _data.DataItem.for_struct(struct)
+        updated_view = _data.DataMapping.add_item_to_view(data_view, part_key, data_item)
+        self.__local_ctx[struct_name] = updated_view
+    def put_file(self, file_name: str, file_content: tp.Union[bytes, bytearray]):
+        _val.validate_signature(self.put_file, file_name, file_content)
+        self.__val.check_item_valid_identifier(file_name, TracContextValidator.FILE)
+        self.__val.check_item_is_model_output(file_name, TracContextValidator.FILE)
+        file_view: _data.DataView = self.__local_ctx.get(file_name)
+        if file_view is None:
+            file_view = _data.DataView.create_empty(_meta.ObjectType.FILE)
+        self.__val.check_context_object_type(file_name, file_view, _data.DataView)
+        self.__val.check_context_data_view_type(file_name, file_view, _meta.ObjectType.FILE)
+        self.__val.check_file_content_not_present(file_name, file_view)
+        if isinstance(file_content, bytearray):
+            file_content = bytes(bytearray)
+        file_item = _data.DataItem.for_file_content(file_content)
+        self.__local_ctx[file_name] = file_view.with_file_item(file_item)
+    def put_file_stream(self, file_name: str) -> tp.ContextManager[tp.BinaryIO]:
+        _val.validate_signature(self.put_file_stream, file_name)
+        self.__val.check_item_valid_identifier(file_name, TracContextValidator.FILE)
+        self.__val.check_item_is_model_output(file_name, TracContextValidator.FILE)
+        @contextlib.contextmanager
+        def memory_stream(stream: io.BytesIO):
+            try:
+                yield stream
+                buffer = stream.getbuffer().tobytes()
+                self.put_file(file_name, buffer)
+            finally:
+                stream.close()
+        return memory_stream(io.BytesIO())
     def log(self) -> logging.Logger:
         _val.validate_signature(self.log)
@@ -300,9 +422,9 @@ class TracDataContextImpl(TracContextImpl, _eapi.TracDataContext):
             self, model_def: _meta.ModelDefinition, model_class: _api.TracModel.__class__,
             local_ctx: tp.Dict[str, tp.Any], dynamic_outputs: tp.List[str],
             storage_map: tp.Dict[str, tp.Union[_eapi.TracFileStorage, _eapi.TracDataStorage]],
-            checkout_directory: pathlib.Path = None):
+            checkout_directory: pathlib.Path = None, log_provider: _logging.LogProvider = None):
-        super().__init__(model_def, model_class, local_ctx, dynamic_outputs, checkout_directory)
+        super().__init__(model_def, model_class, local_ctx, dynamic_outputs, checkout_directory, log_provider)
         self.__model_def = model_def
         self.__local_ctx = local_ctx
@@ -310,7 +432,7 @@ class TracDataContextImpl(TracContextImpl, _eapi.TracDataContext):
         self.__storage_map = storage_map
         self.__checkout_directory = checkout_directory
-        self.__val = self._TracContextImpl__val  # noqa
+        self.__val: TracContextValidator = self._TracContextImpl__val  # noqa
     def get_file_storage(self, storage_key: str) -> _eapi.TracFileStorage:
@@ -348,9 +470,9 @@ class TracDataContextImpl(TracContextImpl, _eapi.TracDataContext):
         _val.validate_signature(self.add_data_import, dataset_name)
-        self.__val.check_dataset_valid_identifier(dataset_name)
-        self.__val.check_dataset_not_defined_in_model(dataset_name)
-        self.__val.check_dataset_not_available_in_context(dataset_name)
+        self.__val.check_item_valid_identifier(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_not_defined_in_model(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_not_available_in_context(dataset_name, TracContextValidator.DATASET)
         self.__local_ctx[dataset_name] = _data.DataView.create_empty()
         self.__dynamic_outputs.append(dataset_name)
@@ -359,8 +481,8 @@ class TracDataContextImpl(TracContextImpl, _eapi.TracDataContext):
         _val.validate_signature(self.set_source_metadata, dataset_name, storage_key, source_info)
-        self.__val.check_dataset_valid_identifier(dataset_name)
-        self.__val.check_dataset_available_in_context(dataset_name)
+        self.__val.check_item_valid_identifier(dataset_name, TracContextValidator.DATASET)
+        self.__val.check_item_available_in_context(dataset_name, TracContextValidator.DATASET)
         self.__val.check_storage_valid_identifier(storage_key)
         self.__val.check_storage_available(self.__storage_map, storage_key)
@@ -368,11 +490,11 @@ class TracDataContextImpl(TracContextImpl, _eapi.TracDataContext):
         if isinstance(storage, _eapi.TracFileStorage):
             if not isinstance(source_info, _eapi.FileStat):
-                self.__val.report_public_error(f"Expected storage_info to be a FileStat, [{storage_key}] refers to file storage")
+                self.__val.report_public_error(_ex.ERuntimeValidation(f"Expected storage_info to be a FileStat, [{storage_key}] refers to file storage"))
         if isinstance(storage, _eapi.TracDataStorage):
             if not isinstance(source_info, str):
-                self.__val.report_public_error(f"Expected storage_info to be a table name, [{storage_key}] refers to dadta storage")
+                self.__val.report_public_error(_ex.ERuntimeValidation(f"Expected storage_info to be a table name, [{storage_key}] refers to dadta storage"))
         pass  # Not implemented yet, only required when imports are sent back to the platform
@@ -392,7 +514,9 @@ class TracDataContextImpl(TracContextImpl, _eapi.TracDataContext):
 class TracFileStorageImpl(_eapi.TracFileStorage):
-    def __init__(self, storage_key: str, storage_impl: _storage.IFileStorage, write_access: bool, checkout_directory):
+    def __init__(
+            self, storage_key: str, storage_impl: _storage.IFileStorage,
+            write_access: bool, checkout_directory, log_provider: _logging.LogProvider):
         self.__storage_key = storage_key
@@ -413,7 +537,11 @@ class TracFileStorageImpl(_eapi.TracFileStorage):
             self.__rmdir = None
             self.__write_byte_stream = None
-        self.__log = _util.logger_for_object(self)
+        # If no log provider is supplied, use the default (system logs only)
+        if log_provider is None:
+            log_provider = _logging.LogProvider()
+        self.__log = log_provider.logger_for_object(self)
         self.__val = TracStorageValidator(self.__log, checkout_directory, self.__storage_key)
     def get_storage_key(self) -> str:
@@ -534,7 +662,7 @@ class TracDataStorageImpl(_eapi.TracDataStorage[_eapi.DATA_API]):
     def __init__(
             self, storage_key: str, storage_impl: _storage.IDataStorageBase[_data.T_INTERNAL_DATA, _data.T_INTERNAL_SCHEMA],
             data_converter: _data.DataConverter[_eapi.DATA_API, _data.T_INTERNAL_DATA, _data.T_INTERNAL_SCHEMA],
-            write_access: bool, checkout_directory):
+            write_access: bool, checkout_directory, log_provider: _logging.LogProvider):
         self.__storage_key = storage_key
         self.__converter = data_converter
@@ -551,7 +679,11 @@ class TracDataStorageImpl(_eapi.TracDataStorage[_eapi.DATA_API]):
             self.__create_table = None
             self.__write_table = None
-        self.__log = _util.logger_for_object(self)
+        # If no log provider is supplied, use the default (system logs only)
+        if log_provider is None:
+            log_provider = _logging.LogProvider()
+        self.__log = log_provider.logger_for_object(self)
         self.__val = TracStorageValidator(self.__log, checkout_directory, self.__storage_key)
     def has_table(self, table_name: str) -> bool:
@@ -684,6 +816,10 @@ class TracContextErrorReporter:
 class TracContextValidator(TracContextErrorReporter):
+    PARAMETER = "Parameter"
+    DATASET = "Dataset"
+    FILE = "File"
     def __init__(
             self, log: logging.Logger,
             model_def: _meta.ModelDefinition,
@@ -697,49 +833,45 @@ class TracContextValidator(TracContextErrorReporter):
         self.__local_ctx = local_ctx
         self.__dynamic_outputs = dynamic_outputs
-    def check_param_valid_identifier(self, param_name: str):
+    def check_item_valid_identifier(self, item_name: str, item_type: str):
-        if param_name is None:
-            self._report_error(f"Parameter name is null")
+        if item_name is None:
+            self._report_error(f"{item_type} name is null")
-        if not self._VALID_IDENTIFIER.match(param_name):
-            self._report_error(f"Parameter name {param_name} is not a valid identifier")
+        if not self._VALID_IDENTIFIER.match(item_name):
+            self._report_error(f"{item_type} name {item_name} is not a valid identifier")
-    def check_param_defined_in_model(self, param_name: str):
+    def check_item_defined_in_model(self, item_name: str, item_type: str):
-        if param_name not in self.__model_def.parameters:
-            self._report_error(f"Parameter {param_name} is not defined in the model")
-    def check_param_available_in_context(self, param_name: str):
-        if param_name not in self.__local_ctx:
-            self._report_error(f"Parameter {param_name} is not available in the current context")
-    def check_dataset_valid_identifier(self, dataset_name: str):
+        if item_type == self.PARAMETER:
+            if item_name not in self.__model_def.parameters:
+                self._report_error(f"{item_type} {item_name} is not defined in the model")
+        else:
+            if item_name not in self.__model_def.inputs and item_name not in self.__model_def.outputs:
+                self._report_error(f"{item_type} {item_name} is not defined in the model")
-        if dataset_name is None:
-            self._report_error(f"Dataset name is null")
+    def check_item_not_defined_in_model(self, item_name: str, item_type: str):
-        if not self._VALID_IDENTIFIER.match(dataset_name):
-            self._report_error(f"Dataset name {dataset_name} is not a valid identifier")
+        if item_name  in self.__model_def.inputs or item_name in self.__model_def.outputs:
+            self._report_error(f"{item_type} {item_name} is already defined in the model")
-    def check_dataset_not_defined_in_model(self, dataset_name: str):
+        if item_name  in self.__model_def.parameters:
+            self._report_error(f"{item_name} name {item_name} is already in use as a model parameter")
-        if dataset_name  in self.__model_def.inputs or dataset_name in self.__model_def.outputs:
-            self._report_error(f"Dataset {dataset_name} is already defined in the model")
+    def check_item_is_model_output(self, item_name: str, item_type: str):
-        if dataset_name  in self.__model_def.parameters:
-            self._report_error(f"Dataset name {dataset_name} is already in use as a model parameter")
+        if item_name not in self.__model_def.outputs and item_name not in self.__dynamic_outputs:
+            self._report_error(f"{item_type} {item_name} is not defined as a model output")
-    def check_dataset_defined_in_model(self, dataset_name: str):
+    def check_item_available_in_context(self, item_name: str, item_type: str):
-        if dataset_name not in self.__model_def.inputs and dataset_name not in self.__model_def.outputs:
-            self._report_error(f"Dataset {dataset_name} is not defined in the model")
+        if item_name not in self.__local_ctx:
+            self._report_error(f"{item_type} {item_name} is not available in the current context")
-    def check_dataset_is_model_output(self, dataset_name: str):
+    def check_item_not_available_in_context(self, item_name: str, item_type: str):
-        if dataset_name not in self.__model_def.outputs and dataset_name not in self.__dynamic_outputs:
-            self._report_error(f"Dataset {dataset_name} is not defined as a model output")
+        if item_name in self.__local_ctx:
+            self._report_error(f"{item_type} {item_name} already exists in the current context")
     def check_dataset_is_dynamic_output(self, dataset_name: str):
@@ -752,21 +884,17 @@ class TracContextValidator(TracContextErrorReporter):
         if model_output and not model_output.dynamic:
             self._report_error(f"Model output {dataset_name} is not a dynamic output")
-    def check_dataset_available_in_context(self, item_name: str):
-        if item_name not in self.__local_ctx:
-            self._report_error(f"Dataset {item_name} is not available in the current context")
-    def check_dataset_not_available_in_context(self, item_name: str):
-        if item_name in self.__local_ctx:
-            self._report_error(f"Dataset {item_name} already exists in the current context")
     def check_dataset_schema_defined(self, dataset_name: str, data_view: _data.DataView):
         schema = data_view.trac_schema if data_view is not None else None
-        if schema is None or schema.table is None or not schema.table.fields:
+        if schema is None:
+            self._report_error(f"Schema not defined for dataset {dataset_name} in the current context")
+        if schema.schemaType == _meta.SchemaType.TABLE and (schema.table is None or not schema.table.fields):
+            self._report_error(f"Schema not defined for dataset {dataset_name} in the current context")
+        if schema.schemaType == _meta.SchemaType.STRUCT and (schema.struct is None or not schema.struct.fields):
             self._report_error(f"Schema not defined for dataset {dataset_name} in the current context")
     def check_dataset_schema_not_defined(self, dataset_name: str, data_view: _data.DataView):
@@ -834,6 +962,14 @@ class TracContextValidator(TracContextErrorReporter):
                 f"The object referenced by [{item_name}] in the current context has the wrong type" +
                 f" (expected {expected_type_name}, got {actual_type_name})")
+    def check_context_data_view_type(self, item_name: str, data_vew: _data.DataView, expected_type: _meta.ObjectType):
+        if data_vew.object_type != expected_type:
+            self._report_error(
+                f"The object referenced by [{item_name}] in the current context has the wrong type" +
+                f" (expected {expected_type.name}, got {data_vew.object_type.name})")
     def check_data_framework_args(self, framework: _eapi.DataFramework, framework_args: tp.Dict[str, tp.Any]):
         expected_args = _data.DataConverter.get_framework_args(framework)
@@ -861,6 +997,16 @@ class TracContextValidator(TracContextErrorReporter):
                     f"Using [{framework}], argument [{arg_name}] has the wrong type" +
                     f" (expected {expected_type_name}, got {actual_type_name})")
+    def check_file_content_present(self, file_name: str, file_view: _data.DataView):
+        if file_view.file_item is None or file_view.file_item.content is None:
+            self._report_error(f"File content is missing or empty for [{file_name}] in the current context")
+    def check_file_content_not_present(self, file_name: str, file_view: _data.DataView):
+        if file_view.file_item is not None and file_view.file_item.content is not None:
+            self._report_error(f"File content is already present for [{file_name}] in the current context")
     def check_storage_valid_identifier(self, storage_key):
         if storage_key is None:
@@ -878,7 +1024,7 @@ class TracContextValidator(TracContextErrorReporter):
     def check_storage_type(
             self, storage_map: tp.Dict, storage_key: str,
-            storage_type: tp.Union[_eapi.TracFileStorage.__class__]):
+            storage_type: tp.Union[_eapi.TracFileStorage.__class__, _eapi.TracDataStorage.__class__]):
         storage_instance = storage_map.get(storage_key)

tracdap-runtime 0.7.1__py3-none-any.whl → 0.8.0__py3-none-any.whl

tracdap-runtime 0.7.1py3-none-any.whl → 0.8.0py3-none-any.whl