PyPI - tracdap-runtime - Versions diffs - 0.6.1.dev3__py3-none-any.whl → 0.6.2__py3-none-any.whl - Mend

tracdap-runtime 0.6.1.dev3py3-none-any.whl → 0.6.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (98) hide show

tracdap/rt/_exec/context.py +25 -1
tracdap/rt/_exec/dev_mode.py +277 -213
tracdap/rt/_exec/functions.py +37 -8
tracdap/rt/_exec/graph.py +2 -0
tracdap/rt/_exec/graph_builder.py +118 -56
tracdap/rt/_exec/runtime.py +28 -0
tracdap/rt/_exec/server.py +68 -0
tracdap/rt/_impl/data.py +14 -0
tracdap/rt/_impl/grpc/__init__.py +13 -0
tracdap/rt/_impl/grpc/codec.py +44 -0
tracdap/rt/_impl/grpc/tracdap/api/internal/runtime_pb2.py +51 -0
tracdap/rt/_impl/grpc/tracdap/api/internal/runtime_pb2.pyi +59 -0
tracdap/rt/_impl/grpc/tracdap/api/internal/runtime_pb2_grpc.py +183 -0
tracdap/rt/_impl/grpc/tracdap/config/common_pb2.py +55 -0
tracdap/rt/_impl/grpc/tracdap/config/common_pb2.pyi +103 -0
tracdap/rt/_impl/grpc/tracdap/config/job_pb2.py +42 -0
tracdap/rt/_impl/grpc/tracdap/config/job_pb2.pyi +44 -0
tracdap/rt/_impl/grpc/tracdap/config/platform_pb2.py +71 -0
tracdap/rt/_impl/grpc/tracdap/config/platform_pb2.pyi +197 -0
tracdap/rt/_impl/grpc/tracdap/config/result_pb2.py +37 -0
tracdap/rt/_impl/grpc/tracdap/config/result_pb2.pyi +35 -0
tracdap/rt/_impl/grpc/tracdap/config/runtime_pb2.py +42 -0
tracdap/rt/_impl/grpc/tracdap/config/runtime_pb2.pyi +46 -0
tracdap/rt/_impl/grpc/tracdap/metadata/common_pb2.py +33 -0
tracdap/rt/_impl/grpc/tracdap/metadata/common_pb2.pyi +34 -0
tracdap/rt/{metadata → _impl/grpc/tracdap/metadata}/custom_pb2.py +5 -5
tracdap/rt/_impl/grpc/tracdap/metadata/custom_pb2.pyi +15 -0
tracdap/rt/_impl/grpc/tracdap/metadata/data_pb2.py +51 -0
tracdap/rt/_impl/grpc/tracdap/metadata/data_pb2.pyi +115 -0
tracdap/rt/_impl/grpc/tracdap/metadata/file_pb2.py +28 -0
tracdap/rt/_impl/grpc/tracdap/metadata/file_pb2.pyi +22 -0
tracdap/rt/_impl/grpc/tracdap/metadata/flow_pb2.py +59 -0
tracdap/rt/_impl/grpc/tracdap/metadata/flow_pb2.pyi +109 -0
tracdap/rt/_impl/grpc/tracdap/metadata/job_pb2.py +76 -0
tracdap/rt/_impl/grpc/tracdap/metadata/job_pb2.pyi +177 -0
tracdap/rt/_impl/grpc/tracdap/metadata/model_pb2.py +51 -0
tracdap/rt/_impl/grpc/tracdap/metadata/model_pb2.pyi +92 -0
tracdap/rt/_impl/grpc/tracdap/metadata/object_id_pb2.py +32 -0
tracdap/rt/_impl/grpc/tracdap/metadata/object_id_pb2.pyi +68 -0
tracdap/rt/_impl/grpc/tracdap/metadata/object_pb2.py +35 -0
tracdap/rt/_impl/grpc/tracdap/metadata/object_pb2.pyi +35 -0
tracdap/rt/_impl/grpc/tracdap/metadata/search_pb2.py +39 -0
tracdap/rt/_impl/grpc/tracdap/metadata/search_pb2.pyi +83 -0
tracdap/rt/_impl/grpc/tracdap/metadata/stoarge_pb2.py +50 -0
tracdap/rt/_impl/grpc/tracdap/metadata/stoarge_pb2.pyi +89 -0
tracdap/rt/_impl/grpc/tracdap/metadata/tag_pb2.py +34 -0
tracdap/rt/_impl/grpc/tracdap/metadata/tag_pb2.pyi +26 -0
tracdap/rt/_impl/grpc/tracdap/metadata/tag_update_pb2.py +30 -0
tracdap/rt/_impl/grpc/tracdap/metadata/tag_update_pb2.pyi +34 -0
tracdap/rt/_impl/grpc/tracdap/metadata/type_pb2.py +47 -0
tracdap/rt/_impl/grpc/tracdap/metadata/type_pb2.pyi +101 -0
tracdap/rt/_impl/guard_rails.py +5 -6
tracdap/rt/_impl/static_api.py +10 -6
tracdap/rt/_version.py +1 -1
tracdap/rt/api/hook.py +6 -2
tracdap/rt/api/model_api.py +22 -0
tracdap/rt/api/static_api.py +14 -4
tracdap/rt/config/__init__.py +3 -3
tracdap/rt/config/platform.py +9 -9
tracdap/rt/launch/cli.py +3 -5
tracdap/rt/launch/launch.py +15 -3
tracdap/rt/metadata/__init__.py +15 -15
tracdap/rt/metadata/common.py +7 -7
tracdap/rt/metadata/custom.py +2 -0
tracdap/rt/metadata/data.py +28 -5
tracdap/rt/metadata/file.py +2 -0
tracdap/rt/metadata/flow.py +66 -4
tracdap/rt/metadata/job.py +56 -16
tracdap/rt/metadata/model.py +4 -0
tracdap/rt/metadata/object_id.py +9 -9
tracdap/rt/metadata/search.py +35 -13
tracdap/rt/metadata/stoarge.py +64 -6
tracdap/rt/metadata/tag_update.py +21 -7
tracdap/rt/metadata/type.py +28 -13
{tracdap_runtime-0.6.1.dev3.dist-info → tracdap_runtime-0.6.2.dist-info}/METADATA +22 -19
tracdap_runtime-0.6.2.dist-info/RECORD +121 -0
{tracdap_runtime-0.6.1.dev3.dist-info → tracdap_runtime-0.6.2.dist-info}/WHEEL +1 -1
tracdap/rt/config/common_pb2.py +0 -55
tracdap/rt/config/job_pb2.py +0 -42
tracdap/rt/config/platform_pb2.py +0 -71
tracdap/rt/config/result_pb2.py +0 -37
tracdap/rt/config/runtime_pb2.py +0 -42
tracdap/rt/metadata/common_pb2.py +0 -33
tracdap/rt/metadata/data_pb2.py +0 -51
tracdap/rt/metadata/file_pb2.py +0 -28
tracdap/rt/metadata/flow_pb2.py +0 -55
tracdap/rt/metadata/job_pb2.py +0 -76
tracdap/rt/metadata/model_pb2.py +0 -51
tracdap/rt/metadata/object_id_pb2.py +0 -32
tracdap/rt/metadata/object_pb2.py +0 -35
tracdap/rt/metadata/search_pb2.py +0 -39
tracdap/rt/metadata/stoarge_pb2.py +0 -50
tracdap/rt/metadata/tag_pb2.py +0 -34
tracdap/rt/metadata/tag_update_pb2.py +0 -30
tracdap/rt/metadata/type_pb2.py +0 -48
tracdap_runtime-0.6.1.dev3.dist-info/RECORD +0 -96
{tracdap_runtime-0.6.1.dev3.dist-info → tracdap_runtime-0.6.2.dist-info}/LICENSE +0 -0
{tracdap_runtime-0.6.1.dev3.dist-info → tracdap_runtime-0.6.2.dist-info}/top_level.txt +0 -0

tracdap/rt/_exec/functions.py CHANGED Viewed

@@ -248,6 +248,10 @@ class DataViewFunc(NodeFunction[_data.DataView]):
         root_item = _ctx_lookup(self.node.root_item, ctx)
         root_part_key = _data.DataPartKey.for_root()
+        # Map empty item -> emtpy view (for optional inputs not supplied)
+        if root_item.is_empty():
+            return _data.DataView.create_empty()
         data_view = _data.DataView.for_trac_schema(self.node.schema)
         data_view = _data.DataMapping.add_item_to_view(data_view, root_part_key, root_item)
@@ -263,6 +267,10 @@ class DataItemFunc(NodeFunction[_data.DataItem]):
         data_view = _ctx_lookup(self.node.data_view_id, ctx)
+        # Map empty view -> emtpy item (for optional outputs not supplied)
+        if data_view.is_empty():
+            return _data.DataItem.create_empty()
         # TODO: Support selecting data item described by self.node
         # Selecting data item for part-root, delta=0
@@ -280,6 +288,12 @@ class DataResultFunc(NodeFunction[ObjectBundle]):
     def _execute(self, ctx: NodeContext) -> ObjectBundle:
+        data_item = _ctx_lookup(self.node.data_item_id, ctx)
+        # Do not record output metadata for optional outputs that are empty
+        if data_item.is_empty():
+            return {}
         data_spec = _ctx_lookup(self.node.data_spec_id, ctx)
         # TODO: Check result of save operation
@@ -451,6 +465,13 @@ class SaveDataFunc(NodeFunction[None], _LoadSaveDataFunc):
     def _execute(self, ctx: NodeContext):
+        # Item to be saved should exist in the current context
+        data_item = _ctx_lookup(self.node.data_item_id, ctx)
+        # Do not save empty outputs (optional outputs that were not produced)
+        if data_item.is_empty():
+            return
         # This function assumes that metadata has already been generated as the data_spec
         # i.e. it is already known which incarnation / copy of the data will be created
@@ -458,9 +479,6 @@ class SaveDataFunc(NodeFunction[None], _LoadSaveDataFunc):
         data_copy = self._choose_copy(data_spec.data_item, data_spec.storage_def)
         data_storage = self.storage.get_data_storage(data_copy.storageKey)
-        # Item to be saved should exist in the current context
-        data_item = _ctx_lookup(self.node.data_item_id, ctx)
         # Current implementation will always put an Arrow table in the data item
         # Empty tables are allowed, so explicitly check if table is None
         # Testing "if not data_item.table" will fail for empty tables
@@ -567,12 +585,23 @@ class RunModelFunc(NodeFunction[Bundle[_data.DataView]]):
             msg = f"There was an unhandled error in the model: {str(e)}{details}"
             raise _ex.EModelExec(msg) from e
-        # The node result is just the model outputs taken from the local context
-        model_outputs: Bundle[_data.DataView] = {
-            name: obj for name, obj in local_ctx.items()
-            if name in self.node.model_def.outputs}
+        # Check required outputs are present and build the results bundle
+        results: Bundle[_data.DataView] = dict()
+        for output_name, output_schema in model_def.outputs.items():
+            result: _data.DataView = local_ctx.get(output_name)
+            if result is None or result.is_empty():
+                if not output_schema.optional:
+                    model_name = self.model_class.__name__
+                    raise _ex.ERuntimeValidation(f"Missing required output [{output_name}] from model [{model_name}]")
+            if result is not None:
+                results[output_name] = result
-        return model_outputs
+        return results
 # ----------------------------------------------------------------------------------------------------------------------

tracdap/rt/_exec/graph.py CHANGED Viewed

@@ -297,6 +297,7 @@ class DataItemNode(MappingNode[_data.DataItem]):
 class DataResultNode(Node[ObjectBundle]):
     output_name: str
+    data_item_id: NodeId[_data.DataItem]
     data_spec_id: NodeId[_data.DataSpec]
     data_save_id: NodeId[type(None)]
@@ -306,6 +307,7 @@ class DataResultNode(Node[ObjectBundle]):
     def _node_dependencies(self) -> tp.Dict[NodeId, DependencyType]:
         return {
+            self.data_item_id: DependencyType.HARD,
             self.data_spec_id: DependencyType.HARD,
             self.data_save_id: DependencyType.HARD}

tracdap/rt/_exec/graph_builder.py CHANGED Viewed

@@ -14,9 +14,6 @@
 from __future__ import annotations
-import copy
-import dataclasses  # noqa
 import tracdap.rt.config as config
 import tracdap.rt.exceptions as _ex
 import tracdap.rt._impl.data as _data  # noqa
@@ -123,12 +120,14 @@ class GraphBuilder:
             job_namespace: NodeNamespace, job_push_id: NodeId) \
             -> GraphSection:
+        target_selector = job_config.job.runModel.model
+        target_obj = _util.get_job_resource(target_selector, job_config)
+        target_def = target_obj.model
+        job_def = job_config.job.runModel
         return cls.build_calculation_job(
             job_config, result_spec, job_namespace, job_push_id,
-            job_config.job.runModel.model,
-            job_config.job.runModel.parameters,
-            job_config.job.runModel.inputs,
-            job_config.job.runModel.outputs)
+            target_selector, target_def, job_def)
     @classmethod
     def build_run_flow_job(
@@ -136,40 +135,53 @@ class GraphBuilder:
             job_namespace: NodeNamespace, job_push_id: NodeId) \
             -> GraphSection:
+        target_selector = job_config.job.runFlow.flow
+        target_obj = _util.get_job_resource(target_selector, job_config)
+        target_def = target_obj.flow
+        job_def = job_config.job.runFlow
         return cls.build_calculation_job(
             job_config, result_spec, job_namespace, job_push_id,
-            job_config.job.runFlow.flow,
-            job_config.job.runFlow.parameters,
-            job_config.job.runFlow.inputs,
-            job_config.job.runFlow.outputs)
+            target_selector, target_def, job_def)
     @classmethod
     def build_calculation_job(
             cls, job_config: config.JobConfig, result_spec: JobResultSpec,
             job_namespace: NodeNamespace, job_push_id: NodeId,
-            target: meta.TagSelector, parameters: tp.Dict[str, meta.Value],
-            inputs: tp.Dict[str, meta.TagSelector], outputs: tp.Dict[str, meta.TagSelector]) \
+            target_selector: meta.TagSelector,
+            target_def: tp.Union[meta.ModelDefinition, meta.FlowDefinition],
+            job_def: tp.Union[meta.RunModelJob, meta.RunFlowJob]) \
             -> GraphSection:
         # The main execution graph can run directly in the job context, no need to do a context push
         # since inputs and outputs in this context line up with the top level execution task
+        # Required / provided items are the same for RUN_MODEL and RUN_FLOW jobs
+        required_params = target_def.parameters
+        required_inputs = target_def.inputs
+        required_outputs = target_def.outputs
+        provided_params = job_def.parameters
+        provided_inputs = job_def.inputs
+        provided_outputs = job_def.outputs
         params_section = cls.build_job_parameters(
-            job_namespace, parameters,
+            job_namespace, required_params, provided_params,
             explicit_deps=[job_push_id])
         input_section = cls.build_job_inputs(
-            job_config, job_namespace, inputs,
+            job_config, job_namespace, required_inputs, provided_inputs,
             explicit_deps=[job_push_id])
-        exec_obj = _util.get_job_resource(target, job_config)
+        exec_obj = _util.get_job_resource(target_selector, job_config)
         exec_section = cls.build_model_or_flow(
             job_config, job_namespace, exec_obj,
             explicit_deps=[job_push_id])
         output_section = cls.build_job_outputs(
-            job_config, job_namespace, outputs,
+            job_config, job_namespace, required_outputs, provided_outputs,
             explicit_deps=[job_push_id])
         main_section = cls._join_sections(params_section, input_section, exec_section, output_section)
@@ -190,13 +202,22 @@ class GraphBuilder:
     @classmethod
     def build_job_parameters(
             cls, job_namespace: NodeNamespace,
-            parameters: tp.Dict[str, meta.Value],
+            required_params: tp.Dict[str, meta.ModelParameter],
+            supplied_params: tp.Dict[str, meta.Value],
             explicit_deps: tp.Optional[tp.List[NodeId]] = None) \
             -> GraphSection:
         nodes = dict()
-        for param_name, param_def in parameters.items():
+        for param_name, param_schema in required_params.items():
+            param_def = supplied_params.get(param_name)
+            if param_def is None:
+                if param_schema.defaultValue is not None:
+                    param_def = param_schema.defaultValue
+                else:
+                    raise _ex.EJobValidation(f"Missing required parameter: [{param_name}]")
             param_id = NodeId(param_name, job_namespace, meta.Value)
             param_node = StaticValueNode(param_id, param_def, explicit_deps=explicit_deps)
@@ -208,7 +229,8 @@ class GraphBuilder:
     @classmethod
     def build_job_inputs(
             cls, job_config: config.JobConfig, job_namespace: NodeNamespace,
-            inputs: tp.Dict[str, meta.TagSelector],
+            required_inputs: tp.Dict[str, meta.ModelInputSchema],
+            supplied_inputs: tp.Dict[str, meta.TagSelector],
             explicit_deps: tp.Optional[tp.List[NodeId]] = None) \
             -> GraphSection:
@@ -216,7 +238,18 @@ class GraphBuilder:
         outputs = set()
         must_run = list()
-        for input_name, data_selector in inputs.items():
+        for input_name, input_schema in required_inputs.items():
+            data_selector = supplied_inputs.get(input_name)
+            if data_selector is None:
+                if input_schema.optional:
+                    data_view_id = NodeId.of(input_name, job_namespace, _data.DataView)
+                    nodes[data_view_id] = StaticValueNode(data_view_id, _data.DataView.create_empty())
+                    outputs.add(data_view_id)
+                    continue
+                else:
+                    raise _ex.EJobValidation(f"Missing required input: [{input_name}]")
             # Build a data spec using metadata from the job config
             # For now we are always loading the root part, snap 0, delta 0
@@ -258,14 +291,24 @@ class GraphBuilder:
     @classmethod
     def build_job_outputs(
             cls, job_config: config.JobConfig, job_namespace: NodeNamespace,
-            outputs: tp.Dict[str, meta.TagSelector],
+            required_outputs: tp.Dict[str, meta.ModelOutputSchema],
+            supplied_outputs: tp.Dict[str, meta.TagSelector],
             explicit_deps: tp.Optional[tp.List[NodeId]] = None) \
             -> GraphSection:
         nodes = {}
         inputs = set()
-        for output_name, data_selector in outputs.items():
+        for output_name, output_schema in required_outputs.items():
+            data_selector = supplied_outputs.get(output_name)
+            if data_selector is None:
+                if output_schema.optional:
+                    optional_info = "(configuration is required for all optional outputs, in case they are produced)"
+                    raise _ex.EJobValidation(f"Missing optional output: [{output_name}] {optional_info}")
+                else:
+                    raise _ex.EJobValidation(f"Missing required output: [{output_name}]")
             # Output data view must already exist in the namespace
             data_view_id = NodeId.of(output_name, job_namespace, _data.DataView)
@@ -323,7 +366,8 @@ class GraphBuilder:
             data_result_id = NodeId.of(f"{output_name}:RESULT", job_namespace, ObjectBundle)
             data_result_node = DataResultNode(
-                data_result_id, output_name, data_spec_id, data_save_id,
+                data_result_id, output_name,
+                data_item_id, data_spec_id, data_save_id,
                 output_data_key, output_storage_key)
             nodes[data_spec_id] = data_spec_node
@@ -458,10 +502,10 @@ class GraphBuilder:
             frozenset(parameter_ids), frozenset(input_ids),
             explicit_deps=explicit_deps, bundle=model_id.namespace)
-        module_result_id = NodeId(f"{model_name}:RESULT", namespace)
-        model_result_node = RunModelResultNode(module_result_id, model_id)
+        model_result_id = NodeId(f"{model_name}:RESULT", namespace)
+        model_result_node = RunModelResultNode(model_result_id, model_id)
-        nodes = {model_id: model_node, module_result_id: model_result_node}
+        nodes = {model_id: model_node, model_result_id: model_result_node}
         # Create nodes for each model output
         # The model node itself outputs a bundle (dictionary of named outputs)
@@ -474,7 +518,7 @@ class GraphBuilder:
             nodes[output_id] = BundleItemNode(output_id, model_id, output_id.name)
         # Assemble a graph to include the model and its outputs
-        return GraphSection(nodes, inputs={*parameter_ids, *input_ids}, outputs=output_ids, must_run=[module_result_id])
+        return GraphSection(nodes, inputs={*parameter_ids, *input_ids}, outputs=output_ids, must_run=[model_result_id])
     @classmethod
     def build_flow(
@@ -488,7 +532,7 @@ class GraphBuilder:
         # https://en.wikipedia.org/wiki/Topological_sorting#Kahn's_algorithm
-        remaining_nodes = copy.copy(flow_def.nodes)
+        # Group edges by source and target node
         remaining_edges_by_target = {edge.target.node: [] for edge in flow_def.edges}
         remaining_edges_by_source = {edge.source.node: [] for edge in flow_def.edges}
@@ -496,16 +540,14 @@ class GraphBuilder:
             remaining_edges_by_target[edge.target.node].append(edge)
             remaining_edges_by_source[edge.source.node].append(edge)
-        reachable_nodes = dict()
-        # Initial set of reachable flow nodes is just the input nodes
-        for node_name, node in list(remaining_nodes.items()):
-            if node.nodeType == meta.FlowNodeType.INPUT_NODE:
-                reachable_nodes[node_name] = node
-                del remaining_nodes[node_name]
+        # Group edges by target socket (only one edge per target in a consistent flow)
         target_edges = {socket_key(edge.target): edge for edge in flow_def.edges}
+        # Initially parameters and inputs are reachable, everything else is not
+        def is_input(n): return n[1].nodeType in [meta.FlowNodeType.PARAMETER_NODE, meta.FlowNodeType.INPUT_NODE]
+        reachable_nodes = dict(filter(is_input, flow_def.nodes.items()))
+        remaining_nodes = dict(filter(lambda n: not is_input(n), flow_def.nodes.items()))
         # Initial graph section for the flow is empty
         graph_section = GraphSection({}, must_run=explicit_deps)
@@ -559,10 +601,16 @@ class GraphBuilder:
             return NodeId(socket_name, namespace, result_type)
         def edge_mapping(node_: str, socket_: str = None, result_type=None):
-            socket = meta.FlowSocket(node_, socket_)
-            edge = target_edges.get(socket_key(socket))  # todo: inconsistent if missing
+            socket = socket_key(meta.FlowSocket(node_, socket_))
+            edge = target_edges.get(socket)
+            # Report missing edges as a job consistency error (this might happen sometimes in dev mode)
+            if edge is None:
+                raise _ex.EJobValidation(f"Inconsistent flow: Socket [{socket}] is not connected")
             return socket_id(edge.source.node, edge.source.socket, result_type)
+        if node.nodeType == meta.FlowNodeType.PARAMETER_NODE:
+            return GraphSection({}, inputs={NodeId(node_name, namespace, result_type=meta.Value)})
         if node.nodeType == meta.FlowNodeType.INPUT_NODE:
             return GraphSection({}, inputs={NodeId(node_name, namespace, result_type=_data.DataView)})
@@ -573,32 +621,46 @@ class GraphBuilder:
         if node.nodeType == meta.FlowNodeType.MODEL_NODE:
-            model_selector = flow_job.models.get(node_name)
-            model_obj = _util.get_job_resource(model_selector, job_config)
-            # TODO: Whether to use flow node or model_obj to build the push mapping?
+            param_mapping = {socket: edge_mapping(node_name, socket, meta.Value) for socket in node.parameters}
+            input_mapping = {socket: edge_mapping(node_name, socket, _data.DataView) for socket in node.inputs}
+            output_mapping = {socket: socket_id(node_name, socket, _data.DataView) for socket in node.outputs}
-            input_mapping_ = {
-                input_name: edge_mapping(node_name, input_name, _data.DataView)
-                for input_name in model_obj.model.inputs
-            }
+            push_mapping = {**input_mapping, **param_mapping}
+            pop_mapping = output_mapping
-            param_mapping_ = {
-                param_name: NodeId(param_name, namespace, meta.Value)
-                for param_name in model_obj.model.parameters
-            }
+            model_selector = flow_job.models.get(node_name)
+            model_obj = _util.get_job_resource(model_selector, job_config)
-            push_mapping = {**input_mapping_, **param_mapping_}
+            # Missing models in the job config is a job consistency error
+            if model_obj is None or model_obj.objectType != meta.ObjectType.MODEL:
+                raise _ex.EJobValidation(f"No model was provided for flow node [{node_name}]")
-            pop_mapping = {
-                output_: NodeId(f"{node_name}.{output_}", namespace, _data.DataView)
-                for output_ in model_obj.model.outputs}
+            # Explicit check for model compatibility - report an error now, do not try build_model()
+            cls.check_model_compatibility(model_selector, model_obj.model, node_name, node)
             return cls.build_model_or_flow_with_context(
                 job_config, namespace, node_name, model_obj,
                 push_mapping, pop_mapping, explicit_deps)
-        raise _ex.ETracInternal()  # TODO: Invalid node type
+        # Missing / invalid node type - should be caught in static validation
+        raise _ex.ETracInternal(f"Flow node [{node_name}] has invalid node type [{node.nodeType}]")
+    @classmethod
+    def check_model_compatibility(
+            cls, model_selector: meta.TagSelector, model_def: meta.ModelDefinition,
+            node_name: str, flow_node: meta.FlowNode):
+        model_params = list(sorted(model_def.parameters.keys()))
+        model_inputs = list(sorted(model_def.inputs.keys()))
+        model_outputs = list(sorted(model_def.outputs.keys()))
+        node_params = list(sorted(flow_node.parameters))
+        node_inputs = list(sorted(flow_node.inputs))
+        node_outputs = list(sorted(flow_node.outputs))
+        if model_params != node_params or model_inputs != node_inputs or model_outputs != node_outputs:
+            model_key = _util.object_key(model_selector)
+            raise _ex.EJobValidation(f"Incompatible model for flow node [{node_name}] (Model: [{model_key}])")
     @staticmethod
     def build_context_push(

tracdap/rt/_exec/runtime.py CHANGED Viewed

@@ -90,6 +90,10 @@ class TracRuntime:
         self._scratch_dir_provided = True if scratch_dir is not None else False
         self._scratch_dir_persist = scratch_dir_persist
         self._dev_mode = dev_mode
+        self._server_enabled = False
+        self._server_port = 0
+        self._pre_start_complete = False
         # Top level resources
         self._models: tp.Optional[_models.ModelLoader] = None
@@ -100,6 +104,9 @@ class TracRuntime:
         self._engine: tp.Optional[_engine.TracEngine] = None
         self._engine_event = threading.Condition()
+        # Runtime API server
+        self._server = None
         self._jobs: tp.Dict[str, _RuntimeJobInfo] = dict()
     # ------------------------------------------------------------------------------------------------------------------
@@ -152,6 +159,8 @@ class TracRuntime:
                 config_dir = self._sys_config_path.parent if self._sys_config_path is not None else None
                 self._sys_config = _dev_mode.DevModeTranslator.translate_sys_config(self._sys_config, config_dir)
+            self._pre_start_complete = True
         except Exception as e:
             self._handle_startup_error(e)
@@ -159,6 +168,10 @@ class TracRuntime:
         try:
+            # Ensure pre-start has been run
+            if not self._pre_start_complete:
+                self.pre_start()
             self._log.info("Starting the engine...")
             self._models = _models.ModelLoader(self._sys_config, self._scratch_dir)
@@ -175,11 +188,26 @@ class TracRuntime:
             self._system.start(wait=wait)
+            # If the runtime server has been enabled, start it up
+            if self._server_enabled:
+                self._log.info("Starting the runtime API server...")
+                # The server module pulls in all the gRPC dependencies, don't import it unless we have to
+                import tracdap.rt._exec.server as _server
+                self._server = _server.RuntimeApiServer(self._server_port)
+                self._server.start()
         except Exception as e:
             self._handle_startup_error(e)
     def stop(self, due_to_error=False):
+        if self._server is not None:
+            self._log.info("Stopping the runtime API server...")
+            self._server.stop()
         if due_to_error:
             self._log.info("Shutting down the engine in response to an error")
         else:

tracdap/rt/_exec/server.py ADDED Viewed

@@ -0,0 +1,68 @@
+#  Copyright 2024 Accenture Global Solutions Limited
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+import typing as tp
+import concurrent.futures as futures
+# Imports for gRPC generated code, these are managed by build_runtime.py for distribution
+import tracdap.rt._impl.grpc.tracdap.api.internal.runtime_pb2 as runtime_pb2
+import tracdap.rt._impl.grpc.tracdap.api.internal.runtime_pb2_grpc as runtime_grpc
+import grpc
+class RuntimeApiServer(runtime_grpc.TracRuntimeApiServicer):
+    __THREAD_POOL_DEFAULT_SIZE = 2
+    __THREAD_NAME_PREFIX = "server-"
+    __DEFAULT_SHUTDOWN_TIMEOUT = 10.0  # seconds
+    def __init__(self, port: int, n_workers: int = None):
+        self.__port = port
+        self.__n_workers = n_workers or self.__THREAD_POOL_DEFAULT_SIZE
+        self.__server: tp.Optional[grpc.Server] = None
+        self.__thread_pool: tp.Optional[futures.ThreadPoolExecutor] = None
+    def listJobs(self, request, context):
+        return super().listJobs(request, context)
+    def getJobStatus(self, request: runtime_pb2.BatchJobStatusRequest, context: grpc.ServicerContext):
+        return super().getJobStatus(request, context)
+    def getJobDetails(self, request, context):
+        return super().getJobDetails(request, context)
+    def start(self):
+        self.__thread_pool = futures.ThreadPoolExecutor(
+            max_workers=self.__n_workers,
+            thread_name_prefix=self.__THREAD_NAME_PREFIX)
+        self.__server = grpc.server(self.__thread_pool)
+        socket = f"[::]:{self.__port}"
+        self.__server.add_insecure_port(socket)
+        runtime_grpc.add_TracRuntimeApiServicer_to_server(self, self.__server)
+        self.__server.start()
+    def stop(self, shutdown_timeout: float = None):
+        grace = shutdown_timeout or self.__DEFAULT_SHUTDOWN_TIMEOUT
+        if self.__server is not None:
+            self.__server.stop(grace)
+        if self.__thread_pool is not None:
+            self.__thread_pool.shutdown()

tracdap/rt/_impl/data.py CHANGED Viewed

@@ -58,6 +58,13 @@ class DataItem:
     pandas: tp.Optional[pd.DataFrame] = None
     pyspark: tp.Any = None
+    def is_empty(self) -> bool:
+        return self.table is None and (self.batches is None or len(self.batches) == 0)
+    @staticmethod
+    def create_empty() -> DataItem:
+        return DataItem(pa.schema([]))
 @dc.dataclass(frozen=True)
 class DataView:
@@ -72,6 +79,13 @@ class DataView:
         arrow_schema = DataMapping.trac_to_arrow_schema(trac_schema)
         return DataView(trac_schema, arrow_schema, dict())
+    def is_empty(self) -> bool:
+        return self.parts is None or len(self.parts) == 0
+    @staticmethod
+    def create_empty() -> DataView:
+        return DataView(_meta.SchemaDefinition(), pa.schema([]), dict())
 class _DataInternal:
     pass

tracdap/rt/_impl/grpc/__init__.py ADDED Viewed

@@ -0,0 +1,13 @@
+#  Copyright 2024 Accenture Global Solutions Limited
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.

tracdap/rt/_impl/grpc/codec.py ADDED Viewed

@@ -0,0 +1,44 @@
+#  Copyright 2024 Accenture Global Solutions Limited
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+import enum
+import typing as tp
+def encode(obj: tp.Any) -> tp.Any:
+    # Translate TRAC domain objects into generic dict / list structures
+    # These can be accepted by gRPC message constructors, do not try to build messages directly
+    # Use shallow copies and builtins to minimize performance impact
+    if obj is None:
+        return None
+    if isinstance(obj, str) or isinstance(obj, bool) or isinstance(obj, int) or isinstance(obj, float):
+        return obj
+    if isinstance(obj, enum.Enum):
+        return obj.value
+    if isinstance(obj, list):
+        return list(map(encode, obj))
+    if isinstance(obj, dict):
+        return dict(map(lambda kv: (kv[0], encode(kv[1])), obj.items()))
+    # Filter classes for TRAC domain objects (sanity check, not a watertight validation)
+    if hasattr(obj, "__module__") and "tracdap" in obj.__module__:
+        return dict(map(lambda kv: (kv[0], encode(kv[1])), obj.__dict__.items()))
+    raise RuntimeError(f"Cannot encode object of type [{type(obj).__name__}] for gRPC")

tracdap-runtime 0.6.1.dev3__py3-none-any.whl → 0.6.2__py3-none-any.whl

tracdap-runtime 0.6.1.dev3py3-none-any.whl → 0.6.2py3-none-any.whl