PyPI - hpcflow-new2 - Versions diffs - 0.2.0a69__py3-none-any.whl → 0.2.0a71__py3-none-any.whl - Mend

hpcflow-new2 0.2.0a69py3-none-any.whl → 0.2.0a71py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

hpcflow/_version.py +1 -1
hpcflow/sdk/__init__.py +1 -0
hpcflow/sdk/core/actions.py +24 -7
hpcflow/sdk/core/element.py +99 -25
hpcflow/sdk/core/parameters.py +316 -69
hpcflow/sdk/core/task.py +312 -176
hpcflow/sdk/core/task_schema.py +27 -18
hpcflow/sdk/core/test_utils.py +16 -1
hpcflow/sdk/core/utils.py +18 -2
hpcflow/sdk/core/workflow.py +15 -11
hpcflow/tests/unit/test_app.py +1 -8
hpcflow/tests/unit/test_input_value.py +41 -0
hpcflow/tests/unit/test_schema_input.py +191 -0
hpcflow/tests/unit/test_task.py +68 -23
hpcflow/tests/unit/test_value_sequence.py +219 -0
hpcflow/tests/unit/test_workflow.py +200 -63
{hpcflow_new2-0.2.0a69.dist-info → hpcflow_new2-0.2.0a71.dist-info}/METADATA +1 -1
{hpcflow_new2-0.2.0a69.dist-info → hpcflow_new2-0.2.0a71.dist-info}/RECORD +20 -18
{hpcflow_new2-0.2.0a69.dist-info → hpcflow_new2-0.2.0a71.dist-info}/WHEEL +0 -0
{hpcflow_new2-0.2.0a69.dist-info → hpcflow_new2-0.2.0a71.dist-info}/entry_points.txt +0 -0

hpcflow/sdk/core/task.py CHANGED Viewed

@@ -113,7 +113,7 @@ class ElementSet(JSONLike):
         input_files: Optional[List[app.InputFile]] = None,
         sequences: Optional[List[app.ValueSequence]] = None,
         resources: Optional[Dict[str, Dict]] = None,
-        repeats: Optional[Union[int, List[int]]] = 1,
+        repeats: Optional[List[Dict]] = None,
         groups: Optional[List[app.ElementGroup]] = None,
         input_sources: Optional[Dict[str, app.InputSource]] = None,
         nesting_order: Optional[List] = None,
@@ -143,7 +143,7 @@ class ElementSet(JSONLike):
         self.inputs = inputs or []
         self.input_files = input_files or []
-        self.repeats = repeats
+        self.repeats = repeats or []
         self.groups = groups or []
         self.resources = resources
         self.sequences = sequences or []
@@ -216,7 +216,7 @@ class ElementSet(JSONLike):
     @property
     def input_types(self):
-        return [i.parameter.typ for i in self.inputs]
+        return [i.labelled_type for i in self.inputs]
     @property
     def element_local_idx_range(self):
@@ -266,7 +266,7 @@ class ElementSet(JSONLike):
         seq_inp_types = []
         for seq_i in self.sequences:
-            inp_type = seq_i.input_type
+            inp_type = seq_i.labelled_type
             if inp_type:
                 bad_inp = {inp_type} - self.task_template.all_schema_input_types
                 allowed_str = ", ".join(
@@ -282,6 +282,11 @@ class ElementSet(JSONLike):
             if seq_i.path not in self.nesting_order:
                 self.nesting_order.update({seq_i.path: seq_i.nesting_order})
+        for rep_spec in self.repeats:
+            reps_path_i = f'repeats.{rep_spec["name"]}'
+            if reps_path_i not in self.nesting_order:
+                self.nesting_order[reps_path_i] = rep_spec["nesting_order"]
         for k, v in self.nesting_order.items():
             if v < 0:
                 raise TaskTemplateInvalidNesting(
@@ -408,22 +413,44 @@ class ElementSet(JSONLike):
         return deps
-    def is_input_type_provided(self, typ: str) -> bool:
+    def is_input_type_provided(self, labelled_path: str) -> bool:
         """Check if an input is provided locally as an InputValue or a ValueSequence."""
         for inp in self.inputs:
-            if typ == inp.parameter.typ:
+            if labelled_path == inp.normalised_inputs_path:
                 return True
         for seq in self.sequences:
             if seq.parameter:
                 # i.e. not a resource:
-                if not seq.is_sub_value and typ == seq.parameter.typ:
+                if labelled_path == seq.normalised_inputs_path:
                     return True
         return False
+class OutputLabel(JSONLike):
+    """Class to represent schema input labels that should be applied to a subset of task
+    outputs"""
+    _child_objects = (
+        ChildObjectSpec(
+            name="where",
+            class_name="ElementFilter",
+        ),
+    )
+    def __init__(
+        self,
+        parameter: str,
+        label: str,
+        where: Optional[List[app.ElementFilter]] = None,
+    ) -> None:
+        self.parameter = parameter
+        self.label = label
+        self.where = where
 class Task(JSONLike):
     """Parametrisation of an isolated task for which a subset of input values are given
     "locally". The remaining input values are expected to be satisfied by other
@@ -444,12 +471,17 @@ class Task(JSONLike):
             is_multiple=True,
             parent_ref="task_template",
         ),
+        ChildObjectSpec(
+            name="output_labels",
+            class_name="OutputLabel",
+            is_multiple=True,
+        ),
     )
     def __init__(
         self,
         schemas: Union[app.TaskSchema, str, List[app.TaskSchema], List[str]],
-        repeats: Optional[Union[int, List[int]]] = None,
+        repeats: Optional[List[Dict]] = None,
         groups: Optional[List[app.ElementGroup]] = None,
         resources: Optional[Dict[str, Dict]] = None,
         inputs: Optional[List[app.InputValue]] = None,
@@ -458,6 +490,7 @@ class Task(JSONLike):
         input_sources: Optional[Dict[str, app.InputSource]] = None,
         nesting_order: Optional[List] = None,
         element_sets: Optional[List[app.ElementSet]] = None,
+        output_labels: Optional[List[app.OutputLabel]] = None,
         sourceable_elem_iters: Optional[List[int]] = None,
     ):
         """
@@ -515,6 +548,7 @@ class Task(JSONLike):
             element_sets=element_sets,
             sourceable_elem_iters=sourceable_elem_iters,
         )
+        self._output_labels = output_labels or []
         # appended to when new element sets are added and reset on dump to disk:
         self._pending_element_sets = []
@@ -700,6 +734,10 @@ class Task(JSONLike):
         else:
             return None
+    @property
+    def output_labels(self):
+        return self._output_labels
     @property
     def _element_indices(self):
         return self.workflow_template.workflow.tasks[self.index].element_indices
@@ -707,7 +745,7 @@ class Task(JSONLike):
     def get_available_task_input_sources(
         self,
         element_set: app.ElementSet,
-        source_tasks: Optional[List[app.Task]] = None,
+        source_tasks: Optional[List[app.WorkflowTask]] = None,
     ) -> List[app.InputSource]:
         """For each input parameter of this task, generate a list of possible input sources
         that derive from inputs or outputs of this and other provided tasks.
@@ -715,8 +753,6 @@ class Task(JSONLike):
         Note this only produces a subset of available input sources for each input
         parameter; other available input sources may exist from workflow imports."""
-        # TODO: also search sub-parameters in the source tasks!
         if source_tasks:
             # ensure parameters provided by later tasks are added to the available sources
             # list first, meaning they take precedence when choosing an input source:
@@ -726,30 +762,32 @@ class Task(JSONLike):
         available = {}
         for inputs_path, inp_status in self.get_input_statuses(element_set).items():
-            available[inputs_path] = []
             # local specification takes precedence:
             if inputs_path in element_set.get_locally_defined_inputs():
+                if inputs_path not in available:
+                    available[inputs_path] = []
                 available[inputs_path].append(self.app.InputSource.local())
             # search for task sources:
-            for src_task_i in source_tasks:
+            for src_wk_task_i in source_tasks:
                 # ensure we process output types before input types, so they appear in the
                 # available sources list first, meaning they take precedence when choosing
                 # an input source:
-                for param_i in sorted(
-                    src_task_i.provides_parameters,
-                    key=lambda x: x.input_or_output,
+                src_task_i = src_wk_task_i.template
+                for in_or_out, labelled_path in sorted(
+                    src_task_i.provides_parameters(),
+                    key=lambda x: x[0],
                     reverse=True,
                 ):
-                    if param_i.typ == inputs_path:
-                        if param_i.input_or_output == "input":
+                    if inputs_path in labelled_path:
+                        avail_src_path = labelled_path
+                        if in_or_out == "input":
                             # input parameter might not be provided e.g. if it only used
                             # to generate an input file, and that input file is passed
                             # directly, so consider only source task element sets that
                             # provide the input locally:
                             es_idx = src_task_i.get_param_provided_element_sets(
-                                param_i.typ
+                                labelled_path
                             )
                         else:
                             # outputs are always available, so consider all source task
@@ -774,17 +812,69 @@ class Task(JSONLike):
                                 set(element_set.sourceable_elem_iters)
                                 & set(src_elem_iters)
                             )
-                            if not src_elem_iters:
-                                continue
-                        task_source = self.app.InputSource.task(
-                            task_ref=src_task_i.insert_ID,
-                            task_source_type=param_i.input_or_output,
-                            element_iters=src_elem_iters,
-                        )
-                        available[inputs_path].append(task_source)
+                    elif labelled_path in inputs_path and in_or_out == "output":
+                        avail_src_path = inputs_path
+                        inputs_path_label = None
+                        out_label = None
+                        try:
+                            inputs_path_label = inputs_path.split("[")[1].split("]")[0]
+                        except IndexError:
+                            pass
+                        if inputs_path_label:
+                            for out_lab_i in src_task_i.output_labels:
+                                if out_lab_i.label == inputs_path_label:
+                                    out_label = out_lab_i
+                        if out_label:
+                            # find element iteration IDs that match the output label
+                            # filter:
+                            param_path = ".".join(
+                                i.condition.callable.kwargs["value"]
+                                for i in out_label.where.path
+                            )
+                            param_path_split = param_path.split(".")
+                            src_elem_iters = []
+                            for elem_i in src_wk_task_i.elements[:]:
+                                params = getattr(elem_i, param_path_split[0])
+                                param_dat = getattr(params, param_path_split[1]).value
+                                # for remaining paths components try both getattr and getitem:
+                                for path_k in param_path_split[2:]:
+                                    try:
+                                        param_dat = param_dat[path_k]
+                                    except TypeError:
+                                        param_dat = getattr(param_dat, path_k)
+                                rule = Rule(
+                                    path=[0],
+                                    condition=out_label.where.condition,
+                                    cast=out_label.where.cast,
+                                )
+                                if rule.test([param_dat]).is_valid:
+                                    src_elem_iters.append(elem_i.iterations[0].id_)
+                    else:
+                        continue
+                    if not src_elem_iters:
+                        continue
+                    task_source = self.app.InputSource.task(
+                        task_ref=src_task_i.insert_ID,
+                        task_source_type=in_or_out,
+                        element_iters=src_elem_iters,
+                    )
+                    if avail_src_path not in available:
+                        available[avail_src_path] = []
+                    available[avail_src_path].append(task_source)
             if inp_status.has_default:
+                if inputs_path not in available:
+                    available[inputs_path] = []
                 available[inputs_path].append(self.app.InputSource.default())
         return available
@@ -885,18 +975,20 @@ class Task(JSONLike):
         provided_files = [i.file for i in element_set.input_files]
         for schema in self.schemas:
+            if not schema.actions:
+                return True  # for empty tasks that are used merely for defining inputs
             for act in schema.actions:
                 if act.is_input_type_required(typ, provided_files):
                     return True
         return False
-    def get_param_provided_element_sets(self, typ: str) -> List[int]:
+    def get_param_provided_element_sets(self, labelled_path: str) -> List[int]:
         """Get the element set indices of this task for which a specified parameter type
         is locally provided."""
         es_idx = []
         for idx, src_es in enumerate(self.element_sets):
-            if src_es.is_input_type_provided(typ):
+            if src_es.is_input_type_provided(labelled_path):
                 es_idx.append(idx)
         return es_idx
@@ -913,19 +1005,18 @@ class Task(JSONLike):
         status = {}
         for schema_input in self.all_schema_inputs:
-            typ = schema_input.parameter.typ
-            status[typ] = InputStatus(
-                has_default=schema_input.default_value is not None,
-                is_provided=elem_set.is_input_type_provided(typ),
-                is_required=self.is_input_type_required(typ, elem_set),
-            )
+            for lab_info in schema_input.labelled_info():
+                labelled_type = lab_info["labelled_type"]
+                status[labelled_type] = InputStatus(
+                    has_default="default_value" in lab_info,
+                    is_provided=elem_set.is_input_type_provided(labelled_type),
+                    is_required=self.is_input_type_required(labelled_type, elem_set),
+                )
         for inp_path in elem_set.get_defined_sub_parameter_types():
             root_param = ".".join(inp_path.split(".")[:-1])
-            # Sub-parameters can only be specified locally (currently), so "is_provided"
-            # is True by definition, and if the root parameter is required then the
-            # sub-parameter should also be required, otherwise there would be no point in
-            # specifying it:
+            # If the root parameter is required then the sub-parameter should also be
+            # required, otherwise there would be no point in specifying it:
             status[inp_path] = InputStatus(
                 has_default=False,
                 is_provided=True,
@@ -934,19 +1025,15 @@ class Task(JSONLike):
         return status
-    def get_all_required_schema_inputs(self, element_set):
-        stats = self.get_input_statuses(element_set)
-        return tuple(
-            i for i in self.all_schema_inputs if stats[i.parameter.typ].is_required
-        )
     @property
     def universal_input_types(self):
         """Get input types that are associated with all schemas"""
+        raise NotImplementedError()
     @property
     def non_universal_input_types(self):
         """Get input types for each schema that are non-universal."""
+        raise NotImplementedError()
     @property
     def defined_input_types(self):
@@ -970,15 +1057,26 @@ class Task(JSONLike):
         """Get schema input types for which no input sources are currently specified."""
         return self.all_schema_input_types - set(self.input_sources.keys())
-    @property
-    def provides_parameters(self):
-        return tuple(j for schema in self.schemas for j in schema.provides_parameters)
+    def provides_parameters(self) -> Tuple[Tuple[str, str]]:
+        """Get all provided parameter labelled types and whether they are inputs and
+        outputs, considering all element sets.
+        """
+        out = []
+        for schema in self.schemas:
+            for in_or_out, labelled_type in schema.provides_parameters:
+                out.append((in_or_out, labelled_type))
-    def get_sub_parameter_input_values(self):
-        return [i for i in self.inputs if i.is_sub_value]
+        # add sub-parameter input values and sequences:
+        for es_i in self.element_sets:
+            for inp_j in es_i.inputs:
+                if inp_j.is_sub_value:
+                    out.append(("input", inp_j.normalised_inputs_path))
+            for seq_j in es_i.sequences:
+                if seq_j.is_sub_value:
+                    out.append(("input", seq_j.normalised_inputs_path))
-    def get_non_sub_parameter_input_values(self):
-        return [i for i in self.inputs if not i.is_sub_value]
+        return tuple(out)
     def add_group(
         self, name: str, where: app.ElementFilter, group_by_distinct: app.ParameterPath
@@ -1099,13 +1197,6 @@ class WorkflowTask:
         sequence_idx = {}
         source_idx = {}
-        # from pprint import pprint
-        # print(f"{element_set.groups=}")
-        # print(f"{element_set.inputs=}")
-        # print("element_set.input_sources")
-        # pprint(element_set.input_sources)
         # Assign first assuming all locally defined values are to be used:
         param_src = {
             "type": "local_input",
@@ -1151,25 +1242,39 @@ class WorkflowTask:
             except ValueError:
                 pass
+        for rep_spec in element_set.repeats:
+            seq_key = f"repeats.{rep_spec['name']}"
+            num_range = list(range(rep_spec["number"]))
+            input_data_idx[seq_key] = num_range
+            sequence_idx[seq_key] = num_range
         # Now check for task- and default-sources and overwrite or append to local sources:
-        for schema_input in self.template.get_all_required_schema_inputs(element_set):
-            key = f"inputs.{schema_input.typ}"
-            sources = element_set.input_sources[schema_input.typ]
+        inp_stats = self.template.get_input_statuses(element_set)
+        for labelled_path_i, sources_i in element_set.input_sources.items():
+            path_i_split = labelled_path_i.split(".")
+            is_path_i_sub = len(path_i_split) > 1
+            if is_path_i_sub:
+                path_i_root = path_i_split[0]
+            else:
+                path_i_root = labelled_path_i
+            if not inp_stats[path_i_root].is_required:
+                continue
-            inp_group_name = schema_input.group
-            # print(f"{inp_group_name=}")
+            inp_group_name, def_val = None, None
+            for schema_input in self.template.all_schema_inputs:
+                for lab_info in schema_input.labelled_info():
+                    if lab_info["labelled_type"] == path_i_root:
+                        inp_group_name = lab_info["group"]
+                        if "default_value" in lab_info:
+                            def_val = lab_info["default_value"]
+                        break
-            for inp_src_idx, inp_src in enumerate(sources):
-                if inp_src.source_type is InputSourceType.TASK:
-                    # print(f"  inp_src: {inp_src}")
+            key = f"inputs.{labelled_path_i}"
+            for inp_src_idx, inp_src in enumerate(sources_i):
+                if inp_src.source_type is InputSourceType.TASK:
                     src_task = inp_src.get_task(self.workflow)
-                    # print(f"  src_task: {src_task}")
-                    # print(f"  {src_task.template.element_sets[0].groups=}")
                     src_elem_iters = src_task.get_all_element_iterations()
-                    # print(f"  {src_elem_iters=}")
                     if inp_src.element_iters:
                         # only include "sourceable" element iterations:
@@ -1180,34 +1285,70 @@ class WorkflowTask:
                         src_elem_set_idx = [
                             i.element.element_set_idx for i in src_elem_iters
                         ]
-                        # print(f"  {src_elem_set_idx=}")
                     if not src_elem_iters:
                         continue
                     task_source_type = inp_src.task_source_type.name.lower()
-                    src_key = f"{task_source_type}s.{schema_input.typ}"
+                    if task_source_type == "output" and "[" in labelled_path_i:
+                        src_key = f"{task_source_type}s.{labelled_path_i.split('[')[0]}"
+                    else:
+                        src_key = f"{task_source_type}s.{labelled_path_i}"
                     grp_idx = [
                         iter_i.get_data_idx()[src_key] for iter_i in src_elem_iters
                     ]
-                    # print(f"  grp_idx (1): {grp_idx}")
                     if inp_group_name:
-                        # print(
-                        #     f" only use elements which are part of a group definition named: {inp_group_name}."
-                        # )
                         group_dat_idx = []
-                        for dat_idx_i, src_set_idx_i in zip(grp_idx, src_elem_set_idx):
+                        for dat_idx_i, src_set_idx_i, src_iter in zip(
+                            grp_idx, src_elem_set_idx, src_elem_iters
+                        ):
                             src_es = src_task.template.element_sets[src_set_idx_i]
                             if inp_group_name in [i.name for i in src_es.groups or []]:
                                 # print(f"IN GROUP; {dat_idx_i}; {src_set_idx_i=}")
                                 group_dat_idx.append(dat_idx_i)
+                            else:
+                                # if for any recursive iteration dependency, this group is
+                                # defined, assign:
+                                src_iter_i = src_iter
+                                src_iter_deps = (
+                                    self.workflow.get_element_iterations_from_IDs(
+                                        src_iter_i.get_element_iteration_dependencies(),
+                                    )
+                                )
+                                src_iter_deps_groups = [
+                                    j
+                                    for i in src_iter_deps
+                                    for j in i.element.element_set.groups
+                                ]
+                                if inp_group_name in [
+                                    i.name for i in src_iter_deps_groups or []
+                                ]:
+                                    group_dat_idx.append(dat_idx_i)
+                                # also check input dependencies
+                                for (
+                                    k,
+                                    v,
+                                ) in src_iter.element.get_input_dependencies().items():
+                                    k_es_idx = v["element_set_idx"]
+                                    k_task_iID = v["task_insert_ID"]
+                                    k_es = self.workflow.tasks.get(
+                                        insert_ID=k_task_iID
+                                    ).template.element_sets[k_es_idx]
+                                    if inp_group_name in [
+                                        i.name for i in k_es.groups or []
+                                    ]:
+                                        group_dat_idx.append(dat_idx_i)
+                                # TODO: this only goes to one level of dependency
                         grp_idx = [group_dat_idx]  # TODO: generalise to multiple groups
-                        # print(f"  grp_idx (2): {grp_idx}")
-                    if self.app.InputSource.local() in sources:
+                    if self.app.InputSource.local() in sources_i:
                         # add task source to existing local source:
                         input_data_idx[key] += grp_idx
                         source_idx[key] += [inp_src_idx] * len(grp_idx)
@@ -1221,8 +1362,8 @@ class WorkflowTask:
                             seq = element_set.get_sequence_by_path(key)
                 elif inp_src.source_type is InputSourceType.DEFAULT:
-                    grp_idx = [schema_input.default_value._value_group_idx]
-                    if self.app.InputSource.local() in sources:
+                    grp_idx = [def_val._value_group_idx]
+                    if self.app.InputSource.local() in sources_i:
                         input_data_idx[key] += grp_idx
                         source_idx[key] += [inp_src_idx] * len(grp_idx)
@@ -1232,19 +1373,23 @@ class WorkflowTask:
         # sort smallest to largest path, so more-specific items overwrite less-specific
         # items parameter retrieval:
-        # TODO: is this still necessary?
+        input_data_idx = dict(sorted(input_data_idx.items()))
         return (input_data_idx, sequence_idx, source_idx)
     def ensure_input_sources(self, element_set):
         """Check valid input sources are specified for a new task to be added to the
         workflow in a given position. If none are specified, set them according to the
-        default behaviour."""
+        default behaviour.
-        # this just depends on this schema and other schemas:
+        This method mutates `element_set.input_sources`.
+        """
+        # this depends on this schema, other task schemas and inputs/sequences:
         available_sources = self.template.get_available_task_input_sources(
             element_set=element_set,
-            source_tasks=self.workflow.template.tasks[: self.index],
+            source_tasks=self.workflow.tasks[: self.index],
         )
         unreq_sources = set(element_set.input_sources.keys()) - set(
@@ -1264,33 +1409,40 @@ class WorkflowTask:
         all_stats = self.template.get_input_statuses(element_set)
+        # an input is not required if it is only used to generate an input file that is
+        # passed directly:
+        req_types = set(k for k, v in all_stats.items() if v.is_required)
         # check any specified sources are valid, and replace them with those computed in
-        # available_sources since this will have `element_iters` assigned:
-        for inputs_path in all_stats:
+        # `available_sources` since these will have `element_iters` assigned:
+        for path_i, avail_i in available_sources.items():
+            # for each sub-path in available sources, if the "root-path" source is
+            # required, then add the sub-path source to `req_types` as well:
+            path_i_split = path_i.split(".")
+            is_path_i_sub = len(path_i_split) > 1
+            if is_path_i_sub:
+                path_i_root = path_i_split[0]
+                if path_i_root in req_types:
+                    req_types.add(path_i)
             for s_idx, specified_source in enumerate(
-                element_set.input_sources.get(inputs_path, [])
+                element_set.input_sources.get(path_i, [])
             ):
                 self.workflow._resolve_input_source_task_reference(
                     specified_source, self.unique_name
                 )
-                avail_idx = specified_source.is_in(available_sources[inputs_path])
+                avail_idx = specified_source.is_in(avail_i)
                 if avail_idx is None:
                     raise ValueError(
                         f"The input source {specified_source.to_string()!r} is not "
-                        f"available for input path {inputs_path!r}. Available "
-                        f"input sources are: "
-                        f"{[i.to_string() for i in available_sources[inputs_path]]}"
+                        f"available for input path {path_i!r}. Available "
+                        f"input sources are: {[i.to_string() for i in avail_i]}."
                     )
                 else:
                     # overwrite with the source from available_sources, since it will have
                     # the `element_iters` attribute assigned:
-                    element_set.input_sources[inputs_path][s_idx] = available_sources[
-                        inputs_path
-                    ][avail_idx]
+                    element_set.input_sources[path_i][s_idx] = avail_i[avail_idx]
-        # an input is not required if it is only used to generate an input file that is
-        # passed directly:
-        req_types = set(k for k, v in all_stats.items() if v.is_required)
         unsourced_inputs = req_types - set(element_set.input_sources.keys())
         extra_types = set(k for k, v in all_stats.items() if v.is_extra)
@@ -1307,7 +1459,8 @@ class WorkflowTask:
         # set source for any unsourced inputs:
         missing = []
         for input_type in unsourced_inputs:
-            inp_i_sources = available_sources[input_type]
+            inp_i_sources = available_sources.get(input_type, [])
             source = None
             try:
                 # first element is defined by default to take precedence in
@@ -1336,6 +1489,29 @@ class WorkflowTask:
             # element iterations for which all parameters are available (the set
             # intersection):
             for sources in sources_by_task.values():
+                # if a parameter has multiple labels, disregard from this by removing all
+                # parameters:
+                seen_labelled = {}
+                for src_i in sources.keys():
+                    if "[" in src_i:
+                        unlabelled = src_i.split("[")[0]
+                        if unlabelled not in seen_labelled:
+                            seen_labelled[unlabelled] = 1
+                        else:
+                            seen_labelled[unlabelled] += 1
+                for unlabelled, count in seen_labelled.items():
+                    if count > 1:
+                        # remove:
+                        sources = {
+                            k: v
+                            for k, v in sources.items()
+                            if not k.startswith(unlabelled)
+                        }
+                if len(sources) < 2:
+                    continue
                 first_src = next(iter(sources.values()))
                 intersect_task_i = set(first_src.element_iters)
                 for src_i in sources.values():
@@ -1537,7 +1713,6 @@ class WorkflowTask:
         """
-        # print()
         self.template.set_sequence_parameters(element_set)
         self.ensure_input_sources(element_set)  # may modify element_set.input_sources
@@ -1547,29 +1722,14 @@ class WorkflowTask:
             element_set_idx=self.num_element_sets,
         )
-        # from pprint import pprint
-        # print("input_data_idx")
-        # pprint(input_data_idx)
         element_set.task_template = self.template  # may modify element_set.nesting_order
         multiplicities = self.template.prepare_element_resolution(
             element_set, input_data_idx
         )
-        # print("multiplicities")
-        # pprint(multiplicities)
         element_inp_data_idx = self.resolve_element_data_indices(multiplicities)
-        # print("element_inp_data_idx")
-        # pprint(element_inp_data_idx)
-        # global_element_iter_idx_range = [
-        #     self.workflow.num_element_iterations,
-        #     self.workflow.num_element_iterations + len(element_inp_data_idx),
-        # ]
         local_element_idx_range = [
             self.num_elements,
             self.num_elements + len(element_inp_data_idx),
@@ -1583,9 +1743,6 @@ class WorkflowTask:
             local_element_idx_range=local_element_idx_range,
         )
-        # print("output_data_idx")
-        # pprint(output_data_idx)
         (element_data_idx, element_seq_idx, element_src_idx) = self.generate_new_elements(
             input_data_idx,
             output_data_idx,
@@ -1593,21 +1750,11 @@ class WorkflowTask:
             seq_idx,
             src_idx,
         )
-        # print("element_data_idx")
-        # pprint(element_data_idx)
         iter_IDs = []
         elem_IDs = []
         for elem_idx, data_idx in enumerate(element_data_idx):
             schema_params = set(i for i in data_idx.keys() if len(i.split(".")) == 2)
-            # elements.append(
-            #     {
-            #         "iterations_idx": [self.num_elements + elem_idx],
-            #         "es_idx": self.num_element_sets - 1,
-            #         "seq_idx": ,
-            #         "src_idx": ,
-            #     }
-            # )
             elem_ID_i = self.workflow._store.add_element(
                 task_ID=self.insert_ID,
                 es_idx=self.num_element_sets - 1,
@@ -1622,27 +1769,7 @@ class WorkflowTask:
             iter_IDs.append(iter_ID_i)
             elem_IDs.append(elem_ID_i)
-            # element_iterations.append(
-            #     {
-            #         "global_idx": self.workflow.num_element_iterations + elem_idx,
-            #         "data_idx": data_idx,
-            #         "EARs_initialised": False,
-            #         "actions": {},
-            #         "schema_parameters": list(schema_params),
-            #         "loop_idx": {},
-            #     }
-            # )
-        # self.workflow._store.add_elements(
-        #     self.index,
-        #     self.insert_ID,
-        #     elements,
-        #     element_iterations,
-        # )
         self._pending_element_IDs += elem_IDs
-        # self._pending_num_elements += len(element_data_idx)
-        # self._pending_num_element_iterations += len(element_data_idx)
         self.initialise_EARs()
         return iter_IDs
@@ -1895,9 +2022,13 @@ class WorkflowTask:
             return
         if path[0] == "inputs":
+            try:
+                path_1 = path[1].split("[")[0]
+            except IndexError:
+                path_1 = path[1]
             for i in self.template.schemas:
                 for j in i.inputs:
-                    if j.parameter.typ == path[1]:
+                    if j.parameter.typ == path_1:
                         return j.parameter
         elif path[0] == "outputs":
@@ -1950,29 +2081,33 @@ class WorkflowTask:
             data = []
             for data_idx_i_j in data_idx_i:
-                param_j = self.workflow.get_parameter(data_idx_i_j)
-                if param_j.file:
-                    if param_j.file["store_contents"]:
-                        data_j = Path(self.workflow.path) / param_j.file["path"]
-                    else:
-                        data_j = Path(param_j.file["path"])
-                    data_j = data_j.as_posix()
+                if path_i[0] == "repeats":
+                    # data is an integer repeats index, rather than a parameter ID:
+                    data_j = data_idx_i_j
                 else:
-                    data_j = param_j.data
-                    if parameter and len(path_i) == 2:
-                        # retrieve the source if this is a non-sub parameter, so we can,
-                        # in the case that there is an associated `ParameterValue` class,
-                        # get the class method that should be invoked to initialise the
-                        # object:
-                        if is_multi:
-                            sources.append(param_j.source)
+                    param_j = self.workflow.get_parameter(data_idx_i_j)
+                    if param_j.file:
+                        if param_j.file["store_contents"]:
+                            data_j = Path(self.workflow.path) / param_j.file["path"]
                         else:
-                            sources = param_j.source
-                if raise_on_unset and not param_j.is_set:
-                    raise UnsetParameterDataError(
-                        f"Element data path {path!r} resolves to unset data for (at "
-                        f"least) data index path: {path_i!r}."
-                    )
+                            data_j = Path(param_j.file["path"])
+                        data_j = data_j.as_posix()
+                    else:
+                        data_j = param_j.data
+                        if parameter and len(path_i) == 2:
+                            # retrieve the source if this is a non-sub parameter, so we can,
+                            # in the case that there is an associated `ParameterValue` class,
+                            # get the class method that should be invoked to initialise the
+                            # object:
+                            if is_multi:
+                                sources.append(param_j.source)
+                            else:
+                                sources = param_j.source
+                    if raise_on_unset and not param_j.is_set:
+                        raise UnsetParameterDataError(
+                            f"Element data path {path!r} resolves to unset data for (at "
+                            f"least) data index path: {path_i!r}."
+                        )
                 if not is_multi:
                     data = data_j
                 else:
@@ -2000,9 +2135,10 @@ class WorkflowTask:
                 current_value = default
         if parameter and parameter._value_class:
+            # TODO: retrieve value class method case-insensitively!
             if isinstance(current_value, dict):
                 # return a ParameterValue instance:
-                method_name = sources["value_class_method"]
+                method_name = sources.get("value_class_method")
                 if method_name:
                     method = getattr(parameter._value_class, method_name)
                 else:
@@ -2013,7 +2149,7 @@ class WorkflowTask:
                 # return a list of ParameterValue instances:
                 current_value_ = []
                 for cur_val, src in zip(current_value, sources):
-                    method_name = src["value_class_method"]
+                    method_name = src.get("value_class_method")
                     if method_name:
                         method = getattr(parameter._value_class, method_name)
                     else:

hpcflow-new2 0.2.0a69__py3-none-any.whl → 0.2.0a71__py3-none-any.whl

hpcflow-new2 0.2.0a69py3-none-any.whl → 0.2.0a71py3-none-any.whl