PyPI - label-studio-sdk - Versions diffs - 0.0.32__py3-none-any.whl → 0.0.34__py3-none-any.whl - Mend

label-studio-sdk 0.0.32py3-none-any.whl → 0.0.34py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of label-studio-sdk might be problematic. Click here for more details.

Files changed (38) hide show

label_studio_sdk/__init__.py +4 -1
label_studio_sdk/client.py +94 -78
label_studio_sdk/data_manager.py +32 -23
label_studio_sdk/exceptions.py +10 -0
label_studio_sdk/label_interface/__init__.py +1 -0
label_studio_sdk/label_interface/base.py +77 -0
label_studio_sdk/label_interface/control_tags.py +756 -0
label_studio_sdk/label_interface/interface.py +922 -0
label_studio_sdk/label_interface/label_tags.py +72 -0
label_studio_sdk/label_interface/object_tags.py +292 -0
label_studio_sdk/label_interface/region.py +43 -0
label_studio_sdk/objects.py +35 -0
label_studio_sdk/project.py +711 -258
label_studio_sdk/schema/label_config_schema.json +226 -0
label_studio_sdk/users.py +15 -13
label_studio_sdk/utils.py +31 -30
label_studio_sdk/workspaces.py +13 -11
{label_studio_sdk-0.0.32.dist-info → label_studio_sdk-0.0.34.dist-info}/METADATA +3 -1
label_studio_sdk-0.0.34.dist-info/RECORD +37 -0
{label_studio_sdk-0.0.32.dist-info → label_studio_sdk-0.0.34.dist-info}/WHEEL +1 -1
{label_studio_sdk-0.0.32.dist-info → label_studio_sdk-0.0.34.dist-info}/top_level.txt +0 -1
tests/test_client.py +21 -10
tests/test_export.py +105 -0
tests/test_interface/__init__.py +1 -0
tests/test_interface/configs.py +137 -0
tests/test_interface/mockups.py +22 -0
tests/test_interface/test_compat.py +64 -0
tests/test_interface/test_control_tags.py +55 -0
tests/test_interface/test_data_generation.py +45 -0
tests/test_interface/test_lpi.py +15 -0
tests/test_interface/test_main.py +196 -0
tests/test_interface/test_object_tags.py +36 -0
tests/test_interface/test_region.py +36 -0
tests/test_interface/test_validate_summary.py +35 -0
tests/test_interface/test_validation.py +59 -0
docs/__init__.py +0 -3
label_studio_sdk-0.0.32.dist-info/RECORD +0 -15
{label_studio_sdk-0.0.32.dist-info → label_studio_sdk-0.0.34.dist-info}/LICENSE +0 -0

label_studio_sdk/label_interface/interface.py ADDED Viewed

@@ -0,0 +1,922 @@
+"""
+"""
+import os
+import copy
+import logging
+import re
+import json
+import jsonschema
+from typing import Dict, Optional, List, Tuple, Any, Callable, Union
+from pydantic import BaseModel
+# from typing import Dict, Optional, List, Tuple, Any
+from collections import defaultdict
+from lxml import etree
+import xmljson
+from label_studio_sdk.exceptions import (
+    LSConfigParseException,
+    LabelStudioXMLSyntaxErrorSentryIgnored,
+    LabelStudioValidationErrorSentryIgnored,
+)
+from label_studio_sdk.label_interface.control_tags import (
+    ControlTag,
+    ChoicesTag,
+    LabelsTag,
+)
+from label_studio_sdk.label_interface.object_tags import ObjectTag
+from label_studio_sdk.label_interface.label_tags import LabelTag
+from label_studio_sdk.objects import AnnotationValue, TaskValue, PredictionValue
+dir_path = os.path.dirname(os.path.realpath(__file__))
+file_path = os.path.join(dir_path, "..", "schema", "label_config_schema.json")
+with open(file_path) as f:
+    _LABEL_CONFIG_SCHEMA_DATA = json.load(f)
+_LABEL_TAGS = {"Label", "Choice", "Relation"}
+_DIR_APP_NAME = "label-studio"
+_VIDEO_TRACKING_TAGS = {"videorectangle"}
+RESULT_KEY = "result"
+############ core/label_config.py
+def merge_labels_counters(dict1, dict2):
+    """
+    Merge two dictionaries with nested dictionary values into a single dictionary.
+    Args:
+        dict1 (dict): The first dictionary to merge.
+        dict2 (dict): The second dictionary to merge.
+    Returns:
+        dict: A new dictionary with the merged nested dictionaries.
+    Example:
+        dict1 = {'sentiment': {'Negative': 1, 'Positive': 1}}
+        dict2 = {'sentiment': {'Positive': 2, 'Neutral': 1}}
+        result_dict = merge_nested_dicts(dict1, dict2)
+        # {'sentiment': {'Negative': 1, 'Positive': 3, 'Neutral': 1}}
+    """
+    result_dict = {}
+    # iterate over keys in both dictionaries
+    for key in set(dict1.keys()) | set(dict2.keys()):
+        # add the corresponding values if they exist in both dictionaries
+        value = {}
+        if key in dict1:
+            value.update(dict1[key])
+        if key in dict2:
+            for subkey in dict2[key]:
+                value[subkey] = value.get(subkey, 0) + dict2[key][subkey]
+        # add the key-value pair to the result dictionary
+        result_dict[key] = value
+    return result_dict
+def _fix_choices(config):
+    """
+    workaround for single choice
+    https://github.com/heartexlabs/label-studio/issues/1259
+    """
+    if "Choices" in config:
+        # for single Choices tag in View
+        if "Choice" in config["Choices"] and not isinstance(
+            config["Choices"]["Choice"], list
+        ):
+            config["Choices"]["Choice"] = [config["Choices"]["Choice"]]
+        # for several Choices tags in View
+        elif isinstance(config["Choices"], list) and all(
+            "Choice" in tag_choices for tag_choices in config["Choices"]
+        ):
+            for n in range(len(config["Choices"])):
+                # check that Choices tag has only 1 choice
+                if not isinstance(config["Choices"][n]["Choice"], list):
+                    config["Choices"][n]["Choice"] = [config["Choices"][n]["Choice"]]
+    if "View" in config:
+        if isinstance(config["View"], OrderedDict):
+            config["View"] = _fix_choices(config["View"])
+        else:
+            config["View"] = [_fix_choices(view) for view in config["View"]]
+    return config
+def get_annotation_tuple(from_name, to_name, type):
+    if isinstance(to_name, list):
+        to_name = ",".join(to_name)
+    return "|".join([from_name, to_name, type.lower()])
+def get_all_control_tag_tuples(label_config):
+    # "chc|text|choices"
+    outputs = parse_config(label_config)
+    out = []
+    for control_name, info in outputs.items():
+        out.append(get_annotation_tuple(control_name, info["to_name"], info["type"]))
+    return out
+def get_all_types(label_config):
+    """
+    Get all types from label_config
+    """
+    outputs = parse_config(label_config)
+    out = []
+    for control_name, info in outputs.items():
+        out.append(info["type"].lower())
+    return out
+def display_count(count: int, type: str) -> Optional[str]:
+    """Helper for displaying pluralized sources of validation errors,
+    eg "1 draft" or "3 annotations"
+    """
+    if not count:
+        return None
+    return f'{count} {type}{"s" if count > 1 else ""}'
+######################
+class LabelInterface:
+    """The LabelInterface class serves as an interface to parse and
+    validate labeling configurations, annotations, and predictions
+    within the Label Studio ecosystem.
+    It is designed to be compatible at the data structure level with
+    an existing parser widely used within the Label Studio ecosystem.
+    This ensures that it works seamlessly with most of the existing functions,
+    either by directly supporting them or by offering re-implemented versions
+    through the new interface.
+    Moreover, the parser adds value by offering functionality to
+    validate predictions and annotations against the specified
+    labeling configuration. Below is a simple example of how to use
+    the new API:
+    ```python
+    from label_studio_sdk.label_interface import LabelInterface
+    config = "<View><Text name='txt' value='$val' /><Choices name='chc' toName='txt'><Choice value='one'/> <Choice value='two'/></Choices></View>"
+    li = LabelInterface(config)
+    region = li.get_tag("chc").label("one")
+    # returns a JSON representing a Label Studio region
+    region.as_json()
+    # returns True
+    li.validate_prediction({
+      "model_version": "0.0.1",
+      "score": 0.90,
+      "result": [{
+          "from_name": "chc",
+          "to_name": "txt",
+          "type": "choices",
+          "value": { "choices": ["one"] }
+      }]
+    })
+    ```
+    """
+    def __init__(self, config: str, *args, **kwargs):
+        """
+        Create LabelInterface instance from the config string
+        Example:
+        ```
+        label_config = LabelInterface('''
+        <View>
+        <Choices name="sentiment" toName="txt">
+            <Choice value="Positive" />
+            <Choice value="Negative" />
+            <Choice value="Neutral" />
+        </Choices>
+        <Text name="txt" value="$text" />
+        ''')
+        """
+        self._config = config
+        # extract predefined task from the config
+        _task_data, _ann, _pred = LabelInterface.get_task_from_labeling_config(config)
+        self._sample_config_task = _task_data
+        self._sample_config_ann = _ann
+        self._sample_config_pred = _pred
+        controls, objects, labels, tree = self.parse(config)
+        controls = self._link_controls(controls, objects, labels)
+        # list of control tags that this config has
+        self._control_tags = set(controls.keys())
+        self._object_tags = set(objects.keys())
+        # self._label_names = set(labels.keys())
+        self._controls = controls
+        self._objects = objects
+        self._labels = labels
+        self._tree = tree
+    ##### NEW API
+    @property
+    def controls(self):
+        """Returns list of control tags"""
+        return self._controls and self._controls.values()
+    @property
+    def objects(self):
+        """Returns list of object tags"""
+        return self._objects and self._objects.values()
+    @property
+    def labels(self):
+        """Returns list of label tags"""
+        return self._labels and self._labels.values()
+    def _link_controls(self, controls: Dict, objects: Dict, labels: Dict) -> Dict:
+        """ """
+        for name, tag in controls.items():
+            inputs = []
+            for object_tag_name in tag.to_name:
+                if object_tag_name not in objects:
+                    # logger.info(
+                    #     f'to_name={object_tag_name} is specified for output tag name={name}, '
+                    #     'but we can\'t find it among input tags'
+                    # )
+                    continue
+                inputs.append(objects[object_tag_name])
+            tag.set_objects(inputs)
+            tag.set_labels(list(labels[name]))
+            tag.set_labels_attrs(labels[name])
+        return controls
+    def _get_tag(self, name, tag_store):
+        """ """
+        if name is not None:
+            if name not in tag_store:
+                raise Exception(
+                    f"Name {name} is not found, available names: {tag_store.keys()}"
+                )
+            else:
+                return tag_store[name]
+        if tag_store and len(tag_store.keys()) > 1:
+            raise Exception("Multiple object tags connected, you should specify name")
+        return list(tag_store.values())[0]
+    def get_tag(self, name):
+        """Method to retrieve the tag object by its name from the current instance.
+        The method checks if the tag with the provided name exists in
+        either `_controls` or `_objects` attributes of the current
+        instance.  If a match is found, it returns the tag. If the tag
+        is not found an exception is raised.
+        Args:
+            name (str): Name of the tag to be retrieved.
+        Returns:
+            object: The tag object if it exists in either `_controls` or `_objects`.
+        Raises:
+            Exception: If the tag with the given name does not exist in both `_controls` and `_objects`.
+        """
+        if name in self._controls:
+            return self._controls[name]
+        if name in self._objects:
+            return self._objects[name]
+        raise Exception(f"Tag with name {name} not found")
+    def get_object(self, name=None):
+        """Retrieves the object with the given name from `_objects`.
+        This utilizes the `_get_tag` method to obtain the named object.
+        Args:
+            name (str, optional): The name of the object to be retrieved from `_objects`.
+        Returns: object: The corresponding object if it exists in
+            `_objects`.
+        """
+        return self._get_tag(name, self._objects)
+    def get_output(self, name=None):
+        """Provides an alias for the `get_control` method."""
+        return self.get_control(name)
+    def get_control(self, name=None):
+        """Retrieves the control tag that the control tag maps to.
+        This uses the `_get_tag` method to obtain the named control.
+        Args:
+            name (str, optional): The name of the control to be retrieved.
+        Returns: object: The corresponding control if it exists in
+            `_controls`.
+        """
+        return self._get_tag(name, self._controls)
+    def find_tags_by_class(self, tag_class) -> List:
+        """Finds tags by their class type.
+        The function looks into both `self.objects` and
+        `self.controls` to find tags that are instances of the
+        provided class(es)
+        Args:
+            tag_class (class or list of classes): The class type(s) of the tags to be found.
+        Returns:
+            list: A list of tags that are instances of the provided `tag_class`(es).
+        """
+        lst = list(self.objects) + list(self.controls)
+        tag_classes = [tag_class] if not isinstance(tag_class, list) else tag_class
+        return [tag for tag in lst for cls in tag_classes if isinstance(tag, cls)]
+    def find_tags(
+        self, tag_type: Optional[str] = None, match_fn: Optional[Callable] = None
+    ) -> List:
+        """Finds tags that match the given function in the entire parsed tree.
+        This function searches through both `objects` and `controls`
+        based on `tag_type`, and applies the `match_fn` (if provided)
+        to filter matching tags.
+        Args:
+            tag_type (str, optional): The type of tags to be
+                searched. Categories include 'objects', 'controls',
+                'inputs' (alias for 'objects'), 'outputs' (alias for
+                'controls'). If not specified, searches both 'objects'
+                and 'controls'.
+            match_fn (Callable, optional): A function that takes a tag
+                as an input and returns a boolean value indicating
+                whether the tag matches the required condition.
+        Returns: list: A list of tags that match the given type and
+        satisfy `match_fn`.
+        """
+        tag_types = {
+            "objects": self.objects,
+            "controls": self.controls,
+            # aliases
+            "inputs": self.objects,
+            "outputs": self.controls,
+        }
+        lst = tag_types.get(tag_type, list(self.objects) + list(self.controls))
+        if match_fn is not None:
+            lst = list(filter(match_fn, lst))
+        return lst
+    def parse(self, config_string: str) -> Tuple[Dict, Dict, Dict, etree._Element]:
+        """Parses the received configuration string into dictionaries
+        of ControlTags, ObjectTags, and Labels, along with an XML tree
+        of the configuration.
+        Args:
+            config_string (str): the configuration string to be parsed.
+        Returns:
+            Tuple of:
+            - Dictionary where keys are control tag names and values are ControlTag instances.
+            - Dictionary where keys are object tag names and values are ObjectTag instances.
+            - Dictionary of dictionaries where primary keys are label parent names
+              and secondary keys are label values and values are LabelTag instances.
+            - An XML tree of the configuration.
+        """
+        try:
+            xml_tree = etree.fromstring(config_string)
+        except etree.XMLSyntaxError as e:
+            raise LabelStudioXMLSyntaxErrorSentryIgnored(str(e))
+        objects, controls, labels = {}, {}, defaultdict(dict)
+        variables = []
+        for tag in xml_tree.iter():
+            if tag.attrib and "indexFlag" in tag.attrib:
+                variables.append(tag.attrib["indexFlag"])
+            if ControlTag.validate_node(tag):
+                controls[tag.attrib["name"]] = ControlTag.parse_node(tag)
+            elif ObjectTag.validate_node(tag):
+                objects[tag.attrib["name"]] = ObjectTag.parse_node(tag)
+            elif LabelTag.validate_node(tag):
+                lb = LabelTag.parse_node(tag, controls)
+                labels[lb.parent_name][lb.value] = lb
+        return controls, objects, labels, xml_tree
+    @classmethod
+    def parse_config_to_json(cls, config_string):
+        """ """
+        try:
+            xml = etree.fromstring(config_string)
+        except TypeError:
+            raise etree.ParseError("can only parse strings")
+        if xml is None:
+            raise etree.ParseError("xml is empty or incorrect")
+        config = xmljson.badgerfish.data(xml)
+        config = _fix_choices(config)
+        return config
+    def _schema_validation(self, config_string):
+        """ """
+        try:
+            config = LabelInterface.parse_config_to_json(config_string)
+            jsonschema.validate(config, _LABEL_CONFIG_SCHEMA_DATA)
+        except (etree.ParseError, ValueError) as exc:
+            raise LabelStudioValidationErrorSentryIgnored(str(exc))
+        except jsonschema.exceptions.ValidationError as exc:
+            error_message = exc.context[-1].message if len(exc.context) else exc.message
+            error_message = "Validation failed on {}: {}".format(
+                "/".join(map(str, exc.path)), error_message.replace("@", "")
+            )
+            raise LabelStudioValidationErrorSentryIgnored(error_message)
+    def _to_name_validation(self, config_string):
+        """ """
+        # toName points to existent name
+        all_names = re.findall(r'name="([^"]*)"', config_string)
+        names = set(all_names)
+        toNames = re.findall(r'toName="([^"]*)"', config_string)
+        for toName_ in toNames:
+            for toName in toName_.split(","):
+                if toName not in names:
+                    raise LabelStudioValidationErrorSentryIgnored(
+                        f'toName="{toName}" not found in names: {sorted(names)}'
+                    )
+    def _unique_names_validation(self, config_string):
+        """ """
+        # unique names in config # FIXME: 'name =' (with spaces) won't work
+        all_names = re.findall(r'name="([^"]*)"', config_string)
+        if len(set(all_names)) != len(all_names):
+            raise LabelStudioValidationErrorSentryIgnored(
+                "Label config contains non-unique names"
+            )
+    def load_task(self, task):
+        """Loads a task and substitutes the value in each object tag
+        with actual data from the task, returning a copy of the
+        LabelConfig object.
+        If the `value` field in an object tag is designed to take
+        variable input (i.e., `value_is_variable` is True), the
+        function replaces this value with the corresponding value from
+        the task dictionary.
+        Args:
+            task (dict): Dictionary representing the task, where
+            each key-value pair denotes an attribute-value of the
+            task.
+        Returns:
+            LabelInterface: A deep copy of the current LabelIntreface
+            instance with the object tags' value fields populated with
+            data from the task.
+        """
+        tree = copy.deepcopy(self)
+        for obj in tree.objects:
+            if obj.value_is_variable and obj.value_name in task:
+                obj.value = task.get(obj.value_name)
+        return tree
+    @property
+    def is_valid(self):
+        """ """
+        try:
+            self.validate()
+            return True
+        except LabelStudioValidationErrorSentryIgnored:
+            return False
+    def validate(self):
+        """Validates the provided configuration string against various validation criteria.
+        This method applies a series of validation checks to
+        `_config`, including schema validation, checking for
+        uniqueness of names used in the configuration, and the
+        "to_name" validation. It throws exceptions if any of these
+        validations fail.
+        Raises:
+            Exception: If any validation fails, specific to the type of validation.
+        """
+        config_string = self._config
+        self._schema_validation(config_string)
+        self._unique_names_validation(config_string)
+        self._to_name_validation(config_string)
+    @classmethod
+    def validate_with_data(cls, config):
+        """ """
+        raise NotImplemented()
+    def validate_task(self, task: "TaskValue", validate_regions_only=False):
+        """ """
+        # TODO this might not be always true, and we need to use
+        # "strict" param above to be able to configure
+        # for every object tag we've got that has value as it's
+        # variable we need to have an associated item in the task data
+        for obj in self.objects:
+            if obj.value_is_variable and task["data"].get(obj.value_name, None) is None:
+                return False
+        if "annotations" in task and not self.validate_annotation():
+            return False
+        if "predictions" in task and not self.validate_prediction():
+            return False
+        return True
+    def validate_annotation(self, annotation):
+        """Validates the given annotation against the current configuration.
+        This method applies the `validate_region` method to each
+        region in the annotation and returns False if any of these
+        validations fail. If all the regions pass the validation, it
+        returns True.
+        Args:
+            annotation (dict): The annotation to be validated, where
+            each key-value pair denotes an attribute-value of the
+            annotation.
+        Returns:
+            bool: True if all regions in the annotation pass the
+            validation, False otherwise.
+        """
+        return all(self.validate_region(r) for r in annotation.get(RESULT_KEY))
+    def validate_prediction(self, prediction):
+        """Same as validate_annotation right now"""
+        return all(self.validate_region(r) for r in prediction.get(RESULT_KEY))
+    def validate_region(self, region) -> bool:
+        """Validates a region from the annotation against the current
+        configuration.
+        The validation checks the following:
+        - Both control and object items are present in the labeling configuration.
+        - The type of the region matches the control tag name.
+        - The 'to_name' in the region data connects to the same tag as in the configuration.
+        - The actual value for example in <Labels /> tag is producing start, end, and labels.
+        If any of these validations fail, the function immediately
+        returns False. If all validations pass for a region, it
+        returns True.
+        Args:
+            region (dict): The region to be validated.
+        Returns:
+            bool: True if all checks pass for the region, False otherwise.
+        """
+        control = self.get_control(region["from_name"])
+        obj = self.get_object(region["to_name"])
+        # we should have both items present in the labeling config
+        if not control or not obj:
+            return False
+        # type of the region should match the tag name
+        if control.tag.lower() != region["type"]:
+            return False
+        # make sure that in config it connects to the same tag as
+        # immplied by the region data
+        if region["to_name"] not in control.to_name:
+            return False
+        # validate the actual value, for example that <Labels /> tag
+        # is producing start, end, and labels
+        if not control.validate_value(region["value"]):
+            return False
+        return True
+    ### Generation
+    def _sample_task(self, secure_mode=False):
+        """ """
+        # predefined_task, annotations, predictions = get_task_from_labeling_config(label_config)
+        generated_task = self.generate_sample_task(
+            mode="editor_preview", secure_mode=secure_mode
+        )
+        if self._sample_config_task is not None:
+            generated_task.update(self._sample_config_task)
+        return generated_task, self._sample_config_ann, self._sample_config_pred
+    def generate_sample_task(self, mode="upload", secure_mode=False):
+        """Generates a sample task based on the provided mode and
+        secure_mode.
+        This function generates an example value for each object in
+        `self.objects` using the specified `mode` and
+        `secure_mode`. The resulting task is a dictionary where each
+        key-value pair denotes an object's value-name and example
+        value.
+        Args:
+            mode (str, optional): The operation mode. Accepts any string but defaults to 'upload'.
+            secure_mode (bool, optional): The security mode. Defaults to False.
+        Returns:
+            dict: A dictionary representing the sample task.
+        """
+        task = {
+            obj.value_name: obj.generate_example_value(
+                mode=mode, secure_mode=secure_mode
+            )
+            for obj in self.objects
+        }
+        return task
+    def generate_sample_annotation(self):
+        """ """
+        raise NotImplemented()
+    #####
+    ##### COMPATIBILITY LAYER
+    #####
+    ##### This are re-implmenetation of functions found in different
+    ##### label_config.py files across the repo. Not all of this were
+    ##### tested, therefore I suggest to write a test first, and then
+    ##### replace where it's being used in the repo.
+    def config_essential_data_has_changed(self, new_config_str):
+        """Detect essential changes of the labeling config"""
+        new_obj = LabelInterface(config=new_config_str)
+        for new_tag_name, new_tag in new_obj._controls.items():
+            if new_tag_name not in self._controls:
+                return True
+            old_tag = self._controls[new_tag_name]
+            if new_tag.tag != old_tag.tag:
+                return True
+            if new_tag.objects != old_tag.objects:
+                return True
+            if not set(old_tag.labels).issubset(new_tag.labels):
+                return True
+        return False
+    def generate_sample_task_without_check(
+        label_config, mode="upload", secure_mode=False
+    ):
+        """ """
+        raise NotImplemented()
+    @classmethod
+    def get_task_from_labeling_config(cls, config):
+        """Get task, annotations and predictions from labeling config comment,
+        it must start from "<!-- {" and end as "} -->"
+        """
+        # try to get task data, annotations & predictions from config comment
+        task_data, annotations, predictions = {}, None, None
+        start = config.find("<!-- {")
+        start = start if start >= 0 else config.find("<!--{")
+        start += 4
+        end = config[start:].find("-->") if start >= 0 else -1
+        if 3 < start < start + end:
+            try:
+                # logger.debug('Parse ' + config[start : start + end])
+                body = json.loads(config[start : start + end])
+            except Exception:
+                # logger.error("Can't parse task from labeling config", exc_info=True)
+                pass
+            else:
+                # logger.debug(json.dumps(body, indent=2))
+                dont_use_root = "predictions" in body or "annotations" in body
+                task_data = (
+                    body["data"]
+                    if "data" in body
+                    else (None if dont_use_root else body)
+                )
+                predictions = body["predictions"] if "predictions" in body else None
+                annotations = body["annotations"] if "annotations" in body else None
+        return task_data, annotations, predictions
+    @classmethod
+    def config_line_stipped(self, c):
+        tree = etree.fromstring(c, forbid_dtd=False)
+        comments = tree.xpath("//comment()")
+        for c in comments:
+            p = c.getparent()
+            if p is not None:
+                p.remove(c)
+            c = etree.tostring(tree, method="html").decode("utf-8")
+        return c.replace("\n", "").replace("\r", "")
+    def get_all_control_tag_tuples(label_config):
+        """ """
+        return [tag.as_tuple() for tag in self.controls]
+    def get_first_tag_occurence(
+        self,
+        control_type: Union[str, Tuple],
+        object_type: Union[str, Tuple],
+        name_filter: Optional[Callable] = None,
+        to_name_filter: Optional[Callable] = None,
+    ) -> Tuple[str, str, str]:
+        """
+        Reads config and fetches the first control tag along with first object tag that matches the type.
+        Args:
+          control_type (str or tuple): The control type for checking tag matches.
+          object_type (str or tuple): The object type for checking tag matches.
+          name_filter (function, optional): If given, only tags with this name will be considered.
+                                           Default is None.
+          to_name_filter (function, optional): If given, only tags with this name will be considered.
+                                              Default is None.
+        Returns:
+          tuple: (from_name, to_name, value), representing control tag, object tag and input value.
+        """
+        for tag in self.controls:
+            if tag.match(control_type, name_filter_fn=name_filter):
+                for object_tag in tag.objects:
+                    if object_tag.match(object_type, to_name_filter_fn=to_name_filter):
+                        return tag.name, object_tag.name, object_tag.value_name
+        raise ValueError(
+            f"No control tag of type {control_type} and object tag of type {object_type} found in label config"
+        )
+    def get_all_labels(self):
+        """ """
+        dynamic_values = {c.name: True for c in self.controls if c.dynamic_value}
+        return self._labels, dynamic_values
+    def get_all_object_tag_names(self):
+        """ """
+        return self._objects.keys()
+    def extract_data_types(self):
+        """ """
+        return self._objects
+    def is_video_object_tracking(self):
+        """ """
+        match_fn = lambda tag: tag.tag.lower() in _VIDEO_TRACKING_TAGS
+        tags = self.find_tags(match_fn=match_fn)
+        return bool(tags)
+    def is_type(self, tag_type=None):
+        """ """
+        raise NotImplemented
+    # NOTE: you can use validate() instead
+    # def validate_label_config(self, config_string):
+    #     # xml and schema
+    #     self._schema_validation(config_string)
+    #     self._unique_names_validation(config_string)
+    #     self._to_name_validation(config_string)
+    def validate_config_using_summary(self, summary, strict=False):
+        """Validate current config using LS Project Summary"""
+        # this is a rewrite of project.validate_config function
+        # self.validate_label_config(config_string)
+        if not self._objects:
+            return False
+        created_labels = summary.created_labels
+        created_labels_drafts = summary.created_labels_drafts
+        annotations_summary = summary.created_annotations
+        self.validate_annotations_consistency(annotations_summary)
+        self.validate_lables_consistency(created_labels, created_labels_drafts)
+    def validate_lables_consistency(self, created_labels, created_labels_drafts):
+        """ """
+        # validate labels consistency
+        # labels_from_config, dynamic_values_tags = self.get_all_labels(config_string)
+        created_labels = merge_labels_counters(created_labels, created_labels_drafts)
+        # <Labels name="sentinement" ...><Label value="Negative" ... />
+        # {'sentiment': {'Negative': 1, 'Positive': 3, 'Neutral': 1}}
+        for control_tag_from_data, labels_from_data in created_labels.items():
+            # Check if labels created in annotations, and their control tag has been removed
+            control_from_config = self.get_control(control_tag_from_data)
+            if labels_from_data and not control_from_config:
+                raise LabelStudioValidationErrorSentryIgnored(
+                    f"There are {sum(labels_from_data.values(), 0)} annotation(s) created with tag "
+                    f'"{control_tag_from_data}", you can\'t remove it'
+                )
+            removed_labels = []
+            # Check that labels themselves were not removed
+            for label_name, label_value in labels_from_data.items():
+                if label_value > 0 and not control_from_config.labels_attrs.get(
+                    label_name, None
+                ):
+                    # that label was used in labeling before, but not
+                    # present in the current config
+                    removed_labels.append(label_name)
+            # TODO that needs to be added back
+            # if 'VideoRectangle' in tag_types:
+            #     for key in labels_from_config:
+            #         labels_from_config_by_tag |= set(labels_from_config[key])
+            # if 'Taxonomy' in tag_types:
+            #     custom_tags = Label.objects.filter(links__project=self).values_list('value', flat=True)
+            #     flat_custom_tags = set([item for sublist in custom_tags for item in sublist])
+            #     labels_from_config_by_tag |= flat_custom_tags
+            if len(removed_labels):
+                raise LabelStudioValidationErrorSentryIgnored(
+                    f'These labels still exist in annotations or drafts:\n{",".join(removed_labels)}'
+                    f'Please add labels to tag with name="{str(control_tag_from_data)}".'
+                )
+    def validate_annotations_consistency(self, annotations_summary):
+        """ """
+        # annotations_summary is coming from LS Project Summary, it's
+        # format is: { "chc|text|choices": 10 }
+        # which means that there are two tags, Choices, and one of
+        # object tags and there are 10 annotations
+        err = []
+        annotations_from_data = set(annotations_summary)
+        for ann in annotations_from_data:
+            from_name, to_name, tag_type = ann.split("|")
+            # avoid textarea to_name check (see DEV-1598)
+            if tag_type.lower() == "textarea":
+                continue
+            try:
+                control = self.get_control(from_name)
+                if not control or not control.get_object(to_name):
+                    err.append(
+                        f"with from_name={from_name}, to_name={to_name}, type={tag_type}"
+                    )
+            except Exception as ex:
+                err.append(
+                    f"Error occurred while processing from_name={from_name}, to_name={to_name}, type={tag_type}, error: {str(ex)}"
+                )
+            # control = self.get_control(from_name)
+            # if not control or not control.get_object(to_name):
+            #     err.append(f'with from_name={from_name}, to_name={to_name}, type={tag_type}')
+        if err:
+            diff_str = "\n".join(err)
+            raise LabelStudioValidationErrorSentryIgnored(
+                f"Created annotations are incompatible with provided labeling schema, we found:\n{diff_str}"
+            )

label-studio-sdk 0.0.32__py3-none-any.whl → 0.0.34__py3-none-any.whl

Potentially problematic release.

label-studio-sdk 0.0.32py3-none-any.whl → 0.0.34py3-none-any.whl