PyPI - dtlpy - Versions diffs - 1.115.44__py3-none-any.whl → 1.116.6__py3-none-any.whl - Mend

dtlpy 1.115.44py3-none-any.whl → 1.116.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (238) hide show

dtlpy/__init__.py +491 -491
dtlpy/__version__.py +1 -1
dtlpy/assets/__init__.py +26 -26
dtlpy/assets/code_server/config.yaml +2 -2
dtlpy/assets/code_server/installation.sh +24 -24
dtlpy/assets/code_server/launch.json +13 -13
dtlpy/assets/code_server/settings.json +2 -2
dtlpy/assets/main.py +53 -53
dtlpy/assets/main_partial.py +18 -18
dtlpy/assets/mock.json +11 -11
dtlpy/assets/model_adapter.py +83 -83
dtlpy/assets/package.json +61 -61
dtlpy/assets/package_catalog.json +29 -29
dtlpy/assets/package_gitignore +307 -307
dtlpy/assets/service_runners/__init__.py +33 -33
dtlpy/assets/service_runners/converter.py +96 -96
dtlpy/assets/service_runners/multi_method.py +49 -49
dtlpy/assets/service_runners/multi_method_annotation.py +54 -54
dtlpy/assets/service_runners/multi_method_dataset.py +55 -55
dtlpy/assets/service_runners/multi_method_item.py +52 -52
dtlpy/assets/service_runners/multi_method_json.py +52 -52
dtlpy/assets/service_runners/single_method.py +37 -37
dtlpy/assets/service_runners/single_method_annotation.py +43 -43
dtlpy/assets/service_runners/single_method_dataset.py +43 -43
dtlpy/assets/service_runners/single_method_item.py +41 -41
dtlpy/assets/service_runners/single_method_json.py +42 -42
dtlpy/assets/service_runners/single_method_multi_input.py +45 -45
dtlpy/assets/voc_annotation_template.xml +23 -23
dtlpy/caches/base_cache.py +32 -32
dtlpy/caches/cache.py +473 -473
dtlpy/caches/dl_cache.py +201 -201
dtlpy/caches/filesystem_cache.py +89 -89
dtlpy/caches/redis_cache.py +84 -84
dtlpy/dlp/__init__.py +20 -20
dtlpy/dlp/cli_utilities.py +367 -367
dtlpy/dlp/command_executor.py +764 -764
dtlpy/dlp/dlp +1 -1
dtlpy/dlp/dlp.bat +1 -1
dtlpy/dlp/dlp.py +128 -128
dtlpy/dlp/parser.py +651 -651
dtlpy/entities/__init__.py +83 -83
dtlpy/entities/analytic.py +347 -347
dtlpy/entities/annotation.py +1879 -1879
dtlpy/entities/annotation_collection.py +699 -699
dtlpy/entities/annotation_definitions/__init__.py +20 -20
dtlpy/entities/annotation_definitions/base_annotation_definition.py +100 -100
dtlpy/entities/annotation_definitions/box.py +195 -195
dtlpy/entities/annotation_definitions/classification.py +67 -67
dtlpy/entities/annotation_definitions/comparison.py +72 -72
dtlpy/entities/annotation_definitions/cube.py +204 -204
dtlpy/entities/annotation_definitions/cube_3d.py +149 -149
dtlpy/entities/annotation_definitions/description.py +32 -32
dtlpy/entities/annotation_definitions/ellipse.py +124 -124
dtlpy/entities/annotation_definitions/free_text.py +62 -62
dtlpy/entities/annotation_definitions/gis.py +69 -69
dtlpy/entities/annotation_definitions/note.py +139 -139
dtlpy/entities/annotation_definitions/point.py +117 -117
dtlpy/entities/annotation_definitions/polygon.py +182 -182
dtlpy/entities/annotation_definitions/polyline.py +111 -111
dtlpy/entities/annotation_definitions/pose.py +92 -92
dtlpy/entities/annotation_definitions/ref_image.py +86 -86
dtlpy/entities/annotation_definitions/segmentation.py +240 -240
dtlpy/entities/annotation_definitions/subtitle.py +34 -34
dtlpy/entities/annotation_definitions/text.py +85 -85
dtlpy/entities/annotation_definitions/undefined_annotation.py +74 -74
dtlpy/entities/app.py +220 -220
dtlpy/entities/app_module.py +107 -107
dtlpy/entities/artifact.py +174 -174
dtlpy/entities/assignment.py +399 -399
dtlpy/entities/base_entity.py +214 -214
dtlpy/entities/bot.py +113 -113
dtlpy/entities/codebase.py +292 -292
dtlpy/entities/collection.py +38 -38
dtlpy/entities/command.py +169 -169
dtlpy/entities/compute.py +449 -449
dtlpy/entities/dataset.py +1299 -1299
dtlpy/entities/directory_tree.py +44 -44
dtlpy/entities/dpk.py +470 -470
dtlpy/entities/driver.py +235 -235
dtlpy/entities/execution.py +397 -397
dtlpy/entities/feature.py +124 -124
dtlpy/entities/feature_set.py +145 -145
dtlpy/entities/filters.py +798 -798
dtlpy/entities/gis_item.py +107 -107
dtlpy/entities/integration.py +184 -184
dtlpy/entities/item.py +959 -959
dtlpy/entities/label.py +123 -123
dtlpy/entities/links.py +85 -85
dtlpy/entities/message.py +175 -175
dtlpy/entities/model.py +684 -684
dtlpy/entities/node.py +1005 -1005
dtlpy/entities/ontology.py +810 -803
dtlpy/entities/organization.py +287 -287
dtlpy/entities/package.py +657 -657
dtlpy/entities/package_defaults.py +5 -5
dtlpy/entities/package_function.py +185 -185
dtlpy/entities/package_module.py +113 -113
dtlpy/entities/package_slot.py +118 -118
dtlpy/entities/paged_entities.py +299 -299
dtlpy/entities/pipeline.py +624 -624
dtlpy/entities/pipeline_execution.py +279 -279
dtlpy/entities/project.py +394 -394
dtlpy/entities/prompt_item.py +505 -505
dtlpy/entities/recipe.py +301 -301
dtlpy/entities/reflect_dict.py +102 -102
dtlpy/entities/resource_execution.py +138 -138
dtlpy/entities/service.py +963 -963
dtlpy/entities/service_driver.py +117 -117
dtlpy/entities/setting.py +294 -294
dtlpy/entities/task.py +495 -495
dtlpy/entities/time_series.py +143 -143
dtlpy/entities/trigger.py +426 -426
dtlpy/entities/user.py +118 -118
dtlpy/entities/webhook.py +124 -124
dtlpy/examples/__init__.py +19 -19
dtlpy/examples/add_labels.py +135 -135
dtlpy/examples/add_metadata_to_item.py +21 -21
dtlpy/examples/annotate_items_using_model.py +65 -65
dtlpy/examples/annotate_video_using_model_and_tracker.py +75 -75
dtlpy/examples/annotations_convert_to_voc.py +9 -9
dtlpy/examples/annotations_convert_to_yolo.py +9 -9
dtlpy/examples/convert_annotation_types.py +51 -51
dtlpy/examples/converter.py +143 -143
dtlpy/examples/copy_annotations.py +22 -22
dtlpy/examples/copy_folder.py +31 -31
dtlpy/examples/create_annotations.py +51 -51
dtlpy/examples/create_video_annotations.py +83 -83
dtlpy/examples/delete_annotations.py +26 -26
dtlpy/examples/filters.py +113 -113
dtlpy/examples/move_item.py +23 -23
dtlpy/examples/play_video_annotation.py +13 -13
dtlpy/examples/show_item_and_mask.py +53 -53
dtlpy/examples/triggers.py +49 -49
dtlpy/examples/upload_batch_of_items.py +20 -20
dtlpy/examples/upload_items_and_custom_format_annotations.py +55 -55
dtlpy/examples/upload_items_with_modalities.py +43 -43
dtlpy/examples/upload_segmentation_annotations_from_mask_image.py +44 -44
dtlpy/examples/upload_yolo_format_annotations.py +70 -70
dtlpy/exceptions.py +125 -125
dtlpy/miscellaneous/__init__.py +20 -20
dtlpy/miscellaneous/dict_differ.py +95 -95
dtlpy/miscellaneous/git_utils.py +217 -217
dtlpy/miscellaneous/json_utils.py +14 -14
dtlpy/miscellaneous/list_print.py +105 -105
dtlpy/miscellaneous/zipping.py +130 -130
dtlpy/ml/__init__.py +20 -20
dtlpy/ml/base_feature_extractor_adapter.py +27 -27
dtlpy/ml/base_model_adapter.py +1257 -1230
dtlpy/ml/metrics.py +461 -461
dtlpy/ml/predictions_utils.py +274 -274
dtlpy/ml/summary_writer.py +57 -57
dtlpy/ml/train_utils.py +60 -60
dtlpy/new_instance.py +252 -252
dtlpy/repositories/__init__.py +56 -56
dtlpy/repositories/analytics.py +85 -85
dtlpy/repositories/annotations.py +916 -916
dtlpy/repositories/apps.py +383 -383
dtlpy/repositories/artifacts.py +452 -452
dtlpy/repositories/assignments.py +599 -599
dtlpy/repositories/bots.py +213 -213
dtlpy/repositories/codebases.py +559 -559
dtlpy/repositories/collections.py +332 -332
dtlpy/repositories/commands.py +152 -152
dtlpy/repositories/compositions.py +61 -61
dtlpy/repositories/computes.py +439 -439
dtlpy/repositories/datasets.py +1504 -1504
dtlpy/repositories/downloader.py +976 -923
dtlpy/repositories/dpks.py +433 -433
dtlpy/repositories/drivers.py +482 -482
dtlpy/repositories/executions.py +815 -815
dtlpy/repositories/feature_sets.py +226 -226
dtlpy/repositories/features.py +255 -255
dtlpy/repositories/integrations.py +484 -484
dtlpy/repositories/items.py +912 -912
dtlpy/repositories/messages.py +94 -94
dtlpy/repositories/models.py +1000 -1000
dtlpy/repositories/nodes.py +80 -80
dtlpy/repositories/ontologies.py +511 -511
dtlpy/repositories/organizations.py +525 -525
dtlpy/repositories/packages.py +1941 -1941
dtlpy/repositories/pipeline_executions.py +451 -451
dtlpy/repositories/pipelines.py +640 -640
dtlpy/repositories/projects.py +539 -539
dtlpy/repositories/recipes.py +419 -399
dtlpy/repositories/resource_executions.py +137 -137
dtlpy/repositories/schema.py +120 -120
dtlpy/repositories/service_drivers.py +213 -213
dtlpy/repositories/services.py +1704 -1704
dtlpy/repositories/settings.py +339 -339
dtlpy/repositories/tasks.py +1477 -1477
dtlpy/repositories/times_series.py +278 -278
dtlpy/repositories/triggers.py +536 -536
dtlpy/repositories/upload_element.py +257 -257
dtlpy/repositories/uploader.py +661 -661
dtlpy/repositories/webhooks.py +249 -249
dtlpy/services/__init__.py +22 -22
dtlpy/services/aihttp_retry.py +131 -131
dtlpy/services/api_client.py +1785 -1785
dtlpy/services/api_reference.py +40 -40
dtlpy/services/async_utils.py +133 -133
dtlpy/services/calls_counter.py +44 -44
dtlpy/services/check_sdk.py +68 -68
dtlpy/services/cookie.py +115 -115
dtlpy/services/create_logger.py +156 -156
dtlpy/services/events.py +84 -84
dtlpy/services/logins.py +235 -235
dtlpy/services/reporter.py +256 -256
dtlpy/services/service_defaults.py +91 -91
dtlpy/utilities/__init__.py +20 -20
dtlpy/utilities/annotations/__init__.py +16 -16
dtlpy/utilities/annotations/annotation_converters.py +269 -269
dtlpy/utilities/base_package_runner.py +285 -264
dtlpy/utilities/converter.py +1650 -1650
dtlpy/utilities/dataset_generators/__init__.py +1 -1
dtlpy/utilities/dataset_generators/dataset_generator.py +670 -670
dtlpy/utilities/dataset_generators/dataset_generator_tensorflow.py +23 -23
dtlpy/utilities/dataset_generators/dataset_generator_torch.py +21 -21
dtlpy/utilities/local_development/__init__.py +1 -1
dtlpy/utilities/local_development/local_session.py +179 -179
dtlpy/utilities/reports/__init__.py +2 -2
dtlpy/utilities/reports/figures.py +343 -343
dtlpy/utilities/reports/report.py +71 -71
dtlpy/utilities/videos/__init__.py +17 -17
dtlpy/utilities/videos/video_player.py +598 -598
dtlpy/utilities/videos/videos.py +470 -470
{dtlpy-1.115.44.data → dtlpy-1.116.6.data}/scripts/dlp +1 -1
dtlpy-1.116.6.data/scripts/dlp.bat +2 -0
{dtlpy-1.115.44.data → dtlpy-1.116.6.data}/scripts/dlp.py +128 -128
{dtlpy-1.115.44.dist-info → dtlpy-1.116.6.dist-info}/METADATA +186 -186
dtlpy-1.116.6.dist-info/RECORD +239 -0
{dtlpy-1.115.44.dist-info → dtlpy-1.116.6.dist-info}/WHEEL +1 -1
{dtlpy-1.115.44.dist-info → dtlpy-1.116.6.dist-info}/licenses/LICENSE +200 -200
tests/features/environment.py +551 -551
dtlpy/assets/__pycache__/__init__.cpython-310.pyc +0 -0
dtlpy-1.115.44.data/scripts/dlp.bat +0 -2
dtlpy-1.115.44.dist-info/RECORD +0 -240
{dtlpy-1.115.44.dist-info → dtlpy-1.116.6.dist-info}/entry_points.txt +0 -0
{dtlpy-1.115.44.dist-info → dtlpy-1.116.6.dist-info}/top_level.txt +0 -0

dtlpy/entities/prompt_item.py CHANGED Viewed

@@ -1,506 +1,506 @@
-import requests
-import logging
-import base64
-import enum
-import json
-import io
-import os
-from typing import List, Optional
-from concurrent.futures import ThreadPoolExecutor
-from .. import entities, repositories
-from dtlpy.services.api_client import client as client_api
-logger = logging.getLogger(name='dtlpy')
-class PromptType(str, enum.Enum):
-    TEXT = 'application/text'
-    IMAGE = 'image/*'
-    AUDIO = 'audio/*'
-    VIDEO = 'video/*'
-    METADATA = 'metadata'
-class Prompt:
-    def __init__(self, key, role='user'):
-        """
-        Create a single Prompt. Prompt can contain multiple mimetype elements, e.g. text sentence and an image.
-        :param key: unique identifier of the prompt in the item
-        """
-        self.key = key
-        self.elements = list()
-        # to avoid broken stream of json files - DAT-75653
-        client_api.default_headers['x-dl-sanitize'] = '0'
-        self._items = repositories.Items(client_api=client_api)
-        self.metadata = {'role': role}
-    def add_element(self, value, mimetype='application/text'):
-        """
-        :param value: url or string of the input
-        :param mimetype: mimetype of the input. options: `text`, `image/*`, `video/*`, `audio/*`
-        :return:
-        """
-        allowed_prompt_types = [prompt_type for prompt_type in PromptType]
-        if mimetype not in allowed_prompt_types:
-            raise ValueError(f'Invalid mimetype: {mimetype}. Allowed values: {allowed_prompt_types}')
-        if mimetype == PromptType.METADATA and isinstance(value, dict):
-            self.metadata.update(value)
-        else:
-            self.elements.append({'mimetype': mimetype,
-                                  'value': value})
-    def to_json(self):
-        """
-        Convert Prompt entity to the item json
-        :return:
-        """
-        elements_json = [
-            {
-                "mimetype": e['mimetype'],
-                "value": e['value'],
-            } for e in self.elements if not e['mimetype'] == PromptType.METADATA
-        ]
-        elements_json.append({
-            "mimetype": PromptType.METADATA,
-            "value": self.metadata
-        })
-        return {
-            self.key: elements_json
-        }
-    def _convert_stream_to_binary(self, image_url: str):
-        """
-        Convert a stream to binary
-        :param image_url: dataloop image stream url
-        :return: binary object
-        """
-        image_buffer = None
-        if '.' in image_url and 'dataloop.ai' not in image_url:
-            # URL and not DL item stream
-            try:
-                response = requests.get(image_url, stream=True)
-                response.raise_for_status()  # Raise an exception for bad status codes
-                # Check for valid image content type
-                if response.headers["Content-Type"].startswith("image/"):
-                    # Read the image data in chunks to avoid loading large images in memory
-                    image_buffer = b"".join(chunk for chunk in response.iter_content(1024))
-            except requests.exceptions.RequestException as e:
-                logger.error(f"Failed to download image from URL: {image_url}, error: {e}")
-        elif '.' in image_url and 'stream' in image_url:
-            # DL Stream URL
-            item_id = image_url.split("/stream")[0].split("/items/")[-1]
-            image_buffer = self._items.get(item_id=item_id).download(save_locally=False).getvalue()
-        else:
-            # DL item ID
-            image_buffer = self._items.get(item_id=image_url).download(save_locally=False).getvalue()
-        if image_buffer is not None:
-            encoded_image = base64.b64encode(image_buffer).decode()
-        else:
-            logger.error(f'Invalid image url: {image_url}')
-            return None
-        return f'data:image/jpeg;base64,{encoded_image}'
-    def messages(self):
-        """
-        return a list of messages in the prompt item,
-        messages are returned following the openai SDK format https://platform.openai.com/docs/guides/vision
-        """
-        messages = []
-        for element in self.elements:
-            if element['mimetype'] == PromptType.TEXT:
-                data = {
-                    "type": "text",
-                    "text": element['value']
-                }
-                messages.append(data)
-            elif element['mimetype'] == PromptType.IMAGE:
-                image_url = self._convert_stream_to_binary(element['value'])
-                data = {
-                    "type": "image_url",
-                    "image_url": {
-                        "url": image_url
-                    }
-                }
-                messages.append(data)
-            elif element['mimetype'] == PromptType.AUDIO:
-                raise NotImplementedError('Audio prompt is not supported yet')
-            elif element['mimetype'] == PromptType.VIDEO:
-                data = {
-                    "type": "video_url",
-                    "video_url": {
-                        "url": element['value']
-                    }
-                }
-                messages.append(data)
-            else:
-                raise ValueError(f'Invalid mimetype: {element["mimetype"]}')
-        return messages, self.key
-class PromptItem:
-    def __init__(self, name, item: entities.Item = None, role_mapping=None):
-        if role_mapping is None:
-            role_mapping = {'user': 'item',
-                            'assistant': 'annotation'}
-        if not isinstance(role_mapping, dict):
-            raise ValueError(f'input role_mapping must be dict. type: {type(role_mapping)}')
-        self.role_mapping = role_mapping
-        # prompt item name
-        self.name = name
-        # list of user prompts in the prompt item
-        self.prompts = list()
-        self.assistant_prompts = list()
-        # list of assistant (annotations) prompts in the prompt item
-        # Dataloop Item
-        self._item: entities.Item = item
-        self._messages = []
-        self._annotations: entities.AnnotationCollection = None
-        if item is not None:
-            if 'json' not in item.mimetype or item.system.get('shebang', dict()).get('dltype') != 'prompt':
-                raise ValueError('Expecting a json item with system.shebang.dltype = prompt')
-            self._items = item.items
-            self.fetch()
-        else:
-            self._items = repositories.Items(client_api=client_api)
-        # to avoid broken stream of json files - DAT-75653
-        self._items._client_api.default_headers['x-dl-sanitize'] = '0'
-    @classmethod
-    def from_messages(cls, messages: list):
-        ...
-    @classmethod
-    def from_item(cls, item: entities.Item):
-        """
-        Load a prompt item from the platform
-        :param item : Item object
-        :return: PromptItem object
-        """
-        if 'json' not in item.mimetype or item.system.get('shebang', dict()).get('dltype') != 'prompt':
-            raise ValueError('Expecting a json item with system.shebang.dltype = prompt')
-        return cls(name=item.name, item=item)
-    @classmethod
-    def from_local_file(cls, filepath):
-        """
-        Create a new prompt item from a file
-        :param filepath: path to the file
-        :return: PromptItem object
-        """
-        if os.path.exists(filepath) is False:
-            raise FileNotFoundError(f'File does not exists: {filepath}')
-        if 'json' not in os.path.splitext(filepath)[-1]:
-            raise ValueError(f'Expected path to json item, got {os.path.splitext(filepath)[-1]}')
-        prompt_item = cls(name=filepath)
-        with open(filepath, 'r', encoding='utf-8') as f:
-            data = json.load(f)
-        prompt_item.prompts = prompt_item._load_item_prompts(data=data)
-        return prompt_item
-    @staticmethod
-    def _load_item_prompts(data):
-        prompts = list()
-        for prompt_key, prompt_elements in data.get('prompts', dict()).items():
-            content = list()
-            for element in prompt_elements:
-                content.append({'value': element.get('value', dict()),
-                                'mimetype': element['mimetype']})
-            prompt = Prompt(key=prompt_key, role="user")
-            for element in content:
-                prompt.add_element(value=element.get('value', ''),
-                                   mimetype=element.get('mimetype', PromptType.TEXT))
-            prompts.append(prompt)
-        return prompts
-    @staticmethod
-    def _load_annotations_prompts(annotations: entities.AnnotationCollection):
-        """
-        Get all the annotations in the item for the assistant messages
-        """
-        # clearing the assistant prompts from previous annotations that might not belong
-        assistant_prompts = list()
-        for annotation in annotations:
-            prompt_id = annotation.metadata.get('system', dict()).get('promptId', None)
-            model_info = annotation.metadata.get('user', dict()).get('model', dict())
-            annotation_id = annotation.id
-            if annotation.type == 'ref_image':
-                prompt = Prompt(key=prompt_id, role='assistant')
-                prompt.add_element(value=annotation.annotation_definition.coordinates.get('ref'),
-                                   mimetype=PromptType.IMAGE)
-            elif annotation.type == 'text':
-                prompt = Prompt(key=prompt_id, role='assistant')
-                prompt.add_element(value=annotation.annotation_definition.coordinates,
-                                   mimetype=PromptType.TEXT)
-            else:
-                raise ValueError(f"Unsupported annotation type: {annotation.type}")
-            prompt.add_element(value={'id': annotation_id,
-                                      'model_info': model_info},
-                               mimetype=PromptType.METADATA)
-            assistant_prompts.append(prompt)
-        return assistant_prompts
-    def to_json(self):
-        """
-        Convert the entity to a platform item.
-        :return:
-        """
-        prompts_json = {
-            "shebang": "dataloop",
-            "metadata": {
-                "dltype": 'prompt'
-            },
-            "prompts": {}
-        }
-        for prompt in self.prompts:
-            for prompt_key, prompt_values in prompt.to_json().items():
-                prompts_json["prompts"][prompt_key] = prompt_values
-        return prompts_json
-    def to_messages(self, model_name=None, include_assistant=True):
-        all_prompts_messages = dict()
-        for prompt in self.prompts:
-            if prompt.key not in all_prompts_messages:
-                all_prompts_messages[prompt.key] = list()
-            prompt_messages, prompt_key = prompt.messages()
-            messages = {
-                'role': prompt.metadata.get('role', 'user'),
-                'content': prompt_messages
-            }
-            all_prompts_messages[prompt.key].append(messages)
-        if include_assistant is True:
-            # reload to filer model annotations
-            for prompt in self.assistant_prompts:
-                prompt_model_name = prompt.metadata.get('model_info', dict()).get('name')
-                if model_name is not None and prompt_model_name != model_name:
-                    continue
-                if prompt.key not in all_prompts_messages:
-                    logger.warning(
-                        f'Prompt key {prompt.key} is not found in the user prompts, skipping Assistant prompt')
-                    continue
-                prompt_messages, prompt_key = prompt.messages()
-                assistant_messages = {
-                    'role': 'assistant',
-                    'content': prompt_messages
-                }
-                all_prompts_messages[prompt.key].append(assistant_messages)
-        res = list()
-        for prompts in all_prompts_messages.values():
-            for prompt in prompts:
-                res.append(prompt)
-        self._messages = res
-        return self._messages
-    def to_bytes_io(self):
-        # Used for item upload, do not delete
-        byte_io = io.BytesIO()
-        byte_io.name = self.name
-        byte_io.write(json.dumps(self.to_json()).encode())
-        byte_io.seek(0)
-        return byte_io
-    def fetch(self):
-        if self._item is None:
-            raise ValueError('Missing item, nothing to fetch..')
-        self._item = self._items.get(item_id=self._item.id)
-        self._annotations = self._item.annotations.list()
-        self.prompts = self._load_item_prompts(data=json.load(self._item.download(save_locally=False)))
-        self.assistant_prompts = self._load_annotations_prompts(self._annotations)
-    def build_context(self, nearest_items, add_metadata=None) -> str:
-        """
-        Create a context stream from nearest items list.
-        add_metadata is a list of location in the item.metadata to add to the context, for instance ['system.document.source']
-        :param nearest_items: list of item ids
-        :param add_metadata: list of metadata location to add metadata to context
-        :return:
-        """
-        if add_metadata is None:
-            add_metadata = list()
-        def stream_single(w_id):
-            context_item = self._items.get(item_id=w_id)
-            buf = context_item.download(save_locally=False)
-            text = buf.read().decode(encoding='utf-8')
-            m = ""
-            for path in add_metadata:
-                parts = path.split('.')
-                value = context_item.metadata
-                part = ""
-                for part in parts:
-                    if isinstance(value, dict):
-                        value = value.get(part)
-                    else:
-                        value = ""
-                m += f"{part}:{value}\n"
-            return text, m
-        pool = ThreadPoolExecutor(max_workers=32)
-        context = ""
-        if len(nearest_items) > 0:
-            # build context
-            results = pool.map(stream_single, nearest_items)
-            for res in results:
-                context += f"\n<source>\n{res[1]}\n</source>\n<text>\n{res[0]}\n</text>"
-        return context
-    def add(self,
-            message: dict,
-            prompt_key: str = None,
-            model_info: dict = None):
-        """
-        add a prompt to the prompt item
-        prompt: a dictionary. keys are prompt message id, values are prompt messages
-        responses: a list of annotations representing responses to the prompt
-        :param message:
-        :param prompt_key:
-        :param model_info:
-        :return:
-        """
-        role = message.get('role', 'user')
-        content = message.get('content', list())
-        if self.role_mapping.get(role, 'item') == 'item':
-            if prompt_key is None:
-                prompt_key = str(len(self.prompts) + 1)
-            # for new prompt we need a new key
-            prompt = Prompt(key=prompt_key, role=role)
-            for element in content:
-                prompt.add_element(value=element.get('value', ''),
-                                   mimetype=element.get('mimetype', PromptType.TEXT))
-            # create new prompt and add to prompts
-            self.prompts.append(prompt)
-            if self._item is not None:
-                self._item._Item__update_item_binary(_json=self.to_json())
-        else:
-            if prompt_key is None:
-                prompt_key = str(len(self.prompts))
-            assistant_message = content[0]
-            assistant_mimetype = assistant_message.get('mimetype', PromptType.TEXT)
-            uploaded_annotation = None
-            # find if prompt
-            if model_info is None:
-                # dont search for existing if there's no model information
-                existing_prompt = None
-            else:
-                existing_prompts = list()
-                for prompt in self.assistant_prompts:
-                    prompt_id = prompt.key
-                    model_name = prompt.metadata.get('model_info', dict()).get('name')
-                    if prompt_id == prompt_key and model_name == model_info.get('name'):
-                        # TODO how to handle multiple annotations
-                        existing_prompts.append(prompt)
-                if len(existing_prompts) > 1:
-                    assert False, "shouldn't be here! more than 1 annotation for a single model"
-                elif len(existing_prompts) == 1:
-                    # found model annotation to upload
-                    existing_prompt = existing_prompts[0]
-                else:
-                    # no annotation found
-                    existing_prompt = None
-            if existing_prompt is None:
-                prompt = Prompt(key=prompt_key)
-                if assistant_mimetype == PromptType.TEXT:
-                    annotation_definition = entities.FreeText(text=assistant_message.get('value'))
-                    prompt.add_element(value=annotation_definition.to_coordinates(None),
-                                       mimetype=PromptType.TEXT)
-                elif assistant_mimetype == PromptType.IMAGE:
-                    annotation_definition = entities.RefImage(ref=assistant_message.get('value'))
-                    prompt.add_element(value=annotation_definition.to_coordinates(None).get('ref'),
-                                       mimetype=PromptType.IMAGE)
-                else:
-                    raise NotImplementedError('Only images of mimetype image and text are supported')
-                metadata = {'system': {'promptId': prompt_key},
-                            'user': {'model': model_info}}
-                prompt.add_element(mimetype=PromptType.METADATA,
-                                   value={"model_info": model_info})
-                existing_annotation = entities.Annotation.new(item=self._item,
-                                                              metadata=metadata,
-                                                              annotation_definition=annotation_definition)
-                uploaded_annotation = existing_annotation.upload()
-                prompt.add_element(mimetype=PromptType.METADATA,
-                                   value={"id": uploaded_annotation.id})
-                existing_prompt = prompt
-                self.assistant_prompts.append(prompt)
-            existing_prompt_element = [element for element in existing_prompt.elements if
-                                       element['mimetype'] != PromptType.METADATA][-1]
-            existing_prompt_element['value'] = assistant_message.get('value')
-            if uploaded_annotation is None:
-                # Creating annotation with old dict to match platform dict
-                annotation_definition = entities.FreeText(text='')
-                metadata = {'system': {'promptId': prompt_key},
-                            'user': {'model': existing_prompt.metadata.get('model_info')}}
-                annotation = entities.Annotation.new(item=self._item,
-                                                     metadata=metadata,
-                                                     annotation_definition=annotation_definition
-                                                     )
-                annotation.id = existing_prompt.metadata['id']
-                # set the platform dict to match the old annotation for the dict difference check, otherwise it won't
-                # update
-                annotation._platform_dict = annotation.to_json()
-                # update the annotation with the new text
-                annotation.annotation_definition.text = existing_prompt_element['value']
-                self._item.annotations.update(annotation)
-    def update(self):
-        """
-        Update the prompt item in the platform.
-        """
-        if self._item is not None:
-            self._item._Item__update_item_binary(_json=self.to_json())
-            self._item = self._item.update()
-        else:
-            raise ValueError('Cannot update PromptItem without an item.')
-    # Properties
-    @property
-    def item(self) -> Optional['entities.Item']:
-        """
-        Get the underlying Item object.
-        :return: The Item object associated with this PromptItem, or None.
-        :rtype: Optional[dtlpy.entities.Item]
-        """
-        return self._item
-    @item.setter
-    def item(self, item: Optional['entities.Item']):
-        """
-        Set the underlying Item object.
-        :param item: The Item object to associate with this PromptItem, or None.
-        :type item: Optional[dtlpy.entities.Item]
-        """
-        if item is not None and not isinstance(item, entities.Item):
-            raise ValueError(f"Expected dtlpy.entities.Item or None, got {type(item)}")
-        self._item = item
-    @property
-    def metadata(self) -> dict:
-        """
-        Get the metadata from the underlying Item object.
-        :return: Metadata dictionary from the item, or empty dict if no item exists.
-        :rtype: dict
-        """
-        if self._item is not None:
-            return self._item.metadata
-        else:
+import requests
+import logging
+import base64
+import enum
+import json
+import io
+import os
+from typing import List, Optional
+from concurrent.futures import ThreadPoolExecutor
+from .. import entities, repositories
+from dtlpy.services.api_client import client as client_api
+logger = logging.getLogger(name='dtlpy')
+class PromptType(str, enum.Enum):
+    TEXT = 'application/text'
+    IMAGE = 'image/*'
+    AUDIO = 'audio/*'
+    VIDEO = 'video/*'
+    METADATA = 'metadata'
+class Prompt:
+    def __init__(self, key, role='user'):
+        """
+        Create a single Prompt. Prompt can contain multiple mimetype elements, e.g. text sentence and an image.
+        :param key: unique identifier of the prompt in the item
+        """
+        self.key = key
+        self.elements = list()
+        # to avoid broken stream of json files - DAT-75653
+        client_api.default_headers['x-dl-sanitize'] = '0'
+        self._items = repositories.Items(client_api=client_api)
+        self.metadata = {'role': role}
+    def add_element(self, value, mimetype='application/text'):
+        """
+        :param value: url or string of the input
+        :param mimetype: mimetype of the input. options: `text`, `image/*`, `video/*`, `audio/*`
+        :return:
+        """
+        allowed_prompt_types = [prompt_type for prompt_type in PromptType]
+        if mimetype not in allowed_prompt_types:
+            raise ValueError(f'Invalid mimetype: {mimetype}. Allowed values: {allowed_prompt_types}')
+        if mimetype == PromptType.METADATA and isinstance(value, dict):
+            self.metadata.update(value)
+        else:
+            self.elements.append({'mimetype': mimetype,
+                                  'value': value})
+    def to_json(self):
+        """
+        Convert Prompt entity to the item json
+        :return:
+        """
+        elements_json = [
+            {
+                "mimetype": e['mimetype'],
+                "value": e['value'],
+            } for e in self.elements if not e['mimetype'] == PromptType.METADATA
+        ]
+        elements_json.append({
+            "mimetype": PromptType.METADATA,
+            "value": self.metadata
+        })
+        return {
+            self.key: elements_json
+        }
+    def _convert_stream_to_binary(self, image_url: str):
+        """
+        Convert a stream to binary
+        :param image_url: dataloop image stream url
+        :return: binary object
+        """
+        image_buffer = None
+        if '.' in image_url and 'dataloop.ai' not in image_url:
+            # URL and not DL item stream
+            try:
+                response = requests.get(image_url, stream=True)
+                response.raise_for_status()  # Raise an exception for bad status codes
+                # Check for valid image content type
+                if response.headers["Content-Type"].startswith("image/"):
+                    # Read the image data in chunks to avoid loading large images in memory
+                    image_buffer = b"".join(chunk for chunk in response.iter_content(1024))
+            except requests.exceptions.RequestException as e:
+                logger.error(f"Failed to download image from URL: {image_url}, error: {e}")
+        elif '.' in image_url and 'stream' in image_url:
+            # DL Stream URL
+            item_id = image_url.split("/stream")[0].split("/items/")[-1]
+            image_buffer = self._items.get(item_id=item_id).download(save_locally=False).getvalue()
+        else:
+            # DL item ID
+            image_buffer = self._items.get(item_id=image_url).download(save_locally=False).getvalue()
+        if image_buffer is not None:
+            encoded_image = base64.b64encode(image_buffer).decode()
+        else:
+            logger.error(f'Invalid image url: {image_url}')
+            return None
+        return f'data:image/jpeg;base64,{encoded_image}'
+    def messages(self):
+        """
+        return a list of messages in the prompt item,
+        messages are returned following the openai SDK format https://platform.openai.com/docs/guides/vision
+        """
+        messages = []
+        for element in self.elements:
+            if element['mimetype'] == PromptType.TEXT:
+                data = {
+                    "type": "text",
+                    "text": element['value']
+                }
+                messages.append(data)
+            elif element['mimetype'] == PromptType.IMAGE:
+                image_url = self._convert_stream_to_binary(element['value'])
+                data = {
+                    "type": "image_url",
+                    "image_url": {
+                        "url": image_url
+                    }
+                }
+                messages.append(data)
+            elif element['mimetype'] == PromptType.AUDIO:
+                raise NotImplementedError('Audio prompt is not supported yet')
+            elif element['mimetype'] == PromptType.VIDEO:
+                data = {
+                    "type": "video_url",
+                    "video_url": {
+                        "url": element['value']
+                    }
+                }
+                messages.append(data)
+            else:
+                raise ValueError(f'Invalid mimetype: {element["mimetype"]}')
+        return messages, self.key
+class PromptItem:
+    def __init__(self, name, item: entities.Item = None, role_mapping=None):
+        if role_mapping is None:
+            role_mapping = {'user': 'item',
+                            'assistant': 'annotation'}
+        if not isinstance(role_mapping, dict):
+            raise ValueError(f'input role_mapping must be dict. type: {type(role_mapping)}')
+        self.role_mapping = role_mapping
+        # prompt item name
+        self.name = name
+        # list of user prompts in the prompt item
+        self.prompts = list()
+        self.assistant_prompts = list()
+        # list of assistant (annotations) prompts in the prompt item
+        # Dataloop Item
+        self._item: entities.Item = item
+        self._messages = []
+        self._annotations: entities.AnnotationCollection = None
+        if item is not None:
+            if 'json' not in item.mimetype or item.system.get('shebang', dict()).get('dltype') != 'prompt':
+                raise ValueError('Expecting a json item with system.shebang.dltype = prompt')
+            self._items = item.items
+            self.fetch()
+        else:
+            self._items = repositories.Items(client_api=client_api)
+        # to avoid broken stream of json files - DAT-75653
+        self._items._client_api.default_headers['x-dl-sanitize'] = '0'
+    @classmethod
+    def from_messages(cls, messages: list):
+        ...
+    @classmethod
+    def from_item(cls, item: entities.Item):
+        """
+        Load a prompt item from the platform
+        :param item : Item object
+        :return: PromptItem object
+        """
+        if 'json' not in item.mimetype or item.system.get('shebang', dict()).get('dltype') != 'prompt':
+            raise ValueError('Expecting a json item with system.shebang.dltype = prompt')
+        return cls(name=item.name, item=item)
+    @classmethod
+    def from_local_file(cls, filepath):
+        """
+        Create a new prompt item from a file
+        :param filepath: path to the file
+        :return: PromptItem object
+        """
+        if os.path.exists(filepath) is False:
+            raise FileNotFoundError(f'File does not exists: {filepath}')
+        if 'json' not in os.path.splitext(filepath)[-1]:
+            raise ValueError(f'Expected path to json item, got {os.path.splitext(filepath)[-1]}')
+        prompt_item = cls(name=filepath)
+        with open(filepath, 'r', encoding='utf-8') as f:
+            data = json.load(f)
+        prompt_item.prompts = prompt_item._load_item_prompts(data=data)
+        return prompt_item
+    @staticmethod
+    def _load_item_prompts(data):
+        prompts = list()
+        for prompt_key, prompt_elements in data.get('prompts', dict()).items():
+            content = list()
+            for element in prompt_elements:
+                content.append({'value': element.get('value', dict()),
+                                'mimetype': element['mimetype']})
+            prompt = Prompt(key=prompt_key, role="user")
+            for element in content:
+                prompt.add_element(value=element.get('value', ''),
+                                   mimetype=element.get('mimetype', PromptType.TEXT))
+            prompts.append(prompt)
+        return prompts
+    @staticmethod
+    def _load_annotations_prompts(annotations: entities.AnnotationCollection):
+        """
+        Get all the annotations in the item for the assistant messages
+        """
+        # clearing the assistant prompts from previous annotations that might not belong
+        assistant_prompts = list()
+        for annotation in annotations:
+            prompt_id = annotation.metadata.get('system', dict()).get('promptId', None)
+            model_info = annotation.metadata.get('user', dict()).get('model', dict())
+            annotation_id = annotation.id
+            if annotation.type == 'ref_image':
+                prompt = Prompt(key=prompt_id, role='assistant')
+                prompt.add_element(value=annotation.annotation_definition.coordinates.get('ref'),
+                                   mimetype=PromptType.IMAGE)
+            elif annotation.type == 'text':
+                prompt = Prompt(key=prompt_id, role='assistant')
+                prompt.add_element(value=annotation.annotation_definition.coordinates,
+                                   mimetype=PromptType.TEXT)
+            else:
+                raise ValueError(f"Unsupported annotation type: {annotation.type}")
+            prompt.add_element(value={'id': annotation_id,
+                                      'model_info': model_info},
+                               mimetype=PromptType.METADATA)
+            assistant_prompts.append(prompt)
+        return assistant_prompts
+    def to_json(self):
+        """
+        Convert the entity to a platform item.
+        :return:
+        """
+        prompts_json = {
+            "shebang": "dataloop",
+            "metadata": {
+                "dltype": 'prompt'
+            },
+            "prompts": {}
+        }
+        for prompt in self.prompts:
+            for prompt_key, prompt_values in prompt.to_json().items():
+                prompts_json["prompts"][prompt_key] = prompt_values
+        return prompts_json
+    def to_messages(self, model_name=None, include_assistant=True):
+        all_prompts_messages = dict()
+        for prompt in self.prompts:
+            if prompt.key not in all_prompts_messages:
+                all_prompts_messages[prompt.key] = list()
+            prompt_messages, prompt_key = prompt.messages()
+            messages = {
+                'role': prompt.metadata.get('role', 'user'),
+                'content': prompt_messages
+            }
+            all_prompts_messages[prompt.key].append(messages)
+        if include_assistant is True:
+            # reload to filer model annotations
+            for prompt in self.assistant_prompts:
+                prompt_model_name = prompt.metadata.get('model_info', dict()).get('name')
+                if model_name is not None and prompt_model_name != model_name:
+                    continue
+                if prompt.key not in all_prompts_messages:
+                    logger.warning(
+                        f'Prompt key {prompt.key} is not found in the user prompts, skipping Assistant prompt')
+                    continue
+                prompt_messages, prompt_key = prompt.messages()
+                assistant_messages = {
+                    'role': 'assistant',
+                    'content': prompt_messages
+                }
+                all_prompts_messages[prompt.key].append(assistant_messages)
+        res = list()
+        for prompts in all_prompts_messages.values():
+            for prompt in prompts:
+                res.append(prompt)
+        self._messages = res
+        return self._messages
+    def to_bytes_io(self):
+        # Used for item upload, do not delete
+        byte_io = io.BytesIO()
+        byte_io.name = self.name
+        byte_io.write(json.dumps(self.to_json()).encode())
+        byte_io.seek(0)
+        return byte_io
+    def fetch(self):
+        if self._item is None:
+            raise ValueError('Missing item, nothing to fetch..')
+        self._item = self._items.get(item_id=self._item.id)
+        self._annotations = self._item.annotations.list()
+        self.prompts = self._load_item_prompts(data=json.load(self._item.download(save_locally=False)))
+        self.assistant_prompts = self._load_annotations_prompts(self._annotations)
+    def build_context(self, nearest_items, add_metadata=None) -> str:
+        """
+        Create a context stream from nearest items list.
+        add_metadata is a list of location in the item.metadata to add to the context, for instance ['system.document.source']
+        :param nearest_items: list of item ids
+        :param add_metadata: list of metadata location to add metadata to context
+        :return:
+        """
+        if add_metadata is None:
+            add_metadata = list()
+        def stream_single(w_id):
+            context_item = self._items.get(item_id=w_id)
+            buf = context_item.download(save_locally=False)
+            text = buf.read().decode(encoding='utf-8')
+            m = ""
+            for path in add_metadata:
+                parts = path.split('.')
+                value = context_item.metadata
+                part = ""
+                for part in parts:
+                    if isinstance(value, dict):
+                        value = value.get(part)
+                    else:
+                        value = ""
+                m += f"{part}:{value}\n"
+            return text, m
+        pool = ThreadPoolExecutor(max_workers=32)
+        context = ""
+        if len(nearest_items) > 0:
+            # build context
+            results = pool.map(stream_single, nearest_items)
+            for res in results:
+                context += f"\n<source>\n{res[1]}\n</source>\n<text>\n{res[0]}\n</text>"
+        return context
+    def add(self,
+            message: dict,
+            prompt_key: str = None,
+            model_info: dict = None):
+        """
+        add a prompt to the prompt item
+        prompt: a dictionary. keys are prompt message id, values are prompt messages
+        responses: a list of annotations representing responses to the prompt
+        :param message:
+        :param prompt_key:
+        :param model_info:
+        :return:
+        """
+        role = message.get('role', 'user')
+        content = message.get('content', list())
+        if self.role_mapping.get(role, 'item') == 'item':
+            if prompt_key is None:
+                prompt_key = str(len(self.prompts) + 1)
+            # for new prompt we need a new key
+            prompt = Prompt(key=prompt_key, role=role)
+            for element in content:
+                prompt.add_element(value=element.get('value', ''),
+                                   mimetype=element.get('mimetype', PromptType.TEXT))
+            # create new prompt and add to prompts
+            self.prompts.append(prompt)
+            if self._item is not None:
+                self._item._Item__update_item_binary(_json=self.to_json())
+        else:
+            if prompt_key is None:
+                prompt_key = str(len(self.prompts))
+            assistant_message = content[0]
+            assistant_mimetype = assistant_message.get('mimetype', PromptType.TEXT)
+            uploaded_annotation = None
+            # find if prompt
+            if model_info is None:
+                # dont search for existing if there's no model information
+                existing_prompt = None
+            else:
+                existing_prompts = list()
+                for prompt in self.assistant_prompts:
+                    prompt_id = prompt.key
+                    model_name = prompt.metadata.get('model_info', dict()).get('name')
+                    if prompt_id == prompt_key and model_name == model_info.get('name'):
+                        # TODO how to handle multiple annotations
+                        existing_prompts.append(prompt)
+                if len(existing_prompts) > 1:
+                    assert False, "shouldn't be here! more than 1 annotation for a single model"
+                elif len(existing_prompts) == 1:
+                    # found model annotation to upload
+                    existing_prompt = existing_prompts[0]
+                else:
+                    # no annotation found
+                    existing_prompt = None
+            if existing_prompt is None:
+                prompt = Prompt(key=prompt_key)
+                if assistant_mimetype == PromptType.TEXT:
+                    annotation_definition = entities.FreeText(text=assistant_message.get('value'))
+                    prompt.add_element(value=annotation_definition.to_coordinates(None),
+                                       mimetype=PromptType.TEXT)
+                elif assistant_mimetype == PromptType.IMAGE:
+                    annotation_definition = entities.RefImage(ref=assistant_message.get('value'))
+                    prompt.add_element(value=annotation_definition.to_coordinates(None).get('ref'),
+                                       mimetype=PromptType.IMAGE)
+                else:
+                    raise NotImplementedError('Only images of mimetype image and text are supported')
+                metadata = {'system': {'promptId': prompt_key},
+                            'user': {'model': model_info}}
+                prompt.add_element(mimetype=PromptType.METADATA,
+                                   value={"model_info": model_info})
+                existing_annotation = entities.Annotation.new(item=self._item,
+                                                              metadata=metadata,
+                                                              annotation_definition=annotation_definition)
+                uploaded_annotation = existing_annotation.upload()
+                prompt.add_element(mimetype=PromptType.METADATA,
+                                   value={"id": uploaded_annotation.id})
+                existing_prompt = prompt
+                self.assistant_prompts.append(prompt)
+            existing_prompt_element = [element for element in existing_prompt.elements if
+                                       element['mimetype'] != PromptType.METADATA][-1]
+            existing_prompt_element['value'] = assistant_message.get('value')
+            if uploaded_annotation is None:
+                # Creating annotation with old dict to match platform dict
+                annotation_definition = entities.FreeText(text='')
+                metadata = {'system': {'promptId': prompt_key},
+                            'user': {'model': existing_prompt.metadata.get('model_info')}}
+                annotation = entities.Annotation.new(item=self._item,
+                                                     metadata=metadata,
+                                                     annotation_definition=annotation_definition
+                                                     )
+                annotation.id = existing_prompt.metadata['id']
+                # set the platform dict to match the old annotation for the dict difference check, otherwise it won't
+                # update
+                annotation._platform_dict = annotation.to_json()
+                # update the annotation with the new text
+                annotation.annotation_definition.text = existing_prompt_element['value']
+                self._item.annotations.update(annotation)
+    def update(self):
+        """
+        Update the prompt item in the platform.
+        """
+        if self._item is not None:
+            self._item._Item__update_item_binary(_json=self.to_json())
+            self._item = self._item.update()
+        else:
+            raise ValueError('Cannot update PromptItem without an item.')
+    # Properties
+    @property
+    def item(self) -> Optional['entities.Item']:
+        """
+        Get the underlying Item object.
+        :return: The Item object associated with this PromptItem, or None.
+        :rtype: Optional[dtlpy.entities.Item]
+        """
+        return self._item
+    @item.setter
+    def item(self, item: Optional['entities.Item']):
+        """
+        Set the underlying Item object.
+        :param item: The Item object to associate with this PromptItem, or None.
+        :type item: Optional[dtlpy.entities.Item]
+        """
+        if item is not None and not isinstance(item, entities.Item):
+            raise ValueError(f"Expected dtlpy.entities.Item or None, got {type(item)}")
+        self._item = item
+    @property
+    def metadata(self) -> dict:
+        """
+        Get the metadata from the underlying Item object.
+        :return: Metadata dictionary from the item, or empty dict if no item exists.
+        :rtype: dict
+        """
+        if self._item is not None:
+            return self._item.metadata
+        else:
             raise ValueError('No item found, cannot get metadata, to set item use prompt_item.item = item')

dtlpy 1.115.44__py3-none-any.whl → 1.116.6__py3-none-any.whl

dtlpy 1.115.44py3-none-any.whl → 1.116.6py3-none-any.whl