PyPI - supervisely - Versions diffs - 6.73.438__py3-none-any.whl → 6.73.513__py3-none-any.whl - Mend

supervisely 6.73.438py3-none-any.whl → 6.73.513py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (203) hide show

supervisely/__init__.py +137 -1
supervisely/_utils.py +81 -0
supervisely/annotation/annotation.py +8 -2
supervisely/annotation/json_geometries_map.py +14 -11
supervisely/annotation/label.py +80 -3
supervisely/api/annotation_api.py +14 -11
supervisely/api/api.py +59 -38
supervisely/api/app_api.py +11 -2
supervisely/api/dataset_api.py +74 -12
supervisely/api/entities_collection_api.py +10 -0
supervisely/api/entity_annotation/figure_api.py +52 -4
supervisely/api/entity_annotation/object_api.py +3 -3
supervisely/api/entity_annotation/tag_api.py +63 -12
supervisely/api/guides_api.py +210 -0
supervisely/api/image_api.py +72 -1
supervisely/api/labeling_job_api.py +83 -1
supervisely/api/labeling_queue_api.py +33 -7
supervisely/api/module_api.py +9 -0
supervisely/api/project_api.py +71 -26
supervisely/api/storage_api.py +3 -1
supervisely/api/task_api.py +13 -2
supervisely/api/team_api.py +4 -3
supervisely/api/video/video_annotation_api.py +119 -3
supervisely/api/video/video_api.py +65 -14
supervisely/api/video/video_figure_api.py +24 -11
supervisely/app/__init__.py +1 -1
supervisely/app/content.py +23 -7
supervisely/app/development/development.py +18 -2
supervisely/app/fastapi/__init__.py +1 -0
supervisely/app/fastapi/custom_static_files.py +1 -1
supervisely/app/fastapi/multi_user.py +105 -0
supervisely/app/fastapi/subapp.py +88 -42
supervisely/app/fastapi/websocket.py +77 -9
supervisely/app/singleton.py +21 -0
supervisely/app/v1/app_service.py +18 -2
supervisely/app/v1/constants.py +7 -1
supervisely/app/widgets/__init__.py +6 -0
supervisely/app/widgets/activity_feed/__init__.py +0 -0
supervisely/app/widgets/activity_feed/activity_feed.py +239 -0
supervisely/app/widgets/activity_feed/style.css +78 -0
supervisely/app/widgets/activity_feed/template.html +22 -0
supervisely/app/widgets/card/card.py +20 -0
supervisely/app/widgets/classes_list_selector/classes_list_selector.py +121 -9
supervisely/app/widgets/classes_list_selector/template.html +60 -93
supervisely/app/widgets/classes_mapping/classes_mapping.py +13 -12
supervisely/app/widgets/classes_table/classes_table.py +1 -0
supervisely/app/widgets/deploy_model/deploy_model.py +56 -35
supervisely/app/widgets/dialog/dialog.py +12 -0
supervisely/app/widgets/dialog/template.html +2 -1
supervisely/app/widgets/ecosystem_model_selector/ecosystem_model_selector.py +1 -1
supervisely/app/widgets/experiment_selector/experiment_selector.py +8 -0
supervisely/app/widgets/fast_table/fast_table.py +184 -60
supervisely/app/widgets/fast_table/template.html +1 -1
supervisely/app/widgets/heatmap/__init__.py +0 -0
supervisely/app/widgets/heatmap/heatmap.py +564 -0
supervisely/app/widgets/heatmap/script.js +533 -0
supervisely/app/widgets/heatmap/style.css +233 -0
supervisely/app/widgets/heatmap/template.html +21 -0
supervisely/app/widgets/modal/__init__.py +0 -0
supervisely/app/widgets/modal/modal.py +198 -0
supervisely/app/widgets/modal/template.html +10 -0
supervisely/app/widgets/object_class_view/object_class_view.py +3 -0
supervisely/app/widgets/radio_tabs/radio_tabs.py +18 -2
supervisely/app/widgets/radio_tabs/template.html +1 -0
supervisely/app/widgets/select/select.py +6 -3
supervisely/app/widgets/select_class/__init__.py +0 -0
supervisely/app/widgets/select_class/select_class.py +363 -0
supervisely/app/widgets/select_class/template.html +50 -0
supervisely/app/widgets/select_cuda/select_cuda.py +22 -0
supervisely/app/widgets/select_dataset_tree/select_dataset_tree.py +65 -7
supervisely/app/widgets/select_tag/__init__.py +0 -0
supervisely/app/widgets/select_tag/select_tag.py +352 -0
supervisely/app/widgets/select_tag/template.html +64 -0
supervisely/app/widgets/select_team/select_team.py +37 -4
supervisely/app/widgets/select_team/template.html +4 -5
supervisely/app/widgets/select_user/__init__.py +0 -0
supervisely/app/widgets/select_user/select_user.py +270 -0
supervisely/app/widgets/select_user/template.html +13 -0
supervisely/app/widgets/select_workspace/select_workspace.py +59 -10
supervisely/app/widgets/select_workspace/template.html +9 -12
supervisely/app/widgets/table/table.py +68 -13
supervisely/app/widgets/tree_select/tree_select.py +2 -0
supervisely/aug/aug.py +6 -2
supervisely/convert/base_converter.py +1 -0
supervisely/convert/converter.py +2 -2
supervisely/convert/image/csv/csv_converter.py +24 -15
supervisely/convert/image/image_converter.py +3 -1
supervisely/convert/image/image_helper.py +48 -4
supervisely/convert/image/label_studio/label_studio_converter.py +2 -0
supervisely/convert/image/medical2d/medical2d_helper.py +2 -24
supervisely/convert/image/multispectral/multispectral_converter.py +6 -0
supervisely/convert/image/pascal_voc/pascal_voc_converter.py +8 -5
supervisely/convert/image/pascal_voc/pascal_voc_helper.py +7 -0
supervisely/convert/pointcloud/kitti_3d/kitti_3d_converter.py +33 -3
supervisely/convert/pointcloud/kitti_3d/kitti_3d_helper.py +12 -5
supervisely/convert/pointcloud/las/las_converter.py +13 -1
supervisely/convert/pointcloud/las/las_helper.py +110 -11
supervisely/convert/pointcloud/nuscenes_conv/nuscenes_converter.py +27 -16
supervisely/convert/pointcloud/pointcloud_converter.py +91 -3
supervisely/convert/pointcloud_episodes/nuscenes_conv/nuscenes_converter.py +58 -22
supervisely/convert/pointcloud_episodes/nuscenes_conv/nuscenes_helper.py +21 -47
supervisely/convert/video/__init__.py +1 -0
supervisely/convert/video/multi_view/__init__.py +0 -0
supervisely/convert/video/multi_view/multi_view.py +543 -0
supervisely/convert/video/sly/sly_video_converter.py +359 -3
supervisely/convert/video/video_converter.py +24 -4
supervisely/convert/volume/dicom/dicom_converter.py +13 -5
supervisely/convert/volume/dicom/dicom_helper.py +30 -18
supervisely/geometry/constants.py +1 -0
supervisely/geometry/geometry.py +4 -0
supervisely/geometry/helpers.py +5 -1
supervisely/geometry/oriented_bbox.py +676 -0
supervisely/geometry/polyline_3d.py +110 -0
supervisely/geometry/rectangle.py +2 -1
supervisely/io/env.py +76 -1
supervisely/io/fs.py +21 -0
supervisely/nn/benchmark/base_evaluator.py +104 -11
supervisely/nn/benchmark/instance_segmentation/evaluator.py +1 -8
supervisely/nn/benchmark/object_detection/evaluator.py +20 -4
supervisely/nn/benchmark/object_detection/vis_metrics/pr_curve.py +10 -5
supervisely/nn/benchmark/semantic_segmentation/evaluator.py +34 -16
supervisely/nn/benchmark/semantic_segmentation/vis_metrics/confusion_matrix.py +1 -1
supervisely/nn/benchmark/semantic_segmentation/vis_metrics/frequently_confused.py +1 -1
supervisely/nn/benchmark/semantic_segmentation/vis_metrics/overview.py +1 -1
supervisely/nn/benchmark/visualization/evaluation_result.py +66 -4
supervisely/nn/inference/cache.py +43 -18
supervisely/nn/inference/gui/serving_gui_template.py +5 -2
supervisely/nn/inference/inference.py +916 -222
supervisely/nn/inference/inference_request.py +55 -10
supervisely/nn/inference/predict_app/gui/classes_selector.py +83 -12
supervisely/nn/inference/predict_app/gui/gui.py +676 -488
supervisely/nn/inference/predict_app/gui/input_selector.py +205 -26
supervisely/nn/inference/predict_app/gui/model_selector.py +2 -4
supervisely/nn/inference/predict_app/gui/output_selector.py +46 -6
supervisely/nn/inference/predict_app/gui/settings_selector.py +756 -59
supervisely/nn/inference/predict_app/gui/tags_selector.py +1 -1
supervisely/nn/inference/predict_app/gui/utils.py +236 -119
supervisely/nn/inference/predict_app/predict_app.py +2 -2
supervisely/nn/inference/session.py +43 -35
supervisely/nn/inference/tracking/bbox_tracking.py +118 -35
supervisely/nn/inference/tracking/point_tracking.py +5 -1
supervisely/nn/inference/tracking/tracker_interface.py +10 -1
supervisely/nn/inference/uploader.py +139 -12
supervisely/nn/live_training/__init__.py +7 -0
supervisely/nn/live_training/api_server.py +111 -0
supervisely/nn/live_training/artifacts_utils.py +243 -0
supervisely/nn/live_training/checkpoint_utils.py +229 -0
supervisely/nn/live_training/dynamic_sampler.py +44 -0
supervisely/nn/live_training/helpers.py +14 -0
supervisely/nn/live_training/incremental_dataset.py +146 -0
supervisely/nn/live_training/live_training.py +497 -0
supervisely/nn/live_training/loss_plateau_detector.py +111 -0
supervisely/nn/live_training/request_queue.py +52 -0
supervisely/nn/model/model_api.py +9 -0
supervisely/nn/model/prediction.py +2 -1
supervisely/nn/model/prediction_session.py +26 -14
supervisely/nn/prediction_dto.py +19 -1
supervisely/nn/tracker/base_tracker.py +11 -1
supervisely/nn/tracker/botsort/botsort_config.yaml +0 -1
supervisely/nn/tracker/botsort/tracker/mc_bot_sort.py +7 -4
supervisely/nn/tracker/botsort_tracker.py +94 -65
supervisely/nn/tracker/utils.py +4 -5
supervisely/nn/tracker/visualize.py +93 -93
supervisely/nn/training/gui/classes_selector.py +16 -1
supervisely/nn/training/gui/train_val_splits_selector.py +52 -31
supervisely/nn/training/train_app.py +46 -31
supervisely/project/data_version.py +115 -51
supervisely/project/download.py +1 -1
supervisely/project/pointcloud_episode_project.py +37 -8
supervisely/project/pointcloud_project.py +30 -2
supervisely/project/project.py +14 -2
supervisely/project/project_meta.py +27 -1
supervisely/project/project_settings.py +32 -18
supervisely/project/versioning/__init__.py +1 -0
supervisely/project/versioning/common.py +20 -0
supervisely/project/versioning/schema_fields.py +35 -0
supervisely/project/versioning/video_schema.py +221 -0
supervisely/project/versioning/volume_schema.py +87 -0
supervisely/project/video_project.py +717 -15
supervisely/project/volume_project.py +623 -5
supervisely/template/experiment/experiment.html.jinja +4 -4
supervisely/template/experiment/experiment_generator.py +14 -21
supervisely/template/live_training/__init__.py +0 -0
supervisely/template/live_training/header.html.jinja +96 -0
supervisely/template/live_training/live_training.html.jinja +51 -0
supervisely/template/live_training/live_training_generator.py +464 -0
supervisely/template/live_training/sly-style.css +402 -0
supervisely/template/live_training/template.html.jinja +18 -0
supervisely/versions.json +28 -26
supervisely/video/sampling.py +39 -20
supervisely/video/video.py +41 -12
supervisely/video_annotation/video_figure.py +38 -4
supervisely/video_annotation/video_object.py +29 -4
supervisely/volume/stl_converter.py +2 -0
supervisely/worker_api/agent_rpc.py +24 -1
supervisely/worker_api/rpc_servicer.py +31 -7
{supervisely-6.73.438.dist-info → supervisely-6.73.513.dist-info}/METADATA +58 -40
{supervisely-6.73.438.dist-info → supervisely-6.73.513.dist-info}/RECORD +203 -155
{supervisely-6.73.438.dist-info → supervisely-6.73.513.dist-info}/WHEEL +1 -1
supervisely_lib/__init__.py +6 -1
{supervisely-6.73.438.dist-info → supervisely-6.73.513.dist-info}/entry_points.txt +0 -0
{supervisely-6.73.438.dist-info → supervisely-6.73.513.dist-info/licenses}/LICENSE +0 -0
{supervisely-6.73.438.dist-info → supervisely-6.73.513.dist-info}/top_level.txt +0 -0

supervisely/nn/live_training/live_training.py ADDED Viewed

@@ -0,0 +1,497 @@
+import os
+import numpy as np
+from .api_server import start_api_server
+from .request_queue import RequestQueue, RequestType
+from .incremental_dataset import IncrementalDataset
+from .helpers import ClassMap
+import supervisely as sly
+from supervisely import logger
+from supervisely.nn import TaskType
+from datetime import datetime
+import signal
+import sys
+import time
+from .checkpoint_utils import resolve_checkpoint, save_state_json
+from .artifacts_utils import upload_artifacts
+from .loss_plateau_detector import LossPlateauDetector
+from pathlib import Path
+class Phase:
+    READY_TO_START = "ready_to_start"
+    WAITING_FOR_SAMPLES = "waiting_for_samples"
+    INITIAL_TRAINING = "initial_training"
+    TRAINING = "training"
+class LiveTraining:
+    from torch import nn  # pylint: disable=import-error
+    task_type: str = None  # Should be set in subclass
+    framework_name: str = None # Should be set in subclass
+    _task2geometries = {
+        TaskType.OBJECT_DETECTION: [sly.Rectangle],
+        TaskType.INSTANCE_SEGMENTATION: [sly.Bitmap, sly.Polygon],
+        TaskType.SEMANTIC_SEGMENTATION: [sly.Bitmap, sly.Polygon],
+    }
+    def __init__(
+            self,
+            initial_samples: int = 2,
+            filter_classes_by_task: bool = True,
+        ):
+        from torch import nn  # pylint: disable=import-error
+        self.initial_samples = initial_samples
+        self.filter_classes_by_task = filter_classes_by_task
+        if self.task_type is None and self.filter_classes_by_task:
+            raise ValueError("task_type must be set in subclass if filter_classes_by_task is set to True")
+        if self.framework_name is None:
+            raise ValueError("framework_name must be set in subclass")
+        self.project_id = sly.env.project_id()
+        self.team_id = sly.env.team_id()
+        self.task_id = sly.env.task_id(raise_not_found=False)
+        self.app = sly.Application()
+        self.api = sly.Api()
+        self.request_queue = RequestQueue()
+        if os.getenv("DEVELOP_AND_DEBUG") and not sly.is_production():
+            logger.info(f"🔧 Initializing Develop & Debug application for project {self.project_id}...")
+            sly.app.development.supervisely_vpn_network(action="up")
+            debug_task = sly.app.development.create_debug_task(self.team_id, port="8000", project_id=self.project_id)
+            self.task_id = debug_task['id']
+        self._api_thread = start_api_server(self.app, self.request_queue)
+        self.phase = Phase.READY_TO_START
+        self.iter = 0
+        self._loss = None
+        self._is_paused = False
+        self._should_pause_after_continue = False
+        self.initial_iters = 60  # TODO: remove later
+        self.project_meta = self._fetch_project_meta(self.project_id)
+        self.class_map = self._init_class_map(self.project_meta)
+        self.dataset: IncrementalDataset = None
+        self.model: nn.Module  = None
+        self.loss_plateau_detector = self._init_loss_plateau_detector()
+        self.work_dir = 'app_data'
+        self.latest_checkpoint_path = f"{self.work_dir}/checkpoints/latest.pth"
+        self.checkpoint_mode = os.getenv("modal.state.checkpointMode", "scratch")
+        selected_task_id_env = os.getenv("modal.state.selectedExperimentTaskId")
+        self.selected_experiment_task_id = int(selected_task_id_env) if selected_task_id_env else None
+        self.training_start_time = None
+        self._upload_in_progress = False
+        # from . import live_training_instance
+        # live_training_instance = self  # for access from other modules
+    @property
+    def ready_to_predict(self):
+        return self.iter > self.initial_iters
+    def status(self):
+        return {
+            'phase': self.phase,
+            'samples_count': len(self.dataset) if self.dataset is not None else 0,
+            'waiting_samples': self.initial_samples,
+            'task_type': self.task_type,
+            'iteration': self.iter,
+            'loss': self._loss,
+            'training_paused': self._is_paused,
+            'ready_to_predict': self.ready_to_predict,
+            'initial_iters': self.initial_iters,
+        }
+    def run(self):
+        self.training_start_time = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+        self._add_shutdown_callback()
+        work_dir_path = Path(self.work_dir)
+        work_dir_path.mkdir(parents=True, exist_ok=True)
+        model_meta_path = work_dir_path / "model_meta.json"
+        sly.json.dump_json_file(self.project_meta.to_json(), str(model_meta_path))
+        try:
+            self.phase = Phase.READY_TO_START
+            self._wait_for_start()
+            if self.checkpoint_mode == 'continue':
+                self._run_continue()
+            elif self.checkpoint_mode == 'finetune':
+                self._run_finetune()
+            else:
+                self._run_from_scratch()
+        except Exception as e:
+            if not sly.is_production():
+                raise e
+            else:
+                logger.error(f"Live training failed: {e}", exc_info=True)
+                final_checkpoint = self.latest_checkpoint_path
+                self.save_checkpoint(final_checkpoint)
+                save_state_json(self.state(), final_checkpoint)
+                self._upload_artifacts()
+    def _run_from_scratch(self):
+        self.phase = Phase.WAITING_FOR_SAMPLES
+        self._wait_for_initial_samples()
+        self.train(checkpoint_path=None)
+    def _run_continue(self):
+        checkpoint_path, state = self._load_checkpoint()
+        self.load_state(state)
+        image_ids = state.get('image_ids', [])
+        if image_ids:
+            self._restore_dataset(image_ids)
+        self.train(checkpoint_path=checkpoint_path)
+    def _run_finetune(self):
+        checkpoint_path, _ = self._load_checkpoint()
+        self.phase = Phase.WAITING_FOR_SAMPLES
+        self._wait_for_initial_samples()
+        self.train(checkpoint_path=checkpoint_path)
+    def _wait_for_start(self):
+        request = self.request_queue.get()
+        while request.type != RequestType.START:
+            if request.type == RequestType.STATUS:
+                status = self.status()
+                request.future.set_result(status)
+            else:
+                request.future.set_exception(Exception(f"Unexpected request {request.type} while waiting for START"))
+            request = self.request_queue.get()
+        # When START is received
+        status = self.status()
+        status['phase'] = Phase.WAITING_FOR_SAMPLES
+        request.future.set_result(status)
+    def _wait_until_samples_added(
+        self,
+        samples_needed: int,
+        max_wait_time: int = None,
+    ):
+        sleep_interval = 0.5
+        elapsed_time = 0
+        samples_before = len(self.dataset)
+        while len(self.dataset) - samples_before < samples_needed:
+            if max_wait_time is not None and elapsed_time >= max_wait_time:
+                raise RuntimeError("Timeout waiting for samples")
+            if not self.request_queue.is_empty():
+                self._process_pending_requests()
+            time.sleep(sleep_interval)
+            elapsed_time += sleep_interval
+    def _wait_for_initial_samples(self):
+        if len(self.dataset) >= self.initial_samples:
+            return
+        self.phase = Phase.WAITING_FOR_SAMPLES
+        self._is_paused = True
+        samples_needed = self.initial_samples - len(self.dataset)
+        logger.info(f"Waiting for {samples_needed} initial samples")
+        self._wait_until_samples_added(
+            samples_needed=samples_needed,
+            max_wait_time=3600,
+        )
+        self._is_paused = False
+    def _process_pending_requests(self):
+        requests = self.request_queue.get_all()
+        if not requests:
+            return
+        new_samples_added = False
+        for request in requests:
+            try:
+                if request.type == RequestType.PREDICT:
+                    result = self._handle_predict(request.data)
+                    request.future.set_result(result)
+                elif request.type == RequestType.ADD_SAMPLE:
+                    result = self._handle_add_sample(request.data)
+                    request.future.set_result(result)
+                    new_samples_added = True
+                elif request.type == RequestType.STATUS:
+                    result = self.status()
+                    request.future.set_result(result)
+            except Exception as e:
+                logger.error(f"Error processing request {request.type}: {e}", exc_info=True)
+                request.future.set_exception(e)
+    def train(self, checkpoint_path: str = None):
+        """
+        Main training loop. Implement framework-specific training logic here.
+        Prepare model config, set hyperparameters and run training.
+        Handle phases: initial training, training
+        """
+        raise NotImplementedError
+    def predict(self, model: nn.Module, image_np, image_info) -> list:
+        """
+        Run inference on a single image and return predictions as a list of sly figures in json format.
+        """
+        raise NotImplementedError
+    def _handle_predict(self, data: dict):
+        image_np = data['image']
+        image_info = {'id': data['image_id']}
+        model = self.model
+        was_training = model.training
+        model.eval()
+        try:
+            objects = self.predict(self.model, image_np=image_np, image_info=image_info)
+            return {
+                'objects': objects,
+                'image_id': data['image_id'],
+                'status': self.status(),
+            }
+        finally:
+            # Restore training mode
+            if was_training:
+                model.train()
+    def add_sample(
+            self,
+            image_id: int,
+            image_np: np.ndarray,
+            annotation: sly.Annotation,
+            image_name: str
+        ) -> dict:
+        return self.dataset.add_or_update(image_id, image_np, annotation, image_name)
+    def _handle_add_sample(self, data: dict):
+        ann_json = data['annotation']
+        ann_json = self._filter_annotation(ann_json)
+        sly_ann = sly.Annotation.from_json(ann_json, self.project_meta)
+        self.add_sample(
+            image_id=data['image_id'],
+            image_np=data['image'],
+            annotation=sly_ann,
+            image_name=data['image_name']
+        )
+        if (len(self.dataset) >= self.initial_samples) and self.phase==Phase.WAITING_FOR_SAMPLES:
+            self.phase = Phase.INITIAL_TRAINING
+        return {
+            'image_id': data['image_id'],
+            'status': self.status(),
+        }
+    def _fetch_project_meta(self, project_id: int) -> sly.ProjectMeta:
+        project_meta = self.api.project.get_meta(project_id)
+        project_meta = sly.ProjectMeta.from_json(project_meta)
+        return project_meta
+    def _init_class_map(self, project_meta: sly.ProjectMeta) -> ClassMap:
+        obj_classes = list(project_meta.obj_classes)
+        if self.task_type == TaskType.SEMANTIC_SEGMENTATION:
+            obj_classes.insert(0, sly.ObjClass(name='_background_', geometry_type=sly.Bitmap))
+        if self.filter_classes_by_task:
+            allowed_geometries = self._task2geometries[self.task_type]
+            obj_classes = [
+                obj_class for obj_class in obj_classes
+                if obj_class.geometry_type in allowed_geometries
+            ]
+        return ClassMap(obj_classes)
+    def _filter_annotation(self, ann_json: dict) -> dict:
+        # Filter objects according to class_map
+        # Important: Must be filtered before sly.Annotation.from_json due to static project meta
+        filtered_objects = []
+        for obj in ann_json['objects']:
+            sly_id = obj['classId']
+            if sly_id in self.class_map.sly_ids:
+                filtered_objects.append(obj)
+        ann_json['objects'] = filtered_objects
+        return ann_json
+    def after_train_step(self, loss: float):
+        self.iter += 1
+        self._loss = loss
+        if self._should_pause_after_continue:
+            self._is_paused = True
+            logger.info("Training was paused. Waiting for 1 new sample before resuming...")
+            self._wait_until_samples_added(samples_needed=1, max_wait_time=None)
+            self._should_pause_after_continue = False
+            logger.info("New sample added. Resuming training...")
+            self._is_paused = False
+        if self.loss_plateau_detector is not None:
+            is_plateau = self.loss_plateau_detector.step(loss, self.iter)
+            if is_plateau:
+                self._is_paused = True
+                self._wait_until_samples_added(
+                    samples_needed=1,
+                    max_wait_time=None,
+                )
+                self._is_paused = False
+                self.loss_plateau_detector.reset()
+        self._process_pending_requests()
+    def register_model(self, model: nn.Module):
+        self.model = model
+    def register_dataset(self, dataset: IncrementalDataset):
+        assert hasattr(dataset, 'add_or_update'), "Dataset must implement add_or_update method. Consider inheriting from IncrementalDataset."
+        self.dataset = dataset
+    def _load_checkpoint(self) -> tuple:
+        """Resolve and configure checkpoint based on checkpoint_mode."""
+        self._process_pending_requests()
+        checkpoint_path, class_map, state = resolve_checkpoint(
+            checkpoint_mode=self.checkpoint_mode,
+            selected_experiment_task_id=self.selected_experiment_task_id,
+            class_map=self.class_map,
+            project_meta=self.project_meta,
+            api=self.api,
+            team_id=self.team_id,
+            work_dir=self.work_dir
+        )
+        self.class_map = class_map
+        self._process_pending_requests()
+        return checkpoint_path, state
+    def state(self):
+        state = {
+            'phase': self.phase,
+            'iter': self.iter,
+            'loss': self._loss,
+            'clases': [cls.name for cls in self.class_map.obj_classes],
+            'image_ids': self.dataset.get_image_ids() if self.dataset else [],
+            'dataset_size': len(self.dataset) if self.dataset else 0,
+            'is_paused': self._is_paused
+        }
+        return state
+    def load_state(self, state: dict):
+        self.phase = state.get('phase', Phase.READY_TO_START)
+        self.iter = state.get('iter', 0)
+        self._loss = state.get('loss', None)
+        self.image_ids = state.get('image_ids', [])
+        if state.get('is_paused', False):
+            self._should_pause_after_continue = True
+        dataset_size = state.get('dataset_size', 0)
+    def _restore_dataset(self, image_ids: list):
+        if not image_ids:
+            return
+        logger.info(f"Restoring {len(image_ids)} images from Supervisely...")
+        restored_count = 0
+        for img_id in image_ids:
+            img_info = self.api.image.get_info_by_id(img_id)
+            if img_info is None:
+                logger.warning(f"Image {img_id} not found, skipping")
+                continue
+            image_np = self.api.image.download_np(img_id)
+            ann_json = self.api.annotation.download_json(img_id)
+            ann = sly.Annotation.from_json(ann_json, self.project_meta)
+            self.dataset.add_or_update(
+                image_id=img_id,
+                image_np=image_np,
+                annotation=ann,
+                image_name=img_info.name
+            )
+            restored_count += 1
+            if restored_count % 10 == 0:
+                logger.info(f"Restored {restored_count}/{len(image_ids)}")
+        logger.info(f"Restored {restored_count} images")
+    def prepare_artifacts(self) -> dict:
+        """
+        Prepare all artifacts for upload (framework-specific).
+        Returns:
+            Dict with:
+                - checkpoint_path: path to checkpoint file
+                - checkpoint_info: dict with {name, iteration, loss}
+                - config_path: path to config file
+                - logs_dir: path to logs directory or None
+                - model_name: model name
+                - model_config: model configuration dict
+                - loss_history: dict with loss history
+        """
+        raise NotImplementedError(
+            f"{self.__class__.__name__} must implement prepare_artifacts()"
+        )
+    def _get_session_info(self) -> dict:
+        """Collect training session context"""
+        return {
+            'team_id': self.team_id,
+            'task_id': self.task_id,
+            'project_id': self.project_id,
+            'framework_name': self.framework_name,
+            'task_type': self.task_type,
+            'class_map': self.class_map,
+            'start_time': self.training_start_time,
+            'train_size': len(self.dataset) if self.dataset else 0,
+            'initial_samples': self.initial_samples
+        }
+    def _upload_artifacts(self):
+        if self._upload_in_progress:
+            return
+        self._upload_in_progress = True
+        try:
+            session_info = self._get_session_info()
+            artifacts = self.prepare_artifacts()
+            report_url = upload_artifacts(
+                api=self.api,
+                session_info=session_info,
+                artifacts=artifacts
+            )
+            logger.info(f"Report: {report_url}")
+        except Exception as e:
+            logger.error(f"Upload failed: {e}", exc_info=True)
+        finally:
+            self._upload_in_progress = False
+    def save_checkpoint(self, checkpoint_path: str):
+        pass
+    def _init_loss_plateau_detector(self):
+        loss_plateau_detector = LossPlateauDetector()
+        loss_plateau_detector.register_save_checkpoint_callback(self.save_checkpoint)
+        return loss_plateau_detector
+    def _add_shutdown_callback(self):
+        """Setup graceful shutdown: save experiment on SIGINT/SIGTERM"""
+        self._upload_in_progress = False
+        def signal_handler(signum, frame):
+            if self._upload_in_progress:
+                # Already uploading - force exit on second signal
+                signal.signal(signal.SIGINT, lambda s, f: sys.exit(1))
+                signal.signal(signal.SIGTERM, lambda s, f: sys.exit(1))
+                return
+            # Save checkpoint and state before upload
+            logger.info("Received shutdown signal, saving checkpoint...")
+            self.save_checkpoint(self.latest_checkpoint_path)
+            save_state_json(self.state(), self.latest_checkpoint_path)
+            self._upload_artifacts()
+            sys.exit(0)
+        signal.signal(signal.SIGINT, signal_handler)
+        signal.signal(signal.SIGTERM, signal_handler)

supervisely/nn/live_training/loss_plateau_detector.py ADDED Viewed

@@ -0,0 +1,111 @@
+import numpy as np
+from typing import Callable
+class LossPlateauDetector:
+    """
+    Detect plateau in training loss using moving average comparison.
+    Args:
+        window_size: Number of iterations for moving average
+        threshold: Relative change threshold (e.g., 0.005 = 0.5%)
+        patience: Number of consecutive plateau detections before action
+        check_interval: Check frequency (every N iterations)
+    """
+    def __init__(
+        self,
+        window_size: int = 20,
+        threshold: float = 0.005,
+        patience: int = 1,
+        check_interval: int = 1,
+    ):
+        self.window_size = window_size
+        self.threshold = threshold
+        self.check_interval = check_interval
+        self.patience = patience
+        self._min_iterations = 2 * window_size
+        # State
+        self.loss_history = []
+        self.consecutive_plateau_count = 0
+        self._save_checkpoint_fn = None
+    def register_save_checkpoint_callback(self, fn: Callable[[], None]):
+        """Register callback function to save checkpoint when plateau detected"""
+        self._save_checkpoint_fn = fn
+    def reset(self):
+        """Reset detector state"""
+        self.loss_history = []
+        self.consecutive_plateau_count = 0
+    def step(self, loss: float, current_iter: int) -> bool:
+        """
+        Process one training iteration.
+        Args:
+            loss: Current loss value
+            current_iter: Current iteration number
+        Returns:
+            True if plateau confirmed and checkpoint saved, False otherwise
+        """
+        self.loss_history.append(loss)
+        # Check only at specified intervals
+        if (current_iter + 1) % self.check_interval != 0:
+            return False
+        # Need enough data
+        if len(self.loss_history) < self._min_iterations:
+            return False
+        # Check for plateau
+        is_plateau, info = self._check_plateau(current_iter)
+        if is_plateau:
+            self.consecutive_plateau_count += 1
+            print(
+                f'[Plateau Detection] Iteration {current_iter}: '
+                f'Signal {self.consecutive_plateau_count}/{self.patience} '
+                f'(change: {info["metric"]:.6f}, threshold: {self.threshold})'
+            )
+            # Trigger action when patience reached
+            if self.consecutive_plateau_count >= self.patience:
+                print(f'[Plateau Detection] Plateau confirmed, saving checkpoint...')
+                if self._save_checkpoint_fn is not None:
+                    self._save_checkpoint_fn()
+                    print(f'[Plateau Detection] Checkpoint saved')
+                else:
+                    print(f'[Plateau Detection] No callback registered')
+                self.consecutive_plateau_count = 0
+                return True
+        return False
+    def _check_plateau(self, current_iter: int) -> tuple:
+        """Check if current window shows plateau"""
+        # Current window average
+        current_window = self.loss_history[-self.window_size:]
+        current_avg = np.mean(current_window)
+        # Previous window average
+        previous_window = self.loss_history[-2*self.window_size:-self.window_size]
+        previous_avg = np.mean(previous_window)
+        change = previous_avg - current_avg
+        is_plateau = change < self.threshold
+        info = {
+            'iter': current_iter,
+            'metric': change,
+            'threshold': self.threshold,
+            'previous_avg': previous_avg,
+            'current_avg': current_avg,
+        }
+        return is_plateau, info

supervisely/nn/live_training/request_queue.py ADDED Viewed

@@ -0,0 +1,52 @@
+import queue
+import asyncio
+from typing import Any, Optional, List
+from enum import Enum
+class RequestType(Enum):
+    START = "start"
+    PREDICT = "predict"
+    ADD_SAMPLE = "add-sample"
+    STATUS = "status"
+class Request:
+    """A simple representation of an API request."""
+    def __init__(self, request_type: RequestType, data: Optional[dict] = None, future: Optional[asyncio.Future] = None):
+        self.type = request_type
+        self.data = data
+        self.future = future
+    def to_tuple(self):
+        return (self.type, self.data, self.future)
+class RequestQueue:
+    """Thread-safe queue for API requests."""
+    def __init__(self):
+        self._queue = queue.Queue()
+    def put(self, request_type: RequestType, data: Optional[dict] = None) -> asyncio.Future:
+        """Add request and return future for result."""
+        future = asyncio.Future()
+        self._queue.put(Request(request_type, data, future))
+        return future
+    def get_all(self) -> List[Request]:
+        """Get all pending requests (non-blocking)."""
+        requests = []
+        while not self._queue.empty():
+            try:
+                requests.append(self._queue.get_nowait())
+            except queue.Empty:
+                break
+        return requests
+    def is_empty(self) -> bool:
+        return self._queue.empty()
+    def get(self, timeout: float = None) -> Request:
+        """Get a single request from the queue."""
+        return self._queue.get(timeout=timeout)

supervisely/nn/model/model_api.py CHANGED Viewed

@@ -72,6 +72,15 @@ class ModelAPI:
         else:
             return self._post("get_custom_inference_settings", {})["settings"]
+    def get_tracking_settings(self):
+        # @TODO: botsort hardcoded
+        # Add dropdown selector for tracking algorithms later
+        if self.task_id is not None:
+            return self.api.task.send_request(self.task_id, "get_tracking_settings", {})["botsort"]
+        else:
+            return self._post("get_tracking_settings", {})["botsort"]
     def get_model_meta(self):
         if self.task_id is not None:
             return ProjectMeta.from_json(

supervisely/nn/model/prediction.py CHANGED Viewed

@@ -59,6 +59,7 @@ class Prediction:
         self.source = source
         if isinstance(annotation_json, Annotation):
             annotation_json = annotation_json.to_json()
         self.annotation_json = annotation_json
         self.model_meta = model_meta
         if isinstance(self.model_meta, dict):
@@ -157,7 +158,7 @@ class Prediction:
     @property
     def annotation(self) -> Annotation:
-        if self._annotation is None:
+        if self._annotation is None and self.annotation_json is not None:
             if self.model_meta is None:
                 raise ValueError("Model meta is not provided. Cannot create annotation.")
             model_meta = get_meta_from_annotation(self.annotation_json, self.model_meta)

supervisely 6.73.438__py3-none-any.whl → 6.73.513__py3-none-any.whl

supervisely 6.73.438py3-none-any.whl → 6.73.513py3-none-any.whl