PyPI - mlrun - Versions diffs - 1.4.0rc25__py3-none-any.whl → 1.5.0rc2__py3-none-any.whl - Mend

mlrun 1.4.0rc25py3-none-any.whl → 1.5.0rc2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mlrun might be problematic. Click here for more details.

Files changed (184) hide show

mlrun/__init__.py +2 -35
mlrun/__main__.py +3 -41
mlrun/api/api/api.py +6 -0
mlrun/api/api/endpoints/feature_store.py +0 -4
mlrun/api/api/endpoints/files.py +14 -2
mlrun/api/api/endpoints/frontend_spec.py +2 -1
mlrun/api/api/endpoints/functions.py +95 -59
mlrun/api/api/endpoints/grafana_proxy.py +9 -9
mlrun/api/api/endpoints/logs.py +17 -3
mlrun/api/api/endpoints/model_endpoints.py +3 -2
mlrun/api/api/endpoints/pipelines.py +1 -5
mlrun/api/api/endpoints/projects.py +88 -0
mlrun/api/api/endpoints/runs.py +48 -6
mlrun/api/api/endpoints/submit.py +2 -1
mlrun/api/api/endpoints/workflows.py +355 -0
mlrun/api/api/utils.py +3 -4
mlrun/api/crud/__init__.py +1 -0
mlrun/api/crud/client_spec.py +6 -2
mlrun/api/crud/feature_store.py +5 -0
mlrun/api/crud/model_monitoring/__init__.py +1 -0
mlrun/api/crud/model_monitoring/deployment.py +497 -0
mlrun/api/crud/model_monitoring/grafana.py +96 -42
mlrun/api/crud/model_monitoring/helpers.py +159 -0
mlrun/api/crud/model_monitoring/model_endpoints.py +202 -476
mlrun/api/crud/notifications.py +9 -4
mlrun/api/crud/pipelines.py +6 -11
mlrun/api/crud/projects.py +2 -2
mlrun/api/crud/runtime_resources.py +4 -3
mlrun/api/crud/runtimes/nuclio/helpers.py +5 -1
mlrun/api/crud/secrets.py +21 -0
mlrun/api/crud/workflows.py +352 -0
mlrun/api/db/base.py +16 -1
mlrun/api/db/init_db.py +2 -4
mlrun/api/db/session.py +1 -1
mlrun/api/db/sqldb/db.py +129 -31
mlrun/api/db/sqldb/models/models_mysql.py +15 -1
mlrun/api/db/sqldb/models/models_sqlite.py +16 -2
mlrun/api/launcher.py +38 -6
mlrun/api/main.py +3 -2
mlrun/api/rundb/__init__.py +13 -0
mlrun/{db → api/rundb}/sqldb.py +36 -84
mlrun/api/runtime_handlers/__init__.py +56 -0
mlrun/api/runtime_handlers/base.py +1247 -0
mlrun/api/runtime_handlers/daskjob.py +209 -0
mlrun/api/runtime_handlers/kubejob.py +37 -0
mlrun/api/runtime_handlers/mpijob.py +147 -0
mlrun/api/runtime_handlers/remotesparkjob.py +29 -0
mlrun/api/runtime_handlers/sparkjob.py +148 -0
mlrun/api/schemas/__init__.py +17 -6
mlrun/api/utils/builder.py +1 -4
mlrun/api/utils/clients/chief.py +14 -0
mlrun/api/utils/clients/iguazio.py +33 -33
mlrun/api/utils/clients/nuclio.py +2 -2
mlrun/api/utils/periodic.py +9 -2
mlrun/api/utils/projects/follower.py +14 -7
mlrun/api/utils/projects/leader.py +2 -1
mlrun/api/utils/projects/remotes/nop_follower.py +2 -2
mlrun/api/utils/projects/remotes/nop_leader.py +2 -2
mlrun/api/utils/runtimes/__init__.py +14 -0
mlrun/api/utils/runtimes/nuclio.py +43 -0
mlrun/api/utils/scheduler.py +98 -15
mlrun/api/utils/singletons/db.py +5 -1
mlrun/api/utils/singletons/project_member.py +4 -1
mlrun/api/utils/singletons/scheduler.py +1 -1
mlrun/artifacts/base.py +6 -6
mlrun/artifacts/dataset.py +4 -4
mlrun/artifacts/manager.py +2 -3
mlrun/artifacts/model.py +2 -2
mlrun/artifacts/plots.py +8 -8
mlrun/common/db/__init__.py +14 -0
mlrun/common/helpers.py +37 -0
mlrun/{mlutils → common/model_monitoring}/__init__.py +3 -2
mlrun/common/model_monitoring/helpers.py +69 -0
mlrun/common/schemas/__init__.py +13 -1
mlrun/common/schemas/auth.py +4 -1
mlrun/common/schemas/client_spec.py +1 -1
mlrun/common/schemas/function.py +17 -0
mlrun/common/schemas/model_monitoring/__init__.py +48 -0
mlrun/common/{model_monitoring.py → schemas/model_monitoring/constants.py} +11 -23
mlrun/common/schemas/model_monitoring/grafana.py +55 -0
mlrun/common/schemas/{model_endpoints.py → model_monitoring/model_endpoints.py} +32 -65
mlrun/common/schemas/notification.py +1 -0
mlrun/common/schemas/object.py +4 -0
mlrun/common/schemas/project.py +1 -0
mlrun/common/schemas/regex.py +1 -1
mlrun/common/schemas/runs.py +1 -8
mlrun/common/schemas/schedule.py +1 -8
mlrun/common/schemas/workflow.py +54 -0
mlrun/config.py +45 -42
mlrun/datastore/__init__.py +21 -0
mlrun/datastore/base.py +1 -1
mlrun/datastore/datastore.py +9 -0
mlrun/datastore/dbfs_store.py +168 -0
mlrun/datastore/helpers.py +18 -0
mlrun/datastore/sources.py +1 -0
mlrun/datastore/store_resources.py +2 -5
mlrun/datastore/v3io.py +1 -2
mlrun/db/__init__.py +4 -68
mlrun/db/base.py +12 -0
mlrun/db/factory.py +65 -0
mlrun/db/httpdb.py +175 -20
mlrun/db/nopdb.py +4 -2
mlrun/execution.py +4 -2
mlrun/feature_store/__init__.py +1 -0
mlrun/feature_store/api.py +1 -2
mlrun/feature_store/common.py +2 -1
mlrun/feature_store/feature_set.py +1 -11
mlrun/feature_store/feature_vector.py +340 -2
mlrun/feature_store/ingestion.py +5 -10
mlrun/feature_store/retrieval/base.py +118 -104
mlrun/feature_store/retrieval/dask_merger.py +17 -10
mlrun/feature_store/retrieval/job.py +4 -1
mlrun/feature_store/retrieval/local_merger.py +18 -18
mlrun/feature_store/retrieval/spark_merger.py +21 -14
mlrun/feature_store/retrieval/storey_merger.py +22 -16
mlrun/kfpops.py +3 -9
mlrun/launcher/base.py +57 -53
mlrun/launcher/client.py +5 -4
mlrun/launcher/factory.py +24 -13
mlrun/launcher/local.py +6 -6
mlrun/launcher/remote.py +4 -4
mlrun/lists.py +0 -11
mlrun/model.py +11 -17
mlrun/model_monitoring/__init__.py +2 -22
mlrun/model_monitoring/features_drift_table.py +1 -1
mlrun/model_monitoring/helpers.py +22 -210
mlrun/model_monitoring/model_endpoint.py +1 -1
mlrun/model_monitoring/model_monitoring_batch.py +127 -50
mlrun/model_monitoring/prometheus.py +219 -0
mlrun/model_monitoring/stores/__init__.py +16 -11
mlrun/model_monitoring/stores/kv_model_endpoint_store.py +95 -23
mlrun/model_monitoring/stores/models/mysql.py +47 -29
mlrun/model_monitoring/stores/models/sqlite.py +47 -29
mlrun/model_monitoring/stores/sql_model_endpoint_store.py +31 -19
mlrun/model_monitoring/{stream_processing_fs.py → stream_processing.py} +206 -64
mlrun/model_monitoring/tracking_policy.py +104 -0
mlrun/package/packager.py +6 -8
mlrun/package/packagers/default_packager.py +121 -10
mlrun/package/packagers/numpy_packagers.py +1 -1
mlrun/platforms/__init__.py +0 -2
mlrun/platforms/iguazio.py +0 -56
mlrun/projects/pipelines.py +53 -159
mlrun/projects/project.py +10 -37
mlrun/render.py +1 -1
mlrun/run.py +8 -124
mlrun/runtimes/__init__.py +6 -42
mlrun/runtimes/base.py +29 -1249
mlrun/runtimes/daskjob.py +2 -198
mlrun/runtimes/funcdoc.py +0 -9
mlrun/runtimes/function.py +25 -29
mlrun/runtimes/kubejob.py +5 -29
mlrun/runtimes/local.py +1 -1
mlrun/runtimes/mpijob/__init__.py +2 -2
mlrun/runtimes/mpijob/abstract.py +10 -1
mlrun/runtimes/mpijob/v1.py +0 -76
mlrun/runtimes/mpijob/v1alpha1.py +1 -74
mlrun/runtimes/nuclio.py +3 -2
mlrun/runtimes/pod.py +28 -18
mlrun/runtimes/remotesparkjob.py +1 -15
mlrun/runtimes/serving.py +14 -6
mlrun/runtimes/sparkjob/__init__.py +0 -1
mlrun/runtimes/sparkjob/abstract.py +4 -131
mlrun/runtimes/utils.py +0 -26
mlrun/serving/routers.py +7 -7
mlrun/serving/server.py +11 -8
mlrun/serving/states.py +7 -1
mlrun/serving/v2_serving.py +6 -6
mlrun/utils/helpers.py +23 -42
mlrun/utils/notifications/notification/__init__.py +4 -0
mlrun/utils/notifications/notification/webhook.py +61 -0
mlrun/utils/notifications/notification_pusher.py +5 -25
mlrun/utils/regex.py +7 -2
mlrun/utils/version/version.json +2 -2
{mlrun-1.4.0rc25.dist-info → mlrun-1.5.0rc2.dist-info}/METADATA +26 -25
{mlrun-1.4.0rc25.dist-info → mlrun-1.5.0rc2.dist-info}/RECORD +180 -158
{mlrun-1.4.0rc25.dist-info → mlrun-1.5.0rc2.dist-info}/WHEEL +1 -1
mlrun/mlutils/data.py +0 -160
mlrun/mlutils/models.py +0 -78
mlrun/mlutils/plots.py +0 -902
mlrun/utils/model_monitoring.py +0 -249
/mlrun/{api/db/sqldb/session.py → common/db/sql_session.py} +0 -0
{mlrun-1.4.0rc25.dist-info → mlrun-1.5.0rc2.dist-info}/LICENSE +0 -0
{mlrun-1.4.0rc25.dist-info → mlrun-1.5.0rc2.dist-info}/entry_points.txt +0 -0
{mlrun-1.4.0rc25.dist-info → mlrun-1.5.0rc2.dist-info}/top_level.txt +0 -0

mlrun/api/crud/model_monitoring/model_endpoints.py CHANGED Viewed

@@ -12,29 +12,22 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
-import json
 import os
 import typing
 import warnings
 import sqlalchemy.orm
-import mlrun.api.api.endpoints.functions
 import mlrun.api.api.utils
-import mlrun.api.crud.runtimes.nuclio.function
-import mlrun.api.utils.singletons.k8s
+import mlrun.api.crud.model_monitoring.deployment
+import mlrun.api.crud.model_monitoring.helpers
+import mlrun.api.crud.secrets
+import mlrun.api.rundb.sqldb
 import mlrun.artifacts
-import mlrun.common.model_monitoring as model_monitoring_constants
-import mlrun.common.schemas
-import mlrun.common.schemas.model_endpoints
-import mlrun.config
-import mlrun.datastore.store_resources
-import mlrun.errors
+import mlrun.common.helpers
+import mlrun.common.schemas.model_monitoring
 import mlrun.feature_store
-import mlrun.model_monitoring.helpers
-import mlrun.utils.helpers
-import mlrun.utils.model_monitoring
-import mlrun.utils.v3io_clients
 from mlrun.model_monitoring.stores import get_model_endpoint_store
 from mlrun.utils import logger
@@ -115,7 +108,8 @@ class ModelEndpoints:
             # Get labels from model object if not found in model endpoint object
             if not model_endpoint.spec.label_names and model_obj.spec.outputs:
                 model_label_names = [
-                    self._clean_feature_name(f.name) for f in model_obj.spec.outputs
+                    mlrun.api.crud.model_monitoring.helpers.clean_feature_name(f.name)
+                    for f in model_obj.spec.outputs
                 ]
                 model_endpoint.spec.label_names = model_label_names
@@ -126,7 +120,7 @@ class ModelEndpoints:
             # Create monitoring feature set if monitoring found in model endpoint object
             if (
                 model_endpoint.spec.monitoring_mode
-                == mlrun.common.model_monitoring.ModelMonitoringMode.enabled.value
+                == mlrun.common.schemas.model_monitoring.ModelMonitoringMode.enabled.value
             ):
                 monitoring_feature_set = self.create_monitoring_feature_set(
                     model_endpoint, model_obj, db_session, run_db
@@ -143,7 +137,7 @@ class ModelEndpoints:
             logger.info("Feature stats found, cleaning feature names")
             if model_endpoint.spec.feature_names:
                 # Validate that the length of feature_stats is equal to the length of feature_names and label_names
-                self._validate_length_features_and_labels(model_endpoint)
+                self._validate_length_features_and_labels(model_endpoint=model_endpoint)
                 # Clean feature names in both feature_stats and feature_names
             (
@@ -163,6 +157,9 @@ class ModelEndpoints:
         # Write the new model endpoint
         model_endpoint_store = get_model_endpoint_store(
             project=model_endpoint.metadata.project,
+            secret_provider=mlrun.api.crud.secrets.get_project_secret_provider(
+                project=model_endpoint.metadata.project
+            ),
         )
         model_endpoint_store.write_model_endpoint(endpoint=model_endpoint.flat_dict())
@@ -170,12 +167,51 @@ class ModelEndpoints:
         return model_endpoint
-    def create_monitoring_feature_set(
+    def patch_model_endpoint(
         self,
+        project: str,
+        endpoint_id: str,
+        attributes: dict,
+    ) -> mlrun.common.schemas.ModelEndpoint:
+        """
+        Update a model endpoint record with a given attributes.
+        :param project: The name of the project.
+        :param endpoint_id: The unique id of the model endpoint.
+        :param attributes: Dictionary of attributes that will be used for update the model endpoint. Note that the keys
+                           of the attributes dictionary should exist in the DB table. More details about the model
+                           endpoint available attributes can be found under
+                           :py:class:`~mlrun.common.schemas.ModelEndpoint`.
+        :return: A patched `ModelEndpoint` object.
+        """
+        # Generate a model endpoint store object and apply the update process
+        model_endpoint_store = get_model_endpoint_store(
+            project=project,
+            secret_provider=mlrun.api.crud.secrets.get_project_secret_provider(
+                project=project
+            ),
+        )
+        model_endpoint_store.update_model_endpoint(
+            endpoint_id=endpoint_id, attributes=attributes
+        )
+        logger.info("Model endpoint table updated", endpoint_id=endpoint_id)
+        # Get the patched model endpoint record
+        model_endpoint_record = model_endpoint_store.get_model_endpoint(
+            endpoint_id=endpoint_id,
+        )
+        return self._convert_into_model_endpoint_object(endpoint=model_endpoint_record)
+    @staticmethod
+    def create_monitoring_feature_set(
         model_endpoint: mlrun.common.schemas.ModelEndpoint,
         model_obj: mlrun.artifacts.ModelArtifact,
         db_session: sqlalchemy.orm.Session,
-        run_db: mlrun.db.sqldb.SQLDB,
+        run_db: mlrun.api.rundb.sqldb.SQLRunDB,
     ):
         """
         Create monitoring feature set with the relevant parquet target.
@@ -190,7 +226,12 @@ class ModelEndpoints:
         """
         # Define a new feature set
-        _, serving_function_name, _, _ = mlrun.utils.helpers.parse_versioned_object_uri(
+        (
+            _,
+            serving_function_name,
+            _,
+            _,
+        ) = mlrun.common.helpers.parse_versioned_object_uri(
             model_endpoint.spec.function_uri
         )
@@ -198,15 +239,15 @@ class ModelEndpoints:
         feature_set = mlrun.feature_store.FeatureSet(
             f"monitoring-{serving_function_name}-{model_name}",
-            entities=[model_monitoring_constants.EventFieldType.ENDPOINT_ID],
-            timestamp_key=model_monitoring_constants.EventFieldType.TIMESTAMP,
+            entities=[mlrun.common.schemas.model_monitoring.EventFieldType.ENDPOINT_ID],
+            timestamp_key=mlrun.common.schemas.model_monitoring.EventFieldType.TIMESTAMP,
             description=f"Monitoring feature set for endpoint: {model_endpoint.spec.model}",
         )
         feature_set.metadata.project = model_endpoint.metadata.project
         feature_set.metadata.labels = {
-            model_monitoring_constants.EventFieldType.ENDPOINT_ID: model_endpoint.metadata.uid,
-            model_monitoring_constants.EventFieldType.MODEL_CLASS: model_endpoint.spec.model_class,
+            mlrun.common.schemas.model_monitoring.EventFieldType.ENDPOINT_ID: model_endpoint.metadata.uid,
+            mlrun.common.schemas.model_monitoring.EventFieldType.MODEL_CLASS: model_endpoint.spec.model_class,
         }
         # Add features to the feature set according to the model object
@@ -239,14 +280,14 @@ class ModelEndpoints:
         # Define parquet target for this feature set
         parquet_path = (
-            self._get_monitoring_parquet_path(
+            mlrun.api.crud.model_monitoring.helpers.get_monitoring_parquet_path(
                 db_session=db_session, project=model_endpoint.metadata.project
             )
             + f"/key={model_endpoint.metadata.uid}"
         )
         parquet_target = mlrun.datastore.targets.ParquetTarget(
-            model_monitoring_constants.FileTargetKind.PARQUET, parquet_path
+            mlrun.common.schemas.model_monitoring.FileTargetKind.PARQUET, parquet_path
         )
         driver = mlrun.datastore.targets.get_target_driver(parquet_target, feature_set)
@@ -257,7 +298,6 @@ class ModelEndpoints:
         driver.update_resource_status("created")
         # Save the new feature set
-        feature_set._override_run_db(db_session)
         feature_set.save()
         logger.info(
             "Monitoring feature set created",
@@ -267,125 +307,6 @@ class ModelEndpoints:
         return feature_set
-    @staticmethod
-    def _get_monitoring_parquet_path(
-        db_session: sqlalchemy.orm.Session, project: str
-    ) -> str:
-        """Getting model monitoring parquet target for the current project. The parquet target path is based on the
-        project artifact path. If project artifact path is not defined, the parquet target path will be based on MLRun
-        artifact path.
-        :param db_session: A session that manages the current dialog with the database. Will be used in this function
-                           to get the project record from DB.
-        :param project:    Project name.
-        :return:           Monitoring parquet target path.
-        """
-        # Get the artifact path from the project record that was stored in the DB
-        project_obj = mlrun.api.crud.projects.Projects().get_project(
-            session=db_session, name=project
-        )
-        artifact_path = project_obj.spec.artifact_path
-        # Generate monitoring parquet path value
-        parquet_path = mlrun.mlconf.get_model_monitoring_file_target_path(
-            project=project,
-            kind=model_monitoring_constants.FileTargetKind.PARQUET,
-            target="offline",
-            artifact_path=artifact_path,
-        )
-        return parquet_path
-    @staticmethod
-    def _validate_length_features_and_labels(model_endpoint):
-        """
-        Validate that the length of feature_stats is equal to the length of `feature_names` and `label_names`
-        :param model_endpoint:    An object representing the model endpoint.
-        """
-        # Getting the length of label names, feature_names and feature_stats
-        len_of_label_names = (
-            0
-            if not model_endpoint.spec.label_names
-            else len(model_endpoint.spec.label_names)
-        )
-        len_of_feature_names = len(model_endpoint.spec.feature_names)
-        len_of_feature_stats = len(model_endpoint.status.feature_stats)
-        if len_of_feature_stats != len_of_feature_names + len_of_label_names:
-            raise mlrun.errors.MLRunInvalidArgumentError(
-                f"The length of model endpoint feature_stats is not equal to the "
-                f"length of model endpoint feature names and labels "
-                f"feature_stats({len_of_feature_stats}), "
-                f"feature_names({len_of_feature_names}),"
-                f"label_names({len_of_label_names}"
-            )
-    def _adjust_feature_names_and_stats(
-        self, model_endpoint
-    ) -> typing.Tuple[typing.Dict, typing.List]:
-        """
-        Create a clean matching version of feature names for both `feature_stats` and `feature_names`. Please note that
-        label names exist only in `feature_stats` and `label_names`.
-        :param model_endpoint:    An object representing the model endpoint.
-        :return: A tuple of:
-             [0] = Dictionary of feature stats with cleaned names
-             [1] = List of cleaned feature names
-        """
-        clean_feature_stats = {}
-        clean_feature_names = []
-        for i, (feature, stats) in enumerate(
-            model_endpoint.status.feature_stats.items()
-        ):
-            clean_name = self._clean_feature_name(feature)
-            clean_feature_stats[clean_name] = stats
-            # Exclude the label columns from the feature names
-            if (
-                model_endpoint.spec.label_names
-                and clean_name in model_endpoint.spec.label_names
-            ):
-                continue
-            clean_feature_names.append(clean_name)
-        return clean_feature_stats, clean_feature_names
-    def patch_model_endpoint(
-        self,
-        project: str,
-        endpoint_id: str,
-        attributes: dict,
-    ) -> mlrun.common.schemas.ModelEndpoint:
-        """
-        Update a model endpoint record with a given attributes.
-        :param project: The name of the project.
-        :param endpoint_id: The unique id of the model endpoint.
-        :param attributes: Dictionary of attributes that will be used for update the model endpoint. Note that the keys
-                           of the attributes dictionary should exist in the DB table. More details about the model
-                           endpoint available attributes can be found under
-                           :py:class:`~mlrun.common.schemas.ModelEndpoint`.
-        :return: A patched `ModelEndpoint` object.
-        """
-        # Generate a model endpoint store object and apply the update process
-        model_endpoint_store = get_model_endpoint_store(
-            project=project,
-        )
-        model_endpoint_store.update_model_endpoint(
-            endpoint_id=endpoint_id, attributes=attributes
-        )
-        logger.info("Model endpoint table updated", endpoint_id=endpoint_id)
-        # Get the patched model endpoint record
-        model_endpoint_record = model_endpoint_store.get_model_endpoint(
-            endpoint_id=endpoint_id,
-        )
-        return self._convert_into_model_endpoint_object(endpoint=model_endpoint_record)
     @staticmethod
     def delete_model_endpoint(
         project: str,
@@ -399,6 +320,9 @@ class ModelEndpoints:
         """
         model_endpoint_store = get_model_endpoint_store(
             project=project,
+            secret_provider=mlrun.api.crud.secrets.get_project_secret_provider(
+                project=project
+            ),
         )
         model_endpoint_store.delete_model_endpoint(endpoint_id=endpoint_id)
@@ -447,7 +371,11 @@ class ModelEndpoints:
         # Generate a model endpoint store object and get the model endpoint record as a dictionary
         model_endpoint_store = get_model_endpoint_store(
-            project=project, access_key=auth_info.data_session
+            project=project,
+            access_key=auth_info.data_session,
+            secret_provider=mlrun.api.crud.secrets.get_project_secret_provider(
+                project=project
+            ),
         )
         model_endpoint_record = model_endpoint_store.get_model_endpoint(
@@ -536,13 +464,15 @@ class ModelEndpoints:
         )
         # Initialize an empty model endpoints list
-        endpoint_list = mlrun.common.schemas.model_endpoints.ModelEndpointList(
-            endpoints=[]
-        )
+        endpoint_list = mlrun.common.schemas.ModelEndpointList(endpoints=[])
         # Generate a model endpoint store object and get a list of model endpoint dictionaries
         endpoint_store = get_model_endpoint_store(
-            access_key=auth_info.data_session, project=project
+            access_key=auth_info.data_session,
+            project=project,
+            secret_provider=mlrun.api.crud.secrets.get_project_secret_provider(
+                project=project
+            ),
         )
         endpoint_dictionary_list = endpoint_store.list_model_endpoints(
@@ -554,7 +484,6 @@ class ModelEndpoints:
         )
         for endpoint_dict in endpoint_dictionary_list:
             # Convert to `ModelEndpoint` object
             endpoint_obj = self._convert_into_model_endpoint_object(
                 endpoint=endpoint_dict
@@ -575,9 +504,116 @@ class ModelEndpoints:
         return endpoint_list
+    def verify_project_has_no_model_endpoints(self, project_name: str):
+        """Verify that there no  model endpoint records in the DB by trying to list all of the project model endpoints.
+        This method is usually being used during the process of deleting a project.
+        :param project_name: project name.
+        """
+        auth_info = mlrun.common.schemas.AuthInfo(
+            data_session=os.getenv("V3IO_ACCESS_KEY")
+        )
+        if not mlrun.mlconf.igz_version or not mlrun.mlconf.v3io_api:
+            return
+        endpoints = self.list_model_endpoints(auth_info, project_name)
+        if endpoints.endpoints:
+            raise mlrun.errors.MLRunPreconditionFailedError(
+                f"Project {project_name} can not be deleted since related resources found: model endpoints"
+            )
+    @staticmethod
+    def delete_model_endpoints_resources(project_name: str):
+        """
+        Delete all model endpoints resources.
+        :param project_name: The name of the project.
+        """
+        auth_info = mlrun.common.schemas.AuthInfo(
+            data_session=os.getenv("V3IO_ACCESS_KEY")
+        )
+        # We would ideally base on config.v3io_api but can't for backwards compatibility reasons,
+        # we're using the igz version heuristic
+        if not mlrun.mlconf.igz_version or not mlrun.mlconf.v3io_api:
+            return
+        # Generate a model endpoint store object and get a list of model endpoint dictionaries
+        endpoint_store = get_model_endpoint_store(
+            access_key=auth_info.data_session,
+            project=project_name,
+            secret_provider=mlrun.api.crud.secrets.get_project_secret_provider(
+                project=project_name
+            ),
+        )
+        endpoints = endpoint_store.list_model_endpoints()
+        # Delete model endpoints resources from databases using the model endpoint store object
+        endpoint_store.delete_model_endpoints_resources(endpoints)
+    @staticmethod
+    def _validate_length_features_and_labels(
+        model_endpoint: mlrun.common.schemas.ModelEndpoint,
+    ):
+        """
+        Validate that the length of feature_stats is equal to the length of `feature_names` and `label_names`
+        :param model_endpoint:    An object representing the model endpoint.
+        """
+        # Getting the length of label names, feature_names and feature_stats
+        len_of_label_names = (
+            0
+            if not model_endpoint.spec.label_names
+            else len(model_endpoint.spec.label_names)
+        )
+        len_of_feature_names = len(model_endpoint.spec.feature_names)
+        len_of_feature_stats = len(model_endpoint.status.feature_stats)
+        if len_of_feature_stats != len_of_feature_names + len_of_label_names:
+            raise mlrun.errors.MLRunInvalidArgumentError(
+                f"The length of model endpoint feature_stats is not equal to the "
+                f"length of model endpoint feature names and labels "
+                f"feature_stats({len_of_feature_stats}), "
+                f"feature_names({len_of_feature_names}),"
+                f"label_names({len_of_label_names}"
+            )
+    @staticmethod
+    def _adjust_feature_names_and_stats(
+        model_endpoint,
+    ) -> typing.Tuple[typing.Dict, typing.List]:
+        """
+        Create a clean matching version of feature names for both `feature_stats` and `feature_names`. Please note that
+        label names exist only in `feature_stats` and `label_names`.
+        :param model_endpoint:    An object representing the model endpoint.
+        :return: A tuple of:
+             [0] = Dictionary of feature stats with cleaned names
+             [1] = List of cleaned feature names
+        """
+        clean_feature_stats = {}
+        clean_feature_names = []
+        for i, (feature, stats) in enumerate(
+            model_endpoint.status.feature_stats.items()
+        ):
+            clean_name = mlrun.api.crud.model_monitoring.helpers.clean_feature_name(
+                feature
+            )
+            clean_feature_stats[clean_name] = stats
+            # Exclude the label columns from the feature names
+            if (
+                model_endpoint.spec.label_names
+                and clean_name in model_endpoint.spec.label_names
+            ):
+                continue
+            clean_feature_names.append(clean_name)
+        return clean_feature_stats, clean_feature_names
     @staticmethod
     def _add_real_time_metrics(
-        model_endpoint_store: mlrun.model_monitoring.stores.ModelEndpointStore,
+        model_endpoint_store: mlrun.model_monitoring.ModelEndpointStore,
         model_endpoint_object: mlrun.common.schemas.ModelEndpoint,
         metrics: typing.List[str] = None,
         start: str = "now-1h",
@@ -616,22 +652,23 @@ class ModelEndpoints:
         )
         if endpoint_metrics:
             model_endpoint_object.status.metrics[
-                model_monitoring_constants.EventKeyMetrics.REAL_TIME
+                mlrun.common.schemas.model_monitoring.EventKeyMetrics.REAL_TIME
             ] = endpoint_metrics
         return model_endpoint_object
+    @staticmethod
     def _convert_into_model_endpoint_object(
-        self, endpoint: typing.Dict[str, typing.Any], feature_analysis: bool = False
+        endpoint: typing.Dict[str, typing.Any], feature_analysis: bool = False
     ) -> mlrun.common.schemas.ModelEndpoint:
         """
         Create a `ModelEndpoint` object according to a provided model endpoint dictionary.
-        :param endpoint:         Dictinoary that represents a DB record of a model endpoint which need to be converted
+        :param endpoint:         Dictionary that represents a DB record of a model endpoint which need to be converted
                                  into a valid `ModelEndpoint` object.
         :param feature_analysis: When True, the base feature statistics and current feature statistics will be added to
                                  the output of the resulting object.
-        :return: A `ModelEndpoint` object.
+        :return: A `~mlrun.common.schemas.ModelEndpoint` object.
         """
         # Convert into `ModelEndpoint` object
@@ -639,332 +676,21 @@ class ModelEndpoints:
         # If feature analysis was applied, add feature stats and current stats to the model endpoint result
         if feature_analysis and endpoint_obj.spec.feature_names:
-            endpoint_features = self.get_endpoint_features(
-                feature_names=endpoint_obj.spec.feature_names,
-                feature_stats=endpoint_obj.status.feature_stats,
-                current_stats=endpoint_obj.status.current_stats,
+            endpoint_features = (
+                mlrun.api.crud.model_monitoring.deployment.get_endpoint_features(
+                    feature_names=endpoint_obj.spec.feature_names,
+                    feature_stats=endpoint_obj.status.feature_stats,
+                    current_stats=endpoint_obj.status.current_stats,
+                )
             )
             if endpoint_features:
                 endpoint_obj.status.features = endpoint_features
                 # Add the latest drift measures results (calculated by the model monitoring batch)
-                drift_measures = self._json_loads_if_not_none(
+                drift_measures = mlrun.api.crud.model_monitoring.helpers.json_loads_if_not_none(
                     endpoint.get(
-                        model_monitoring_constants.EventFieldType.DRIFT_MEASURES
+                        mlrun.common.schemas.model_monitoring.EventFieldType.DRIFT_MEASURES
                     )
                 )
                 endpoint_obj.status.drift_measures = drift_measures
         return endpoint_obj
-    @staticmethod
-    def get_endpoint_features(
-        feature_names: typing.List[str],
-        feature_stats: dict = None,
-        current_stats: dict = None,
-    ) -> typing.List[mlrun.common.schemas.Features]:
-        """
-        Getting a new list of features that exist in feature_names along with their expected (feature_stats) and
-        actual (current_stats) stats. The expected stats were calculated during the creation of the model endpoint,
-        usually based on the data from the Model Artifact. The actual stats are based on the results from the latest
-        model monitoring batch job.
-        param feature_names: List of feature names.
-        param feature_stats: Dictionary of feature stats that were stored during the creation of the model endpoint
-                             object.
-        param current_stats: Dictionary of the latest stats that were stored during the last run of the model monitoring
-                             batch job.
-        return: List of feature objects. Each feature has a name, weight, expected values, and actual values. More info
-                can be found under `mlrun.common.schemas.Features`.
-        """
-        # Initialize feature and current stats dictionaries
-        safe_feature_stats = feature_stats or {}
-        safe_current_stats = current_stats or {}
-        # Create feature object and add it to a general features list
-        features = []
-        for name in feature_names:
-            if feature_stats is not None and name not in feature_stats:
-                logger.warn("Feature missing from 'feature_stats'", name=name)
-            if current_stats is not None and name not in current_stats:
-                logger.warn("Feature missing from 'current_stats'", name=name)
-            f = mlrun.common.schemas.Features.new(
-                name, safe_feature_stats.get(name), safe_current_stats.get(name)
-            )
-            features.append(f)
-        return features
-    @staticmethod
-    def _json_loads_if_not_none(field: typing.Any) -> typing.Any:
-        return (
-            json.loads(field)
-            if field and field != "null" and field is not None
-            else None
-        )
-    def deploy_monitoring_functions(
-        self,
-        project: str,
-        model_monitoring_access_key: str,
-        db_session: sqlalchemy.orm.Session,
-        auth_info: mlrun.common.schemas.AuthInfo,
-        tracking_policy: mlrun.utils.model_monitoring.TrackingPolicy,
-    ):
-        """
-        Invoking monitoring deploying functions.
-        :param project:                     The name of the project.
-        :param model_monitoring_access_key: Access key to apply the model monitoring process.
-        :param db_session:                  A session that manages the current dialog with the database.
-        :param auth_info:                   The auth info of the request.
-        :param tracking_policy:             Model monitoring configurations.
-        """
-        self.deploy_model_monitoring_stream_processing(
-            project=project,
-            model_monitoring_access_key=model_monitoring_access_key,
-            db_session=db_session,
-            auth_info=auth_info,
-            tracking_policy=tracking_policy,
-        )
-        self.deploy_model_monitoring_batch_processing(
-            project=project,
-            model_monitoring_access_key=model_monitoring_access_key,
-            db_session=db_session,
-            auth_info=auth_info,
-            tracking_policy=tracking_policy,
-        )
-    def verify_project_has_no_model_endpoints(self, project_name: str):
-        auth_info = mlrun.common.schemas.AuthInfo(
-            data_session=os.getenv("V3IO_ACCESS_KEY")
-        )
-        if not mlrun.mlconf.igz_version or not mlrun.mlconf.v3io_api:
-            return
-        endpoints = self.list_model_endpoints(auth_info, project_name)
-        if endpoints.endpoints:
-            raise mlrun.errors.MLRunPreconditionFailedError(
-                f"Project {project_name} can not be deleted since related resources found: model endpoints"
-            )
-    @staticmethod
-    def delete_model_endpoints_resources(project_name: str):
-        """
-        Delete all model endpoints resources.
-        :param project_name: The name of the project.
-        """
-        auth_info = mlrun.common.schemas.AuthInfo(
-            data_session=os.getenv("V3IO_ACCESS_KEY")
-        )
-        # We would ideally base on config.v3io_api but can't for backwards compatibility reasons,
-        # we're using the igz version heuristic
-        if not mlrun.mlconf.igz_version or not mlrun.mlconf.v3io_api:
-            return
-        # Generate a model endpoint store object and get a list of model endpoint dictionaries
-        endpoint_store = get_model_endpoint_store(
-            access_key=auth_info.data_session, project=project_name
-        )
-        endpoints = endpoint_store.list_model_endpoints()
-        # Delete model endpoints resources from databases using the model endpoint store object
-        endpoint_store.delete_model_endpoints_resources(endpoints)
-    def deploy_model_monitoring_stream_processing(
-        self,
-        project: str,
-        model_monitoring_access_key: str,
-        db_session: sqlalchemy.orm.Session,
-        auth_info: mlrun.common.schemas.AuthInfo,
-        tracking_policy: mlrun.utils.model_monitoring.TrackingPolicy,
-    ):
-        """
-        Deploying model monitoring stream real time nuclio function. The goal of this real time function is
-        to monitor the log of the data stream. It is triggered when a new log entry is detected.
-        It processes the new events into statistics that are then written to statistics databases.
-        :param project:                     The name of the project.
-        :param model_monitoring_access_key: Access key to apply the model monitoring process.
-        :param db_session:                  A session that manages the current dialog with the database.
-        :param auth_info:                   The auth info of the request.
-        :param tracking_policy:             Model monitoring configurations.
-        """
-        logger.info(
-            "Checking if model monitoring stream is already deployed",
-            project=project,
-        )
-        try:
-            # validate that the model monitoring stream has not yet been deployed
-            mlrun.api.crud.runtimes.nuclio.function.get_nuclio_deploy_status(
-                name="model-monitoring-stream",
-                project=project,
-                tag="",
-                auth_info=auth_info,
-            )
-            logger.info(
-                "Detected model monitoring stream processing function already deployed",
-                project=project,
-            )
-            return
-        except mlrun.errors.MLRunNotFoundError:
-            logger.info(
-                "Deploying model monitoring stream processing function", project=project
-            )
-        # Get parquet target value for model monitoring stream function
-        parquet_target = self._get_monitoring_parquet_path(
-            db_session=db_session, project=project
-        )
-        fn = mlrun.model_monitoring.helpers.initial_model_monitoring_stream_processing_function(
-            project=project,
-            model_monitoring_access_key=model_monitoring_access_key,
-            tracking_policy=tracking_policy,
-            auth_info=auth_info,
-            parquet_target=parquet_target,
-        )
-        mlrun.api.api.endpoints.functions._build_function(
-            db_session=db_session, auth_info=auth_info, function=fn
-        )
-    def deploy_model_monitoring_batch_processing(
-        self,
-        project: str,
-        model_monitoring_access_key: str,
-        db_session: sqlalchemy.orm.Session,
-        auth_info: mlrun.common.schemas.AuthInfo,
-        tracking_policy: mlrun.utils.model_monitoring.TrackingPolicy,
-    ):
-        """
-        Deploying model monitoring batch job. The goal of this job is to identify drift in the data
-        based on the latest batch of events. By default, this job is executed on the hour every hour.
-        Note that if the monitoring batch job was already deployed then you will have to delete the
-        old monitoring batch job before deploying a new one.
-        :param project:                     The name of the project.
-        :param model_monitoring_access_key: Access key to apply the model monitoring process.
-        :param db_session:                  A session that manages the current dialog with the database.
-        :param auth_info:                   The auth info of the request.
-        :param tracking_policy:             Model monitoring configurations.
-        """
-        logger.info(
-            "Checking if model monitoring batch processing function is already deployed",
-            project=project,
-        )
-        # Try to list functions that named model monitoring batch
-        # to make sure that this job has not yet been deployed
-        function_list = mlrun.api.utils.singletons.db.get_db().list_functions(
-            session=db_session, name="model-monitoring-batch", project=project
-        )
-        if function_list:
-            logger.info(
-                "Detected model monitoring batch processing function already deployed",
-                project=project,
-            )
-            return
-        # Create a monitoring batch job function object
-        fn = mlrun.model_monitoring.helpers.get_model_monitoring_batch_function(
-            project=project,
-            model_monitoring_access_key=model_monitoring_access_key,
-            db_session=db_session,
-            auth_info=auth_info,
-            tracking_policy=tracking_policy,
-        )
-        # Get the function uri
-        function_uri = fn.save(versioned=True)
-        function_uri = function_uri.replace("db://", "")
-        task = mlrun.new_task(name="model-monitoring-batch", project=project)
-        task.spec.function = function_uri
-        # Apply batching interval params
-        interval_list = [
-            tracking_policy.default_batch_intervals.minute,
-            tracking_policy.default_batch_intervals.hour,
-            tracking_policy.default_batch_intervals.day,
-        ]
-        minutes, hours, days = self._get_batching_interval_param(interval_list)
-        batch_dict = {"minutes": minutes, "hours": hours, "days": days}
-        task.spec.parameters[
-            model_monitoring_constants.EventFieldType.BATCH_INTERVALS_DICT
-        ] = batch_dict
-        data = {
-            "task": task.to_dict(),
-            "schedule": self._convert_to_cron_string(
-                tracking_policy.default_batch_intervals
-            ),
-        }
-        logger.info(
-            "Deploying model monitoring batch processing function", project=project
-        )
-        # Add job schedule policy (every hour by default)
-        mlrun.api.api.utils.submit_run_sync(
-            db_session=db_session, auth_info=auth_info, data=data
-        )
-    @staticmethod
-    def _clean_feature_name(feature_name):
-        return feature_name.replace(" ", "_").replace("(", "").replace(")", "")
-    @staticmethod
-    def get_access_key(auth_info: mlrun.common.schemas.AuthInfo):
-        """
-        Getting access key from the current data session. This method is usually used to verify that the session
-        is valid and contains an access key.
-        param auth_info: The auth info of the request.
-        :return: Access key as a string.
-        """
-        access_key = auth_info.data_session
-        if not access_key:
-            raise mlrun.errors.MLRunBadRequestError("Data session is missing")
-        return access_key
-    @staticmethod
-    def _get_batching_interval_param(intervals_list: typing.List):
-        """Converting each value in the intervals list into a float number. None
-        Values will be converted into 0.0.
-        param intervals_list: A list of values based on the ScheduleCronTrigger expression. Note that at the moment
-                              it supports minutes, hours, and days. e.g. [0, '*/1', None] represents on the hour
-                              every hour.
-        :return: A tuple of:
-                 [0] = minutes interval as a float
-                 [1] = hours interval as a float
-                 [2] = days interval as a float
-        """
-        return tuple(
-            [
-                0.0
-                if isinstance(interval, (float, int)) or interval is None
-                else float(f"0{interval.partition('/')[-1]}")
-                for interval in intervals_list
-            ]
-        )
-    @staticmethod
-    def _convert_to_cron_string(
-        cron_trigger: mlrun.common.schemas.schedule.ScheduleCronTrigger,
-    ):
-        """Converting the batch interval `ScheduleCronTrigger` into a cron trigger expression"""
-        return "{} {} {} * *".format(
-            cron_trigger.minute, cron_trigger.hour, cron_trigger.day
-        ).replace("None", "*")

mlrun 1.4.0rc25__py3-none-any.whl → 1.5.0rc2__py3-none-any.whl

Potentially problematic release.

mlrun 1.4.0rc25py3-none-any.whl → 1.5.0rc2py3-none-any.whl