PyPI - mlrun - Versions diffs - 1.7.0rc17__py3-none-any.whl → 1.7.0rc18__py3-none-any.whl - Mend

mlrun 1.7.0rc17py3-none-any.whl → 1.7.0rc18py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mlrun might be problematic. Click here for more details.

Files changed (55) hide show

mlrun/alerts/alert.py +1 -1
mlrun/artifacts/manager.py +5 -1
mlrun/common/runtimes/constants.py +3 -0
mlrun/common/schemas/__init__.py +1 -1
mlrun/common/schemas/alert.py +31 -9
mlrun/common/schemas/client_spec.py +1 -0
mlrun/common/schemas/function.py +4 -0
mlrun/common/schemas/model_monitoring/__init__.py +3 -1
mlrun/common/schemas/model_monitoring/constants.py +20 -1
mlrun/common/schemas/model_monitoring/grafana.py +9 -5
mlrun/common/schemas/model_monitoring/model_endpoints.py +17 -6
mlrun/config.py +2 -0
mlrun/data_types/to_pandas.py +5 -5
mlrun/datastore/datastore.py +6 -2
mlrun/datastore/redis.py +2 -2
mlrun/datastore/s3.py +5 -0
mlrun/datastore/sources.py +111 -6
mlrun/datastore/targets.py +2 -2
mlrun/db/base.py +5 -1
mlrun/db/httpdb.py +22 -3
mlrun/db/nopdb.py +5 -1
mlrun/errors.py +6 -0
mlrun/feature_store/retrieval/conversion.py +5 -5
mlrun/feature_store/retrieval/job.py +3 -2
mlrun/feature_store/retrieval/spark_merger.py +2 -1
mlrun/frameworks/_dl_common/loggers/tensorboard_logger.py +2 -2
mlrun/model_monitoring/db/stores/base/store.py +16 -3
mlrun/model_monitoring/db/stores/sqldb/sql_store.py +44 -43
mlrun/model_monitoring/db/stores/v3io_kv/kv_store.py +190 -91
mlrun/model_monitoring/db/tsdb/__init__.py +35 -6
mlrun/model_monitoring/db/tsdb/base.py +25 -18
mlrun/model_monitoring/db/tsdb/tdengine/__init__.py +15 -0
mlrun/model_monitoring/db/tsdb/tdengine/schemas.py +207 -0
mlrun/model_monitoring/db/tsdb/tdengine/stream_graph_steps.py +45 -0
mlrun/model_monitoring/db/tsdb/tdengine/tdengine_connector.py +231 -0
mlrun/model_monitoring/db/tsdb/v3io/v3io_connector.py +73 -72
mlrun/model_monitoring/db/v3io_tsdb_reader.py +217 -16
mlrun/model_monitoring/helpers.py +32 -0
mlrun/model_monitoring/stream_processing.py +7 -4
mlrun/model_monitoring/writer.py +18 -13
mlrun/package/utils/_formatter.py +2 -2
mlrun/projects/project.py +33 -8
mlrun/render.py +8 -5
mlrun/runtimes/databricks_job/databricks_wrapper.py +1 -1
mlrun/utils/async_http.py +25 -5
mlrun/utils/helpers.py +20 -1
mlrun/utils/notifications/notification/slack.py +27 -7
mlrun/utils/notifications/notification_pusher.py +38 -40
mlrun/utils/version/version.json +2 -2
{mlrun-1.7.0rc17.dist-info → mlrun-1.7.0rc18.dist-info}/METADATA +7 -2
{mlrun-1.7.0rc17.dist-info → mlrun-1.7.0rc18.dist-info}/RECORD +55 -51
{mlrun-1.7.0rc17.dist-info → mlrun-1.7.0rc18.dist-info}/LICENSE +0 -0
{mlrun-1.7.0rc17.dist-info → mlrun-1.7.0rc18.dist-info}/WHEEL +0 -0
{mlrun-1.7.0rc17.dist-info → mlrun-1.7.0rc18.dist-info}/entry_points.txt +0 -0
{mlrun-1.7.0rc17.dist-info → mlrun-1.7.0rc18.dist-info}/top_level.txt +0 -0

mlrun/model_monitoring/db/stores/v3io_kv/kv_store.py CHANGED Viewed

@@ -15,23 +15,79 @@
 import json
 import os
 import typing
+from dataclasses import dataclass
 from http import HTTPStatus
 import v3io.dataplane
+import v3io.dataplane.output
 import v3io.dataplane.response
 import mlrun.common.model_monitoring.helpers
-import mlrun.common.schemas.model_monitoring as mm_constants
+import mlrun.common.schemas.model_monitoring as mm_schemas
 import mlrun.model_monitoring.db
 import mlrun.utils.v3io_clients
 from mlrun.utils import logger
 # Fields to encode before storing in the KV table or to decode after retrieving
 fields_to_encode_decode = [
-    mm_constants.EventFieldType.FEATURE_STATS,
-    mm_constants.EventFieldType.CURRENT_STATS,
+    mm_schemas.EventFieldType.FEATURE_STATS,
+    mm_schemas.EventFieldType.CURRENT_STATS,
 ]
+_METRIC_FIELDS: list[str] = [
+    mm_schemas.WriterEvent.APPLICATION_NAME,
+    mm_schemas.MetricData.METRIC_NAME,
+    mm_schemas.MetricData.METRIC_VALUE,
+    mm_schemas.WriterEvent.START_INFER_TIME,
+    mm_schemas.WriterEvent.END_INFER_TIME,
+]
+class SchemaField(typing.TypedDict):
+    name: str
+    type: str
+    nullable: bool
+@dataclass
+class SchemaParams:
+    key: str
+    fields: list[SchemaField]
+_RESULT_SCHEMA: list[SchemaField] = [
+    SchemaField(
+        name=mm_schemas.ResultData.RESULT_NAME,
+        type=mm_schemas.GrafanaColumnType.STRING,
+        nullable=False,
+    )
+]
+_METRIC_SCHEMA: list[SchemaField] = [
+    SchemaField(
+        name=mm_schemas.WriterEvent.APPLICATION_NAME,
+        type=mm_schemas.GrafanaColumnType.STRING,
+        nullable=False,
+    ),
+    SchemaField(
+        name=mm_schemas.MetricData.METRIC_NAME,
+        type=mm_schemas.GrafanaColumnType.STRING,
+        nullable=False,
+    ),
+]
+_KIND_TO_SCHEMA_PARAMS: dict[mm_schemas.WriterEventKind, SchemaParams] = {
+    mm_schemas.WriterEventKind.RESULT: SchemaParams(
+        key=mm_schemas.WriterEvent.APPLICATION_NAME, fields=_RESULT_SCHEMA
+    ),
+    mm_schemas.WriterEventKind.METRIC: SchemaParams(
+        key="metric_id", fields=_METRIC_SCHEMA
+    ),
+}
+_EXCLUDE_SCHEMA_FILTER_EXPRESSION = '__name!=".#schema"'
 class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
     """
@@ -64,7 +120,7 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
         self.client.kv.put(
             container=self.container,
             table_path=self.path,
-            key=endpoint[mm_constants.EventFieldType.UID],
+            key=endpoint[mm_schemas.EventFieldType.UID],
             attributes=endpoint,
         )
@@ -151,7 +207,7 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
         """Getting path and container based on the model monitoring configurations"""
         path = mlrun.mlconf.model_endpoint_monitoring.store_prefixes.default.format(
             project=self.project,
-            kind=mlrun.common.schemas.ModelMonitoringStoreKinds.ENDPOINTS,
+            kind=mm_schemas.ModelMonitoringStoreKinds.ENDPOINTS,
         )
         (
             _,
@@ -217,11 +273,11 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
         if uids is None:
             uids = []
             for item in items:
-                if mm_constants.EventFieldType.UID not in item:
+                if mm_schemas.EventFieldType.UID not in item:
                     # This is kept for backwards compatibility - in old versions the key column named endpoint_id
-                    uids.append(item[mm_constants.EventFieldType.ENDPOINT_ID])
+                    uids.append(item[mm_schemas.EventFieldType.ENDPOINT_ID])
                 else:
-                    uids.append(item[mm_constants.EventFieldType.UID])
+                    uids.append(item[mm_schemas.EventFieldType.UID])
         # Add each relevant model endpoint to the model endpoints list
         for endpoint_id in uids:
@@ -241,11 +297,11 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
         # Delete model endpoint record from KV table
         for endpoint_dict in endpoints:
-            if mm_constants.EventFieldType.UID not in endpoint_dict:
+            if mm_schemas.EventFieldType.UID not in endpoint_dict:
                 # This is kept for backwards compatibility - in old versions the key column named endpoint_id
-                endpoint_id = endpoint_dict[mm_constants.EventFieldType.ENDPOINT_ID]
+                endpoint_id = endpoint_dict[mm_schemas.EventFieldType.ENDPOINT_ID]
             else:
-                endpoint_id = endpoint_dict[mm_constants.EventFieldType.UID]
+                endpoint_id = endpoint_dict[mm_schemas.EventFieldType.UID]
             self.delete_model_endpoint(
                 endpoint_id,
             )
@@ -268,11 +324,19 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
                 raise_for_status=v3io.dataplane.RaiseForStatus.never,
             )
+    @staticmethod
+    def _get_results_table_path(endpoint_id: str) -> str:
+        return endpoint_id
+    @staticmethod
+    def _get_metrics_table_path(endpoint_id: str) -> str:
+        return f"{endpoint_id}_metrics"
     def write_application_event(
         self,
         event: dict[str, typing.Any],
-        kind: mm_constants.WriterEventKind = mm_constants.WriterEventKind.RESULT,
-    ):
+        kind: mm_schemas.WriterEventKind = mm_schemas.WriterEventKind.RESULT,
+    ) -> None:
         """
         Write a new application event in the target table.
@@ -281,66 +345,63 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
                       object.
         :param kind: The type of the event, can be either "result" or "metric".
         """
-        if kind == mm_constants.WriterEventKind.METRIC:
-            # TODO : Implement the logic for writing metrics to KV
-            return
-        endpoint_id = event.pop(mm_constants.WriterEvent.ENDPOINT_ID)
-        app_name = event.pop(mm_constants.WriterEvent.APPLICATION_NAME)
-        metric_name = event.pop(mm_constants.ResultData.RESULT_NAME)
-        attributes = {metric_name: json.dumps(event)}
-        v3io_monitoring_apps_container = self.get_v3io_monitoring_apps_container(
-            project_name=self.project
-        )
+        container = self.get_v3io_monitoring_apps_container(project_name=self.project)
+        endpoint_id = event.pop(mm_schemas.WriterEvent.ENDPOINT_ID)
+        if kind == mm_schemas.WriterEventKind.METRIC:
+            table_path = self._get_metrics_table_path(endpoint_id)
+            key = f"{event[mm_schemas.WriterEvent.APPLICATION_NAME]}.{event[mm_schemas.MetricData.METRIC_NAME]}"
+            attributes = {event_key: event[event_key] for event_key in _METRIC_FIELDS}
+        elif kind == mm_schemas.WriterEventKind.RESULT:
+            table_path = self._get_results_table_path(endpoint_id)
+            key = event.pop(mm_schemas.WriterEvent.APPLICATION_NAME)
+            metric_name = event.pop(mm_schemas.ResultData.RESULT_NAME)
+            attributes = {metric_name: json.dumps(event)}
+        else:
+            raise ValueError(f"Invalid {kind = }")
         self.client.kv.update(
-            container=v3io_monitoring_apps_container,
-            table_path=endpoint_id,
-            key=app_name,
+            container=container,
+            table_path=table_path,
+            key=key,
             attributes=attributes,
         )
         schema_file = self.client.kv.new_cursor(
-            container=v3io_monitoring_apps_container,
-            table_path=endpoint_id,
+            container=container,
+            table_path=table_path,
             filter_expression='__name==".#schema"',
         )
         if not schema_file.all():
             logger.info(
-                "Generate a new V3IO KV schema file",
-                container=v3io_monitoring_apps_container,
-                endpoint_id=endpoint_id,
+                "Generating a new V3IO KV schema file",
+                container=container,
+                table_path=table_path,
+            )
+            self._generate_kv_schema(
+                container=container, table_path=table_path, kind=kind
             )
-            self._generate_kv_schema(endpoint_id, v3io_monitoring_apps_container)
-        logger.info("Updated V3IO KV successfully", key=app_name)
+        logger.info("Updated V3IO KV successfully", key=key)
     def _generate_kv_schema(
-        self, endpoint_id: str, v3io_monitoring_apps_container: str
-    ):
+        self, *, container: str, table_path: str, kind: mm_schemas.WriterEventKind
+    ) -> None:
         """Generate V3IO KV schema file which will be used by the model monitoring applications dashboard in Grafana."""
-        fields = [
-            {
-                "name": mm_constants.ResultData.RESULT_NAME,
-                "type": "string",
-                "nullable": False,
-            }
-        ]
+        schema_params = _KIND_TO_SCHEMA_PARAMS[kind]
         res = self.client.kv.create_schema(
-            container=v3io_monitoring_apps_container,
-            table_path=endpoint_id,
-            key=mm_constants.WriterEvent.APPLICATION_NAME,
-            fields=fields,
+            container=container,
+            table_path=table_path,
+            key=schema_params.key,
+            fields=schema_params.fields,
         )
         if res.status_code != HTTPStatus.OK:
             raise mlrun.errors.MLRunBadRequestError(
-                f"Couldn't infer schema for endpoint {endpoint_id} which is required for Grafana dashboards"
+                f"Couldn't infer schema for endpoint {table_path} which is required for Grafana dashboards"
             )
         else:
-            logger.info(
-                "Generated V3IO KV schema successfully", endpoint_id=endpoint_id
-            )
+            logger.info("Generated V3IO KV schema successfully", table_path=table_path)
     def get_last_analyzed(self, endpoint_id: str, application_name: str) -> int:
         """
@@ -361,7 +422,7 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
                 table_path=endpoint_id,
                 key=application_name,
             )
-            return data.output.item[mm_constants.SchedulingKeys.LAST_ANALYZED]
+            return data.output.item[mm_schemas.SchedulingKeys.LAST_ANALYZED]
         except v3io.dataplane.response.HttpResponseError as err:
             logger.debug("Error while getting last analyzed time", err=err)
             raise mlrun.errors.MLRunNotFoundError(
@@ -386,7 +447,7 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
             ),
             table_path=endpoint_id,
             key=application_name,
-            attributes={mm_constants.SchedulingKeys.LAST_ANALYZED: last_analyzed},
+            attributes={mm_schemas.SchedulingKeys.LAST_ANALYZED: last_analyzed},
         )
     def _generate_tsdb_paths(self) -> tuple[str, str]:
@@ -399,7 +460,7 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
         full_path = (
             mlrun.mlconf.model_endpoint_monitoring.store_prefixes.default.format(
                 project=self.project,
-                kind=mlrun.common.schemas.ModelMonitoringStoreKinds.EVENTS,
+                kind=mm_schemas.ModelMonitoringStoreKinds.EVENTS,
             )
         )
@@ -495,8 +556,8 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
         # Apply top_level filter (remove endpoints that considered a child of a router)
         if top_level:
             filter_expression.append(
-                f"(endpoint_type=='{str(mm_constants.EndpointType.NODE_EP.value)}' "
-                f"OR  endpoint_type=='{str(mm_constants.EndpointType.ROUTER.value)}')"
+                f"(endpoint_type=='{str(mm_schemas.EndpointType.NODE_EP.value)}' "
+                f"OR  endpoint_type=='{str(mm_schemas.EndpointType.ROUTER.value)}')"
             )
         return " AND ".join(filter_expression)
@@ -516,30 +577,30 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
         # Validate default value for `error_count`
         # For backwards compatibility reasons, we validate that the model endpoint includes the `error_count` key
         if (
-            mm_constants.EventFieldType.ERROR_COUNT in endpoint
-            and endpoint[mm_constants.EventFieldType.ERROR_COUNT] == "null"
+            mm_schemas.EventFieldType.ERROR_COUNT in endpoint
+            and endpoint[mm_schemas.EventFieldType.ERROR_COUNT] == "null"
         ):
-            endpoint[mm_constants.EventFieldType.ERROR_COUNT] = "0"
+            endpoint[mm_schemas.EventFieldType.ERROR_COUNT] = "0"
         # Validate default value for `metrics`
         # For backwards compatibility reasons, we validate that the model endpoint includes the `metrics` key
         if (
-            mm_constants.EventFieldType.METRICS in endpoint
-            and endpoint[mm_constants.EventFieldType.METRICS] == "null"
+            mm_schemas.EventFieldType.METRICS in endpoint
+            and endpoint[mm_schemas.EventFieldType.METRICS] == "null"
         ):
-            endpoint[mm_constants.EventFieldType.METRICS] = json.dumps(
+            endpoint[mm_schemas.EventFieldType.METRICS] = json.dumps(
                 {
-                    mm_constants.EventKeyMetrics.GENERIC: {
-                        mm_constants.EventLiveStats.LATENCY_AVG_1H: 0,
-                        mm_constants.EventLiveStats.PREDICTIONS_PER_SECOND: 0,
+                    mm_schemas.EventKeyMetrics.GENERIC: {
+                        mm_schemas.EventLiveStats.LATENCY_AVG_1H: 0,
+                        mm_schemas.EventLiveStats.PREDICTIONS_PER_SECOND: 0,
                     }
                 }
             )
         # Validate key `uid` instead of `endpoint_id`
         # For backwards compatibility reasons, we replace the `endpoint_id` with `uid` which is the updated key name
-        if mm_constants.EventFieldType.ENDPOINT_ID in endpoint:
-            endpoint[mm_constants.EventFieldType.UID] = endpoint[
-                mm_constants.EventFieldType.ENDPOINT_ID
+        if mm_schemas.EventFieldType.ENDPOINT_ID in endpoint:
+            endpoint[mm_schemas.EventFieldType.UID] = endpoint[
+                mm_schemas.EventFieldType.ENDPOINT_ID
             ]
     @staticmethod
@@ -566,57 +627,95 @@ class KVStoreBase(mlrun.model_monitoring.db.StoreBase):
     def _get_monitoring_schedules_container(project_name: str) -> str:
         return f"users/pipelines/{project_name}/monitoring-schedules/functions"
-    def _extract_metrics_from_items(
+    def _extract_results_from_items(
         self, app_items: list[dict[str, str]]
-    ) -> list[mm_constants.ModelEndpointMonitoringMetric]:
-        metrics: list[mm_constants.ModelEndpointMonitoringMetric] = []
+    ) -> list[mm_schemas.ModelEndpointMonitoringMetric]:
+        """Assuming .#schema items are filtered out"""
+        metrics: list[mm_schemas.ModelEndpointMonitoringMetric] = []
         for app_item in app_items:
-            # See https://www.iguazio.com/docs/latest-release/services/data-layer/reference/system-attributes/#sys-attr-__name
             app_name = app_item.pop("__name")
-            if app_name == ".#schema":
-                continue
             for result_name in app_item:
                 metrics.append(
-                    mm_constants.ModelEndpointMonitoringMetric(
+                    mm_schemas.ModelEndpointMonitoringMetric(
                         project=self.project,
                         app=app_name,
-                        type=mm_constants.ModelEndpointMonitoringMetricType.RESULT,
+                        type=mm_schemas.ModelEndpointMonitoringMetricType.RESULT,
                         name=result_name,
-                        full_name=mlrun.common.schemas.model_monitoring.model_endpoints._compose_full_name(
+                        full_name=mm_schemas.model_endpoints._compose_full_name(
                             project=self.project, app=app_name, name=result_name
                         ),
                     )
                 )
         return metrics
+    def _extract_metrics_from_items(
+        self, result_items: list[dict[str, str]]
+    ) -> list[mm_schemas.ModelEndpointMonitoringMetric]:
+        metrics: list[mm_schemas.ModelEndpointMonitoringMetric] = []
+        logger.debug("Result items", result_items=result_items)
+        for result_item in result_items:
+            app = result_item[mm_schemas.WriterEvent.APPLICATION_NAME]
+            name = result_item[mm_schemas.MetricData.METRIC_NAME]
+            metrics.append(
+                mm_schemas.ModelEndpointMonitoringMetric(
+                    project=self.project,
+                    app=app,
+                    type=mm_schemas.ModelEndpointMonitoringMetricType.METRIC,
+                    name=name,
+                    full_name=mm_schemas.model_endpoints._compose_full_name(
+                        project=self.project,
+                        app=app,
+                        name=name,
+                        type=mm_schemas.ModelEndpointMonitoringMetricType.METRIC,
+                    ),
+                )
+            )
+        return metrics
     def get_model_endpoint_metrics(
-        self, endpoint_id: str
-    ) -> list[mm_constants.ModelEndpointMonitoringMetric]:
+        self, endpoint_id: str, type: mm_schemas.ModelEndpointMonitoringMetricType
+    ) -> list[mm_schemas.ModelEndpointMonitoringMetric]:
         """Get model monitoring results and metrics on the endpoint"""
-        metrics: list[mm_constants.ModelEndpointMonitoringMetric] = []
+        metrics: list[mm_schemas.ModelEndpointMonitoringMetric] = []
         container = self.get_v3io_monitoring_apps_container(self.project)
+        if type == mm_schemas.ModelEndpointMonitoringMetricType.METRIC:
+            table_path = self._get_metrics_table_path(endpoint_id)
+            items_extractor = self._extract_metrics_from_items
+        elif type == mm_schemas.ModelEndpointMonitoringMetricType.RESULT:
+            table_path = self._get_results_table_path(endpoint_id)
+            items_extractor = self._extract_results_from_items
+        else:
+            raise ValueError(f"Invalid metric {type = }")
+        def scan(
+            marker: typing.Optional[str] = None,
+        ) -> v3io.dataplane.response.Response:
+            # TODO: Use AIO client: `v3io.aio.dataplane.client.Client`
+            return self.client.kv.scan(
+                container=container,
+                table_path=table_path,
+                marker=marker,
+                filter_expression=_EXCLUDE_SCHEMA_FILTER_EXPRESSION,
+            )
         try:
-            response = self.client.kv.scan(container=container, table_path=endpoint_id)
+            response = scan()
         except v3io.dataplane.response.HttpResponseError as err:
             if err.status_code == HTTPStatus.NOT_FOUND:
                 logger.warning(
-                    "Attempt getting metrics and results - no data. Check the "
+                    f"Attempt getting {type}s - no data. Check the "
                     "project name, endpoint, or wait for the applications to start.",
                     container=container,
-                    table_path=endpoint_id,
+                    table_path=table_path,
                 )
                 return []
             raise
         while True:
-            metrics.extend(self._extract_metrics_from_items(response.output.items))
-            if response.output.last:
+            output = typing.cast(v3io.dataplane.output.GetItemsOutput, response.output)
+            metrics.extend(items_extractor(output.items))
+            if output.last:
                 break
-            # TODO: Use AIO client: `v3io.aio.dataplane.client.Client`
-            response = self.client.kv.scan(
-                container=container,
-                table_path=endpoint_id,
-                marker=response.output.next_marker,
-            )
+            response = scan(marker=output.next_marker)
         return metrics

mlrun/model_monitoring/db/tsdb/__init__.py CHANGED Viewed

@@ -25,6 +25,7 @@ class ObjectTSDBFactory(enum.Enum):
     """Enum class to handle the different TSDB connector type values for storing real time metrics"""
     v3io_tsdb = "v3io-tsdb"
+    tdengine = "tdengine"
     def to_tsdb_connector(self, project: str, **kwargs) -> TSDBConnector:
         """
@@ -43,6 +44,13 @@ class ObjectTSDBFactory(enum.Enum):
             return V3IOTSDBConnector(project=project, **kwargs)
+        # Assuming TDEngine connector if connector type is not V3IO TSDB.
+        # Update these lines once there are more than two connector types.
+        from .tdengine.tdengine_connector import TDEngineConnector
+        return TDEngineConnector(project=project, **kwargs)
     @classmethod
     def _missing_(cls, value: typing.Any):
         """A lookup function to handle an invalid value.
@@ -54,18 +62,39 @@ class ObjectTSDBFactory(enum.Enum):
         )
-def get_tsdb_connector(project: str, **kwargs) -> TSDBConnector:
+def get_tsdb_connector(
+    project: str,
+    tsdb_connector_type: str = "",
+    secret_provider: typing.Callable = None,
+    **kwargs,
+) -> TSDBConnector:
     """
-    Get the TSDB connector type based on mlrun.config.model_endpoint_monitoring.tsdb_connector_type.
+    Get TSDB connector object.
     :param project: The name of the project.
+    :param tsdb_connector_type: The type of the TSDB connector. See mlrun.model_monitoring.db.tsdb.ObjectTSDBFactory
+                                for available options.
+    :param secret_provider: An optional secret provider to get the connection string secret.
     :return: `TSDBConnector` object. The main goal of this object is to handle different operations on the
              TSDB connector such as updating drift metrics or write application record result.
     """
-    # Get store type value from ObjectTSDBFactory enum class
-    tsdb_connector_type = ObjectTSDBFactory(
-        mlrun.mlconf.model_endpoint_monitoring.tsdb_connector_type
+    tsdb_connection_string = mlrun.model_monitoring.helpers.get_tsdb_connection_string(
+        secret_provider=secret_provider
     )
+    if tsdb_connection_string and tsdb_connection_string.startswith("taosws"):
+        tsdb_connector_type = mlrun.common.schemas.model_monitoring.TSDBTarget.TDEngine
+        kwargs["connection_string"] = tsdb_connection_string
+    # Set the default TSDB connector type if no connection has been set
+    tsdb_connector_type = (
+        tsdb_connector_type
+        or mlrun.mlconf.model_endpoint_monitoring.tsdb_connector_type
+    )
+    # Get connector type value from ObjectTSDBFactory enum class
+    tsdb_connector_factory = ObjectTSDBFactory(tsdb_connector_type)
     # Convert into TSDB connector object
-    return tsdb_connector_type.to_tsdb_connector(project=project, **kwargs)
+    return tsdb_connector_factory.to_tsdb_connector(project=project, **kwargs)

mlrun/model_monitoring/db/tsdb/base.py CHANGED Viewed

@@ -14,6 +14,7 @@
 #
+import typing
 from abc import ABC
 import pandas as pd
@@ -22,6 +23,8 @@ import mlrun.common.schemas.model_monitoring.constants as mm_constants
 class TSDBConnector(ABC):
+    type: str = ""
     def __init__(self, project: str):
         """
         Initialize a new TSDB connector. The connector is used to interact with the TSDB and store monitoring data.
@@ -57,13 +60,12 @@ class TSDBConnector(ABC):
         self,
         event: dict,
         kind: mm_constants.WriterEventKind = mm_constants.WriterEventKind.RESULT,
-    ):
+    ) -> None:
         """
         Write a single application or metric to TSDB.
         :raise mlrun.errors.MLRunRuntimeError: If an error occurred while writing the event.
         """
-        pass
     def delete_tsdb_resources(self):
         """
@@ -76,8 +78,8 @@ class TSDBConnector(ABC):
         self,
         endpoint_id: str,
         metrics: list[str],
-        start: str = "now-1h",
-        end: str = "now",
+        start: str,
+        end: str,
     ) -> dict[str, list[tuple[str, float]]]:
         """
         Getting real time metrics from the TSDB. There are pre-defined metrics for model endpoints such as
@@ -101,35 +103,40 @@ class TSDBConnector(ABC):
     def get_records(
         self,
         table: str,
-        columns: list[str] = None,
+        start: str,
+        end: str,
+        columns: typing.Optional[list[str]] = None,
         filter_query: str = "",
-        start: str = "now-1h",
-        end: str = "now",
     ) -> pd.DataFrame:
         """
         Getting records from TSDB data collection.
         :param table:            Table name, e.g. 'metrics', 'app_results'.
+        :param start:            The start time of the metrics.
+                                 If using V3IO, can be represented by a string containing an RFC 3339 time, a  Unix
+                                 timestamp in milliseconds, a relative time (`'now'` or `'now-[0-9]+[mhd]'`, where
+                                 `m` = minutes, `h` = hours, `'d'` = days, and `'s'` = seconds), or 0 for the earliest
+                                 time.
+                                 If using TDEngine, can be represented by datetime.
+        :param end:              The end time of the metrics.
+                                 If using V3IO, can be represented by a string containing an RFC 3339 time, a  Unix
+                                 timestamp in milliseconds, a relative time (`'now'` or `'now-[0-9]+[mhd]'`, where
+                                 `m` = minutes, `h` = hours, `'d'` = days, and `'s'` = seconds), or 0 for the earliest
+                                 time.
+                                 If using TDEngine, can be represented by datetime.
         :param columns:          Columns to include in the result.
         :param filter_query:     Optional filter expression as a string. The filter structure depends on the TSDB
                                  connector type.
-        :param start:            The start time of the metrics. Can be represented by a string containing an RFC
-                                 3339 time, a  Unix timestamp in milliseconds, a relative time (`'now'` or
-                                 `'now-[0-9]+[mhd]'`, where `m` = minutes, `h` = hours, `'d'` = days, and `'s'`
-                                 = seconds), or 0 for the earliest time.
-        :param end:              The end time of the metrics. Can be represented by a string containing an RFC
-                                 3339 time, a  Unix timestamp in milliseconds, a relative time (`'now'` or
-                                 `'now-[0-9]+[mhd]'`, where `m` = minutes, `h` = hours, `'d'` = days, and `'s'`
-                                 = seconds), or 0 for the earliest time.
         :return: DataFrame with the provided attributes from the data collection.
         :raise:  MLRunNotFoundError if the provided table wasn't found.
         """
         pass
-    def create_tsdb_application_tables(self):
+    def create_tables(self) -> None:
         """
-        Create the application tables using the TSDB connector. At the moment we support 2 types of application tables:
+        Create the TSDB tables using the TSDB connector. At the moment we support 3 types of tables:
         - app_results: a detailed result that includes status, kind, extra data, etc.
         - metrics: a basic key value that represents a numeric metric.
+        - predictions: latency of each prediction.
         """
-        pass

mlrun/model_monitoring/db/tsdb/tdengine/__init__.py ADDED Viewed

@@ -0,0 +1,15 @@
+# Copyright 2024 Iguazio
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from .tdengine_connector import TDEngineConnector

mlrun 1.7.0rc17__py3-none-any.whl → 1.7.0rc18__py3-none-any.whl

Potentially problematic release.

mlrun 1.7.0rc17py3-none-any.whl → 1.7.0rc18py3-none-any.whl