PyPI - mlrun - Versions diffs - 1.3.2rc1__py3-none-any.whl → 1.3.2rc2__py3-none-any.whl - Mend

mlrun 1.3.2rc1py3-none-any.whl → 1.3.2rc2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mlrun might be problematic. Click here for more details.

Files changed (93) hide show

mlrun/api/api/deps.py +14 -1
mlrun/api/api/endpoints/frontend_spec.py +0 -2
mlrun/api/api/endpoints/functions.py +15 -27
mlrun/api/api/endpoints/grafana_proxy.py +435 -74
mlrun/api/api/endpoints/healthz.py +5 -18
mlrun/api/api/endpoints/model_endpoints.py +33 -37
mlrun/api/api/utils.py +6 -13
mlrun/api/crud/__init__.py +14 -16
mlrun/api/crud/logs.py +5 -7
mlrun/api/crud/model_monitoring/__init__.py +2 -2
mlrun/api/crud/model_monitoring/model_endpoint_store.py +847 -0
mlrun/api/crud/model_monitoring/model_endpoints.py +105 -328
mlrun/api/crud/pipelines.py +2 -3
mlrun/api/db/sqldb/models/models_mysql.py +52 -19
mlrun/api/db/sqldb/models/models_sqlite.py +52 -19
mlrun/api/db/sqldb/session.py +19 -26
mlrun/api/schemas/__init__.py +2 -0
mlrun/api/schemas/constants.py +0 -13
mlrun/api/schemas/frontend_spec.py +0 -1
mlrun/api/schemas/model_endpoints.py +38 -195
mlrun/api/schemas/schedule.py +2 -2
mlrun/api/utils/clients/log_collector.py +5 -0
mlrun/builder.py +9 -41
mlrun/config.py +1 -76
mlrun/data_types/__init__.py +1 -6
mlrun/data_types/data_types.py +1 -3
mlrun/datastore/__init__.py +2 -9
mlrun/datastore/sources.py +20 -25
mlrun/datastore/store_resources.py +1 -1
mlrun/datastore/targets.py +34 -67
mlrun/datastore/utils.py +4 -26
mlrun/db/base.py +2 -4
mlrun/db/filedb.py +5 -13
mlrun/db/httpdb.py +32 -64
mlrun/db/sqldb.py +2 -4
mlrun/errors.py +0 -5
mlrun/execution.py +0 -2
mlrun/feature_store/api.py +8 -24
mlrun/feature_store/feature_set.py +6 -28
mlrun/feature_store/feature_vector.py +0 -2
mlrun/feature_store/ingestion.py +11 -8
mlrun/feature_store/retrieval/base.py +43 -271
mlrun/feature_store/retrieval/dask_merger.py +153 -55
mlrun/feature_store/retrieval/job.py +3 -12
mlrun/feature_store/retrieval/local_merger.py +130 -48
mlrun/feature_store/retrieval/spark_merger.py +125 -126
mlrun/features.py +2 -7
mlrun/model_monitoring/constants.py +6 -48
mlrun/model_monitoring/helpers.py +35 -118
mlrun/model_monitoring/model_monitoring_batch.py +260 -293
mlrun/model_monitoring/stream_processing_fs.py +253 -220
mlrun/platforms/iguazio.py +0 -33
mlrun/projects/project.py +72 -34
mlrun/runtimes/base.py +0 -5
mlrun/runtimes/daskjob.py +0 -2
mlrun/runtimes/function.py +3 -29
mlrun/runtimes/kubejob.py +15 -39
mlrun/runtimes/local.py +45 -7
mlrun/runtimes/mpijob/abstract.py +0 -2
mlrun/runtimes/mpijob/v1.py +0 -2
mlrun/runtimes/pod.py +0 -2
mlrun/runtimes/remotesparkjob.py +0 -2
mlrun/runtimes/serving.py +0 -6
mlrun/runtimes/sparkjob/abstract.py +2 -39
mlrun/runtimes/sparkjob/spark3job.py +0 -2
mlrun/serving/__init__.py +1 -2
mlrun/serving/routers.py +35 -35
mlrun/serving/server.py +12 -22
mlrun/serving/states.py +30 -162
mlrun/serving/v2_serving.py +10 -13
mlrun/utils/clones.py +1 -1
mlrun/utils/model_monitoring.py +96 -122
mlrun/utils/version/version.json +2 -2
{mlrun-1.3.2rc1.dist-info → mlrun-1.3.2rc2.dist-info}/METADATA +27 -23
{mlrun-1.3.2rc1.dist-info → mlrun-1.3.2rc2.dist-info}/RECORD +79 -92
mlrun/api/crud/model_monitoring/grafana.py +0 -427
mlrun/datastore/spark_udf.py +0 -40
mlrun/model_monitoring/__init__.py +0 -44
mlrun/model_monitoring/common.py +0 -112
mlrun/model_monitoring/model_endpoint.py +0 -141
mlrun/model_monitoring/stores/__init__.py +0 -106
mlrun/model_monitoring/stores/kv_model_endpoint_store.py +0 -448
mlrun/model_monitoring/stores/model_endpoint_store.py +0 -147
mlrun/model_monitoring/stores/models/__init__.py +0 -23
mlrun/model_monitoring/stores/models/base.py +0 -18
mlrun/model_monitoring/stores/models/mysql.py +0 -100
mlrun/model_monitoring/stores/models/sqlite.py +0 -98
mlrun/model_monitoring/stores/sql_model_endpoint_store.py +0 -375
mlrun/utils/db.py +0 -52
{mlrun-1.3.2rc1.dist-info → mlrun-1.3.2rc2.dist-info}/LICENSE +0 -0
{mlrun-1.3.2rc1.dist-info → mlrun-1.3.2rc2.dist-info}/WHEEL +0 -0
{mlrun-1.3.2rc1.dist-info → mlrun-1.3.2rc2.dist-info}/entry_points.txt +0 -0
{mlrun-1.3.2rc1.dist-info → mlrun-1.3.2rc2.dist-info}/top_level.txt +0 -0

mlrun/api/api/deps.py CHANGED Viewed

@@ -70,7 +70,20 @@ def verify_api_state(request: Request):
             "memory-reports",
         ]
         if not any(enabled_endpoint in path for enabled_endpoint in enabled_endpoints):
-            message = mlrun.api.schemas.APIStates.description(mlrun.mlconf.httpdb.state)
+            message = (
+                "API is waiting for migrations to be triggered. Send POST request to /api/operations/migrations to"
+                " trigger it"
+            )
+            if (
+                mlrun.mlconf.httpdb.state
+                == mlrun.api.schemas.APIStates.migrations_in_progress
+            ):
+                message = "Migrations are in progress"
+            elif (
+                mlrun.mlconf.httpdb.state
+                == mlrun.api.schemas.APIStates.migrations_failed
+            ):
+                message = "Migrations failed, API can't be started"
             raise mlrun.errors.MLRunPreconditionFailedError(message)

mlrun/api/api/endpoints/frontend_spec.py CHANGED Viewed

@@ -24,7 +24,6 @@ import mlrun.builder
 import mlrun.runtimes
 import mlrun.runtimes.utils
 import mlrun.utils.helpers
-from mlrun.api.api.utils import get_allowed_path_prefixes_list
 from mlrun.config import config
 from mlrun.platforms import is_iguazio_session_cookie
@@ -83,7 +82,6 @@ def get_frontend_spec(
         default_function_pod_resources=mlrun.mlconf.default_function_pod_resources.to_dict(),
         default_function_preemption_mode=mlrun.mlconf.function_defaults.preemption_mode,
         feature_store_data_prefixes=config.feature_store.data_prefixes.to_dict(),
-        allowed_artifact_path_prefixes_list=get_allowed_path_prefixes_list(),
         # ce_mode is deprecated, we will use the full ce config instead and ce_mode will be removed in 1.6.0
         ce_mode=config.ce.mode,
         ce=config.ce.to_dict(),

mlrun/api/api/endpoints/functions.py CHANGED Viewed

@@ -40,7 +40,6 @@ import mlrun.api.utils.auth.verifier
 import mlrun.api.utils.background_tasks
 import mlrun.api.utils.clients.chief
 import mlrun.api.utils.singletons.project_member
-import mlrun.model_monitoring.constants
 from mlrun.api.api import deps
 from mlrun.api.api.utils import get_run_db_instance, log_and_raise, log_path
 from mlrun.api.crud.secrets import Secrets, SecretsClientType
@@ -631,33 +630,25 @@ def _build_function(
                 try:
                     if fn.spec.track_models:
                         logger.info("Tracking enabled, initializing model monitoring")
-                        # Generating model monitoring access key
-                        model_monitoring_access_key = None
-                        if not mlrun.mlconf.is_ce_mode():
-                            model_monitoring_access_key = _process_model_monitoring_secret(
-                                db_session,
-                                fn.metadata.project,
-                                mlrun.model_monitoring.constants.ProjectSecretKeys.ACCESS_KEY,
-                            )
-                            if mlrun.utils.model_monitoring.get_stream_path(
-                                project=fn.metadata.project
-                            ).startswith("v3io://"):
-                                # Initialize model monitoring V3IO stream
-                                _create_model_monitoring_stream(
-                                    project=fn.metadata.project,
-                                    function=fn,
-                                )
+                        _init_serving_function_stream_args(fn=fn)
+                        # get model monitoring access key
+                        model_monitoring_access_key = _process_model_monitoring_secret(
+                            db_session,
+                            fn.metadata.project,
+                            "MODEL_MONITORING_ACCESS_KEY",
+                        )
+                        # initialize model monitoring stream
+                        _create_model_monitoring_stream(project=fn.metadata.project)
                         if fn.spec.tracking_policy:
-                            # Convert to `TrackingPolicy` object as `fn.spec.tracking_policy` is provided as a dict
+                            # convert to `TrackingPolicy` object as `fn.spec.tracking_policy` is provided as a dict
                             fn.spec.tracking_policy = (
                                 mlrun.utils.model_monitoring.TrackingPolicy.from_dict(
                                     fn.spec.tracking_policy
                                 )
                             )
                         else:
-                            # Initialize tracking policy with default values
+                            # initialize tracking policy with default values
                             fn.spec.tracking_policy = (
                                 mlrun.utils.model_monitoring.TrackingPolicy()
                             )
@@ -665,10 +656,10 @@ def _build_function(
                         # deploy both model monitoring stream and model monitoring batch job
                         mlrun.api.crud.ModelEndpoints().deploy_monitoring_functions(
                             project=fn.metadata.project,
+                            model_monitoring_access_key=model_monitoring_access_key,
                             db_session=db_session,
                             auth_info=auth_info,
                             tracking_policy=fn.spec.tracking_policy,
-                            model_monitoring_access_key=model_monitoring_access_key,
                         )
                 except Exception as exc:
                     logger.warning(
@@ -819,12 +810,9 @@ async def _get_function_status(data, auth_info: mlrun.api.schemas.AuthInfo):
         )
-def _create_model_monitoring_stream(project: str, function):
-    _init_serving_function_stream_args(fn=function)
-    stream_path = mlrun.mlconf.get_model_monitoring_file_target_path(
-        project=project, kind="events"
+def _create_model_monitoring_stream(project: str):
+    stream_path = config.model_endpoint_monitoring.store_prefixes.default.format(
+        project=project, kind="stream"
     )
     _, container, stream_path = parse_model_endpoint_store_prefix(stream_path)

mlrun/api/api/endpoints/grafana_proxy.py CHANGED Viewed

@@ -13,37 +13,36 @@
 # limitations under the License.
 #
 import asyncio
-import warnings
+import json
 from http import HTTPStatus
-from typing import List, Union
+from typing import Any, Dict, List, Optional, Set, Union
+import numpy as np
+import pandas as pd
 from fastapi import APIRouter, Depends, Request, Response
 from fastapi.concurrency import run_in_threadpool
 from sqlalchemy.orm import Session
 import mlrun.api.crud
-import mlrun.api.crud.model_monitoring.grafana
 import mlrun.api.schemas
 import mlrun.api.utils.auth.verifier
-import mlrun.model_monitoring
 from mlrun.api.api import deps
-from mlrun.api.schemas import GrafanaTable, GrafanaTimeSeriesTarget
+from mlrun.api.schemas import (
+    GrafanaColumn,
+    GrafanaDataPoint,
+    GrafanaNumberColumn,
+    GrafanaTable,
+    GrafanaTimeSeriesTarget,
+    ProjectsFormat,
+)
+from mlrun.api.utils.singletons.project_member import get_project_member
+from mlrun.errors import MLRunBadRequestError
+from mlrun.utils import config, logger
+from mlrun.utils.model_monitoring import parse_model_endpoint_store_prefix
+from mlrun.utils.v3io_clients import get_frames_client
 router = APIRouter()
-NAME_TO_SEARCH_FUNCTION_DICTIONARY = {
-    "list_projects": mlrun.api.crud.model_monitoring.grafana.grafana_list_projects,
-}
-NAME_TO_QUERY_FUNCTION_DICTIONARY = {
-    "list_endpoints": mlrun.api.crud.model_monitoring.grafana.grafana_list_endpoints,
-    "individual_feature_analysis": mlrun.api.crud.model_monitoring.grafana.grafana_individual_feature_analysis,
-    "overall_feature_analysis": mlrun.api.crud.model_monitoring.grafana.grafana_overall_feature_analysis,
-    "incoming_features": mlrun.api.crud.model_monitoring.grafana.grafana_incoming_features,
-}
-SUPPORTED_QUERY_FUNCTIONS = set(NAME_TO_QUERY_FUNCTION_DICTIONARY.keys())
-SUPPORTED_SEARCH_FUNCTIONS = set(NAME_TO_SEARCH_FUNCTION_DICTIONARY)
 @router.get("/grafana-proxy/model-endpoints", status_code=HTTPStatus.OK.value)
 def grafana_proxy_model_endpoints_check_connection(
@@ -53,95 +52,457 @@ def grafana_proxy_model_endpoints_check_connection(
     Root of grafana proxy for the model-endpoints API, used for validating the model-endpoints data source
     connectivity.
     """
-    if not mlrun.mlconf.is_ce_mode():
-        mlrun.api.crud.ModelEndpoints().get_access_key(auth_info)
+    mlrun.api.crud.ModelEndpoints().get_access_key(auth_info)
     return Response(status_code=HTTPStatus.OK.value)
-@router.post("/grafana-proxy/model-endpoints/search", response_model=List[str])
-async def grafana_proxy_model_endpoints_search(
+@router.post(
+    "/grafana-proxy/model-endpoints/query",
+    response_model=List[Union[GrafanaTable, GrafanaTimeSeriesTarget]],
+)
+async def grafana_proxy_model_endpoints_query(
     request: Request,
     auth_info: mlrun.api.schemas.AuthInfo = Depends(deps.authenticate_request),
-    db_session: Session = Depends(deps.get_db_session),
-) -> List[str]:
+) -> List[Union[GrafanaTable, GrafanaTimeSeriesTarget]]:
     """
-    Search route for model-endpoints grafana proxy API, used for creating an interface between grafana queries and
+    Query route for model-endpoints grafana proxy API, used for creating an interface between grafana queries and
     model-endpoints logic.
     This implementation requires passing target_endpoint query parameter in order to dispatch different
     model-endpoint monitoring functions.
-    :param request:    An api request with the required target and parameters.
-    :param auth_info:  The auth info of the request.
-    :param db_session: A session that manages the current dialog with the database.
-    :return: List of results. e.g. list of available project names.
     """
-    if not mlrun.mlconf.is_ce_mode():
-        mlrun.api.crud.ModelEndpoints().get_access_key(auth_info)
     body = await request.json()
-    query_parameters = mlrun.api.crud.model_monitoring.grafana.parse_search_parameters(
-        body
-    )
-    mlrun.api.crud.model_monitoring.grafana.validate_query_parameters(
-        query_parameters, SUPPORTED_SEARCH_FUNCTIONS
-    )
+    query_parameters = _parse_query_parameters(body)
+    _validate_query_parameters(query_parameters, SUPPORTED_QUERY_FUNCTIONS)
+    query_parameters = _drop_grafana_escape_chars(query_parameters)
     # At this point everything is validated and we can access everything that is needed without performing all previous
     # checks again.
     target_endpoint = query_parameters["target_endpoint"]
-    function = NAME_TO_SEARCH_FUNCTION_DICTIONARY[target_endpoint]
+    function = NAME_TO_QUERY_FUNCTION_DICTIONARY[target_endpoint]
     if asyncio.iscoroutinefunction(function):
-        result = await function(db_session, auth_info, query_parameters)
-    else:
-        result = await run_in_threadpool(
-            function, db_session, auth_info, query_parameters
-        )
+        return await function(body, query_parameters, auth_info)
+    result = await run_in_threadpool(function, body, query_parameters, auth_info)
     return result
-@router.post(
-    "/grafana-proxy/model-endpoints/query",
-    response_model=List[Union[GrafanaTable, GrafanaTimeSeriesTarget]],
-)
-async def grafana_proxy_model_endpoints_query(
+@router.post("/grafana-proxy/model-endpoints/search", response_model=List[str])
+async def grafana_proxy_model_endpoints_search(
     request: Request,
     auth_info: mlrun.api.schemas.AuthInfo = Depends(deps.authenticate_request),
-) -> List[Union[GrafanaTable, GrafanaTimeSeriesTarget]]:
+    db_session: Session = Depends(deps.get_db_session),
+) -> List[str]:
     """
-    Query route for model-endpoints grafana proxy API, used for creating an interface between grafana queries and
+    Search route for model-endpoints grafana proxy API, used for creating an interface between grafana queries and
     model-endpoints logic.
     This implementation requires passing target_endpoint query parameter in order to dispatch different
     model-endpoint monitoring functions.
     """
+    mlrun.api.crud.ModelEndpoints().get_access_key(auth_info)
+    body = await request.json()
+    query_parameters = _parse_search_parameters(body)
+    _validate_query_parameters(query_parameters, SUPPORTED_SEARCH_FUNCTIONS)
+    # At this point everything is validated and we can access everything that is needed without performing all previous
+    # checks again.
+    target_endpoint = query_parameters["target_endpoint"]
+    function = NAME_TO_SEARCH_FUNCTION_DICTIONARY[target_endpoint]
+    if asyncio.iscoroutinefunction(function):
+        return await function(db_session, auth_info)
+    result = await run_in_threadpool(function, db_session, auth_info)
+    return result
-    warnings.warn(
-        "This api is deprecated in 1.3.1 and will be removed in 1.5.0. "
-        "Please update grafana model monitoring dashboards that use a different data source",
-        # TODO: remove in 1.5.0
-        FutureWarning,
+def grafana_list_projects(
+    db_session: Session, auth_info: mlrun.api.schemas.AuthInfo
+) -> List[str]:
+    projects_output = get_project_member().list_projects(
+        db_session, format_=ProjectsFormat.name_only, leader_session=auth_info.session
     )
+    return projects_output.projects
-    body = await request.json()
-    query_parameters = mlrun.api.crud.model_monitoring.grafana.parse_query_parameters(
-        body
+async def grafana_list_endpoints(
+    body: Dict[str, Any],
+    query_parameters: Dict[str, str],
+    auth_info: mlrun.api.schemas.AuthInfo,
+) -> List[GrafanaTable]:
+    project = query_parameters.get("project")
+    # Filters
+    model = query_parameters.get("model", None)
+    function = query_parameters.get("function", None)
+    labels = query_parameters.get("labels", "")
+    labels = labels.split(",") if labels else []
+    # Metrics to include
+    metrics = query_parameters.get("metrics", "")
+    metrics = metrics.split(",") if metrics else []
+    # Time range for metrics
+    start = body.get("rangeRaw", {}).get("start", "now-1h")
+    end = body.get("rangeRaw", {}).get("end", "now")
+    if project:
+        await mlrun.api.utils.auth.verifier.AuthVerifier().query_project_permissions(
+            project,
+            mlrun.api.schemas.AuthorizationAction.read,
+            auth_info,
+        )
+    endpoint_list = await run_in_threadpool(
+        mlrun.api.crud.ModelEndpoints().list_model_endpoints,
+        auth_info=auth_info,
+        project=project,
+        model=model,
+        function=function,
+        labels=labels,
+        metrics=metrics,
+        start=start,
+        end=end,
+    )
+    allowed_endpoints = await mlrun.api.utils.auth.verifier.AuthVerifier().filter_project_resources_by_permissions(
+        mlrun.api.schemas.AuthorizationResourceTypes.model_endpoint,
+        endpoint_list.endpoints,
+        lambda _endpoint: (
+            _endpoint.metadata.project,
+            _endpoint.metadata.uid,
+        ),
+        auth_info,
+    )
+    endpoint_list.endpoints = allowed_endpoints
+    columns = [
+        GrafanaColumn(text="endpoint_id", type="string"),
+        GrafanaColumn(text="endpoint_function", type="string"),
+        GrafanaColumn(text="endpoint_model", type="string"),
+        GrafanaColumn(text="endpoint_model_class", type="string"),
+        GrafanaColumn(text="first_request", type="time"),
+        GrafanaColumn(text="last_request", type="time"),
+        GrafanaColumn(text="accuracy", type="number"),
+        GrafanaColumn(text="error_count", type="number"),
+        GrafanaColumn(text="drift_status", type="number"),
+    ]
+    metric_columns = []
+    found_metrics = set()
+    for endpoint in endpoint_list.endpoints:
+        if endpoint.status.metrics is not None:
+            for key in endpoint.status.metrics.keys():
+                if key not in found_metrics:
+                    found_metrics.add(key)
+                    metric_columns.append(GrafanaColumn(text=key, type="number"))
+    columns = columns + metric_columns
+    table = GrafanaTable(columns=columns)
+    for endpoint in endpoint_list.endpoints:
+        row = [
+            endpoint.metadata.uid,
+            endpoint.spec.function_uri,
+            endpoint.spec.model,
+            endpoint.spec.model_class,
+            endpoint.status.first_request,
+            endpoint.status.last_request,
+            endpoint.status.accuracy,
+            endpoint.status.error_count,
+            endpoint.status.drift_status,
+        ]
+        if endpoint.status.metrics is not None and metric_columns:
+            for metric_column in metric_columns:
+                row.append(endpoint.status.metrics[metric_column.text])
+        table.add_row(*row)
+    return [table]
+async def grafana_individual_feature_analysis(
+    body: Dict[str, Any],
+    query_parameters: Dict[str, str],
+    auth_info: mlrun.api.schemas.AuthInfo,
+):
+    endpoint_id = query_parameters.get("endpoint_id")
+    project = query_parameters.get("project")
+    await mlrun.api.utils.auth.verifier.AuthVerifier().query_project_resource_permissions(
+        mlrun.api.schemas.AuthorizationResourceTypes.model_endpoint,
+        project,
+        endpoint_id,
+        mlrun.api.schemas.AuthorizationAction.read,
+        auth_info,
+    )
+    endpoint = await run_in_threadpool(
+        mlrun.api.crud.ModelEndpoints().get_model_endpoint,
+        auth_info=auth_info,
+        project=project,
+        endpoint_id=endpoint_id,
+        feature_analysis=True,
+    )
+    # Load JSON data from KV, make sure not to fail if a field is missing
+    feature_stats = endpoint.status.feature_stats or {}
+    current_stats = endpoint.status.current_stats or {}
+    drift_measures = endpoint.status.drift_measures or {}
+    table = GrafanaTable(
+        columns=[
+            GrafanaColumn(text="feature_name", type="string"),
+            GrafanaColumn(text="actual_min", type="number"),
+            GrafanaColumn(text="actual_mean", type="number"),
+            GrafanaColumn(text="actual_max", type="number"),
+            GrafanaColumn(text="expected_min", type="number"),
+            GrafanaColumn(text="expected_mean", type="number"),
+            GrafanaColumn(text="expected_max", type="number"),
+            GrafanaColumn(text="tvd", type="number"),
+            GrafanaColumn(text="hellinger", type="number"),
+            GrafanaColumn(text="kld", type="number"),
+        ]
     )
-    mlrun.api.crud.model_monitoring.grafana.validate_query_parameters(
-        query_parameters, SUPPORTED_QUERY_FUNCTIONS
+    for feature, base_stat in feature_stats.items():
+        current_stat = current_stats.get(feature, {})
+        drift_measure = drift_measures.get(feature, {})
+        table.add_row(
+            feature,
+            current_stat.get("min"),
+            current_stat.get("mean"),
+            current_stat.get("max"),
+            base_stat.get("min"),
+            base_stat.get("mean"),
+            base_stat.get("max"),
+            drift_measure.get("tvd"),
+            drift_measure.get("hellinger"),
+            drift_measure.get("kld"),
+        )
+    return [table]
+async def grafana_overall_feature_analysis(
+    body: Dict[str, Any],
+    query_parameters: Dict[str, str],
+    auth_info: mlrun.api.schemas.AuthInfo,
+):
+    endpoint_id = query_parameters.get("endpoint_id")
+    project = query_parameters.get("project")
+    await mlrun.api.utils.auth.verifier.AuthVerifier().query_project_resource_permissions(
+        mlrun.api.schemas.AuthorizationResourceTypes.model_endpoint,
+        project,
+        endpoint_id,
+        mlrun.api.schemas.AuthorizationAction.read,
+        auth_info,
+    )
+    endpoint = await run_in_threadpool(
+        mlrun.api.crud.ModelEndpoints().get_model_endpoint,
+        auth_info=auth_info,
+        project=project,
+        endpoint_id=endpoint_id,
+        feature_analysis=True,
+    )
+    table = GrafanaTable(
+        columns=[
+            GrafanaNumberColumn(text="tvd_sum"),
+            GrafanaNumberColumn(text="tvd_mean"),
+            GrafanaNumberColumn(text="hellinger_sum"),
+            GrafanaNumberColumn(text="hellinger_mean"),
+            GrafanaNumberColumn(text="kld_sum"),
+            GrafanaNumberColumn(text="kld_mean"),
+        ]
     )
-    query_parameters = (
-        mlrun.api.crud.model_monitoring.grafana.drop_grafana_escape_chars(
-            query_parameters
+    if endpoint.status.drift_measures:
+        table.add_row(
+            endpoint.status.drift_measures.get("tvd_sum"),
+            endpoint.status.drift_measures.get("tvd_mean"),
+            endpoint.status.drift_measures.get("hellinger_sum"),
+            endpoint.status.drift_measures.get("hellinger_mean"),
+            endpoint.status.drift_measures.get("kld_sum"),
+            endpoint.status.drift_measures.get("kld_mean"),
         )
+    return [table]
+async def grafana_incoming_features(
+    body: Dict[str, Any],
+    query_parameters: Dict[str, str],
+    auth_info: mlrun.api.schemas.AuthInfo,
+):
+    endpoint_id = query_parameters.get("endpoint_id")
+    project = query_parameters.get("project")
+    start = body.get("rangeRaw", {}).get("from", "now-1h")
+    end = body.get("rangeRaw", {}).get("to", "now")
+    await mlrun.api.utils.auth.verifier.AuthVerifier().query_project_resource_permissions(
+        mlrun.api.schemas.AuthorizationResourceTypes.model_endpoint,
+        project,
+        endpoint_id,
+        mlrun.api.schemas.AuthorizationAction.read,
+        auth_info,
     )
-    # At this point everything is validated and we can access everything that is needed without performing all previous
-    # checks again.
-    target_endpoint = query_parameters["target_endpoint"]
-    function = NAME_TO_QUERY_FUNCTION_DICTIONARY[target_endpoint]
-    if asyncio.iscoroutinefunction(function):
-        return await function(body, query_parameters, auth_info)
-    result = await run_in_threadpool(function, body, query_parameters, auth_info)
-    return result
+    endpoint = await run_in_threadpool(
+        mlrun.api.crud.ModelEndpoints().get_model_endpoint,
+        auth_info=auth_info,
+        project=project,
+        endpoint_id=endpoint_id,
+    )
+    time_series = []
+    feature_names = endpoint.spec.feature_names
+    if not feature_names:
+        logger.warn(
+            "'feature_names' is either missing or not initialized in endpoint record",
+            endpoint_id=endpoint.metadata.uid,
+        )
+        return time_series
+    path = config.model_endpoint_monitoring.store_prefixes.default.format(
+        project=project, kind=mlrun.api.schemas.ModelMonitoringStoreKinds.EVENTS
+    )
+    _, container, path = parse_model_endpoint_store_prefix(path)
+    client = get_frames_client(
+        token=auth_info.data_session,
+        address=config.v3io_framesd,
+        container=container,
+    )
+    data: pd.DataFrame = await run_in_threadpool(
+        client.read,
+        backend="tsdb",
+        table=path,
+        columns=feature_names,
+        filter=f"endpoint_id=='{endpoint_id}'",
+        start=start,
+        end=end,
+    )
+    data.drop(["endpoint_id"], axis=1, inplace=True, errors="ignore")
+    data.index = data.index.astype(np.int64) // 10**6
+    for feature, indexed_values in data.to_dict().items():
+        target = GrafanaTimeSeriesTarget(target=feature)
+        for index, value in indexed_values.items():
+            data_point = GrafanaDataPoint(value=float(value), timestamp=index)
+            target.add_data_point(data_point)
+        time_series.append(target)
+    return time_series
+def _parse_query_parameters(request_body: Dict[str, Any]) -> Dict[str, str]:
+    """
+    This function searches for the target field in Grafana's SimpleJson json. Once located, the target string is
+    parsed by splitting on semi-colons (;). Each part in the resulting list is then split by an equal sign (=) to be
+    read as key-value pairs.
+    """
+    # Try to get the target
+    targets = request_body.get("targets", [])
+    if len(targets) > 1:
+        logger.warn(
+            f"The 'targets' list contains more then one element ({len(targets)}), all targets except the first one are "
+            f"ignored."
+        )
+    target_obj = targets[0] if targets else {}
+    target_query = target_obj.get("target") if target_obj else ""
+    if not target_query:
+        raise MLRunBadRequestError(f"Target missing in request body:\n {request_body}")
+    parameters = _parse_parameters(target_query)
+    return parameters
+def _parse_search_parameters(request_body: Dict[str, Any]) -> Dict[str, str]:
+    """
+    This function searches for the target field in Grafana's SimpleJson json. Once located, the target string is
+    parsed by splitting on semi-colons (;). Each part in the resulting list is then split by an equal sign (=) to be
+    read as key-value pairs.
+    """
+    # Try to get the target
+    target = request_body.get("target")
+    if not target:
+        raise MLRunBadRequestError(f"Target missing in request body:\n {request_body}")
+    parameters = _parse_parameters(target)
+    return parameters
+def _parse_parameters(target_query):
+    parameters = {}
+    for query in filter(lambda q: q, target_query.split(";")):
+        query_parts = query.split("=")
+        if len(query_parts) < 2:
+            raise MLRunBadRequestError(
+                f"Query must contain both query key and query value. Expected query_key=query_value, found {query} "
+                f"instead."
+            )
+        parameters[query_parts[0]] = query_parts[1]
+    return parameters
+def _drop_grafana_escape_chars(query_parameters: Dict[str, str]):
+    query_parameters = dict(query_parameters)
+    endpoint_id = query_parameters.get("endpoint_id")
+    if endpoint_id is not None:
+        query_parameters["endpoint_id"] = endpoint_id.replace("\\", "")
+    return query_parameters
+def _validate_query_parameters(
+    query_parameters: Dict[str, str], supported_endpoints: Optional[Set[str]] = None
+):
+    """Validates the parameters sent via Grafana's SimpleJson query"""
+    if "target_endpoint" not in query_parameters:
+        raise MLRunBadRequestError(
+            f"Expected 'target_endpoint' field in query, found {query_parameters} instead"
+        )
+    if (
+        supported_endpoints is not None
+        and query_parameters["target_endpoint"] not in supported_endpoints
+    ):
+        raise MLRunBadRequestError(
+            f"{query_parameters['target_endpoint']} unsupported in query parameters: {query_parameters}. "
+            f"Currently supports: {','.join(supported_endpoints)}"
+        )
+def _json_loads_or_default(string: Optional[str], default: Any):
+    if string is None:
+        return default
+    obj = json.loads(string)
+    if not obj:
+        return default
+    return obj
+NAME_TO_QUERY_FUNCTION_DICTIONARY = {
+    "list_endpoints": grafana_list_endpoints,
+    "individual_feature_analysis": grafana_individual_feature_analysis,
+    "overall_feature_analysis": grafana_overall_feature_analysis,
+    "incoming_features": grafana_incoming_features,
+}
+NAME_TO_SEARCH_FUNCTION_DICTIONARY = {
+    "list_projects": grafana_list_projects,
+}
+SUPPORTED_QUERY_FUNCTIONS = set(NAME_TO_QUERY_FUNCTION_DICTIONARY.keys())
+SUPPORTED_SEARCH_FUNCTIONS = set(NAME_TO_SEARCH_FUNCTION_DICTIONARY)

mlrun 1.3.2rc1__py3-none-any.whl → 1.3.2rc2__py3-none-any.whl

Potentially problematic release.

mlrun 1.3.2rc1py3-none-any.whl → 1.3.2rc2py3-none-any.whl