PyPI - mlrun - Versions diffs - 1.3.3__py3-none-any.whl → 1.4.0__py3-none-any.whl - Mend

mlrun 1.3.3py3-none-any.whl → 1.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mlrun might be problematic. Click here for more details.

Files changed (444) hide show

mlrun/__init__.py +3 -3
mlrun/__main__.py +79 -37
mlrun/api/__init__.py +1 -1
mlrun/api/api/__init__.py +1 -1
mlrun/api/api/api.py +4 -4
mlrun/api/api/deps.py +10 -21
mlrun/api/api/endpoints/__init__.py +1 -1
mlrun/api/api/endpoints/artifacts.py +64 -36
mlrun/api/api/endpoints/auth.py +4 -4
mlrun/api/api/endpoints/background_tasks.py +11 -11
mlrun/api/api/endpoints/client_spec.py +5 -5
mlrun/api/api/endpoints/clusterization_spec.py +6 -4
mlrun/api/api/endpoints/feature_store.py +124 -115
mlrun/api/api/endpoints/files.py +22 -14
mlrun/api/api/endpoints/frontend_spec.py +28 -21
mlrun/api/api/endpoints/functions.py +142 -87
mlrun/api/api/endpoints/grafana_proxy.py +89 -442
mlrun/api/api/endpoints/healthz.py +20 -7
mlrun/api/api/endpoints/hub.py +320 -0
mlrun/api/api/endpoints/internal/__init__.py +1 -1
mlrun/api/api/endpoints/internal/config.py +1 -1
mlrun/api/api/endpoints/internal/memory_reports.py +9 -9
mlrun/api/api/endpoints/logs.py +11 -11
mlrun/api/api/endpoints/model_endpoints.py +74 -70
mlrun/api/api/endpoints/operations.py +13 -9
mlrun/api/api/endpoints/pipelines.py +93 -88
mlrun/api/api/endpoints/projects.py +35 -35
mlrun/api/api/endpoints/runs.py +69 -27
mlrun/api/api/endpoints/runtime_resources.py +28 -28
mlrun/api/api/endpoints/schedules.py +98 -41
mlrun/api/api/endpoints/secrets.py +37 -32
mlrun/api/api/endpoints/submit.py +12 -12
mlrun/api/api/endpoints/tags.py +20 -22
mlrun/api/api/utils.py +251 -42
mlrun/api/constants.py +1 -1
mlrun/api/crud/__init__.py +18 -15
mlrun/api/crud/artifacts.py +10 -10
mlrun/api/crud/client_spec.py +4 -4
mlrun/api/crud/clusterization_spec.py +3 -3
mlrun/api/crud/feature_store.py +54 -46
mlrun/api/crud/functions.py +3 -3
mlrun/api/crud/hub.py +312 -0
mlrun/api/crud/logs.py +11 -9
mlrun/api/crud/model_monitoring/__init__.py +3 -3
mlrun/api/crud/model_monitoring/grafana.py +435 -0
mlrun/api/crud/model_monitoring/model_endpoints.py +352 -129
mlrun/api/crud/notifications.py +149 -0
mlrun/api/crud/pipelines.py +67 -52
mlrun/api/crud/projects.py +51 -23
mlrun/api/crud/runs.py +7 -5
mlrun/api/crud/runtime_resources.py +13 -13
mlrun/api/{db/filedb → crud/runtimes}/__init__.py +1 -1
mlrun/api/crud/runtimes/nuclio/__init__.py +14 -0
mlrun/api/crud/runtimes/nuclio/function.py +505 -0
mlrun/api/crud/runtimes/nuclio/helpers.py +310 -0
mlrun/api/crud/secrets.py +88 -46
mlrun/api/crud/tags.py +5 -5
mlrun/api/db/__init__.py +1 -1
mlrun/api/db/base.py +102 -54
mlrun/api/db/init_db.py +2 -3
mlrun/api/db/session.py +4 -12
mlrun/api/db/sqldb/__init__.py +1 -1
mlrun/api/db/sqldb/db.py +439 -196
mlrun/api/db/sqldb/helpers.py +1 -1
mlrun/api/db/sqldb/models/__init__.py +3 -3
mlrun/api/db/sqldb/models/models_mysql.py +82 -64
mlrun/api/db/sqldb/models/models_sqlite.py +76 -64
mlrun/api/db/sqldb/session.py +27 -20
mlrun/api/initial_data.py +82 -24
mlrun/api/launcher.py +196 -0
mlrun/api/main.py +91 -22
mlrun/api/middlewares.py +6 -5
mlrun/api/migrations_mysql/env.py +1 -1
mlrun/api/migrations_mysql/versions/28383af526f3_market_place_to_hub.py +40 -0
mlrun/api/migrations_mysql/versions/32bae1b0e29c_increase_timestamp_fields_precision.py +1 -1
mlrun/api/migrations_mysql/versions/4903aef6a91d_tag_foreign_key_and_cascades.py +1 -1
mlrun/api/migrations_mysql/versions/5f1351c88a19_adding_background_tasks_table.py +1 -1
mlrun/api/migrations_mysql/versions/88e656800d6a_add_requested_logs_column_and_index_to_.py +1 -1
mlrun/api/migrations_mysql/versions/9d16de5f03a7_adding_data_versions_table.py +1 -1
mlrun/api/migrations_mysql/versions/b86f5b53f3d7_adding_name_and_updated_to_runs_table.py +1 -1
mlrun/api/migrations_mysql/versions/c4af40b0bf61_init.py +1 -1
mlrun/api/migrations_mysql/versions/c905d15bd91d_notifications.py +72 -0
mlrun/api/migrations_mysql/versions/ee041e8fdaa0_adding_next_run_time_column_to_schedule_.py +1 -1
mlrun/api/migrations_sqlite/env.py +1 -1
mlrun/api/migrations_sqlite/versions/11f8dd2dc9fe_init.py +1 -1
mlrun/api/migrations_sqlite/versions/1c954f8cb32d_schedule_last_run_uri.py +1 -1
mlrun/api/migrations_sqlite/versions/2b6d23c715aa_adding_feature_sets.py +1 -1
mlrun/api/migrations_sqlite/versions/4acd9430b093_market_place_to_hub.py +77 -0
mlrun/api/migrations_sqlite/versions/6401142f2d7c_adding_next_run_time_column_to_schedule_.py +1 -1
mlrun/api/migrations_sqlite/versions/64d90a1a69bc_adding_background_tasks_table.py +1 -1
mlrun/api/migrations_sqlite/versions/803438ecd005_add_requested_logs_column_to_runs.py +1 -1
mlrun/api/migrations_sqlite/versions/863114f0c659_refactoring_feature_set.py +1 -1
mlrun/api/migrations_sqlite/versions/959ae00528ad_notifications.py +63 -0
mlrun/api/migrations_sqlite/versions/accf9fc83d38_adding_data_versions_table.py +1 -1
mlrun/api/migrations_sqlite/versions/b68e8e897a28_schedule_labels.py +1 -1
mlrun/api/migrations_sqlite/versions/bcd0c1f9720c_adding_project_labels.py +1 -1
mlrun/api/migrations_sqlite/versions/cf21882f938e_schedule_id.py +1 -1
mlrun/api/migrations_sqlite/versions/d781f58f607f_tag_object_name_string.py +1 -1
mlrun/api/migrations_sqlite/versions/deac06871ace_adding_marketplace_sources_table.py +1 -1
mlrun/api/migrations_sqlite/versions/e1dd5983c06b_schedule_concurrency_limit.py +1 -1
mlrun/api/migrations_sqlite/versions/e5594ed3ab53_adding_name_and_updated_to_runs_table.py +1 -1
mlrun/api/migrations_sqlite/versions/f4249b4ba6fa_adding_feature_vectors.py +1 -1
mlrun/api/migrations_sqlite/versions/f7b5a1a03629_adding_feature_labels.py +1 -1
mlrun/api/schemas/__init__.py +216 -138
mlrun/api/utils/__init__.py +1 -1
mlrun/api/utils/asyncio.py +1 -1
mlrun/api/utils/auth/__init__.py +1 -1
mlrun/api/utils/auth/providers/__init__.py +1 -1
mlrun/api/utils/auth/providers/base.py +7 -7
mlrun/api/utils/auth/providers/nop.py +6 -7
mlrun/api/utils/auth/providers/opa.py +17 -17
mlrun/api/utils/auth/verifier.py +36 -34
mlrun/api/utils/background_tasks.py +24 -24
mlrun/{builder.py → api/utils/builder.py} +216 -123
mlrun/api/utils/clients/__init__.py +1 -1
mlrun/api/utils/clients/chief.py +19 -4
mlrun/api/utils/clients/iguazio.py +106 -60
mlrun/api/utils/clients/log_collector.py +1 -1
mlrun/api/utils/clients/nuclio.py +23 -23
mlrun/api/utils/clients/protocols/grpc.py +2 -2
mlrun/api/utils/db/__init__.py +1 -1
mlrun/api/utils/db/alembic.py +1 -1
mlrun/api/utils/db/backup.py +1 -1
mlrun/api/utils/db/mysql.py +24 -25
mlrun/api/utils/db/sql_collation.py +1 -1
mlrun/api/utils/db/sqlite_migration.py +2 -2
mlrun/api/utils/events/__init__.py +14 -0
mlrun/api/utils/events/base.py +57 -0
mlrun/api/utils/events/events_factory.py +41 -0
mlrun/api/utils/events/iguazio.py +217 -0
mlrun/api/utils/events/nop.py +55 -0
mlrun/api/utils/helpers.py +16 -13
mlrun/api/utils/memory_reports.py +1 -1
mlrun/api/utils/periodic.py +6 -3
mlrun/api/utils/projects/__init__.py +1 -1
mlrun/api/utils/projects/follower.py +33 -33
mlrun/api/utils/projects/leader.py +36 -34
mlrun/api/utils/projects/member.py +27 -27
mlrun/api/utils/projects/remotes/__init__.py +1 -1
mlrun/api/utils/projects/remotes/follower.py +13 -13
mlrun/api/utils/projects/remotes/leader.py +10 -10
mlrun/api/utils/projects/remotes/nop_follower.py +27 -21
mlrun/api/utils/projects/remotes/nop_leader.py +17 -16
mlrun/api/utils/scheduler.py +140 -51
mlrun/api/utils/singletons/__init__.py +1 -1
mlrun/api/utils/singletons/db.py +9 -15
mlrun/api/utils/singletons/k8s.py +677 -5
mlrun/api/utils/singletons/logs_dir.py +1 -1
mlrun/api/utils/singletons/project_member.py +1 -1
mlrun/api/utils/singletons/scheduler.py +1 -1
mlrun/artifacts/__init__.py +2 -2
mlrun/artifacts/base.py +8 -2
mlrun/artifacts/dataset.py +5 -3
mlrun/artifacts/manager.py +7 -1
mlrun/artifacts/model.py +15 -4
mlrun/artifacts/plots.py +1 -1
mlrun/common/__init__.py +1 -1
mlrun/common/constants.py +15 -0
mlrun/common/model_monitoring.py +209 -0
mlrun/common/schemas/__init__.py +167 -0
mlrun/{api → common}/schemas/artifact.py +13 -14
mlrun/{api → common}/schemas/auth.py +10 -8
mlrun/{api → common}/schemas/background_task.py +3 -3
mlrun/{api → common}/schemas/client_spec.py +1 -1
mlrun/{api → common}/schemas/clusterization_spec.py +3 -3
mlrun/{api → common}/schemas/constants.py +21 -8
mlrun/common/schemas/events.py +36 -0
mlrun/{api → common}/schemas/feature_store.py +2 -1
mlrun/{api → common}/schemas/frontend_spec.py +7 -6
mlrun/{api → common}/schemas/function.py +5 -5
mlrun/{api → common}/schemas/http.py +3 -3
mlrun/common/schemas/hub.py +134 -0
mlrun/{api → common}/schemas/k8s.py +3 -3
mlrun/{api → common}/schemas/memory_reports.py +1 -1
mlrun/common/schemas/model_endpoints.py +342 -0
mlrun/common/schemas/notification.py +57 -0
mlrun/{api → common}/schemas/object.py +6 -6
mlrun/{api → common}/schemas/pipeline.py +3 -3
mlrun/{api → common}/schemas/project.py +6 -5
mlrun/common/schemas/regex.py +24 -0
mlrun/common/schemas/runs.py +30 -0
mlrun/{api → common}/schemas/runtime_resource.py +3 -3
mlrun/{api → common}/schemas/schedule.py +19 -7
mlrun/{api → common}/schemas/secret.py +3 -3
mlrun/{api → common}/schemas/tag.py +2 -2
mlrun/common/types.py +25 -0
mlrun/config.py +152 -20
mlrun/data_types/__init__.py +7 -2
mlrun/data_types/data_types.py +4 -2
mlrun/data_types/infer.py +1 -1
mlrun/data_types/spark.py +10 -3
mlrun/datastore/__init__.py +10 -3
mlrun/datastore/azure_blob.py +1 -1
mlrun/datastore/base.py +185 -53
mlrun/datastore/datastore.py +1 -1
mlrun/datastore/filestore.py +1 -1
mlrun/datastore/google_cloud_storage.py +1 -1
mlrun/datastore/inmem.py +4 -1
mlrun/datastore/redis.py +1 -1
mlrun/datastore/s3.py +1 -1
mlrun/datastore/sources.py +192 -70
mlrun/datastore/spark_udf.py +44 -0
mlrun/datastore/store_resources.py +4 -4
mlrun/datastore/targets.py +115 -45
mlrun/datastore/utils.py +127 -5
mlrun/datastore/v3io.py +1 -1
mlrun/datastore/wasbfs/__init__.py +1 -1
mlrun/datastore/wasbfs/fs.py +1 -1
mlrun/db/__init__.py +7 -5
mlrun/db/base.py +112 -68
mlrun/db/httpdb.py +445 -277
mlrun/db/nopdb.py +491 -0
mlrun/db/sqldb.py +112 -65
mlrun/errors.py +6 -1
mlrun/execution.py +44 -22
mlrun/feature_store/__init__.py +1 -1
mlrun/feature_store/api.py +143 -95
mlrun/feature_store/common.py +16 -20
mlrun/feature_store/feature_set.py +42 -12
mlrun/feature_store/feature_vector.py +32 -21
mlrun/feature_store/ingestion.py +9 -12
mlrun/feature_store/retrieval/__init__.py +3 -2
mlrun/feature_store/retrieval/base.py +388 -66
mlrun/feature_store/retrieval/dask_merger.py +63 -151
mlrun/feature_store/retrieval/job.py +30 -12
mlrun/feature_store/retrieval/local_merger.py +40 -133
mlrun/feature_store/retrieval/spark_merger.py +129 -127
mlrun/feature_store/retrieval/storey_merger.py +173 -0
mlrun/feature_store/steps.py +132 -15
mlrun/features.py +8 -3
mlrun/frameworks/__init__.py +1 -1
mlrun/frameworks/_common/__init__.py +1 -1
mlrun/frameworks/_common/artifacts_library.py +1 -1
mlrun/frameworks/_common/mlrun_interface.py +1 -1
mlrun/frameworks/_common/model_handler.py +1 -1
mlrun/frameworks/_common/plan.py +1 -1
mlrun/frameworks/_common/producer.py +1 -1
mlrun/frameworks/_common/utils.py +1 -1
mlrun/frameworks/_dl_common/__init__.py +1 -1
mlrun/frameworks/_dl_common/loggers/__init__.py +1 -1
mlrun/frameworks/_dl_common/loggers/logger.py +1 -1
mlrun/frameworks/_dl_common/loggers/mlrun_logger.py +1 -1
mlrun/frameworks/_dl_common/loggers/tensorboard_logger.py +1 -1
mlrun/frameworks/_dl_common/model_handler.py +1 -1
mlrun/frameworks/_dl_common/utils.py +1 -1
mlrun/frameworks/_ml_common/__init__.py +1 -1
mlrun/frameworks/_ml_common/artifacts_library.py +1 -1
mlrun/frameworks/_ml_common/loggers/__init__.py +1 -1
mlrun/frameworks/_ml_common/loggers/logger.py +1 -1
mlrun/frameworks/_ml_common/loggers/mlrun_logger.py +1 -1
mlrun/frameworks/_ml_common/model_handler.py +1 -1
mlrun/frameworks/_ml_common/pkl_model_server.py +13 -1
mlrun/frameworks/_ml_common/plan.py +1 -1
mlrun/frameworks/_ml_common/plans/__init__.py +1 -1
mlrun/frameworks/_ml_common/plans/calibration_curve_plan.py +1 -6
mlrun/frameworks/_ml_common/plans/confusion_matrix_plan.py +1 -1
mlrun/frameworks/_ml_common/plans/dataset_plan.py +1 -1
mlrun/frameworks/_ml_common/plans/feature_importance_plan.py +1 -1
mlrun/frameworks/_ml_common/plans/roc_curve_plan.py +1 -1
mlrun/frameworks/_ml_common/producer.py +1 -1
mlrun/frameworks/_ml_common/utils.py +1 -1
mlrun/frameworks/auto_mlrun/__init__.py +1 -1
mlrun/frameworks/auto_mlrun/auto_mlrun.py +1 -1
mlrun/frameworks/huggingface/__init__.py +1 -1
mlrun/frameworks/huggingface/model_server.py +1 -1
mlrun/frameworks/lgbm/__init__.py +1 -1
mlrun/frameworks/lgbm/callbacks/__init__.py +1 -1
mlrun/frameworks/lgbm/callbacks/callback.py +1 -1
mlrun/frameworks/lgbm/callbacks/logging_callback.py +1 -1
mlrun/frameworks/lgbm/callbacks/mlrun_logging_callback.py +1 -1
mlrun/frameworks/lgbm/mlrun_interfaces/__init__.py +1 -1
mlrun/frameworks/lgbm/mlrun_interfaces/booster_mlrun_interface.py +1 -1
mlrun/frameworks/lgbm/mlrun_interfaces/mlrun_interface.py +1 -1
mlrun/frameworks/lgbm/mlrun_interfaces/model_mlrun_interface.py +1 -1
mlrun/frameworks/lgbm/model_handler.py +1 -1
mlrun/frameworks/lgbm/model_server.py +1 -1
mlrun/frameworks/lgbm/utils.py +1 -1
mlrun/frameworks/onnx/__init__.py +1 -1
mlrun/frameworks/onnx/dataset.py +1 -1
mlrun/frameworks/onnx/mlrun_interface.py +1 -1
mlrun/frameworks/onnx/model_handler.py +1 -1
mlrun/frameworks/onnx/model_server.py +1 -1
mlrun/frameworks/parallel_coordinates.py +1 -1
mlrun/frameworks/pytorch/__init__.py +1 -1
mlrun/frameworks/pytorch/callbacks/__init__.py +1 -1
mlrun/frameworks/pytorch/callbacks/callback.py +1 -1
mlrun/frameworks/pytorch/callbacks/logging_callback.py +1 -1
mlrun/frameworks/pytorch/callbacks/mlrun_logging_callback.py +1 -1
mlrun/frameworks/pytorch/callbacks/tensorboard_logging_callback.py +1 -1
mlrun/frameworks/pytorch/callbacks_handler.py +1 -1
mlrun/frameworks/pytorch/mlrun_interface.py +1 -1
mlrun/frameworks/pytorch/model_handler.py +1 -1
mlrun/frameworks/pytorch/model_server.py +1 -1
mlrun/frameworks/pytorch/utils.py +1 -1
mlrun/frameworks/sklearn/__init__.py +1 -1
mlrun/frameworks/sklearn/estimator.py +1 -1
mlrun/frameworks/sklearn/metric.py +1 -1
mlrun/frameworks/sklearn/metrics_library.py +1 -1
mlrun/frameworks/sklearn/mlrun_interface.py +1 -1
mlrun/frameworks/sklearn/model_handler.py +1 -1
mlrun/frameworks/sklearn/utils.py +1 -1
mlrun/frameworks/tf_keras/__init__.py +1 -1
mlrun/frameworks/tf_keras/callbacks/__init__.py +1 -1
mlrun/frameworks/tf_keras/callbacks/logging_callback.py +1 -1
mlrun/frameworks/tf_keras/callbacks/mlrun_logging_callback.py +1 -1
mlrun/frameworks/tf_keras/callbacks/tensorboard_logging_callback.py +1 -1
mlrun/frameworks/tf_keras/mlrun_interface.py +1 -1
mlrun/frameworks/tf_keras/model_handler.py +1 -1
mlrun/frameworks/tf_keras/model_server.py +1 -1
mlrun/frameworks/tf_keras/utils.py +1 -1
mlrun/frameworks/xgboost/__init__.py +1 -1
mlrun/frameworks/xgboost/mlrun_interface.py +1 -1
mlrun/frameworks/xgboost/model_handler.py +1 -1
mlrun/frameworks/xgboost/utils.py +1 -1
mlrun/k8s_utils.py +14 -765
mlrun/kfpops.py +14 -17
mlrun/launcher/__init__.py +13 -0
mlrun/launcher/base.py +406 -0
mlrun/launcher/client.py +159 -0
mlrun/launcher/factory.py +50 -0
mlrun/launcher/local.py +276 -0
mlrun/launcher/remote.py +178 -0
mlrun/lists.py +10 -2
mlrun/mlutils/__init__.py +1 -1
mlrun/mlutils/data.py +1 -1
mlrun/mlutils/models.py +1 -1
mlrun/mlutils/plots.py +1 -1
mlrun/model.py +252 -14
mlrun/model_monitoring/__init__.py +41 -0
mlrun/model_monitoring/features_drift_table.py +1 -1
mlrun/model_monitoring/helpers.py +123 -38
mlrun/model_monitoring/model_endpoint.py +144 -0
mlrun/model_monitoring/model_monitoring_batch.py +310 -259
mlrun/model_monitoring/stores/__init__.py +106 -0
mlrun/model_monitoring/stores/kv_model_endpoint_store.py +448 -0
mlrun/model_monitoring/stores/model_endpoint_store.py +147 -0
mlrun/model_monitoring/stores/models/__init__.py +23 -0
mlrun/model_monitoring/stores/models/base.py +18 -0
mlrun/model_monitoring/stores/models/mysql.py +100 -0
mlrun/model_monitoring/stores/models/sqlite.py +98 -0
mlrun/model_monitoring/stores/sql_model_endpoint_store.py +370 -0
mlrun/model_monitoring/stream_processing_fs.py +239 -271
mlrun/package/__init__.py +163 -0
mlrun/package/context_handler.py +325 -0
mlrun/package/errors.py +47 -0
mlrun/package/packager.py +298 -0
mlrun/{runtimes/package → package/packagers}/__init__.py +3 -1
mlrun/package/packagers/default_packager.py +422 -0
mlrun/package/packagers/numpy_packagers.py +612 -0
mlrun/package/packagers/pandas_packagers.py +968 -0
mlrun/package/packagers/python_standard_library_packagers.py +616 -0
mlrun/package/packagers_manager.py +786 -0
mlrun/package/utils/__init__.py +53 -0
mlrun/package/utils/_archiver.py +226 -0
mlrun/package/utils/_formatter.py +211 -0
mlrun/package/utils/_pickler.py +234 -0
mlrun/package/utils/_supported_format.py +71 -0
mlrun/package/utils/log_hint_utils.py +93 -0
mlrun/package/utils/type_hint_utils.py +298 -0
mlrun/platforms/__init__.py +1 -1
mlrun/platforms/iguazio.py +34 -2
mlrun/platforms/other.py +1 -1
mlrun/projects/__init__.py +1 -1
mlrun/projects/operations.py +14 -9
mlrun/projects/pipelines.py +31 -13
mlrun/projects/project.py +762 -238
mlrun/render.py +49 -19
mlrun/run.py +57 -326
mlrun/runtimes/__init__.py +3 -9
mlrun/runtimes/base.py +247 -784
mlrun/runtimes/constants.py +1 -1
mlrun/runtimes/daskjob.py +45 -41
mlrun/runtimes/funcdoc.py +43 -7
mlrun/runtimes/function.py +66 -656
mlrun/runtimes/function_reference.py +1 -1
mlrun/runtimes/generators.py +1 -1
mlrun/runtimes/kubejob.py +99 -116
mlrun/runtimes/local.py +59 -66
mlrun/runtimes/mpijob/__init__.py +1 -1
mlrun/runtimes/mpijob/abstract.py +13 -15
mlrun/runtimes/mpijob/v1.py +3 -1
mlrun/runtimes/mpijob/v1alpha1.py +1 -1
mlrun/runtimes/nuclio.py +1 -1
mlrun/runtimes/pod.py +51 -26
mlrun/runtimes/remotesparkjob.py +3 -1
mlrun/runtimes/serving.py +12 -4
mlrun/runtimes/sparkjob/__init__.py +1 -2
mlrun/runtimes/sparkjob/abstract.py +44 -31
mlrun/runtimes/sparkjob/spark3job.py +11 -9
mlrun/runtimes/utils.py +61 -42
mlrun/secrets.py +16 -18
mlrun/serving/__init__.py +3 -2
mlrun/serving/merger.py +1 -1
mlrun/serving/remote.py +1 -1
mlrun/serving/routers.py +39 -42
mlrun/serving/server.py +23 -13
mlrun/serving/serving_wrapper.py +1 -1
mlrun/serving/states.py +172 -39
mlrun/serving/utils.py +1 -1
mlrun/serving/v1_serving.py +1 -1
mlrun/serving/v2_serving.py +29 -21
mlrun/utils/__init__.py +1 -2
mlrun/utils/async_http.py +8 -1
mlrun/utils/azure_vault.py +1 -1
mlrun/utils/clones.py +2 -2
mlrun/utils/condition_evaluator.py +65 -0
mlrun/utils/db.py +52 -0
mlrun/utils/helpers.py +188 -13
mlrun/utils/http.py +89 -54
mlrun/utils/logger.py +48 -8
mlrun/utils/model_monitoring.py +132 -100
mlrun/utils/notifications/__init__.py +1 -1
mlrun/utils/notifications/notification/__init__.py +8 -6
mlrun/utils/notifications/notification/base.py +20 -14
mlrun/utils/notifications/notification/console.py +7 -4
mlrun/utils/notifications/notification/git.py +36 -19
mlrun/utils/notifications/notification/ipython.py +10 -8
mlrun/utils/notifications/notification/slack.py +18 -13
mlrun/utils/notifications/notification_pusher.py +377 -56
mlrun/utils/regex.py +6 -1
mlrun/utils/singleton.py +1 -1
mlrun/utils/v3io_clients.py +1 -1
mlrun/utils/vault.py +270 -269
mlrun/utils/version/__init__.py +1 -1
mlrun/utils/version/version.json +2 -2
mlrun/utils/version/version.py +1 -1
{mlrun-1.3.3.dist-info → mlrun-1.4.0.dist-info}/METADATA +16 -10
mlrun-1.4.0.dist-info/RECORD +434 -0
mlrun/api/api/endpoints/marketplace.py +0 -257
mlrun/api/crud/marketplace.py +0 -221
mlrun/api/crud/model_monitoring/model_endpoint_store.py +0 -847
mlrun/api/db/filedb/db.py +0 -518
mlrun/api/schemas/marketplace.py +0 -128
mlrun/api/schemas/model_endpoints.py +0 -185
mlrun/db/filedb.py +0 -891
mlrun/feature_store/retrieval/online.py +0 -92
mlrun/model_monitoring/constants.py +0 -67
mlrun/runtimes/package/context_handler.py +0 -711
mlrun/runtimes/sparkjob/spark2job.py +0 -59
mlrun-1.3.3.dist-info/RECORD +0 -381
{mlrun-1.3.3.dist-info → mlrun-1.4.0.dist-info}/LICENSE +0 -0
{mlrun-1.3.3.dist-info → mlrun-1.4.0.dist-info}/WHEEL +0 -0
{mlrun-1.3.3.dist-info → mlrun-1.4.0.dist-info}/entry_points.txt +0 -0
{mlrun-1.3.3.dist-info → mlrun-1.4.0.dist-info}/top_level.txt +0 -0

mlrun/model_monitoring/stream_processing_fs.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Copyright 2018 Iguazio
+# Copyright 2023 Iguazio
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -19,23 +19,25 @@ import os
 import typing
 import pandas as pd
-# Constants
 import storey
-import v3io
-import v3io.dataplane
+import mlrun
+import mlrun.common.model_monitoring
 import mlrun.config
 import mlrun.datastore.targets
 import mlrun.feature_store.steps
 import mlrun.utils
 import mlrun.utils.model_monitoring
 import mlrun.utils.v3io_clients
-from mlrun.model_monitoring.constants import (
+from mlrun.common.model_monitoring import (
     EventFieldType,
     EventKeyMetrics,
     EventLiveStats,
+    FileTargetKind,
+    ModelEndpointTarget,
+    ProjectSecretKeys,
 )
+from mlrun.model_monitoring.stores import get_model_endpoint_store
 from mlrun.utils import logger
@@ -45,81 +47,90 @@ class EventStreamProcessor:
         self,
         project: str,
         parquet_batching_max_events: int,
+        parquet_target: str,
         sample_window: int = 10,
-        tsdb_batching_max_events: int = 10,
-        tsdb_batching_timeout_secs: int = 60 * 5,  # Default 5 minutes
         parquet_batching_timeout_secs: int = 30 * 60,  # Default 30 minutes
         aggregate_count_windows: typing.Optional[typing.List[str]] = None,
         aggregate_count_period: str = "30s",
         aggregate_avg_windows: typing.Optional[typing.List[str]] = None,
         aggregate_avg_period: str = "30s",
-        v3io_access_key: typing.Optional[str] = None,
-        v3io_framesd: typing.Optional[str] = None,
-        v3io_api: typing.Optional[str] = None,
         model_monitoring_access_key: str = None,
     ):
+        # General configurations, mainly used for the storey steps in the future serving graph
         self.project = project
         self.sample_window = sample_window
-        self.tsdb_batching_max_events = tsdb_batching_max_events
-        self.tsdb_batching_timeout_secs = tsdb_batching_timeout_secs
-        self.parquet_batching_max_events = parquet_batching_max_events
-        self.parquet_batching_timeout_secs = parquet_batching_timeout_secs
         self.aggregate_count_windows = aggregate_count_windows or ["5m", "1h"]
         self.aggregate_count_period = aggregate_count_period
         self.aggregate_avg_windows = aggregate_avg_windows or ["5m", "1h"]
         self.aggregate_avg_period = aggregate_avg_period
+        # Parquet path and configurations
+        self.parquet_path = parquet_target
+        self.parquet_batching_max_events = parquet_batching_max_events
+        self.parquet_batching_timeout_secs = parquet_batching_timeout_secs
+        self.model_endpoint_store_target = (
+            mlrun.mlconf.model_endpoint_monitoring.store_type
+        )
+        logger.info(
+            "Initializing model monitoring event stream processor",
+            parquet_path=self.parquet_path,
+            parquet_batching_max_events=self.parquet_batching_max_events,
+        )
+        self.storage_options = None
+        if not mlrun.mlconf.is_ce_mode():
+            self._initialize_v3io_configurations(
+                model_monitoring_access_key=model_monitoring_access_key
+            )
+    def _initialize_v3io_configurations(
+        self,
+        tsdb_batching_max_events: int = 10,
+        tsdb_batching_timeout_secs: int = 60 * 5,  # Default 5 minutes
+        v3io_access_key: typing.Optional[str] = None,
+        v3io_framesd: typing.Optional[str] = None,
+        v3io_api: typing.Optional[str] = None,
+        model_monitoring_access_key: str = None,
+    ):
+        # Get the V3IO configurations
         self.v3io_framesd = v3io_framesd or mlrun.mlconf.v3io_framesd
         self.v3io_api = v3io_api or mlrun.mlconf.v3io_api
         self.v3io_access_key = v3io_access_key or os.environ.get("V3IO_ACCESS_KEY")
         self.model_monitoring_access_key = (
             model_monitoring_access_key
-            or os.environ.get("MODEL_MONITORING_ACCESS_KEY")
+            or os.environ.get(ProjectSecretKeys.ACCESS_KEY)
             or self.v3io_access_key
         )
         self.storage_options = dict(
             v3io_access_key=self.model_monitoring_access_key, v3io_api=self.v3io_api
         )
-        template = mlrun.mlconf.model_endpoint_monitoring.store_prefixes.default
-        kv_path = template.format(project=project, kind="endpoints")
+        # KV path
+        kv_path = mlrun.mlconf.get_model_monitoring_file_target_path(
+            project=self.project, kind=FileTargetKind.ENDPOINTS
+        )
         (
             _,
             self.kv_container,
             self.kv_path,
         ) = mlrun.utils.model_monitoring.parse_model_endpoint_store_prefix(kv_path)
-        tsdb_path = template.format(project=project, kind="events")
+        # TSDB path and configurations
+        tsdb_path = mlrun.mlconf.get_model_monitoring_file_target_path(
+            project=self.project, kind=FileTargetKind.EVENTS
+        )
         (
             _,
             self.tsdb_container,
             self.tsdb_path,
         ) = mlrun.utils.model_monitoring.parse_model_endpoint_store_prefix(tsdb_path)
-        self.tsdb_path = f"{self.tsdb_container}/{self.tsdb_path}"
-        self.parquet_path = (
-            mlrun.mlconf.model_endpoint_monitoring.store_prefixes.user_space.format(
-                project=project, kind="parquet"
-            )
-        )
-        logger.info(
-            "Initializing model monitoring event stream processor",
-            parquet_batching_max_events=self.parquet_batching_max_events,
-            v3io_access_key=self.v3io_access_key,
-            model_monitoring_access_key=self.model_monitoring_access_key,
-            default_store_prefix=mlrun.mlconf.model_endpoint_monitoring.store_prefixes.default,
-            user_space_store_prefix=mlrun.mlconf.model_endpoint_monitoring.store_prefixes.user_space,
-            v3io_api=self.v3io_api,
-            v3io_framesd=self.v3io_framesd,
-            kv_container=self.kv_container,
-            kv_path=self.kv_path,
-            tsdb_container=self.tsdb_container,
-            tsdb_path=self.tsdb_path,
-            parquet_path=self.parquet_path,
-        )
+        self.tsdb_path = f"{self.tsdb_container}/{self.tsdb_path}"
+        self.tsdb_batching_max_events = tsdb_batching_max_events
+        self.tsdb_batching_timeout_secs = tsdb_batching_timeout_secs
     def apply_monitoring_serving_graph(self, fn):
         """
@@ -127,20 +138,23 @@ class EventStreamProcessor:
         of different operations that are executed on the events from the model server. Each event has
         metadata (function_uri, timestamp, class, etc.) but also inputs and predictions from the model server.
         Throughout the serving graph, the results are written to 3 different databases:
-        1. KV (steps 7-9): Stores metadata and stats about the average latency and the amount of predictions over time
-           per endpoint. for example the amount of predictions of endpoint x in the last 5 min. This data is used by
-           the monitoring dashboards in grafana. Please note that the KV table, which can be found under
-           v3io:///users/pipelines/project-name/model-endpoints/endpoints/ also contains data on the model endpoint
-            from other processes, such as current_stats that is being calculated by the monitoring batch job
-            process.
+        1. KV/SQL (steps 7-9): Stores metadata and stats about the average latency and the amount of predictions over
+           time per endpoint. for example the amount of predictions of endpoint x in the last 5 min. This data is used
+           by the monitoring dashboards in grafana. The model endpoints table also contains data on the model endpoint
+           from other processes, such as current_stats that is being calculated by the monitoring batch job
+           process. If the target is from type KV, then the model endpoints table can be found under
+           v3io:///users/pipelines/project-name/model-endpoints/endpoints/. If the target is SQL, then the table
+           is stored within the database that was defined in the provided connection string and can be found
+           under mlrun.mlconf.model_endpoint_monitoring.endpoint_store_connection.
         2. TSDB (steps 12-18): Stores live data of different key metric dictionaries in tsdb target. Results can be
            found under v3io:///users/pipelines/project-name/model-endpoints/events/. At the moment, this part supports
            3 different key metric dictionaries: base_metrics (average latency and predictions over time),
            endpoint_features (Prediction and feature names and values), and custom_metrics (user-defined metrics).
            This data is also being used by the monitoring dashboards in grafana.
         3. Parquet (steps 19-20): This Parquet file includes the required data for the model monitoring batch job
-           that run every hour by default. The parquet target can be found under
-           v3io:///projects/{project}/model-endpoints/.
+           that run every hour by default. If defined, the parquet target path can be found under
+           mlrun.mlconf.model_endpoint_monitoring.offline. Otherwise, the default parquet path is under
+           mlrun.mlconf.model_endpoint_monitoring.user_space.
         :param fn: A serving function.
         """
@@ -151,9 +165,6 @@ class EventStreamProcessor:
         def apply_process_endpoint_event():
             graph.add_step(
                 "ProcessEndpointEvent",
-                kv_container=self.kv_container,
-                kv_path=self.kv_path,
-                v3io_access_key=self.v3io_access_key,
                 full_event=True,
                 project=self.project,
             )
@@ -182,10 +193,8 @@ class EventStreamProcessor:
             graph.add_step(
                 "MapFeatureNames",
                 name="MapFeatureNames",
-                kv_container=self.kv_container,
-                kv_path=self.kv_path,
-                access_key=self.v3io_access_key,
                 infer_columns_from_data=True,
+                project=self.project,
                 after="flatten_events",
             )
@@ -209,7 +218,6 @@ class EventStreamProcessor:
                 after="MapFeatureNames",
                 step_name="Aggregates",
                 table=".",
-                v3io_access_key=self.v3io_access_key,
             )
             # Step 5.2 - Calculate average latency time for each window (5 min and 1 hour by default)
             graph.add_step(
@@ -226,7 +234,6 @@ class EventStreamProcessor:
                 name=EventFieldType.LATENCY,
                 after=EventFieldType.PREDICTIONS,
                 table=".",
-                v3io_access_key=self.v3io_access_key,
             )
         apply_storey_aggregations()
@@ -239,117 +246,122 @@ class EventStreamProcessor:
                 after=EventFieldType.LATENCY,
                 window_size=self.sample_window,
                 key=EventFieldType.ENDPOINT_ID,
-                v3io_access_key=self.v3io_access_key,
             )
         apply_storey_sample_window()
-        # Steps 7-9 - KV branch
-        # Step 7 - Filter relevant keys from the event before writing the data into KV
-        def apply_process_before_kv():
-            graph.add_step("ProcessBeforeKV", name="ProcessBeforeKV", after="sample")
+        # Steps 7-9 - KV/SQL branch
+        # Step 7 - Filter relevant keys from the event before writing the data into the database table
+        def apply_process_before_endpoint_update():
+            graph.add_step(
+                "ProcessBeforeEndpointUpdate",
+                name="ProcessBeforeEndpointUpdate",
+                after="sample",
+            )
-        apply_process_before_kv()
+        apply_process_before_endpoint_update()
-        # Step 8 - Write the filtered event to KV table. At this point, the serving graph updates the stats
+        # Step 8 - Write the filtered event to KV/SQL table. At this point, the serving graph updates the stats
         # about average latency and the amount of predictions over time
-        def apply_write_to_kv():
+        def apply_update_endpoint():
             graph.add_step(
-                "WriteToKV",
-                name="WriteToKV",
-                after="ProcessBeforeKV",
-                container=self.kv_container,
-                table=self.kv_path,
-                v3io_access_key=self.v3io_access_key,
+                "UpdateEndpoint",
+                name="UpdateEndpoint",
+                after="ProcessBeforeEndpointUpdate",
+                project=self.project,
+                model_endpoint_store_target=self.model_endpoint_store_target,
             )
-        apply_write_to_kv()
+        apply_update_endpoint()
-        # Step 9 - Apply infer_schema on the KB table for generating schema file
+        # Step 9 (only for KV target) - Apply infer_schema on the model endpoints table for generating schema file
         # which will be used by Grafana monitoring dashboards
         def apply_infer_schema():
             graph.add_step(
                 "InferSchema",
                 name="InferSchema",
-                after="WriteToKV",
-                v3io_access_key=self.v3io_access_key,
+                after="UpdateEndpoint",
                 v3io_framesd=self.v3io_framesd,
                 container=self.kv_container,
                 table=self.kv_path,
             )
-        apply_infer_schema()
+        if self.model_endpoint_store_target == ModelEndpointTarget.V3IO_NOSQL:
+            apply_infer_schema()
-        # Steps 11-18 - TSDB branch
-        # Step 11 - Before writing data to TSDB, create dictionary of 2-3 dictionaries that contains
-        # stats and details about the events
-        def apply_process_before_tsdb():
-            graph.add_step(
-                "ProcessBeforeTSDB", name="ProcessBeforeTSDB", after="sample"
-            )
+        # Steps 11-18 - TSDB branch (not supported in CE environment at the moment)
-        apply_process_before_tsdb()
+        if not mlrun.mlconf.is_ce_mode():
+            # Step 11 - Before writing data to TSDB, create dictionary of 2-3 dictionaries that contains
+            # stats and details about the events
+            def apply_process_before_tsdb():
+                graph.add_step(
+                    "ProcessBeforeTSDB", name="ProcessBeforeTSDB", after="sample"
+                )
-        # Steps 12-18: - Unpacked keys from each dictionary and write to TSDB target
-        def apply_filter_and_unpacked_keys(name, keys):
-            graph.add_step(
-                "FilterAndUnpackKeys",
-                name=name,
-                after="ProcessBeforeTSDB",
-                keys=[keys],
-            )
+            apply_process_before_tsdb()
-        def apply_tsdb_target(name, after):
-            graph.add_step(
-                "storey.TSDBTarget",
-                name=name,
-                after=after,
-                path=self.tsdb_path,
-                rate="10/m",
-                time_col=EventFieldType.TIMESTAMP,
-                container=self.tsdb_container,
-                access_key=self.v3io_access_key,
-                v3io_frames=self.v3io_framesd,
-                infer_columns_from_data=True,
-                index_cols=[
-                    EventFieldType.ENDPOINT_ID,
-                    EventFieldType.RECORD_TYPE,
-                ],
-                max_events=self.tsdb_batching_max_events,
-                flush_after_seconds=self.tsdb_batching_timeout_secs,
-                key=EventFieldType.ENDPOINT_ID,
-            )
+            # Steps 12-18: - Unpacked keys from each dictionary and write to TSDB target
+            def apply_filter_and_unpacked_keys(name, keys):
+                graph.add_step(
+                    "FilterAndUnpackKeys",
+                    name=name,
+                    after="ProcessBeforeTSDB",
+                    keys=[keys],
+                )
-        # Steps 12-13 - unpacked base_metrics dictionary
-        apply_filter_and_unpacked_keys(
-            name="FilterAndUnpackKeys1",
-            keys=EventKeyMetrics.BASE_METRICS,
-        )
-        apply_tsdb_target(name="tsdb1", after="FilterAndUnpackKeys1")
+            def apply_tsdb_target(name, after):
+                graph.add_step(
+                    "storey.TSDBTarget",
+                    name=name,
+                    after=after,
+                    path=self.tsdb_path,
+                    rate="10/m",
+                    time_col=EventFieldType.TIMESTAMP,
+                    container=self.tsdb_container,
+                    access_key=self.v3io_access_key,
+                    v3io_frames=self.v3io_framesd,
+                    infer_columns_from_data=True,
+                    index_cols=[
+                        EventFieldType.ENDPOINT_ID,
+                        EventFieldType.RECORD_TYPE,
+                        EventFieldType.ENDPOINT_TYPE,
+                    ],
+                    max_events=self.tsdb_batching_max_events,
+                    flush_after_seconds=self.tsdb_batching_timeout_secs,
+                    key=EventFieldType.ENDPOINT_ID,
+                )
-        # Steps 14-15 - unpacked endpoint_features dictionary
-        apply_filter_and_unpacked_keys(
-            name="FilterAndUnpackKeys2",
-            keys=EventKeyMetrics.ENDPOINT_FEATURES,
-        )
-        apply_tsdb_target(name="tsdb2", after="FilterAndUnpackKeys2")
+            # Steps 12-13 - unpacked base_metrics dictionary
+            apply_filter_and_unpacked_keys(
+                name="FilterAndUnpackKeys1",
+                keys=EventKeyMetrics.BASE_METRICS,
+            )
+            apply_tsdb_target(name="tsdb1", after="FilterAndUnpackKeys1")
-        # Steps 16-18 - unpacked custom_metrics dictionary. In addition, use storey.Filter remove none values
-        apply_filter_and_unpacked_keys(
-            name="FilterAndUnpackKeys3",
-            keys=EventKeyMetrics.CUSTOM_METRICS,
-        )
+            # Steps 14-15 - unpacked endpoint_features dictionary
+            apply_filter_and_unpacked_keys(
+                name="FilterAndUnpackKeys2",
+                keys=EventKeyMetrics.ENDPOINT_FEATURES,
+            )
+            apply_tsdb_target(name="tsdb2", after="FilterAndUnpackKeys2")
-        def apply_storey_filter():
-            graph.add_step(
-                "storey.Filter",
-                "FilterNotNone",
-                after="FilterAndUnpackKeys3",
-                _fn="(event is not None)",
+            # Steps 16-18 - unpacked custom_metrics dictionary. In addition, use storey.Filter remove none values
+            apply_filter_and_unpacked_keys(
+                name="FilterAndUnpackKeys3",
+                keys=EventKeyMetrics.CUSTOM_METRICS,
             )
-        apply_storey_filter()
-        apply_tsdb_target(name="tsdb3", after="FilterNotNone")
+            def apply_storey_filter():
+                graph.add_step(
+                    "storey.Filter",
+                    "FilterNotNone",
+                    after="FilterAndUnpackKeys3",
+                    _fn="(event is not None)",
+                )
+            apply_storey_filter()
+            apply_tsdb_target(name="tsdb3", after="FilterNotNone")
         # Steps 19-20 - Parquet branch
         # Step 19 - Filter and validate different keys before writing the data to Parquet target
@@ -384,19 +396,18 @@ class EventStreamProcessor:
         apply_parquet_target()
-class ProcessBeforeKV(mlrun.feature_store.steps.MapClass):
+class ProcessBeforeEndpointUpdate(mlrun.feature_store.steps.MapClass):
     def __init__(self, **kwargs):
         """
-        Filter relevant keys from the event before writing the data to KV table (in WriteToKV step). Note that in KV
-        we only keep metadata (function_uri, model_class, etc.) and stats about the average latency and the number
-        of predictions (per 5min and 1hour).
+        Filter relevant keys from the event before writing the data to database table (in EndpointUpdate step).
+        Note that in the endpoint table we only keep metadata (function_uri, model_class, etc.) and stats about the
+        average latency and the number of predictions (per 5min and 1hour).
-        :returns: A filtered event as a dictionary which will be written to KV table in the next step.
+        :returns: A filtered event as a dictionary which will be written to the endpoint table in the next step.
         """
         super().__init__(**kwargs)
     def do(self, event):
         # Compute prediction per second
         event[EventLiveStats.PREDICTIONS_PER_SECOND] = (
             float(event[EventLiveStats.PREDICTIONS_COUNT_5M]) / 300
@@ -408,26 +419,31 @@ class ProcessBeforeKV(mlrun.feature_store.steps.MapClass):
                 EventFieldType.FUNCTION_URI,
                 EventFieldType.MODEL,
                 EventFieldType.MODEL_CLASS,
-                EventFieldType.TIMESTAMP,
                 EventFieldType.ENDPOINT_ID,
                 EventFieldType.LABELS,
-                EventFieldType.UNPACKED_LABELS,
+                EventFieldType.FIRST_REQUEST,
+                EventFieldType.LAST_REQUEST,
+                EventFieldType.ERROR_COUNT,
+            ]
+        }
+        # Add generic metrics statistics
+        generic_metrics = {
+            k: event[k]
+            for k in [
                 EventLiveStats.LATENCY_AVG_5M,
                 EventLiveStats.LATENCY_AVG_1H,
                 EventLiveStats.PREDICTIONS_PER_SECOND,
                 EventLiveStats.PREDICTIONS_COUNT_5M,
                 EventLiveStats.PREDICTIONS_COUNT_1H,
-                EventFieldType.FIRST_REQUEST,
-                EventFieldType.LAST_REQUEST,
-                EventFieldType.ERROR_COUNT,
             ]
         }
-        # Unpack labels dictionary
-        e = {
-            **e.pop(EventFieldType.UNPACKED_LABELS, {}),
-            **e,
-        }
-        # Write labels to kv as json string to be presentable later
+        e[EventFieldType.METRICS] = json.dumps(
+            {EventKeyMetrics.GENERIC: generic_metrics}
+        )
+        # Write labels as json string as required by the DB format
         e[EventFieldType.LABELS] = json.dumps(e[EventFieldType.LABELS])
         return e
@@ -449,7 +465,6 @@ class ProcessBeforeTSDB(mlrun.feature_store.steps.MapClass):
         super().__init__(**kwargs)
     def do(self, event):
         # Compute prediction per second
         event[EventLiveStats.PREDICTIONS_PER_SECOND] = (
             float(event[EventLiveStats.PREDICTIONS_COUNT_5M]) / 300
@@ -457,6 +472,7 @@ class ProcessBeforeTSDB(mlrun.feature_store.steps.MapClass):
         base_fields = [
             EventFieldType.TIMESTAMP,
             EventFieldType.ENDPOINT_ID,
+            EventFieldType.ENDPOINT_TYPE,
         ]
         # Getting event timestamp and endpoint_id
@@ -519,11 +535,9 @@ class ProcessBeforeParquet(mlrun.feature_store.steps.MapClass):
         super().__init__(**kwargs)
     def do(self, event):
         logger.info("ProcessBeforeParquet1", event=event)
         # Remove the following keys from the event
         for key in [
-            EventFieldType.UNPACKED_LABELS,
             EventFieldType.FEATURES,
             EventFieldType.NAMED_FEATURES,
         ]:
@@ -549,32 +563,23 @@ class ProcessBeforeParquet(mlrun.feature_store.steps.MapClass):
 class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
     def __init__(
         self,
-        kv_container: str,
-        kv_path: str,
-        v3io_access_key: str,
+        project: str,
         **kwargs,
     ):
         """
         Process event or batch of events as part of the first step of the monitoring serving graph. It includes
-        Adding important details to the event such as endpoint_id, handling errors coming from the stream, Validation
+        Adding important details to the event such as endpoint_id, handling errors coming from the stream, validation
         of event data such as inputs and outputs, and splitting model event into sub-events.
-        :param kv_container:    Name of the container that will be used to retrieve the endpoint id. For model
-                                endpoints it is usually 'users'.
-        :param kv_path:         KV table path that will be used to retrieve the endpoint id. For model endpoints
-                                it is usually pipelines/project-name/model-endpoints/endpoints/
-        :param v3io_access_key: Access key with permission to read from a KV table.
-        :param project:         Project name.
+        :param project: Project name.
         :returns: A Storey event object which is the basic unit of data in Storey. Note that the next steps of
                   the monitoring serving graph are based on Storey operations.
         """
         super().__init__(**kwargs)
-        self.kv_container: str = kv_container
-        self.kv_path: str = kv_path
-        self.v3io_access_key: str = v3io_access_key
+        self.project: str = project
         # First and last requests timestamps (value) of each endpoint (key)
         self.first_request: typing.Dict[str, str] = dict()
@@ -602,7 +607,7 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
         version = event.get(EventFieldType.VERSION)
         versioned_model = f"{model}:{version}" if version else f"{model}:latest"
-        endpoint_id = mlrun.utils.model_monitoring.create_model_endpoint_id(
+        endpoint_id = mlrun.common.model_monitoring.create_model_endpoint_uid(
             function_uri=function_uri,
             versioned_model=versioned_model,
         )
@@ -615,10 +620,12 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
         # In case this process fails, resume state from existing record
         self.resume_state(endpoint_id)
-        # Handle errors coming from stream
-        found_errors = self.handle_errors(endpoint_id, event)
-        if found_errors:
-            return None
+        # If error key has been found in the current event,
+        # increase the error counter by 1 and raise the error description
+        error = event.get("error")
+        if error:
+            self.error_count[endpoint_id] += 1
+            raise mlrun.errors.MLRunInvalidArgumentError(str(error))
         # Validate event fields
         model_class = event.get("model_class") or event.get("class")
@@ -679,11 +686,6 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
         ):
             return None
-        # Get labels from event (if exist)
-        unpacked_labels = {
-            f"_{k}": v for k, v in event.get(EventFieldType.LABELS, {}).items()
-        }
         # Adjust timestamp format
         timestamp = datetime.datetime.strptime(timestamp[:-6], "%Y-%m-%d %H:%M:%S.%f")
@@ -722,7 +724,6 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
                     EventFieldType.ENTITIES: event.get("request", {}).get(
                         EventFieldType.ENTITIES, {}
                     ),
-                    EventFieldType.UNPACKED_LABELS: unpacked_labels,
                 }
             )
@@ -745,14 +746,13 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
             endpoint_id in self.last_request
             and self.last_request[endpoint_id] > timestamp
         ):
             logger.error(
                 f"current event request time {timestamp} is earlier than the last request time "
                 f"{self.last_request[endpoint_id]} - write to TSDB will be rejected"
             )
+    @staticmethod
     def is_list_of_numerics(
-        self,
         field: typing.List[typing.Union[int, float, dict, list]],
         dict_path: typing.List[str],
     ):
@@ -769,10 +769,8 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
         if endpoint_id not in self.endpoints:
             logger.info("Trying to resume state", endpoint_id=endpoint_id)
             endpoint_record = get_endpoint_record(
-                kv_container=self.kv_container,
-                kv_path=self.kv_path,
+                project=self.project,
                 endpoint_id=endpoint_id,
-                access_key=self.v3io_access_key,
             )
             # If model endpoint found, get first_request, last_request and error_count values
@@ -784,13 +782,12 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
                 last_request = endpoint_record.get(EventFieldType.LAST_REQUEST)
                 if last_request:
                     self.last_request[endpoint_id] = last_request
                 error_count = endpoint_record.get(EventFieldType.ERROR_COUNT)
                 if error_count:
-                    self.error_count[endpoint_id] = error_count
+                    self.error_count[endpoint_id] = int(error_count)
             # add endpoint to endpoints set
             self.endpoints.add(endpoint_id)
@@ -807,13 +804,6 @@ class ProcessEndpointEvent(mlrun.feature_store.steps.MapClass):
         self.error_count[endpoint_id] += 1
         return False
-    def handle_errors(self, endpoint_id, event) -> bool:
-        if "error" in event:
-            self.error_count[endpoint_id] += 1
-            return True
-        return False
 def is_not_none(field: typing.Any, dict_path: typing.List[str]):
     if field is not None:
@@ -857,9 +847,7 @@ class FilterAndUnpackKeys(mlrun.feature_store.steps.MapClass):
 class MapFeatureNames(mlrun.feature_store.steps.MapClass):
     def __init__(
         self,
-        kv_container: str,
-        kv_path: str,
-        access_key: str,
+        project: str,
         infer_columns_from_data: bool = False,
         **kwargs,
     ):
@@ -867,11 +855,7 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
         Validating feature names and label columns and map each feature to its value. In the end of this step,
         the event should have key-value pairs of (feature name: feature value).
-        :param kv_container:            Name of the container that will be used to retrieve the endpoint id. For model
-                                        endpoints it is usually 'users'.
-        :param kv_path:                 KV table path that will be used to retrieve the endpoint id. For model endpoints
-                                        it is usually pipelines/project-name/model-endpoints/endpoints/
-        :param v3io_access_key:         Access key with permission to read from a KV table.
+        :param project:                 Project name.
         :param infer_columns_from_data: If true and features or labels names were not found, then try to
                                         retrieve them from data that was stored in the previous events of
                                         the current process. This data can be found under self.feature_names and
@@ -882,16 +866,18 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
                   feature names and values (as well as the prediction results).
         """
         super().__init__(**kwargs)
-        self.kv_container = kv_container
-        self.kv_path = kv_path
-        self.access_key = access_key
         self._infer_columns_from_data = infer_columns_from_data
+        self.project = project
         # Dictionaries that will be used in case features names
         # and labels columns were not found in the current event
         self.feature_names = {}
         self.label_columns = {}
+        # Dictionary to manage the model endpoint types - important for the V3IO TSDB
+        self.endpoint_type = {}
     def _infer_feature_names_from_data(self, event):
         for endpoint_id in self.feature_names:
             if len(self.feature_names[endpoint_id]) >= len(
@@ -914,10 +900,8 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
         # Get feature names and label columns
         if endpoint_id not in self.feature_names:
             endpoint_record = get_endpoint_record(
-                kv_container=self.kv_container,
-                kv_path=self.kv_path,
+                project=self.project,
                 endpoint_id=endpoint_id,
-                access_key=self.access_key,
             )
             feature_names = endpoint_record.get(EventFieldType.FEATURE_NAMES)
             feature_names = json.loads(feature_names) if feature_names else None
@@ -925,7 +909,7 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
             label_columns = endpoint_record.get(EventFieldType.LABEL_NAMES)
             label_columns = json.loads(label_columns) if label_columns else None
-            # Ff feature names were not found,
+            # If feature names were not found,
             # try to retrieve them from the previous events of the current process
             if not feature_names and self._infer_columns_from_data:
                 feature_names = self._infer_feature_names_from_data(event)
@@ -940,15 +924,12 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
                 ]
                 # Update the endpoint record with the generated features
-                mlrun.utils.v3io_clients.get_v3io_client().kv.update(
-                    container=self.kv_container,
-                    table_path=self.kv_path,
-                    access_key=self.access_key,
-                    key=event[EventFieldType.ENDPOINT_ID],
+                update_endpoint_record(
+                    project=self.project,
+                    endpoint_id=endpoint_id,
                     attributes={
                         EventFieldType.FEATURE_NAMES: json.dumps(feature_names)
                     },
-                    raise_for_status=v3io.dataplane.RaiseForStatus.always,
                 )
             # Similar process with label columns
@@ -963,15 +944,11 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
                 label_columns = [
                     f"p{i}" for i, _ in enumerate(event[EventFieldType.PREDICTION])
                 ]
-                mlrun.utils.v3io_clients.get_v3io_client().kv.update(
-                    container=self.kv_container,
-                    table_path=self.kv_path,
-                    access_key=self.access_key,
-                    key=event[EventFieldType.ENDPOINT_ID],
-                    attributes={
-                        EventFieldType.LABEL_COLUMNS: json.dumps(label_columns)
-                    },
-                    raise_for_status=v3io.dataplane.RaiseForStatus.always,
+                update_endpoint_record(
+                    project=self.project,
+                    endpoint_id=endpoint_id,
+                    attributes={EventFieldType.LABEL_NAMES: json.dumps(label_columns)},
                 )
             self.label_columns[endpoint_id] = label_columns
@@ -984,6 +961,10 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
                 "Feature names", endpoint_id=endpoint_id, feature_names=feature_names
             )
+            # Update the endpoint type within the endpoint types dictionary
+            endpoint_type = int(endpoint_record.get(EventFieldType.ENDPOINT_TYPE))
+            self.endpoint_type[endpoint_id] = endpoint_type
         # Add feature_name:value pairs along with a mapping dictionary of all of these pairs
         feature_names = self.feature_names[endpoint_id]
         feature_values = event[EventFieldType.FEATURES]
@@ -1004,6 +985,9 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
             mapping_dictionary=EventFieldType.NAMED_PREDICTIONS,
         )
+        # Add endpoint type to the event
+        event[EventFieldType.ENDPOINT_TYPE] = self.endpoint_type[endpoint_id]
         logger.info("Mapped event", event=event)
         return event
@@ -1033,33 +1017,24 @@ class MapFeatureNames(mlrun.feature_store.steps.MapClass):
             event[mapping_dictionary][name] = value
-class WriteToKV(mlrun.feature_store.steps.MapClass):
-    def __init__(self, container: str, table: str, v3io_access_key: str, **kwargs):
+class UpdateEndpoint(mlrun.feature_store.steps.MapClass):
+    def __init__(self, project: str, model_endpoint_store_target: str, **kwargs):
         """
-        Writes the event to KV table. Note that the event at this point includes metadata and stats about the
-        average latency and the amount of predictions over time. This data will be used in the monitoring dashboards
+        Update the model endpoint record in the DB. Note that the event at this point includes metadata and stats about
+        the average latency and the amount of predictions over time. This data will be used in the monitoring dashboards
         such as "Model Monitoring - Performance" which can be found in Grafana.
-        :param kv_container:            Name of the container that will be used to retrieve the endpoint id. For model
-                                        endpoints it is usually 'users'.
-        :param table:                   KV table path that will be used to retrieve the endpoint id. For model endpoints
-                                        it is usually pipelines/project-name/model-endpoints/endpoints/.
-        :param v3io_access_key:         Access key with permission to read from a KV table.
         :returns: Event as a dictionary (without any changes) for the next step (InferSchema).
         """
         super().__init__(**kwargs)
-        self.container = container
-        self.table = table
-        self.v3io_access_key = v3io_access_key
+        self.project = project
+        self.model_endpoint_store_target = model_endpoint_store_target
     def do(self, event: typing.Dict):
-        mlrun.utils.v3io_clients.get_v3io_client().kv.update(
-            container=self.container,
-            table_path=self.table,
-            key=event[EventFieldType.ENDPOINT_ID],
+        update_endpoint_record(
+            project=self.project,
+            endpoint_id=event.pop(EventFieldType.ENDPOINT_ID),
             attributes=event,
-            access_key=self.v3io_access_key,
         )
         return event
@@ -1067,7 +1042,6 @@ class WriteToKV(mlrun.feature_store.steps.MapClass):
 class InferSchema(mlrun.feature_store.steps.MapClass):
     def __init__(
         self,
-        v3io_access_key: str,
         v3io_framesd: str,
         container: str,
         table: str,
@@ -1087,7 +1061,6 @@ class InferSchema(mlrun.feature_store.steps.MapClass):
         """
         super().__init__(**kwargs)
         self.container = container
-        self.v3io_access_key = v3io_access_key
         self.v3io_framesd = v3io_framesd
         self.table = table
         self.keys = set()
@@ -1098,34 +1071,29 @@ class InferSchema(mlrun.feature_store.steps.MapClass):
             self.keys.update(key_set)
             # Apply infer_schema on the kv table for generating the schema file
             mlrun.utils.v3io_clients.get_frames_client(
-                token=self.v3io_access_key,
                 container=self.container,
                 address=self.v3io_framesd,
             ).execute(backend="kv", table=self.table, command="infer_schema")
         return event
-def get_endpoint_record(
-    kv_container: str, kv_path: str, endpoint_id: str, access_key: str
-) -> typing.Optional[dict]:
-    logger.info(
-        "Grabbing endpoint data",
-        container=kv_container,
-        table_path=kv_path,
-        key=endpoint_id,
+def update_endpoint_record(
+    project: str,
+    endpoint_id: str,
+    attributes: dict,
+):
+    model_endpoint_store = get_model_endpoint_store(
+        project=project,
     )
-    try:
-        endpoint_record = (
-            mlrun.utils.v3io_clients.get_v3io_client()
-            .kv.get(
-                container=kv_container,
-                table_path=kv_path,
-                key=endpoint_id,
-                access_key=access_key,
-                raise_for_status=v3io.dataplane.RaiseForStatus.always,
-            )
-            .output.item
-        )
-        return endpoint_record
-    except Exception:
-        return None
+    model_endpoint_store.update_model_endpoint(
+        endpoint_id=endpoint_id, attributes=attributes
+    )
+def get_endpoint_record(project: str, endpoint_id: str):
+    model_endpoint_store = get_model_endpoint_store(
+        project=project,
+    )
+    return model_endpoint_store.get_model_endpoint(endpoint_id=endpoint_id)

mlrun 1.3.3__py3-none-any.whl → 1.4.0__py3-none-any.whl

Potentially problematic release.

mlrun 1.3.3py3-none-any.whl → 1.4.0py3-none-any.whl