genesis-flow 1.0.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- genesis_flow-1.0.0.dist-info/METADATA +822 -0
- genesis_flow-1.0.0.dist-info/RECORD +645 -0
- genesis_flow-1.0.0.dist-info/WHEEL +5 -0
- genesis_flow-1.0.0.dist-info/entry_points.txt +19 -0
- genesis_flow-1.0.0.dist-info/licenses/LICENSE.txt +202 -0
- genesis_flow-1.0.0.dist-info/top_level.txt +1 -0
- mlflow/__init__.py +367 -0
- mlflow/__main__.py +3 -0
- mlflow/ag2/__init__.py +56 -0
- mlflow/ag2/ag2_logger.py +294 -0
- mlflow/anthropic/__init__.py +40 -0
- mlflow/anthropic/autolog.py +129 -0
- mlflow/anthropic/chat.py +144 -0
- mlflow/artifacts/__init__.py +268 -0
- mlflow/autogen/__init__.py +144 -0
- mlflow/autogen/chat.py +142 -0
- mlflow/azure/__init__.py +26 -0
- mlflow/azure/auth_handler.py +257 -0
- mlflow/azure/client.py +319 -0
- mlflow/azure/config.py +120 -0
- mlflow/azure/connection_factory.py +340 -0
- mlflow/azure/exceptions.py +27 -0
- mlflow/azure/stores.py +327 -0
- mlflow/azure/utils.py +183 -0
- mlflow/bedrock/__init__.py +45 -0
- mlflow/bedrock/_autolog.py +202 -0
- mlflow/bedrock/chat.py +122 -0
- mlflow/bedrock/stream.py +160 -0
- mlflow/bedrock/utils.py +43 -0
- mlflow/cli.py +707 -0
- mlflow/client.py +12 -0
- mlflow/config/__init__.py +56 -0
- mlflow/crewai/__init__.py +79 -0
- mlflow/crewai/autolog.py +253 -0
- mlflow/crewai/chat.py +29 -0
- mlflow/data/__init__.py +75 -0
- mlflow/data/artifact_dataset_sources.py +170 -0
- mlflow/data/code_dataset_source.py +40 -0
- mlflow/data/dataset.py +123 -0
- mlflow/data/dataset_registry.py +168 -0
- mlflow/data/dataset_source.py +110 -0
- mlflow/data/dataset_source_registry.py +219 -0
- mlflow/data/delta_dataset_source.py +167 -0
- mlflow/data/digest_utils.py +108 -0
- mlflow/data/evaluation_dataset.py +562 -0
- mlflow/data/filesystem_dataset_source.py +81 -0
- mlflow/data/http_dataset_source.py +145 -0
- mlflow/data/huggingface_dataset.py +258 -0
- mlflow/data/huggingface_dataset_source.py +118 -0
- mlflow/data/meta_dataset.py +104 -0
- mlflow/data/numpy_dataset.py +223 -0
- mlflow/data/pandas_dataset.py +231 -0
- mlflow/data/polars_dataset.py +352 -0
- mlflow/data/pyfunc_dataset_mixin.py +31 -0
- mlflow/data/schema.py +76 -0
- mlflow/data/sources.py +1 -0
- mlflow/data/spark_dataset.py +406 -0
- mlflow/data/spark_dataset_source.py +74 -0
- mlflow/data/spark_delta_utils.py +118 -0
- mlflow/data/tensorflow_dataset.py +350 -0
- mlflow/data/uc_volume_dataset_source.py +81 -0
- mlflow/db.py +27 -0
- mlflow/dspy/__init__.py +17 -0
- mlflow/dspy/autolog.py +197 -0
- mlflow/dspy/callback.py +398 -0
- mlflow/dspy/constant.py +1 -0
- mlflow/dspy/load.py +93 -0
- mlflow/dspy/save.py +393 -0
- mlflow/dspy/util.py +109 -0
- mlflow/dspy/wrapper.py +226 -0
- mlflow/entities/__init__.py +104 -0
- mlflow/entities/_mlflow_object.py +52 -0
- mlflow/entities/assessment.py +545 -0
- mlflow/entities/assessment_error.py +80 -0
- mlflow/entities/assessment_source.py +141 -0
- mlflow/entities/dataset.py +92 -0
- mlflow/entities/dataset_input.py +51 -0
- mlflow/entities/dataset_summary.py +62 -0
- mlflow/entities/document.py +48 -0
- mlflow/entities/experiment.py +109 -0
- mlflow/entities/experiment_tag.py +35 -0
- mlflow/entities/file_info.py +45 -0
- mlflow/entities/input_tag.py +35 -0
- mlflow/entities/lifecycle_stage.py +35 -0
- mlflow/entities/logged_model.py +228 -0
- mlflow/entities/logged_model_input.py +26 -0
- mlflow/entities/logged_model_output.py +32 -0
- mlflow/entities/logged_model_parameter.py +46 -0
- mlflow/entities/logged_model_status.py +74 -0
- mlflow/entities/logged_model_tag.py +33 -0
- mlflow/entities/metric.py +200 -0
- mlflow/entities/model_registry/__init__.py +29 -0
- mlflow/entities/model_registry/_model_registry_entity.py +13 -0
- mlflow/entities/model_registry/model_version.py +243 -0
- mlflow/entities/model_registry/model_version_deployment_job_run_state.py +44 -0
- mlflow/entities/model_registry/model_version_deployment_job_state.py +70 -0
- mlflow/entities/model_registry/model_version_search.py +25 -0
- mlflow/entities/model_registry/model_version_stages.py +25 -0
- mlflow/entities/model_registry/model_version_status.py +35 -0
- mlflow/entities/model_registry/model_version_tag.py +35 -0
- mlflow/entities/model_registry/prompt.py +73 -0
- mlflow/entities/model_registry/prompt_version.py +244 -0
- mlflow/entities/model_registry/registered_model.py +175 -0
- mlflow/entities/model_registry/registered_model_alias.py +35 -0
- mlflow/entities/model_registry/registered_model_deployment_job_state.py +39 -0
- mlflow/entities/model_registry/registered_model_search.py +25 -0
- mlflow/entities/model_registry/registered_model_tag.py +35 -0
- mlflow/entities/multipart_upload.py +74 -0
- mlflow/entities/param.py +49 -0
- mlflow/entities/run.py +97 -0
- mlflow/entities/run_data.py +84 -0
- mlflow/entities/run_info.py +188 -0
- mlflow/entities/run_inputs.py +59 -0
- mlflow/entities/run_outputs.py +43 -0
- mlflow/entities/run_status.py +41 -0
- mlflow/entities/run_tag.py +36 -0
- mlflow/entities/source_type.py +31 -0
- mlflow/entities/span.py +774 -0
- mlflow/entities/span_event.py +96 -0
- mlflow/entities/span_status.py +102 -0
- mlflow/entities/trace.py +317 -0
- mlflow/entities/trace_data.py +71 -0
- mlflow/entities/trace_info.py +220 -0
- mlflow/entities/trace_info_v2.py +162 -0
- mlflow/entities/trace_location.py +173 -0
- mlflow/entities/trace_state.py +39 -0
- mlflow/entities/trace_status.py +68 -0
- mlflow/entities/view_type.py +51 -0
- mlflow/environment_variables.py +866 -0
- mlflow/evaluation/__init__.py +16 -0
- mlflow/evaluation/assessment.py +369 -0
- mlflow/evaluation/evaluation.py +411 -0
- mlflow/evaluation/evaluation_tag.py +61 -0
- mlflow/evaluation/fluent.py +48 -0
- mlflow/evaluation/utils.py +201 -0
- mlflow/exceptions.py +213 -0
- mlflow/experiments.py +140 -0
- mlflow/gemini/__init__.py +81 -0
- mlflow/gemini/autolog.py +186 -0
- mlflow/gemini/chat.py +261 -0
- mlflow/genai/__init__.py +71 -0
- mlflow/genai/datasets/__init__.py +67 -0
- mlflow/genai/datasets/evaluation_dataset.py +131 -0
- mlflow/genai/evaluation/__init__.py +3 -0
- mlflow/genai/evaluation/base.py +411 -0
- mlflow/genai/evaluation/constant.py +23 -0
- mlflow/genai/evaluation/utils.py +244 -0
- mlflow/genai/judges/__init__.py +21 -0
- mlflow/genai/judges/databricks.py +404 -0
- mlflow/genai/label_schemas/__init__.py +153 -0
- mlflow/genai/label_schemas/label_schemas.py +209 -0
- mlflow/genai/labeling/__init__.py +159 -0
- mlflow/genai/labeling/labeling.py +250 -0
- mlflow/genai/optimize/__init__.py +13 -0
- mlflow/genai/optimize/base.py +198 -0
- mlflow/genai/optimize/optimizers/__init__.py +4 -0
- mlflow/genai/optimize/optimizers/base_optimizer.py +38 -0
- mlflow/genai/optimize/optimizers/dspy_mipro_optimizer.py +221 -0
- mlflow/genai/optimize/optimizers/dspy_optimizer.py +91 -0
- mlflow/genai/optimize/optimizers/utils/dspy_mipro_callback.py +76 -0
- mlflow/genai/optimize/optimizers/utils/dspy_mipro_utils.py +18 -0
- mlflow/genai/optimize/types.py +75 -0
- mlflow/genai/optimize/util.py +30 -0
- mlflow/genai/prompts/__init__.py +206 -0
- mlflow/genai/scheduled_scorers.py +431 -0
- mlflow/genai/scorers/__init__.py +26 -0
- mlflow/genai/scorers/base.py +492 -0
- mlflow/genai/scorers/builtin_scorers.py +765 -0
- mlflow/genai/scorers/scorer_utils.py +138 -0
- mlflow/genai/scorers/validation.py +165 -0
- mlflow/genai/utils/data_validation.py +146 -0
- mlflow/genai/utils/enum_utils.py +23 -0
- mlflow/genai/utils/trace_utils.py +211 -0
- mlflow/groq/__init__.py +42 -0
- mlflow/groq/_groq_autolog.py +74 -0
- mlflow/johnsnowlabs/__init__.py +888 -0
- mlflow/langchain/__init__.py +24 -0
- mlflow/langchain/api_request_parallel_processor.py +330 -0
- mlflow/langchain/autolog.py +147 -0
- mlflow/langchain/chat_agent_langgraph.py +340 -0
- mlflow/langchain/constant.py +1 -0
- mlflow/langchain/constants.py +1 -0
- mlflow/langchain/databricks_dependencies.py +444 -0
- mlflow/langchain/langchain_tracer.py +597 -0
- mlflow/langchain/model.py +919 -0
- mlflow/langchain/output_parsers.py +142 -0
- mlflow/langchain/retriever_chain.py +153 -0
- mlflow/langchain/runnables.py +527 -0
- mlflow/langchain/utils/chat.py +402 -0
- mlflow/langchain/utils/logging.py +671 -0
- mlflow/langchain/utils/serialization.py +36 -0
- mlflow/legacy_databricks_cli/__init__.py +0 -0
- mlflow/legacy_databricks_cli/configure/__init__.py +0 -0
- mlflow/legacy_databricks_cli/configure/provider.py +482 -0
- mlflow/litellm/__init__.py +175 -0
- mlflow/llama_index/__init__.py +22 -0
- mlflow/llama_index/autolog.py +55 -0
- mlflow/llama_index/chat.py +43 -0
- mlflow/llama_index/constant.py +1 -0
- mlflow/llama_index/model.py +577 -0
- mlflow/llama_index/pyfunc_wrapper.py +332 -0
- mlflow/llama_index/serialize_objects.py +188 -0
- mlflow/llama_index/tracer.py +561 -0
- mlflow/metrics/__init__.py +479 -0
- mlflow/metrics/base.py +39 -0
- mlflow/metrics/genai/__init__.py +25 -0
- mlflow/metrics/genai/base.py +101 -0
- mlflow/metrics/genai/genai_metric.py +771 -0
- mlflow/metrics/genai/metric_definitions.py +450 -0
- mlflow/metrics/genai/model_utils.py +371 -0
- mlflow/metrics/genai/prompt_template.py +68 -0
- mlflow/metrics/genai/prompts/__init__.py +0 -0
- mlflow/metrics/genai/prompts/v1.py +422 -0
- mlflow/metrics/genai/utils.py +6 -0
- mlflow/metrics/metric_definitions.py +619 -0
- mlflow/mismatch.py +34 -0
- mlflow/mistral/__init__.py +34 -0
- mlflow/mistral/autolog.py +71 -0
- mlflow/mistral/chat.py +135 -0
- mlflow/ml_package_versions.py +452 -0
- mlflow/models/__init__.py +97 -0
- mlflow/models/auth_policy.py +83 -0
- mlflow/models/cli.py +354 -0
- mlflow/models/container/__init__.py +294 -0
- mlflow/models/container/scoring_server/__init__.py +0 -0
- mlflow/models/container/scoring_server/nginx.conf +39 -0
- mlflow/models/dependencies_schemas.py +287 -0
- mlflow/models/display_utils.py +158 -0
- mlflow/models/docker_utils.py +211 -0
- mlflow/models/evaluation/__init__.py +23 -0
- mlflow/models/evaluation/_shap_patch.py +64 -0
- mlflow/models/evaluation/artifacts.py +194 -0
- mlflow/models/evaluation/base.py +1811 -0
- mlflow/models/evaluation/calibration_curve.py +109 -0
- mlflow/models/evaluation/default_evaluator.py +996 -0
- mlflow/models/evaluation/deprecated.py +23 -0
- mlflow/models/evaluation/evaluator_registry.py +80 -0
- mlflow/models/evaluation/evaluators/classifier.py +704 -0
- mlflow/models/evaluation/evaluators/default.py +233 -0
- mlflow/models/evaluation/evaluators/regressor.py +96 -0
- mlflow/models/evaluation/evaluators/shap.py +296 -0
- mlflow/models/evaluation/lift_curve.py +178 -0
- mlflow/models/evaluation/utils/metric.py +123 -0
- mlflow/models/evaluation/utils/trace.py +179 -0
- mlflow/models/evaluation/validation.py +434 -0
- mlflow/models/flavor_backend.py +93 -0
- mlflow/models/flavor_backend_registry.py +53 -0
- mlflow/models/model.py +1639 -0
- mlflow/models/model_config.py +150 -0
- mlflow/models/notebook_resources/agent_evaluation_template.html +235 -0
- mlflow/models/notebook_resources/eval_with_dataset_example.py +22 -0
- mlflow/models/notebook_resources/eval_with_synthetic_example.py +22 -0
- mlflow/models/python_api.py +369 -0
- mlflow/models/rag_signatures.py +128 -0
- mlflow/models/resources.py +321 -0
- mlflow/models/signature.py +662 -0
- mlflow/models/utils.py +2054 -0
- mlflow/models/wheeled_model.py +280 -0
- mlflow/openai/__init__.py +57 -0
- mlflow/openai/_agent_tracer.py +364 -0
- mlflow/openai/api_request_parallel_processor.py +131 -0
- mlflow/openai/autolog.py +509 -0
- mlflow/openai/constant.py +1 -0
- mlflow/openai/model.py +824 -0
- mlflow/openai/utils/chat_schema.py +367 -0
- mlflow/optuna/__init__.py +3 -0
- mlflow/optuna/storage.py +646 -0
- mlflow/plugins/__init__.py +72 -0
- mlflow/plugins/base.py +358 -0
- mlflow/plugins/builtin/__init__.py +24 -0
- mlflow/plugins/builtin/pytorch_plugin.py +150 -0
- mlflow/plugins/builtin/sklearn_plugin.py +158 -0
- mlflow/plugins/builtin/transformers_plugin.py +187 -0
- mlflow/plugins/cli.py +321 -0
- mlflow/plugins/discovery.py +340 -0
- mlflow/plugins/manager.py +465 -0
- mlflow/plugins/registry.py +316 -0
- mlflow/plugins/templates/framework_plugin_template.py +329 -0
- mlflow/prompt/constants.py +20 -0
- mlflow/prompt/promptlab_model.py +197 -0
- mlflow/prompt/registry_utils.py +248 -0
- mlflow/promptflow/__init__.py +495 -0
- mlflow/protos/__init__.py +0 -0
- mlflow/protos/assessments_pb2.py +174 -0
- mlflow/protos/databricks_artifacts_pb2.py +489 -0
- mlflow/protos/databricks_filesystem_service_pb2.py +196 -0
- mlflow/protos/databricks_managed_catalog_messages_pb2.py +95 -0
- mlflow/protos/databricks_managed_catalog_service_pb2.py +86 -0
- mlflow/protos/databricks_pb2.py +267 -0
- mlflow/protos/databricks_trace_server_pb2.py +374 -0
- mlflow/protos/databricks_uc_registry_messages_pb2.py +1249 -0
- mlflow/protos/databricks_uc_registry_service_pb2.py +170 -0
- mlflow/protos/facet_feature_statistics_pb2.py +296 -0
- mlflow/protos/internal_pb2.py +77 -0
- mlflow/protos/mlflow_artifacts_pb2.py +336 -0
- mlflow/protos/model_registry_pb2.py +1073 -0
- mlflow/protos/scalapb/__init__.py +0 -0
- mlflow/protos/scalapb/scalapb_pb2.py +104 -0
- mlflow/protos/service_pb2.py +2600 -0
- mlflow/protos/unity_catalog_oss_messages_pb2.py +457 -0
- mlflow/protos/unity_catalog_oss_service_pb2.py +130 -0
- mlflow/protos/unity_catalog_prompt_messages_pb2.py +447 -0
- mlflow/protos/unity_catalog_prompt_messages_pb2_grpc.py +24 -0
- mlflow/protos/unity_catalog_prompt_service_pb2.py +164 -0
- mlflow/protos/unity_catalog_prompt_service_pb2_grpc.py +785 -0
- mlflow/py.typed +0 -0
- mlflow/pydantic_ai/__init__.py +57 -0
- mlflow/pydantic_ai/autolog.py +173 -0
- mlflow/pyfunc/__init__.py +3844 -0
- mlflow/pyfunc/_mlflow_pyfunc_backend_predict.py +61 -0
- mlflow/pyfunc/backend.py +523 -0
- mlflow/pyfunc/context.py +78 -0
- mlflow/pyfunc/dbconnect_artifact_cache.py +144 -0
- mlflow/pyfunc/loaders/__init__.py +7 -0
- mlflow/pyfunc/loaders/chat_agent.py +117 -0
- mlflow/pyfunc/loaders/chat_model.py +125 -0
- mlflow/pyfunc/loaders/code_model.py +31 -0
- mlflow/pyfunc/loaders/responses_agent.py +112 -0
- mlflow/pyfunc/mlserver.py +46 -0
- mlflow/pyfunc/model.py +1473 -0
- mlflow/pyfunc/scoring_server/__init__.py +604 -0
- mlflow/pyfunc/scoring_server/app.py +7 -0
- mlflow/pyfunc/scoring_server/client.py +146 -0
- mlflow/pyfunc/spark_model_cache.py +48 -0
- mlflow/pyfunc/stdin_server.py +44 -0
- mlflow/pyfunc/utils/__init__.py +3 -0
- mlflow/pyfunc/utils/data_validation.py +224 -0
- mlflow/pyfunc/utils/environment.py +22 -0
- mlflow/pyfunc/utils/input_converter.py +47 -0
- mlflow/pyfunc/utils/serving_data_parser.py +11 -0
- mlflow/pytorch/__init__.py +1171 -0
- mlflow/pytorch/_lightning_autolog.py +580 -0
- mlflow/pytorch/_pytorch_autolog.py +50 -0
- mlflow/pytorch/pickle_module.py +35 -0
- mlflow/rfunc/__init__.py +42 -0
- mlflow/rfunc/backend.py +134 -0
- mlflow/runs.py +89 -0
- mlflow/server/__init__.py +302 -0
- mlflow/server/auth/__init__.py +1224 -0
- mlflow/server/auth/__main__.py +4 -0
- mlflow/server/auth/basic_auth.ini +6 -0
- mlflow/server/auth/cli.py +11 -0
- mlflow/server/auth/client.py +537 -0
- mlflow/server/auth/config.py +34 -0
- mlflow/server/auth/db/__init__.py +0 -0
- mlflow/server/auth/db/cli.py +18 -0
- mlflow/server/auth/db/migrations/__init__.py +0 -0
- mlflow/server/auth/db/migrations/alembic.ini +110 -0
- mlflow/server/auth/db/migrations/env.py +76 -0
- mlflow/server/auth/db/migrations/versions/8606fa83a998_initial_migration.py +51 -0
- mlflow/server/auth/db/migrations/versions/__init__.py +0 -0
- mlflow/server/auth/db/models.py +67 -0
- mlflow/server/auth/db/utils.py +37 -0
- mlflow/server/auth/entities.py +165 -0
- mlflow/server/auth/logo.py +14 -0
- mlflow/server/auth/permissions.py +65 -0
- mlflow/server/auth/routes.py +18 -0
- mlflow/server/auth/sqlalchemy_store.py +263 -0
- mlflow/server/graphql/__init__.py +0 -0
- mlflow/server/graphql/autogenerated_graphql_schema.py +353 -0
- mlflow/server/graphql/graphql_custom_scalars.py +24 -0
- mlflow/server/graphql/graphql_errors.py +15 -0
- mlflow/server/graphql/graphql_no_batching.py +89 -0
- mlflow/server/graphql/graphql_schema_extensions.py +74 -0
- mlflow/server/handlers.py +3217 -0
- mlflow/server/prometheus_exporter.py +17 -0
- mlflow/server/validation.py +30 -0
- mlflow/shap/__init__.py +691 -0
- mlflow/sklearn/__init__.py +1994 -0
- mlflow/sklearn/utils.py +1041 -0
- mlflow/smolagents/__init__.py +66 -0
- mlflow/smolagents/autolog.py +139 -0
- mlflow/smolagents/chat.py +29 -0
- mlflow/store/__init__.py +10 -0
- mlflow/store/_unity_catalog/__init__.py +1 -0
- mlflow/store/_unity_catalog/lineage/__init__.py +1 -0
- mlflow/store/_unity_catalog/lineage/constants.py +2 -0
- mlflow/store/_unity_catalog/registry/__init__.py +6 -0
- mlflow/store/_unity_catalog/registry/prompt_info.py +75 -0
- mlflow/store/_unity_catalog/registry/rest_store.py +1740 -0
- mlflow/store/_unity_catalog/registry/uc_oss_rest_store.py +507 -0
- mlflow/store/_unity_catalog/registry/utils.py +121 -0
- mlflow/store/artifact/__init__.py +0 -0
- mlflow/store/artifact/artifact_repo.py +472 -0
- mlflow/store/artifact/artifact_repository_registry.py +154 -0
- mlflow/store/artifact/azure_blob_artifact_repo.py +275 -0
- mlflow/store/artifact/azure_data_lake_artifact_repo.py +295 -0
- mlflow/store/artifact/cli.py +141 -0
- mlflow/store/artifact/cloud_artifact_repo.py +332 -0
- mlflow/store/artifact/databricks_artifact_repo.py +729 -0
- mlflow/store/artifact/databricks_artifact_repo_resources.py +301 -0
- mlflow/store/artifact/databricks_logged_model_artifact_repo.py +93 -0
- mlflow/store/artifact/databricks_models_artifact_repo.py +216 -0
- mlflow/store/artifact/databricks_sdk_artifact_repo.py +134 -0
- mlflow/store/artifact/databricks_sdk_models_artifact_repo.py +97 -0
- mlflow/store/artifact/dbfs_artifact_repo.py +240 -0
- mlflow/store/artifact/ftp_artifact_repo.py +132 -0
- mlflow/store/artifact/gcs_artifact_repo.py +296 -0
- mlflow/store/artifact/hdfs_artifact_repo.py +209 -0
- mlflow/store/artifact/http_artifact_repo.py +218 -0
- mlflow/store/artifact/local_artifact_repo.py +142 -0
- mlflow/store/artifact/mlflow_artifacts_repo.py +94 -0
- mlflow/store/artifact/models_artifact_repo.py +259 -0
- mlflow/store/artifact/optimized_s3_artifact_repo.py +356 -0
- mlflow/store/artifact/presigned_url_artifact_repo.py +173 -0
- mlflow/store/artifact/r2_artifact_repo.py +70 -0
- mlflow/store/artifact/runs_artifact_repo.py +265 -0
- mlflow/store/artifact/s3_artifact_repo.py +330 -0
- mlflow/store/artifact/sftp_artifact_repo.py +141 -0
- mlflow/store/artifact/uc_volume_artifact_repo.py +76 -0
- mlflow/store/artifact/unity_catalog_models_artifact_repo.py +168 -0
- mlflow/store/artifact/unity_catalog_oss_models_artifact_repo.py +168 -0
- mlflow/store/artifact/utils/__init__.py +0 -0
- mlflow/store/artifact/utils/models.py +148 -0
- mlflow/store/db/__init__.py +0 -0
- mlflow/store/db/base_sql_model.py +3 -0
- mlflow/store/db/db_types.py +10 -0
- mlflow/store/db/utils.py +314 -0
- mlflow/store/db_migrations/__init__.py +0 -0
- mlflow/store/db_migrations/alembic.ini +74 -0
- mlflow/store/db_migrations/env.py +84 -0
- mlflow/store/db_migrations/versions/0584bdc529eb_add_cascading_deletion_to_datasets_from_experiments.py +88 -0
- mlflow/store/db_migrations/versions/0a8213491aaa_drop_duplicate_killed_constraint.py +49 -0
- mlflow/store/db_migrations/versions/0c779009ac13_add_deleted_time_field_to_runs_table.py +24 -0
- mlflow/store/db_migrations/versions/181f10493468_allow_nulls_for_metric_values.py +35 -0
- mlflow/store/db_migrations/versions/27a6a02d2cf1_add_model_version_tags_table.py +38 -0
- mlflow/store/db_migrations/versions/2b4d017a5e9b_add_model_registry_tables_to_db.py +77 -0
- mlflow/store/db_migrations/versions/2d6e25af4d3e_increase_max_param_val_length.py +33 -0
- mlflow/store/db_migrations/versions/3500859a5d39_add_model_aliases_table.py +50 -0
- mlflow/store/db_migrations/versions/39d1c3be5f05_add_is_nan_constraint_for_metrics_tables_if_necessary.py +41 -0
- mlflow/store/db_migrations/versions/400f98739977_add_logged_model_tables.py +123 -0
- mlflow/store/db_migrations/versions/4465047574b1_increase_max_dataset_schema_size.py +38 -0
- mlflow/store/db_migrations/versions/451aebb31d03_add_metric_step.py +35 -0
- mlflow/store/db_migrations/versions/5b0e9adcef9c_add_cascade_deletion_to_trace_tables_fk.py +40 -0
- mlflow/store/db_migrations/versions/6953534de441_add_step_to_inputs_table.py +25 -0
- mlflow/store/db_migrations/versions/728d730b5ebd_add_registered_model_tags_table.py +38 -0
- mlflow/store/db_migrations/versions/7ac759974ad8_update_run_tags_with_larger_limit.py +36 -0
- mlflow/store/db_migrations/versions/7f2a7d5fae7d_add_datasets_inputs_input_tags_tables.py +82 -0
- mlflow/store/db_migrations/versions/84291f40a231_add_run_link_to_model_version.py +26 -0
- mlflow/store/db_migrations/versions/867495a8f9d4_add_trace_tables.py +90 -0
- mlflow/store/db_migrations/versions/89d4b8295536_create_latest_metrics_table.py +169 -0
- mlflow/store/db_migrations/versions/90e64c465722_migrate_user_column_to_tags.py +64 -0
- mlflow/store/db_migrations/versions/97727af70f4d_creation_time_last_update_time_experiments.py +25 -0
- mlflow/store/db_migrations/versions/__init__.py +0 -0
- mlflow/store/db_migrations/versions/a8c4a736bde6_allow_nulls_for_run_id.py +27 -0
- mlflow/store/db_migrations/versions/acf3f17fdcc7_add_storage_location_field_to_model_.py +29 -0
- mlflow/store/db_migrations/versions/bd07f7e963c5_create_index_on_run_uuid.py +26 -0
- mlflow/store/db_migrations/versions/bda7b8c39065_increase_model_version_tag_value_limit.py +38 -0
- mlflow/store/db_migrations/versions/c48cb773bb87_reset_default_value_for_is_nan_in_metrics_table_for_mysql.py +41 -0
- mlflow/store/db_migrations/versions/cbc13b556ace_add_v3_trace_schema_columns.py +31 -0
- mlflow/store/db_migrations/versions/cc1f77228345_change_param_value_length_to_500.py +34 -0
- mlflow/store/db_migrations/versions/cfd24bdc0731_update_run_status_constraint_with_killed.py +78 -0
- mlflow/store/db_migrations/versions/df50e92ffc5e_add_experiment_tags_table.py +38 -0
- mlflow/store/db_migrations/versions/f5a4f2784254_increase_run_tag_value_limit.py +36 -0
- mlflow/store/entities/__init__.py +3 -0
- mlflow/store/entities/paged_list.py +18 -0
- mlflow/store/model_registry/__init__.py +10 -0
- mlflow/store/model_registry/abstract_store.py +1081 -0
- mlflow/store/model_registry/base_rest_store.py +44 -0
- mlflow/store/model_registry/databricks_workspace_model_registry_rest_store.py +37 -0
- mlflow/store/model_registry/dbmodels/__init__.py +0 -0
- mlflow/store/model_registry/dbmodels/models.py +206 -0
- mlflow/store/model_registry/file_store.py +1091 -0
- mlflow/store/model_registry/rest_store.py +481 -0
- mlflow/store/model_registry/sqlalchemy_store.py +1286 -0
- mlflow/store/tracking/__init__.py +23 -0
- mlflow/store/tracking/abstract_store.py +816 -0
- mlflow/store/tracking/dbmodels/__init__.py +0 -0
- mlflow/store/tracking/dbmodels/initial_models.py +243 -0
- mlflow/store/tracking/dbmodels/models.py +1073 -0
- mlflow/store/tracking/file_store.py +2438 -0
- mlflow/store/tracking/postgres_managed_identity.py +146 -0
- mlflow/store/tracking/rest_store.py +1131 -0
- mlflow/store/tracking/sqlalchemy_store.py +2785 -0
- mlflow/system_metrics/__init__.py +61 -0
- mlflow/system_metrics/metrics/__init__.py +0 -0
- mlflow/system_metrics/metrics/base_metrics_monitor.py +32 -0
- mlflow/system_metrics/metrics/cpu_monitor.py +23 -0
- mlflow/system_metrics/metrics/disk_monitor.py +21 -0
- mlflow/system_metrics/metrics/gpu_monitor.py +71 -0
- mlflow/system_metrics/metrics/network_monitor.py +34 -0
- mlflow/system_metrics/metrics/rocm_monitor.py +123 -0
- mlflow/system_metrics/system_metrics_monitor.py +198 -0
- mlflow/tracing/__init__.py +16 -0
- mlflow/tracing/assessment.py +356 -0
- mlflow/tracing/client.py +531 -0
- mlflow/tracing/config.py +125 -0
- mlflow/tracing/constant.py +105 -0
- mlflow/tracing/destination.py +81 -0
- mlflow/tracing/display/__init__.py +40 -0
- mlflow/tracing/display/display_handler.py +196 -0
- mlflow/tracing/export/async_export_queue.py +186 -0
- mlflow/tracing/export/inference_table.py +138 -0
- mlflow/tracing/export/mlflow_v3.py +137 -0
- mlflow/tracing/export/utils.py +70 -0
- mlflow/tracing/fluent.py +1417 -0
- mlflow/tracing/processor/base_mlflow.py +199 -0
- mlflow/tracing/processor/inference_table.py +175 -0
- mlflow/tracing/processor/mlflow_v3.py +47 -0
- mlflow/tracing/processor/otel.py +73 -0
- mlflow/tracing/provider.py +487 -0
- mlflow/tracing/trace_manager.py +200 -0
- mlflow/tracing/utils/__init__.py +616 -0
- mlflow/tracing/utils/artifact_utils.py +28 -0
- mlflow/tracing/utils/copy.py +55 -0
- mlflow/tracing/utils/environment.py +55 -0
- mlflow/tracing/utils/exception.py +21 -0
- mlflow/tracing/utils/once.py +35 -0
- mlflow/tracing/utils/otlp.py +63 -0
- mlflow/tracing/utils/processor.py +54 -0
- mlflow/tracing/utils/search.py +292 -0
- mlflow/tracing/utils/timeout.py +250 -0
- mlflow/tracing/utils/token.py +19 -0
- mlflow/tracing/utils/truncation.py +124 -0
- mlflow/tracing/utils/warning.py +76 -0
- mlflow/tracking/__init__.py +39 -0
- mlflow/tracking/_model_registry/__init__.py +1 -0
- mlflow/tracking/_model_registry/client.py +764 -0
- mlflow/tracking/_model_registry/fluent.py +853 -0
- mlflow/tracking/_model_registry/registry.py +67 -0
- mlflow/tracking/_model_registry/utils.py +251 -0
- mlflow/tracking/_tracking_service/__init__.py +0 -0
- mlflow/tracking/_tracking_service/client.py +883 -0
- mlflow/tracking/_tracking_service/registry.py +56 -0
- mlflow/tracking/_tracking_service/utils.py +275 -0
- mlflow/tracking/artifact_utils.py +179 -0
- mlflow/tracking/client.py +5900 -0
- mlflow/tracking/context/__init__.py +0 -0
- mlflow/tracking/context/abstract_context.py +35 -0
- mlflow/tracking/context/databricks_cluster_context.py +15 -0
- mlflow/tracking/context/databricks_command_context.py +15 -0
- mlflow/tracking/context/databricks_job_context.py +49 -0
- mlflow/tracking/context/databricks_notebook_context.py +41 -0
- mlflow/tracking/context/databricks_repo_context.py +43 -0
- mlflow/tracking/context/default_context.py +51 -0
- mlflow/tracking/context/git_context.py +32 -0
- mlflow/tracking/context/registry.py +98 -0
- mlflow/tracking/context/system_environment_context.py +15 -0
- mlflow/tracking/default_experiment/__init__.py +1 -0
- mlflow/tracking/default_experiment/abstract_context.py +43 -0
- mlflow/tracking/default_experiment/databricks_notebook_experiment_provider.py +44 -0
- mlflow/tracking/default_experiment/registry.py +75 -0
- mlflow/tracking/fluent.py +3595 -0
- mlflow/tracking/metric_value_conversion_utils.py +93 -0
- mlflow/tracking/multimedia.py +206 -0
- mlflow/tracking/registry.py +86 -0
- mlflow/tracking/request_auth/__init__.py +0 -0
- mlflow/tracking/request_auth/abstract_request_auth_provider.py +34 -0
- mlflow/tracking/request_auth/registry.py +60 -0
- mlflow/tracking/request_header/__init__.py +0 -0
- mlflow/tracking/request_header/abstract_request_header_provider.py +36 -0
- mlflow/tracking/request_header/databricks_request_header_provider.py +38 -0
- mlflow/tracking/request_header/default_request_header_provider.py +17 -0
- mlflow/tracking/request_header/registry.py +79 -0
- mlflow/transformers/__init__.py +2982 -0
- mlflow/transformers/flavor_config.py +258 -0
- mlflow/transformers/hub_utils.py +83 -0
- mlflow/transformers/llm_inference_utils.py +468 -0
- mlflow/transformers/model_io.py +301 -0
- mlflow/transformers/peft.py +51 -0
- mlflow/transformers/signature.py +183 -0
- mlflow/transformers/torch_utils.py +55 -0
- mlflow/types/__init__.py +21 -0
- mlflow/types/agent.py +270 -0
- mlflow/types/chat.py +240 -0
- mlflow/types/llm.py +935 -0
- mlflow/types/responses.py +139 -0
- mlflow/types/responses_helpers.py +416 -0
- mlflow/types/schema.py +1505 -0
- mlflow/types/type_hints.py +647 -0
- mlflow/types/utils.py +753 -0
- mlflow/utils/__init__.py +283 -0
- mlflow/utils/_capture_modules.py +256 -0
- mlflow/utils/_capture_transformers_modules.py +75 -0
- mlflow/utils/_spark_utils.py +201 -0
- mlflow/utils/_unity_catalog_oss_utils.py +97 -0
- mlflow/utils/_unity_catalog_utils.py +479 -0
- mlflow/utils/annotations.py +218 -0
- mlflow/utils/arguments_utils.py +16 -0
- mlflow/utils/async_logging/__init__.py +1 -0
- mlflow/utils/async_logging/async_artifacts_logging_queue.py +258 -0
- mlflow/utils/async_logging/async_logging_queue.py +366 -0
- mlflow/utils/async_logging/run_artifact.py +38 -0
- mlflow/utils/async_logging/run_batch.py +58 -0
- mlflow/utils/async_logging/run_operations.py +49 -0
- mlflow/utils/autologging_utils/__init__.py +737 -0
- mlflow/utils/autologging_utils/client.py +432 -0
- mlflow/utils/autologging_utils/config.py +33 -0
- mlflow/utils/autologging_utils/events.py +294 -0
- mlflow/utils/autologging_utils/logging_and_warnings.py +328 -0
- mlflow/utils/autologging_utils/metrics_queue.py +71 -0
- mlflow/utils/autologging_utils/safety.py +1104 -0
- mlflow/utils/autologging_utils/versioning.py +95 -0
- mlflow/utils/checkpoint_utils.py +206 -0
- mlflow/utils/class_utils.py +6 -0
- mlflow/utils/cli_args.py +257 -0
- mlflow/utils/conda.py +354 -0
- mlflow/utils/credentials.py +231 -0
- mlflow/utils/data_utils.py +17 -0
- mlflow/utils/databricks_utils.py +1436 -0
- mlflow/utils/docstring_utils.py +477 -0
- mlflow/utils/doctor.py +133 -0
- mlflow/utils/download_cloud_file_chunk.py +43 -0
- mlflow/utils/env_manager.py +16 -0
- mlflow/utils/env_pack.py +131 -0
- mlflow/utils/environment.py +1009 -0
- mlflow/utils/exception_utils.py +14 -0
- mlflow/utils/file_utils.py +978 -0
- mlflow/utils/git_utils.py +77 -0
- mlflow/utils/gorilla.py +797 -0
- mlflow/utils/import_hooks/__init__.py +363 -0
- mlflow/utils/lazy_load.py +51 -0
- mlflow/utils/logging_utils.py +168 -0
- mlflow/utils/mime_type_utils.py +58 -0
- mlflow/utils/mlflow_tags.py +103 -0
- mlflow/utils/model_utils.py +486 -0
- mlflow/utils/name_utils.py +346 -0
- mlflow/utils/nfs_on_spark.py +62 -0
- mlflow/utils/openai_utils.py +164 -0
- mlflow/utils/os.py +12 -0
- mlflow/utils/oss_registry_utils.py +29 -0
- mlflow/utils/plugins.py +17 -0
- mlflow/utils/process.py +182 -0
- mlflow/utils/promptlab_utils.py +146 -0
- mlflow/utils/proto_json_utils.py +743 -0
- mlflow/utils/pydantic_utils.py +54 -0
- mlflow/utils/request_utils.py +279 -0
- mlflow/utils/requirements_utils.py +704 -0
- mlflow/utils/rest_utils.py +673 -0
- mlflow/utils/search_logged_model_utils.py +127 -0
- mlflow/utils/search_utils.py +2111 -0
- mlflow/utils/secure_loading.py +221 -0
- mlflow/utils/security_validation.py +384 -0
- mlflow/utils/server_cli_utils.py +61 -0
- mlflow/utils/spark_utils.py +15 -0
- mlflow/utils/string_utils.py +138 -0
- mlflow/utils/thread_utils.py +63 -0
- mlflow/utils/time.py +54 -0
- mlflow/utils/timeout.py +42 -0
- mlflow/utils/uri.py +572 -0
- mlflow/utils/validation.py +662 -0
- mlflow/utils/virtualenv.py +458 -0
- mlflow/utils/warnings_utils.py +25 -0
- mlflow/utils/yaml_utils.py +179 -0
- mlflow/version.py +24 -0
@@ -0,0 +1,275 @@
|
|
1
|
+
import base64
|
2
|
+
import datetime
|
3
|
+
import os
|
4
|
+
import posixpath
|
5
|
+
import re
|
6
|
+
import urllib.parse
|
7
|
+
from typing import Optional, Union
|
8
|
+
|
9
|
+
from mlflow.entities import FileInfo
|
10
|
+
from mlflow.entities.multipart_upload import (
|
11
|
+
CreateMultipartUploadResponse,
|
12
|
+
MultipartUploadCredential,
|
13
|
+
)
|
14
|
+
from mlflow.environment_variables import MLFLOW_ARTIFACT_UPLOAD_DOWNLOAD_TIMEOUT
|
15
|
+
from mlflow.exceptions import MlflowException
|
16
|
+
from mlflow.store.artifact.artifact_repo import ArtifactRepository, MultipartUploadMixin
|
17
|
+
from mlflow.utils.credentials import get_default_host_creds
|
18
|
+
|
19
|
+
|
20
|
+
def encode_base64(data: Union[str, bytes]) -> str:
|
21
|
+
if isinstance(data, str):
|
22
|
+
data = data.encode("utf-8")
|
23
|
+
encoded = base64.b64encode(data)
|
24
|
+
return encoded.decode("utf-8")
|
25
|
+
|
26
|
+
|
27
|
+
def decode_base64(encoded: str) -> str:
|
28
|
+
decoded_bytes = base64.b64decode(encoded)
|
29
|
+
return decoded_bytes.decode("utf-8")
|
30
|
+
|
31
|
+
|
32
|
+
class AzureBlobArtifactRepository(ArtifactRepository, MultipartUploadMixin):
|
33
|
+
"""
|
34
|
+
Stores artifacts on Azure Blob Storage.
|
35
|
+
|
36
|
+
This repository is used with URIs of the form
|
37
|
+
``wasbs://<container-name>@<ystorage-account-name>.blob.core.windows.net/<path>``,
|
38
|
+
following the same URI scheme as Hadoop on Azure blob storage. It requires either that:
|
39
|
+
- Azure storage connection string is in the env var ``AZURE_STORAGE_CONNECTION_STRING``
|
40
|
+
- Azure storage access key is in the env var ``AZURE_STORAGE_ACCESS_KEY``
|
41
|
+
- DefaultAzureCredential is configured
|
42
|
+
"""
|
43
|
+
|
44
|
+
def __init__(self, artifact_uri: str, tracking_uri: Optional[str] = None, client=None) -> None:
|
45
|
+
super().__init__(artifact_uri, tracking_uri)
|
46
|
+
|
47
|
+
_DEFAULT_TIMEOUT = 600 # 10 minutes
|
48
|
+
self.write_timeout = MLFLOW_ARTIFACT_UPLOAD_DOWNLOAD_TIMEOUT.get() or _DEFAULT_TIMEOUT
|
49
|
+
|
50
|
+
# Allow override for testing
|
51
|
+
if client:
|
52
|
+
self.client = client
|
53
|
+
return
|
54
|
+
|
55
|
+
from azure.storage.blob import BlobServiceClient
|
56
|
+
|
57
|
+
(_, account, _, api_uri_suffix) = AzureBlobArtifactRepository.parse_wasbs_uri(artifact_uri)
|
58
|
+
if "AZURE_STORAGE_CONNECTION_STRING" in os.environ:
|
59
|
+
self.client = BlobServiceClient.from_connection_string(
|
60
|
+
conn_str=os.environ.get("AZURE_STORAGE_CONNECTION_STRING"),
|
61
|
+
connection_verify=get_default_host_creds(artifact_uri).verify,
|
62
|
+
)
|
63
|
+
elif "AZURE_STORAGE_ACCESS_KEY" in os.environ:
|
64
|
+
account_url = f"https://{account}.{api_uri_suffix}"
|
65
|
+
self.client = BlobServiceClient(
|
66
|
+
account_url=account_url,
|
67
|
+
credential=os.environ.get("AZURE_STORAGE_ACCESS_KEY"),
|
68
|
+
connection_verify=get_default_host_creds(artifact_uri).verify,
|
69
|
+
)
|
70
|
+
else:
|
71
|
+
try:
|
72
|
+
from azure.identity import DefaultAzureCredential
|
73
|
+
except ImportError as exc:
|
74
|
+
raise ImportError(
|
75
|
+
"Using DefaultAzureCredential requires the azure-identity package. "
|
76
|
+
"Please install it via: pip install azure-identity"
|
77
|
+
) from exc
|
78
|
+
|
79
|
+
account_url = f"https://{account}.{api_uri_suffix}"
|
80
|
+
self.client = BlobServiceClient(
|
81
|
+
account_url=account_url,
|
82
|
+
credential=DefaultAzureCredential(),
|
83
|
+
connection_verify=get_default_host_creds(artifact_uri).verify,
|
84
|
+
)
|
85
|
+
|
86
|
+
@staticmethod
|
87
|
+
def parse_wasbs_uri(uri):
|
88
|
+
"""Parse a wasbs:// URI, returning (container, storage_account, path, api_uri_suffix)."""
|
89
|
+
parsed = urllib.parse.urlparse(uri)
|
90
|
+
if parsed.scheme != "wasbs":
|
91
|
+
raise Exception(f"Not a WASBS URI: {uri}")
|
92
|
+
|
93
|
+
match = re.match(
|
94
|
+
r"([^@]+)@([^.]+)\.(blob\.core\.(windows\.net|chinacloudapi\.cn))", parsed.netloc
|
95
|
+
)
|
96
|
+
|
97
|
+
if match is None:
|
98
|
+
raise Exception(
|
99
|
+
"WASBS URI must be of the form "
|
100
|
+
"<container>@<account>.blob.core.windows.net"
|
101
|
+
" or <container>@<account>.blob.core.chinacloudapi.cn"
|
102
|
+
)
|
103
|
+
container = match.group(1)
|
104
|
+
storage_account = match.group(2)
|
105
|
+
api_uri_suffix = match.group(3)
|
106
|
+
path = parsed.path
|
107
|
+
if path.startswith("/"):
|
108
|
+
path = path[1:]
|
109
|
+
return container, storage_account, path, api_uri_suffix
|
110
|
+
|
111
|
+
def log_artifact(self, local_file, artifact_path=None):
|
112
|
+
(container, _, dest_path, _) = self.parse_wasbs_uri(self.artifact_uri)
|
113
|
+
container_client = self.client.get_container_client(container)
|
114
|
+
if artifact_path:
|
115
|
+
dest_path = posixpath.join(dest_path, artifact_path)
|
116
|
+
dest_path = posixpath.join(dest_path, os.path.basename(local_file))
|
117
|
+
with open(local_file, "rb") as file:
|
118
|
+
container_client.upload_blob(
|
119
|
+
dest_path, file, overwrite=True, timeout=self.write_timeout
|
120
|
+
)
|
121
|
+
|
122
|
+
def log_artifacts(self, local_dir, artifact_path=None):
|
123
|
+
(container, _, dest_path, _) = self.parse_wasbs_uri(self.artifact_uri)
|
124
|
+
container_client = self.client.get_container_client(container)
|
125
|
+
if artifact_path:
|
126
|
+
dest_path = posixpath.join(dest_path, artifact_path)
|
127
|
+
local_dir = os.path.abspath(local_dir)
|
128
|
+
for root, _, filenames in os.walk(local_dir):
|
129
|
+
upload_path = dest_path
|
130
|
+
if root != local_dir:
|
131
|
+
rel_path = os.path.relpath(root, local_dir)
|
132
|
+
upload_path = posixpath.join(dest_path, rel_path)
|
133
|
+
for f in filenames:
|
134
|
+
remote_file_path = posixpath.join(upload_path, f)
|
135
|
+
local_file_path = os.path.join(root, f)
|
136
|
+
with open(local_file_path, "rb") as file:
|
137
|
+
container_client.upload_blob(
|
138
|
+
remote_file_path, file, overwrite=True, timeout=self.write_timeout
|
139
|
+
)
|
140
|
+
|
141
|
+
def list_artifacts(self, path=None):
|
142
|
+
# Newer versions of `azure-storage-blob` (>= 12.4.0) provide a public
|
143
|
+
# `azure.storage.blob.BlobPrefix` object to signify that a blob is a directory,
|
144
|
+
# while older versions only expose this API internally as
|
145
|
+
# `azure.storage.blob._models.BlobPrefix`
|
146
|
+
try:
|
147
|
+
from azure.storage.blob import BlobPrefix
|
148
|
+
except ImportError:
|
149
|
+
from azure.storage.blob._models import BlobPrefix
|
150
|
+
|
151
|
+
def is_dir(result):
|
152
|
+
return isinstance(result, BlobPrefix)
|
153
|
+
|
154
|
+
(container, _, artifact_path, _) = self.parse_wasbs_uri(self.artifact_uri)
|
155
|
+
container_client = self.client.get_container_client(container)
|
156
|
+
dest_path = artifact_path
|
157
|
+
if path:
|
158
|
+
dest_path = posixpath.join(dest_path, path)
|
159
|
+
infos = []
|
160
|
+
prefix = dest_path if dest_path.endswith("/") else dest_path + "/"
|
161
|
+
results = container_client.walk_blobs(name_starts_with=prefix)
|
162
|
+
|
163
|
+
for result in results:
|
164
|
+
if (
|
165
|
+
dest_path == result.name
|
166
|
+
): # result isn't actually a child of the path we're interested in, so skip it
|
167
|
+
continue
|
168
|
+
|
169
|
+
if not result.name.startswith(artifact_path):
|
170
|
+
raise MlflowException(
|
171
|
+
"The name of the listed Azure blob does not begin with the specified"
|
172
|
+
f" artifact path. Artifact path: {artifact_path}. Blob name: {result.name}"
|
173
|
+
)
|
174
|
+
|
175
|
+
if is_dir(result):
|
176
|
+
subdir = posixpath.relpath(path=result.name, start=artifact_path)
|
177
|
+
if subdir.endswith("/"):
|
178
|
+
subdir = subdir[:-1]
|
179
|
+
infos.append(FileInfo(subdir, is_dir=True, file_size=None))
|
180
|
+
else: # Just a plain old blob
|
181
|
+
file_name = posixpath.relpath(path=result.name, start=artifact_path)
|
182
|
+
infos.append(FileInfo(file_name, is_dir=False, file_size=result.size))
|
183
|
+
|
184
|
+
# The list_artifacts API expects us to return an empty list if the
|
185
|
+
# the path references a single file.
|
186
|
+
rel_path = dest_path[len(artifact_path) + 1 :]
|
187
|
+
if (len(infos) == 1) and not infos[0].is_dir and (infos[0].path == rel_path):
|
188
|
+
return []
|
189
|
+
return sorted(infos, key=lambda f: f.path)
|
190
|
+
|
191
|
+
def _download_file(self, remote_file_path, local_path):
|
192
|
+
(container, _, remote_root_path, _) = self.parse_wasbs_uri(self.artifact_uri)
|
193
|
+
container_client = self.client.get_container_client(container)
|
194
|
+
remote_full_path = posixpath.join(remote_root_path, remote_file_path)
|
195
|
+
blob = container_client.download_blob(remote_full_path)
|
196
|
+
with open(local_path, "wb") as file:
|
197
|
+
blob.readinto(file)
|
198
|
+
|
199
|
+
def delete_artifacts(self, artifact_path=None):
|
200
|
+
from azure.core.exceptions import ResourceNotFoundError
|
201
|
+
|
202
|
+
(container, _, dest_path, _) = self.parse_wasbs_uri(self.artifact_uri)
|
203
|
+
container_client = self.client.get_container_client(container)
|
204
|
+
if artifact_path:
|
205
|
+
dest_path = posixpath.join(dest_path, artifact_path)
|
206
|
+
|
207
|
+
try:
|
208
|
+
blobs = container_client.list_blobs(name_starts_with=dest_path)
|
209
|
+
blob_list = list(blobs)
|
210
|
+
if not blob_list:
|
211
|
+
raise MlflowException(f"No such file or directory: '{dest_path}'")
|
212
|
+
|
213
|
+
for blob in blob_list:
|
214
|
+
container_client.delete_blob(blob.name)
|
215
|
+
except ResourceNotFoundError:
|
216
|
+
raise MlflowException(f"No such file or directory: '{dest_path}'")
|
217
|
+
|
218
|
+
def create_multipart_upload(self, local_file, num_parts=1, artifact_path=None):
|
219
|
+
from azure.storage.blob import BlobSasPermissions, generate_blob_sas
|
220
|
+
|
221
|
+
(container, _, dest_path, _) = self.parse_wasbs_uri(self.artifact_uri)
|
222
|
+
if artifact_path:
|
223
|
+
dest_path = posixpath.join(dest_path, artifact_path)
|
224
|
+
dest_path = posixpath.join(dest_path, os.path.basename(local_file))
|
225
|
+
|
226
|
+
# Put Block: https://learn.microsoft.com/en-us/rest/api/storageservices/put-block?tabs=microsoft-entra-id
|
227
|
+
# SDK: https://learn.microsoft.com/en-us/python/api/azure-storage-blob/azure.storage.blob.blobclient?view=azure-python#azure-storage-blob-blobclient-stage-block
|
228
|
+
blob_url = posixpath.join(self.client.url, container, dest_path)
|
229
|
+
sas_token = generate_blob_sas(
|
230
|
+
account_name=self.client.account_name,
|
231
|
+
container_name=container,
|
232
|
+
blob_name=dest_path,
|
233
|
+
account_key=self.client.credential.account_key,
|
234
|
+
permission=BlobSasPermissions(read=True, write=True),
|
235
|
+
expiry=datetime.datetime.utcnow() + datetime.timedelta(hours=1),
|
236
|
+
)
|
237
|
+
credentials = []
|
238
|
+
for i in range(1, num_parts + 1):
|
239
|
+
block_id = f"mlflow_block_{i}"
|
240
|
+
# see https://github.com/Azure/azure-sdk-for-python/blob/18a66ef98c6f2153491489d3d7d2fe4a5849e4ac/sdk/storage/azure-storage-blob/azure/storage/blob/_blob_client.py#L2468
|
241
|
+
safe_block_id = urllib.parse.quote(encode_base64(block_id), safe="")
|
242
|
+
url = f"{blob_url}?comp=block&blockid={safe_block_id}&{sas_token}"
|
243
|
+
credentials.append(
|
244
|
+
MultipartUploadCredential(
|
245
|
+
url=url,
|
246
|
+
part_number=i,
|
247
|
+
headers={},
|
248
|
+
)
|
249
|
+
)
|
250
|
+
return CreateMultipartUploadResponse(
|
251
|
+
credentials=credentials,
|
252
|
+
upload_id=None,
|
253
|
+
)
|
254
|
+
|
255
|
+
def complete_multipart_upload(self, local_file, upload_id, parts=None, artifact_path=None):
|
256
|
+
(container, _, dest_path, _) = self.parse_wasbs_uri(self.artifact_uri)
|
257
|
+
if artifact_path:
|
258
|
+
dest_path = posixpath.join(dest_path, artifact_path)
|
259
|
+
dest_path = posixpath.join(dest_path, os.path.basename(local_file))
|
260
|
+
|
261
|
+
block_ids = []
|
262
|
+
for part in parts:
|
263
|
+
qs = urllib.parse.urlparse(part.url).query
|
264
|
+
block_id = urllib.parse.parse_qs(qs)["blockid"][0]
|
265
|
+
block_id = decode_base64(urllib.parse.unquote(block_id))
|
266
|
+
block_ids.append(block_id)
|
267
|
+
blob_client = self.client.get_blob_client(container, dest_path)
|
268
|
+
blob_client.commit_block_list(block_ids)
|
269
|
+
|
270
|
+
def abort_multipart_upload(self, local_file, upload_id, artifact_path=None):
|
271
|
+
# There is no way to delete uncommitted blocks in Azure Blob Storage.
|
272
|
+
# Instead, they are garbage collected within 7 days.
|
273
|
+
# See https://docs.microsoft.com/en-us/rest/api/storageservices/put-block-list#remarks
|
274
|
+
# The blob may already exist so we cannot delete it either.
|
275
|
+
pass
|
@@ -0,0 +1,295 @@
|
|
1
|
+
import os
|
2
|
+
import posixpath
|
3
|
+
import re
|
4
|
+
import urllib.parse
|
5
|
+
from typing import Optional
|
6
|
+
|
7
|
+
import requests
|
8
|
+
|
9
|
+
from mlflow.azure.client import patch_adls_file_upload, patch_adls_flush, put_adls_file_creation
|
10
|
+
from mlflow.entities import FileInfo
|
11
|
+
from mlflow.environment_variables import (
|
12
|
+
MLFLOW_ARTIFACT_UPLOAD_DOWNLOAD_TIMEOUT,
|
13
|
+
MLFLOW_ENABLE_MULTIPART_UPLOAD,
|
14
|
+
MLFLOW_MULTIPART_UPLOAD_CHUNK_SIZE,
|
15
|
+
)
|
16
|
+
from mlflow.exceptions import MlflowException
|
17
|
+
from mlflow.protos.databricks_artifacts_pb2 import ArtifactCredentialInfo
|
18
|
+
from mlflow.store.artifact.artifact_repo import _retry_with_new_creds
|
19
|
+
from mlflow.store.artifact.cloud_artifact_repo import (
|
20
|
+
CloudArtifactRepository,
|
21
|
+
_complete_futures,
|
22
|
+
_compute_num_chunks,
|
23
|
+
)
|
24
|
+
|
25
|
+
|
26
|
+
def _parse_abfss_uri(uri):
|
27
|
+
"""
|
28
|
+
Parse an ABFSS URI in the format
|
29
|
+
"abfss://<file_system>@<account_name>.<domain_suffix>/<path>",
|
30
|
+
returning a tuple consisting of the filesystem, account name, domain suffix, and path
|
31
|
+
|
32
|
+
See more details about ABFSS URIs at
|
33
|
+
https://learn.microsoft.com/en-us/azure/storage/blobs/data-lake-storage-abfs-driver#uri-scheme-to-reference-data.
|
34
|
+
Also, see different domain suffixes for:
|
35
|
+
* Azure China: https://learn.microsoft.com/en-us/azure/china/resources-developer-guide
|
36
|
+
* Azure Government: https://learn.microsoft.com/en-us/azure/azure-government/compare-azure-government-global-azure#guidance-for-developers
|
37
|
+
* Azure Private Link: https://learn.microsoft.com/en-us/azure/private-link/private-endpoint-dns#government
|
38
|
+
Args:
|
39
|
+
uri: ABFSS URI to parse
|
40
|
+
|
41
|
+
Returns:
|
42
|
+
A tuple containing the name of the filesystem, account name, domain suffix,
|
43
|
+
and path
|
44
|
+
"""
|
45
|
+
parsed = urllib.parse.urlparse(uri)
|
46
|
+
if parsed.scheme != "abfss":
|
47
|
+
raise MlflowException(f"Not an ABFSS URI: {uri}")
|
48
|
+
|
49
|
+
match = re.match(r"([^@]+)@([^.]+)\.(.*)", parsed.netloc)
|
50
|
+
|
51
|
+
if match is None:
|
52
|
+
raise MlflowException(
|
53
|
+
"ABFSS URI must be of the form abfss://<filesystem>@<account>.<domain_suffix>"
|
54
|
+
)
|
55
|
+
filesystem = match.group(1)
|
56
|
+
account_name = match.group(2)
|
57
|
+
domain_suffix = match.group(3)
|
58
|
+
path = parsed.path
|
59
|
+
if path.startswith("/"):
|
60
|
+
path = path[1:]
|
61
|
+
return filesystem, account_name, domain_suffix, path
|
62
|
+
|
63
|
+
|
64
|
+
def _get_data_lake_client(account_url, credential):
|
65
|
+
from azure.storage.filedatalake import DataLakeServiceClient
|
66
|
+
|
67
|
+
return DataLakeServiceClient(account_url, credential)
|
68
|
+
|
69
|
+
|
70
|
+
class AzureDataLakeArtifactRepository(CloudArtifactRepository):
|
71
|
+
"""
|
72
|
+
Stores artifacts on Azure Data Lake Storage Gen2.
|
73
|
+
|
74
|
+
This repository is used with URIs of the form
|
75
|
+
``abfs[s]://file_system@account_name.dfs.core.windows.net/<path>/<path>``.
|
76
|
+
|
77
|
+
Args
|
78
|
+
credential: Azure credential (see options in https://learn.microsoft.com/en-us/python/api/azure-core/azure.core.credentials?view=azure-python)
|
79
|
+
to use to authenticate to storage
|
80
|
+
"""
|
81
|
+
|
82
|
+
def __init__(
|
83
|
+
self,
|
84
|
+
artifact_uri: str,
|
85
|
+
tracking_uri: Optional[str] = None,
|
86
|
+
credential=None,
|
87
|
+
credential_refresh_def=None,
|
88
|
+
) -> None:
|
89
|
+
super().__init__(artifact_uri, tracking_uri)
|
90
|
+
_DEFAULT_TIMEOUT = 600 # 10 minutes
|
91
|
+
self.write_timeout = MLFLOW_ARTIFACT_UPLOAD_DOWNLOAD_TIMEOUT.get() or _DEFAULT_TIMEOUT
|
92
|
+
self._parse_credentials(credential)
|
93
|
+
self._credential_refresh_def = credential_refresh_def
|
94
|
+
|
95
|
+
def _parse_credentials(self, credential):
|
96
|
+
(filesystem, account_name, domain_suffix, path) = _parse_abfss_uri(self.artifact_uri)
|
97
|
+
account_url = f"https://{account_name}.{domain_suffix}"
|
98
|
+
self.sas_token = ""
|
99
|
+
if credential is None:
|
100
|
+
if sas_token := os.environ.get("AZURE_STORAGE_SAS_TOKEN"):
|
101
|
+
self.sas_token = f"?{sas_token}"
|
102
|
+
account_url += self.sas_token
|
103
|
+
else:
|
104
|
+
from azure.identity import DefaultAzureCredential
|
105
|
+
|
106
|
+
credential = DefaultAzureCredential()
|
107
|
+
self.credential = credential
|
108
|
+
data_lake_client = _get_data_lake_client(
|
109
|
+
account_url=account_url, credential=self.credential
|
110
|
+
)
|
111
|
+
self.fs_client = data_lake_client.get_file_system_client(filesystem)
|
112
|
+
self.domain_suffix = domain_suffix
|
113
|
+
self.base_data_lake_directory = path
|
114
|
+
self.account_name = account_name
|
115
|
+
self.container = filesystem
|
116
|
+
|
117
|
+
def _refresh_credentials(self):
|
118
|
+
if not self._credential_refresh_def:
|
119
|
+
return self.fs_client
|
120
|
+
new_creds = self._credential_refresh_def()
|
121
|
+
self._parse_credentials(new_creds["credential"])
|
122
|
+
return self.fs_client
|
123
|
+
|
124
|
+
def log_artifact(self, local_file, artifact_path=None):
|
125
|
+
dest_path = self.base_data_lake_directory
|
126
|
+
if artifact_path:
|
127
|
+
dest_path = posixpath.join(dest_path, artifact_path)
|
128
|
+
local_file_path = os.path.abspath(local_file)
|
129
|
+
file_name = os.path.basename(local_file_path)
|
130
|
+
|
131
|
+
def try_func(creds):
|
132
|
+
dir_client = creds.get_directory_client(dest_path)
|
133
|
+
file_client = dir_client.get_file_client(file_name)
|
134
|
+
if os.path.getsize(local_file_path) == 0:
|
135
|
+
file_client.create_file()
|
136
|
+
else:
|
137
|
+
with open(local_file_path, "rb") as file:
|
138
|
+
file_client.upload_data(data=file, overwrite=True)
|
139
|
+
|
140
|
+
_retry_with_new_creds(
|
141
|
+
try_func=try_func, creds_func=self._refresh_credentials, orig_creds=self.fs_client
|
142
|
+
)
|
143
|
+
|
144
|
+
def list_artifacts(self, path=None):
|
145
|
+
directory_to_list = self.base_data_lake_directory
|
146
|
+
if path:
|
147
|
+
directory_to_list = posixpath.join(directory_to_list, path)
|
148
|
+
infos = []
|
149
|
+
for result in self.fs_client.get_paths(path=directory_to_list, recursive=False):
|
150
|
+
if (
|
151
|
+
directory_to_list == result.name
|
152
|
+
): # result isn't actually a child of the path we're interested in, so skip it
|
153
|
+
continue
|
154
|
+
if result.is_directory:
|
155
|
+
subdir = posixpath.relpath(path=result.name, start=self.base_data_lake_directory)
|
156
|
+
if subdir.endswith("/"):
|
157
|
+
subdir = subdir[:-1]
|
158
|
+
infos.append(FileInfo(subdir, is_dir=True, file_size=None))
|
159
|
+
else:
|
160
|
+
file_name = posixpath.relpath(path=result.name, start=self.base_data_lake_directory)
|
161
|
+
infos.append(FileInfo(file_name, is_dir=False, file_size=result.content_length))
|
162
|
+
|
163
|
+
# The list_artifacts API expects us to return an empty list if the
|
164
|
+
# the path references a single file.
|
165
|
+
rel_path = directory_to_list[len(self.base_data_lake_directory) + 1 :]
|
166
|
+
if (len(infos) == 1) and not infos[0].is_dir and (infos[0].path == rel_path):
|
167
|
+
return []
|
168
|
+
return sorted(infos, key=lambda f: f.path)
|
169
|
+
|
170
|
+
def _download_from_cloud(self, remote_file_path, local_path):
|
171
|
+
remote_full_path = posixpath.join(self.base_data_lake_directory, remote_file_path)
|
172
|
+
base_dir = posixpath.dirname(remote_full_path)
|
173
|
+
|
174
|
+
def try_func(creds):
|
175
|
+
dir_client = creds.get_directory_client(base_dir)
|
176
|
+
filename = posixpath.basename(remote_full_path)
|
177
|
+
file_client = dir_client.get_file_client(filename)
|
178
|
+
with open(local_path, "wb") as file:
|
179
|
+
file_client.download_file().readinto(file)
|
180
|
+
|
181
|
+
_retry_with_new_creds(
|
182
|
+
try_func=try_func, creds_func=self._refresh_credentials, orig_creds=self.fs_client
|
183
|
+
)
|
184
|
+
|
185
|
+
def delete_artifacts(self, artifact_path=None):
|
186
|
+
raise NotImplementedError("This artifact repository does not support deleting artifacts")
|
187
|
+
|
188
|
+
def _upload_to_cloud(self, cloud_credential_info, src_file_path, artifact_file_path):
|
189
|
+
if (
|
190
|
+
MLFLOW_ENABLE_MULTIPART_UPLOAD.get()
|
191
|
+
and os.path.getsize(src_file_path) > MLFLOW_MULTIPART_UPLOAD_CHUNK_SIZE.get()
|
192
|
+
):
|
193
|
+
self._multipart_upload(cloud_credential_info, src_file_path, artifact_file_path)
|
194
|
+
else:
|
195
|
+
artifact_subdir = posixpath.dirname(artifact_file_path)
|
196
|
+
self.log_artifact(src_file_path, artifact_subdir)
|
197
|
+
|
198
|
+
def _retryable_adls_function(self, func, artifact_file_path, **kwargs):
|
199
|
+
# Attempt to call the passed function. Retry if the credentials have expired
|
200
|
+
try:
|
201
|
+
func(**kwargs)
|
202
|
+
except requests.HTTPError as e:
|
203
|
+
if e.response.status_code in [403]:
|
204
|
+
new_credentials = self._get_write_credential_infos([artifact_file_path])[0]
|
205
|
+
kwargs["sas_url"] = new_credentials.signed_uri
|
206
|
+
func(**kwargs)
|
207
|
+
else:
|
208
|
+
raise e
|
209
|
+
|
210
|
+
def _multipart_upload(self, credentials, src_file_path, artifact_file_path):
|
211
|
+
"""
|
212
|
+
Uploads a file to a given Azure storage location using the ADLS gen2 API.
|
213
|
+
"""
|
214
|
+
try:
|
215
|
+
headers = self._extract_headers_from_credentials(credentials.headers)
|
216
|
+
# try to create the file
|
217
|
+
self._retryable_adls_function(
|
218
|
+
func=put_adls_file_creation,
|
219
|
+
artifact_file_path=artifact_file_path,
|
220
|
+
sas_url=credentials.signed_uri,
|
221
|
+
headers=headers,
|
222
|
+
)
|
223
|
+
# next try to append the file
|
224
|
+
futures = {}
|
225
|
+
file_size = os.path.getsize(src_file_path)
|
226
|
+
num_chunks = _compute_num_chunks(
|
227
|
+
src_file_path, MLFLOW_MULTIPART_UPLOAD_CHUNK_SIZE.get()
|
228
|
+
)
|
229
|
+
use_single_part_upload = num_chunks == 1
|
230
|
+
for index in range(num_chunks):
|
231
|
+
start_byte = index * MLFLOW_MULTIPART_UPLOAD_CHUNK_SIZE.get()
|
232
|
+
future = self.chunk_thread_pool.submit(
|
233
|
+
self._retryable_adls_function,
|
234
|
+
func=patch_adls_file_upload,
|
235
|
+
artifact_file_path=artifact_file_path,
|
236
|
+
sas_url=credentials.signed_uri,
|
237
|
+
local_file=src_file_path,
|
238
|
+
start_byte=start_byte,
|
239
|
+
size=MLFLOW_MULTIPART_UPLOAD_CHUNK_SIZE.get(),
|
240
|
+
position=start_byte,
|
241
|
+
headers=headers,
|
242
|
+
is_single=use_single_part_upload,
|
243
|
+
)
|
244
|
+
futures[future] = index
|
245
|
+
|
246
|
+
_, errors = _complete_futures(futures, src_file_path)
|
247
|
+
if errors:
|
248
|
+
raise MlflowException(
|
249
|
+
f"Failed to upload at least one part of {artifact_file_path}. Errors: {errors}"
|
250
|
+
)
|
251
|
+
|
252
|
+
# finally try to flush the file
|
253
|
+
if not use_single_part_upload:
|
254
|
+
self._retryable_adls_function(
|
255
|
+
func=patch_adls_flush,
|
256
|
+
artifact_file_path=artifact_file_path,
|
257
|
+
sas_url=credentials.signed_uri,
|
258
|
+
position=file_size,
|
259
|
+
headers=headers,
|
260
|
+
)
|
261
|
+
except Exception as err:
|
262
|
+
raise MlflowException(err)
|
263
|
+
|
264
|
+
def _get_presigned_uri(self, artifact_file_path):
|
265
|
+
"""
|
266
|
+
Gets the presigned URL required to upload a file to or download a file from a given Azure
|
267
|
+
storage location.
|
268
|
+
|
269
|
+
Args:
|
270
|
+
artifact_file_path: Path of the file relative to the artifact repository root.
|
271
|
+
|
272
|
+
Returns:
|
273
|
+
a string presigned URL.
|
274
|
+
"""
|
275
|
+
sas_token = (
|
276
|
+
f"?{self.credential.signature}"
|
277
|
+
if hasattr(self.credential, "signature")
|
278
|
+
else self.sas_token
|
279
|
+
)
|
280
|
+
return (
|
281
|
+
f"https://{self.account_name}.{self.domain_suffix}/{self.container}/"
|
282
|
+
f"{self.base_data_lake_directory}/{artifact_file_path}{sas_token}"
|
283
|
+
)
|
284
|
+
|
285
|
+
def _get_write_credential_infos(self, remote_file_paths) -> list[ArtifactCredentialInfo]:
|
286
|
+
return [
|
287
|
+
ArtifactCredentialInfo(signed_uri=self._get_presigned_uri(path))
|
288
|
+
for path in remote_file_paths
|
289
|
+
]
|
290
|
+
|
291
|
+
def _get_read_credential_infos(self, remote_file_paths) -> list[ArtifactCredentialInfo]:
|
292
|
+
return [
|
293
|
+
ArtifactCredentialInfo(signed_uri=self._get_presigned_uri(path))
|
294
|
+
for path in remote_file_paths
|
295
|
+
]
|