PyPI - snowflake-ml-python - Versions diffs - 1.1.2__py3-none-any.whl → 1.2.1__py3-none-any.whl - Mend

snowflake-ml-python 1.1.2py3-none-any.whl → 1.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (215) hide show

snowflake/ml/{model/_deploy_client/utils → _internal/container_services/image_registry}/imagelib.py +3 -1
snowflake/ml/{model/_deploy_client/utils/image_registry_client.py → _internal/container_services/image_registry/registry_client.py} +4 -2
snowflake/ml/_internal/env_utils.py +31 -52
snowflake/ml/_internal/file_utils.py +17 -0
snowflake/ml/_internal/telemetry.py +19 -0
snowflake/ml/_internal/utils/query_result_checker.py +8 -5
snowflake/ml/_internal/utils/snowflake_env.py +95 -0
snowflake/ml/fileset/parquet_parser.py +31 -1
snowflake/ml/model/__init__.py +6 -0
snowflake/ml/model/_client/model/model_impl.py +172 -13
snowflake/ml/model/_client/model/model_version_impl.py +96 -52
snowflake/ml/model/_client/ops/metadata_ops.py +1 -3
snowflake/ml/model/_client/ops/model_ops.py +155 -9
snowflake/ml/model/_client/sql/model.py +55 -10
snowflake/ml/model/_client/sql/model_version.py +72 -61
snowflake/ml/model/_client/sql/stage.py +10 -4
snowflake/ml/model/_client/sql/tag.py +118 -0
snowflake/ml/model/_deploy_client/image_builds/client_image_builder.py +2 -2
snowflake/ml/model/_deploy_client/image_builds/docker_context.py +8 -8
snowflake/ml/model/_deploy_client/image_builds/inference_server/main.py +4 -6
snowflake/ml/model/_deploy_client/image_builds/server_image_builder.py +6 -7
snowflake/ml/model/_deploy_client/snowservice/deploy.py +4 -5
snowflake/ml/model/_deploy_client/snowservice/instance_types.py +9 -1
snowflake/ml/model/_deploy_client/warehouse/deploy.py +20 -11
snowflake/ml/model/_model_composer/model_manifest/model_manifest.py +45 -1
snowflake/ml/model/_model_composer/model_manifest/model_manifest_schema.py +30 -0
snowflake/ml/model/_model_composer/model_method/function_generator.py +2 -1
snowflake/ml/model/_model_composer/model_runtime/_runtime_requirements.py +10 -1
snowflake/ml/model/_model_composer/model_runtime/model_runtime.py +10 -7
snowflake/ml/model/_packager/model_handlers/huggingface_pipeline.py +1 -1
snowflake/ml/model/_packager/model_handlers/xgboost.py +13 -2
snowflake/ml/model/_packager/model_meta/_core_requirements.py +11 -1
snowflake/ml/model/_packager/model_meta/_packaging_requirements.py +3 -0
snowflake/ml/model/_packager/model_meta/model_meta.py +17 -3
snowflake/ml/model/_signatures/core.py +20 -17
snowflake/ml/model/custom_model.py +30 -27
snowflake/ml/model/model_signature.py +16 -17
snowflake/ml/model/type_hints.py +3 -0
snowflake/ml/modeling/_internal/distributed_hpo_trainer.py +185 -98
snowflake/ml/modeling/_internal/estimator_utils.py +21 -0
snowflake/ml/modeling/_internal/model_specifications.py +3 -10
snowflake/ml/modeling/_internal/model_trainer_builder.py +55 -11
snowflake/ml/modeling/_internal/snowpark_handlers.py +9 -6
snowflake/ml/modeling/_internal/snowpark_trainer.py +10 -2
snowflake/ml/modeling/_internal/xgboost_external_memory_trainer.py +444 -0
snowflake/ml/modeling/calibration/calibrated_classifier_cv.py +51 -16
snowflake/ml/modeling/cluster/affinity_propagation.py +51 -16
snowflake/ml/modeling/cluster/agglomerative_clustering.py +51 -16
snowflake/ml/modeling/cluster/birch.py +51 -16
snowflake/ml/modeling/cluster/bisecting_k_means.py +51 -16
snowflake/ml/modeling/cluster/dbscan.py +51 -16
snowflake/ml/modeling/cluster/feature_agglomeration.py +51 -16
snowflake/ml/modeling/cluster/k_means.py +51 -16
snowflake/ml/modeling/cluster/mean_shift.py +51 -16
snowflake/ml/modeling/cluster/mini_batch_k_means.py +51 -16
snowflake/ml/modeling/cluster/optics.py +51 -16
snowflake/ml/modeling/cluster/spectral_biclustering.py +51 -16
snowflake/ml/modeling/cluster/spectral_clustering.py +51 -16
snowflake/ml/modeling/cluster/spectral_coclustering.py +51 -16
snowflake/ml/modeling/compose/column_transformer.py +51 -16
snowflake/ml/modeling/compose/transformed_target_regressor.py +51 -16
snowflake/ml/modeling/covariance/elliptic_envelope.py +51 -16
snowflake/ml/modeling/covariance/empirical_covariance.py +51 -16
snowflake/ml/modeling/covariance/graphical_lasso.py +51 -16
snowflake/ml/modeling/covariance/graphical_lasso_cv.py +51 -16
snowflake/ml/modeling/covariance/ledoit_wolf.py +51 -16
snowflake/ml/modeling/covariance/min_cov_det.py +51 -16
snowflake/ml/modeling/covariance/oas.py +51 -16
snowflake/ml/modeling/covariance/shrunk_covariance.py +51 -16
snowflake/ml/modeling/decomposition/dictionary_learning.py +51 -16
snowflake/ml/modeling/decomposition/factor_analysis.py +51 -16
snowflake/ml/modeling/decomposition/fast_ica.py +51 -16
snowflake/ml/modeling/decomposition/incremental_pca.py +51 -16
snowflake/ml/modeling/decomposition/kernel_pca.py +51 -16
snowflake/ml/modeling/decomposition/mini_batch_dictionary_learning.py +51 -16
snowflake/ml/modeling/decomposition/mini_batch_sparse_pca.py +51 -16
snowflake/ml/modeling/decomposition/pca.py +51 -16
snowflake/ml/modeling/decomposition/sparse_pca.py +51 -16
snowflake/ml/modeling/decomposition/truncated_svd.py +51 -16
snowflake/ml/modeling/discriminant_analysis/linear_discriminant_analysis.py +51 -16
snowflake/ml/modeling/discriminant_analysis/quadratic_discriminant_analysis.py +51 -16
snowflake/ml/modeling/ensemble/ada_boost_classifier.py +51 -16
snowflake/ml/modeling/ensemble/ada_boost_regressor.py +51 -16
snowflake/ml/modeling/ensemble/bagging_classifier.py +51 -16
snowflake/ml/modeling/ensemble/bagging_regressor.py +51 -16
snowflake/ml/modeling/ensemble/extra_trees_classifier.py +51 -16
snowflake/ml/modeling/ensemble/extra_trees_regressor.py +51 -16
snowflake/ml/modeling/ensemble/gradient_boosting_classifier.py +51 -16
snowflake/ml/modeling/ensemble/gradient_boosting_regressor.py +51 -16
snowflake/ml/modeling/ensemble/hist_gradient_boosting_classifier.py +51 -16
snowflake/ml/modeling/ensemble/hist_gradient_boosting_regressor.py +51 -16
snowflake/ml/modeling/ensemble/isolation_forest.py +51 -16
snowflake/ml/modeling/ensemble/random_forest_classifier.py +51 -16
snowflake/ml/modeling/ensemble/random_forest_regressor.py +51 -16
snowflake/ml/modeling/ensemble/stacking_regressor.py +51 -16
snowflake/ml/modeling/ensemble/voting_classifier.py +51 -16
snowflake/ml/modeling/ensemble/voting_regressor.py +51 -16
snowflake/ml/modeling/feature_selection/generic_univariate_select.py +51 -16
snowflake/ml/modeling/feature_selection/select_fdr.py +51 -16
snowflake/ml/modeling/feature_selection/select_fpr.py +51 -16
snowflake/ml/modeling/feature_selection/select_fwe.py +51 -16
snowflake/ml/modeling/feature_selection/select_k_best.py +51 -16
snowflake/ml/modeling/feature_selection/select_percentile.py +51 -16
snowflake/ml/modeling/feature_selection/sequential_feature_selector.py +51 -16
snowflake/ml/modeling/feature_selection/variance_threshold.py +51 -16
snowflake/ml/modeling/gaussian_process/gaussian_process_classifier.py +51 -16
snowflake/ml/modeling/gaussian_process/gaussian_process_regressor.py +51 -16
snowflake/ml/modeling/impute/iterative_imputer.py +51 -16
snowflake/ml/modeling/impute/knn_imputer.py +51 -16
snowflake/ml/modeling/impute/missing_indicator.py +51 -16
snowflake/ml/modeling/kernel_approximation/additive_chi2_sampler.py +51 -16
snowflake/ml/modeling/kernel_approximation/nystroem.py +51 -16
snowflake/ml/modeling/kernel_approximation/polynomial_count_sketch.py +51 -16
snowflake/ml/modeling/kernel_approximation/rbf_sampler.py +51 -16
snowflake/ml/modeling/kernel_approximation/skewed_chi2_sampler.py +51 -16
snowflake/ml/modeling/kernel_ridge/kernel_ridge.py +51 -16
snowflake/ml/modeling/lightgbm/lgbm_classifier.py +51 -16
snowflake/ml/modeling/lightgbm/lgbm_regressor.py +51 -16
snowflake/ml/modeling/linear_model/ard_regression.py +51 -16
snowflake/ml/modeling/linear_model/bayesian_ridge.py +51 -16
snowflake/ml/modeling/linear_model/elastic_net.py +51 -16
snowflake/ml/modeling/linear_model/elastic_net_cv.py +51 -16
snowflake/ml/modeling/linear_model/gamma_regressor.py +51 -16
snowflake/ml/modeling/linear_model/huber_regressor.py +51 -16
snowflake/ml/modeling/linear_model/lars.py +51 -16
snowflake/ml/modeling/linear_model/lars_cv.py +51 -16
snowflake/ml/modeling/linear_model/lasso.py +51 -16
snowflake/ml/modeling/linear_model/lasso_cv.py +51 -16
snowflake/ml/modeling/linear_model/lasso_lars.py +51 -16
snowflake/ml/modeling/linear_model/lasso_lars_cv.py +51 -16
snowflake/ml/modeling/linear_model/lasso_lars_ic.py +51 -16
snowflake/ml/modeling/linear_model/linear_regression.py +51 -16
snowflake/ml/modeling/linear_model/logistic_regression.py +51 -16
snowflake/ml/modeling/linear_model/logistic_regression_cv.py +51 -16
snowflake/ml/modeling/linear_model/multi_task_elastic_net.py +51 -16
snowflake/ml/modeling/linear_model/multi_task_elastic_net_cv.py +51 -16
snowflake/ml/modeling/linear_model/multi_task_lasso.py +51 -16
snowflake/ml/modeling/linear_model/multi_task_lasso_cv.py +51 -16
snowflake/ml/modeling/linear_model/orthogonal_matching_pursuit.py +51 -16
snowflake/ml/modeling/linear_model/passive_aggressive_classifier.py +51 -16
snowflake/ml/modeling/linear_model/passive_aggressive_regressor.py +51 -16
snowflake/ml/modeling/linear_model/perceptron.py +51 -16
snowflake/ml/modeling/linear_model/poisson_regressor.py +51 -16
snowflake/ml/modeling/linear_model/ransac_regressor.py +51 -16
snowflake/ml/modeling/linear_model/ridge.py +51 -16
snowflake/ml/modeling/linear_model/ridge_classifier.py +51 -16
snowflake/ml/modeling/linear_model/ridge_classifier_cv.py +51 -16
snowflake/ml/modeling/linear_model/ridge_cv.py +51 -16
snowflake/ml/modeling/linear_model/sgd_classifier.py +51 -16
snowflake/ml/modeling/linear_model/sgd_one_class_svm.py +51 -16
snowflake/ml/modeling/linear_model/sgd_regressor.py +51 -16
snowflake/ml/modeling/linear_model/theil_sen_regressor.py +51 -16
snowflake/ml/modeling/linear_model/tweedie_regressor.py +51 -16
snowflake/ml/modeling/manifold/isomap.py +51 -16
snowflake/ml/modeling/manifold/mds.py +51 -16
snowflake/ml/modeling/manifold/spectral_embedding.py +51 -16
snowflake/ml/modeling/manifold/tsne.py +51 -16
snowflake/ml/modeling/metrics/classification.py +5 -6
snowflake/ml/modeling/metrics/metrics_utils.py +5 -3
snowflake/ml/modeling/metrics/ranking.py +7 -3
snowflake/ml/modeling/metrics/regression.py +6 -3
snowflake/ml/modeling/mixture/bayesian_gaussian_mixture.py +51 -16
snowflake/ml/modeling/mixture/gaussian_mixture.py +51 -16
snowflake/ml/modeling/multiclass/one_vs_one_classifier.py +51 -16
snowflake/ml/modeling/multiclass/one_vs_rest_classifier.py +51 -16
snowflake/ml/modeling/multiclass/output_code_classifier.py +51 -16
snowflake/ml/modeling/naive_bayes/bernoulli_nb.py +51 -16
snowflake/ml/modeling/naive_bayes/categorical_nb.py +51 -16
snowflake/ml/modeling/naive_bayes/complement_nb.py +51 -16
snowflake/ml/modeling/naive_bayes/gaussian_nb.py +51 -16
snowflake/ml/modeling/naive_bayes/multinomial_nb.py +51 -16
snowflake/ml/modeling/neighbors/k_neighbors_classifier.py +51 -16
snowflake/ml/modeling/neighbors/k_neighbors_regressor.py +51 -16
snowflake/ml/modeling/neighbors/kernel_density.py +51 -16
snowflake/ml/modeling/neighbors/local_outlier_factor.py +51 -16
snowflake/ml/modeling/neighbors/nearest_centroid.py +51 -16
snowflake/ml/modeling/neighbors/nearest_neighbors.py +51 -16
snowflake/ml/modeling/neighbors/neighborhood_components_analysis.py +51 -16
snowflake/ml/modeling/neighbors/radius_neighbors_classifier.py +51 -16
snowflake/ml/modeling/neighbors/radius_neighbors_regressor.py +51 -16
snowflake/ml/modeling/neural_network/bernoulli_rbm.py +51 -16
snowflake/ml/modeling/neural_network/mlp_classifier.py +51 -16
snowflake/ml/modeling/neural_network/mlp_regressor.py +51 -16
snowflake/ml/modeling/preprocessing/min_max_scaler.py +15 -1
snowflake/ml/modeling/preprocessing/polynomial_features.py +51 -16
snowflake/ml/modeling/semi_supervised/label_propagation.py +51 -16
snowflake/ml/modeling/semi_supervised/label_spreading.py +51 -16
snowflake/ml/modeling/svm/linear_svc.py +51 -16
snowflake/ml/modeling/svm/linear_svr.py +51 -16
snowflake/ml/modeling/svm/nu_svc.py +51 -16
snowflake/ml/modeling/svm/nu_svr.py +51 -16
snowflake/ml/modeling/svm/svc.py +51 -16
snowflake/ml/modeling/svm/svr.py +51 -16
snowflake/ml/modeling/tree/decision_tree_classifier.py +51 -16
snowflake/ml/modeling/tree/decision_tree_regressor.py +51 -16
snowflake/ml/modeling/tree/extra_tree_classifier.py +51 -16
snowflake/ml/modeling/tree/extra_tree_regressor.py +51 -16
snowflake/ml/modeling/xgboost/xgb_classifier.py +69 -16
snowflake/ml/modeling/xgboost/xgb_regressor.py +69 -16
snowflake/ml/modeling/xgboost/xgbrf_classifier.py +69 -16
snowflake/ml/modeling/xgboost/xgbrf_regressor.py +69 -16
snowflake/ml/registry/__init__.py +3 -0
snowflake/ml/registry/_manager/model_manager.py +163 -0
snowflake/ml/registry/model_registry.py +12 -0
snowflake/ml/registry/registry.py +100 -90
snowflake/ml/version.py +1 -1
snowflake_ml_python-1.2.1.dist-info/LICENSE.txt +202 -0
{snowflake_ml_python-1.1.2.dist-info → snowflake_ml_python-1.2.1.dist-info}/METADATA +295 -60
snowflake_ml_python-1.2.1.dist-info/RECORD +355 -0
{snowflake_ml_python-1.1.2.dist-info → snowflake_ml_python-1.2.1.dist-info}/WHEEL +2 -1
snowflake_ml_python-1.2.1.dist-info/top_level.txt +1 -0
snowflake/ml/model/_client/model/model_method_info.py +0 -19
snowflake_ml_python-1.1.2.dist-info/RECORD +0 -347
/snowflake/ml/_internal/{utils/spcs_image_registry.py → container_services/image_registry/credential.py} +0 -0
/snowflake/ml/_internal/{utils/image_registry_http_client.py → container_services/image_registry/http_client.py} +0 -0

snowflake/ml/{model/_deploy_client/utils → _internal/container_services/image_registry}/imagelib.py RENAMED Viewed

@@ -23,7 +23,9 @@ from typing import Dict, List, Optional, Tuple
 import requests
-from snowflake.ml._internal.utils import image_registry_http_client
+from snowflake.ml._internal.container_services.image_registry import (
+    http_client as image_registry_http_client,
+)
 # Common HTTP headers
 _CONTENT_LENGTH_HEADER = "content-length"

snowflake/ml/{model/_deploy_client/utils/image_registry_client.py → _internal/container_services/image_registry/registry_client.py} RENAMED Viewed

@@ -3,12 +3,14 @@ import logging
 from typing import Dict, Optional, cast
 from urllib.parse import urlunparse
+from snowflake.ml._internal.container_services.image_registry import (
+    http_client as image_registry_http_client,
+    imagelib,
+)
 from snowflake.ml._internal.exceptions import (
     error_codes,
     exceptions as snowml_exceptions,
 )
-from snowflake.ml._internal.utils import image_registry_http_client
-from snowflake.ml.model._deploy_client.utils import imagelib
 from snowflake.snowpark import Session
 from snowflake.snowpark._internal import utils as snowpark_utils

snowflake/ml/_internal/env_utils.py CHANGED Viewed

@@ -33,7 +33,6 @@ class CONDA_OS(Enum):
 _SNOWFLAKE_CONDA_CHANNEL_URL = "https://repo.anaconda.com/pkgs/snowflake"
 _NODEFAULTS = "nodefaults"
-_INFO_SCHEMA_PACKAGES_HAS_RUNTIME_VERSION: Optional[bool] = None
 _SNOWFLAKE_INFO_SCHEMA_PACKAGE_CACHE: Dict[str, List[version.Version]] = {}
 _SNOWFLAKE_CONDA_PACKAGE_CACHE: Dict[str, List[version.Version]] = {}
@@ -267,18 +266,6 @@ def relax_requirement_version(req: requirements.Requirement) -> requirements.Req
     return new_req
-def _check_runtime_version_column_existence(session: session.Session) -> bool:
-    sql = textwrap.dedent(
-        """
-        SHOW COLUMNS
-        LIKE 'runtime_version'
-        IN TABLE information_schema.packages;
-        """
-    )
-    result = session.sql(sql).count()
-    return result == 1
 def get_matched_package_versions_in_snowflake_conda_channel(
     req: requirements.Requirement,
     python_version: str = snowml_env.PYTHON_VERSION,
@@ -325,9 +312,9 @@ def get_matched_package_versions_in_snowflake_conda_channel(
     return matched_versions
-def validate_requirements_in_information_schema(
+def get_matched_package_versions_in_information_schema(
     session: session.Session, reqs: List[requirements.Requirement], python_version: str
-) -> Optional[List[str]]:
+) -> Dict[str, List[version.Version]]:
     """Look up the information_schema table to check if a package with the specified specifier exists in the Snowflake
     Conda channel. Note that this is not the source of truth due to the potential delay caused by a package that might
     exist in the information_schema table but has not yet become available in the Snowflake Conda channel.
@@ -338,42 +325,35 @@ def validate_requirements_in_information_schema(
         python_version: A string of python version where model is run.
     Returns:
-        A list of pinned latest version that available in Snowflake anaconda channel and meet the version specifier.
+        A Dict, whose key is the package name, and value is a list of versions match the requirements.
     """
-    global _INFO_SCHEMA_PACKAGES_HAS_RUNTIME_VERSION
-    if _INFO_SCHEMA_PACKAGES_HAS_RUNTIME_VERSION is None:
-        _INFO_SCHEMA_PACKAGES_HAS_RUNTIME_VERSION = _check_runtime_version_column_existence(session)
-    ret_list = []
-    reqs_to_request = []
+    ret_dict: Dict[str, List[version.Version]] = {}
+    reqs_to_request: List[requirements.Requirement] = []
     for req in reqs:
-        if req.name not in _SNOWFLAKE_INFO_SCHEMA_PACKAGE_CACHE:
+        if req.name in _SNOWFLAKE_INFO_SCHEMA_PACKAGE_CACHE:
+            available_versions = list(
+                sorted(req.specifier.filter(set(_SNOWFLAKE_INFO_SCHEMA_PACKAGE_CACHE.get(req.name, []))))
+            )
+            ret_dict[req.name] = available_versions
+        else:
             reqs_to_request.append(req)
     if reqs_to_request:
         pkg_names_str = " OR ".join(
             f"package_name = '{req_name}'" for req_name in sorted(req.name for req in reqs_to_request)
         )
-        if _INFO_SCHEMA_PACKAGES_HAS_RUNTIME_VERSION:
-            parsed_python_version = version.Version(python_version)
-            sql = textwrap.dedent(
-                f"""
-                SELECT PACKAGE_NAME, VERSION
-                FROM information_schema.packages
-                WHERE ({pkg_names_str})
-                AND language = 'python'
-                AND (runtime_version = '{parsed_python_version.major}.{parsed_python_version.minor}'
-                    OR runtime_version is null);
-                """
-            )
-        else:
-            sql = textwrap.dedent(
-                f"""
-                SELECT PACKAGE_NAME, VERSION
-                FROM information_schema.packages
-                WHERE ({pkg_names_str})
-                AND language = 'python';
-                """
-            )
+        parsed_python_version = version.Version(python_version)
+        sql = textwrap.dedent(
+            f"""
+            SELECT PACKAGE_NAME, VERSION
+            FROM information_schema.packages
+            WHERE ({pkg_names_str})
+            AND language = 'python'
+            AND (runtime_version = '{parsed_python_version.major}.{parsed_python_version.minor}'
+                OR runtime_version is null);
+            """
+        )
         try:
             result = (
@@ -392,14 +372,13 @@ def validate_requirements_in_information_schema(
                 cached_req_ver_list.append(req_ver)
                 _SNOWFLAKE_INFO_SCHEMA_PACKAGE_CACHE[req_name] = cached_req_ver_list
         except snowflake.connector.DataError:
-            return None
-    for req in reqs:
-        available_versions = list(req.specifier.filter(set(_SNOWFLAKE_INFO_SCHEMA_PACKAGE_CACHE.get(req.name, []))))
-        if not available_versions:
-            return None
-        else:
-            ret_list.append(str(req))
-    return sorted(ret_list)
+            return ret_dict
+    for req in reqs_to_request:
+        available_versions = list(
+            sorted(req.specifier.filter(set(_SNOWFLAKE_INFO_SCHEMA_PACKAGE_CACHE.get(req.name, []))))
+        )
+        ret_dict[req.name] = available_versions
+    return ret_dict
 def save_conda_env_file(

snowflake/ml/_internal/file_utils.py CHANGED Viewed

@@ -362,3 +362,20 @@ def download_directory_from_stage(
             wait_exponential_multiplier=100,
             wait_exponential_max=10000,
         )(file_operation.get)(str(stage_file_path), str(local_file_dir), statement_params=statement_params)
+def open_file(path: str, *args: Any, **kwargs: Any) -> Any:
+    """This function is a wrapper on top of the Python built-in "open" function, with a few added default values
+    to ensure successful execution across different platforms.
+    Args:
+        path: file path
+        *args: arguments.
+        **kwargs: key arguments.
+    Returns:
+        Open file and return a stream.
+    """
+    kwargs.setdefault("newline", "\n")
+    kwargs.setdefault("encoding", "utf-8")
+    return open(path, *args, **kwargs)

snowflake/ml/_internal/telemetry.py CHANGED Viewed

@@ -584,3 +584,22 @@ class _SourceTelemetryClient:
         """Send the telemetry data batch immediately."""
         if self._telemetry:
             self._telemetry.send_batch()
+def get_sproc_statement_params_kwargs(sproc: Callable[..., Any], statement_params: Dict[str, Any]) -> Dict[str, Any]:
+    """
+    Get statement_params keyword argument for sproc call.
+    Args:
+        sproc: sproc function
+        statement_params: dictionary to be passed as statement params, if possible
+    Returns:
+        Keyword arguments dict
+    """
+    sproc_argspec = inspect.getfullargspec(sproc)
+    kwargs = {}
+    if "statement_params" in sproc_argspec.args:
+        kwargs["statement_params"] = statement_params
+    return kwargs

snowflake/ml/_internal/utils/query_result_checker.py CHANGED Viewed

@@ -60,9 +60,13 @@ def result_dimension_matcher(
     return True
-def column_name_matcher(expected_col_name: str, result: list[snowpark.Row], sql: str | None = None) -> bool:
+def column_name_matcher(
+    expected_col_name: str, allow_empty: bool, result: list[snowpark.Row], sql: str | None = None
+) -> bool:
     """Returns true if `expected_col_name` is found. Raise exception otherwise."""
     if not result:
+        if allow_empty:
+            return True
         raise connector.DataError(f"Query Result is empty.{_query_log(sql)}")
     if expected_col_name not in result[0]:
         raise connector.DataError(
@@ -159,16 +163,17 @@ class ResultValidator:
         self._success_matchers.append(partial(result_dimension_matcher, expected_rows, expected_cols))
         return self
-    def has_column(self, expected_col_name: str) -> ResultValidator:
+    def has_column(self, expected_col_name: str, allow_empty: bool = False) -> ResultValidator:
         """Validate that the a column with the name `expected_column_name` exists in the result.
         Args:
             expected_col_name: Name of the column that is expected to be present in the result (case sensitive).
+            allow_empty: If the check will fail if the result is empty.
         Returns:
             ResultValidator object (self)
         """
-        self._success_matchers.append(partial(column_name_matcher, expected_col_name))
+        self._success_matchers.append(partial(column_name_matcher, expected_col_name, allow_empty))
         return self
     def has_named_value_match(self, row_idx: int, col_name: str, expected_value: Any) -> ResultValidator:
@@ -224,8 +229,6 @@ class ResultValidator:
         Returns:
             Query result.
         """
-        if len(self._success_matchers) == 0:
-            self._success_matchers = _DEFAULT_MATCHERS
         result = self._get_result()
         for matcher in self._success_matchers:
             assert matcher(result, self._query)

snowflake/ml/_internal/utils/snowflake_env.py ADDED Viewed

@@ -0,0 +1,95 @@
+import enum
+from typing import Any, Dict, Optional, TypedDict, cast
+from packaging import version
+from typing_extensions import Required
+from snowflake.ml._internal.utils import query_result_checker
+from snowflake.snowpark import session
+def get_current_snowflake_version(
+    sess: session.Session, *, statement_params: Optional[Dict[str, Any]] = None
+) -> version.Version:
+    """Get Snowflake Version as a version.Version object follow PEP way of versioning, that is to say:
+        "7.44.2 b202312132139364eb71238" to <Version('7.44.2+b202312132139364eb71238')>
+    Args:
+        sess: Snowpark Session.
+        statement_params: Statement params. Defaults to None.
+    Returns:
+        The version of Snowflake Version.
+    """
+    res = (
+        query_result_checker.SqlResultValidator(
+            sess, "SELECT CURRENT_VERSION() AS CURRENT_VERSION", statement_params=statement_params
+        )
+        .has_dimensions(expected_rows=1, expected_cols=1)
+        .validate()[0]
+    )
+    version_str = res.CURRENT_VERSION
+    assert isinstance(version_str, str)
+    version_str = "+".join(version_str.split())
+    return version.parse(version_str)
+class SnowflakeCloudType(enum.Enum):
+    AWS = "aws"
+    AZURE = "azure"
+    GCP = "gcp"
+    @classmethod
+    def from_value(cls, value: str) -> "SnowflakeCloudType":
+        assert value
+        for k in cls:
+            if k.value == value.lower():
+                return k
+        else:
+            raise ValueError(f"'{cls.__name__}' enum not found for '{value}'")
+class SnowflakeRegion(TypedDict):
+    region_group: Required[str]
+    snowflake_region: Required[str]
+    cloud: Required[SnowflakeCloudType]
+    region: Required[str]
+    display_name: Required[str]
+def get_regions(
+    sess: session.Session, *, statement_params: Optional[Dict[str, Any]] = None
+) -> Dict[str, SnowflakeRegion]:
+    res = (
+        query_result_checker.SqlResultValidator(sess, "SHOW REGIONS", statement_params=statement_params)
+        .has_column("region_group")
+        .has_column("snowflake_region")
+        .has_column("cloud")
+        .has_column("region")
+        .has_column("display_name")
+        .validate()
+    )
+    return {
+        f"{r.region_group}.{r.snowflake_region}": SnowflakeRegion(
+            region_group=r.region_group,
+            snowflake_region=r.snowflake_region,
+            cloud=SnowflakeCloudType.from_value(r.cloud),
+            region=r.region,
+            display_name=r.display_name,
+        )
+        for r in res
+    }
+def get_current_region_id(sess: session.Session, *, statement_params: Optional[Dict[str, Any]] = None) -> str:
+    res = (
+        query_result_checker.SqlResultValidator(
+            sess, "SELECT CURRENT_REGION() AS CURRENT_REGION", statement_params=statement_params
+        )
+        .has_dimensions(expected_rows=1, expected_cols=1)
+        .validate()[0]
+    )
+    return cast(str, res.CURRENT_REGION)

snowflake/ml/fileset/parquet_parser.py CHANGED Viewed

@@ -1,4 +1,6 @@
 import collections
+import logging
+import time
 from typing import Any, Deque, Dict, Iterator, List
 import fsspec
@@ -83,7 +85,7 @@ class ParquetParser:
             np.random.shuffle(files)
         pa_dataset: ds.Dataset = ds.dataset(files, format="parquet", filesystem=self._fs)
-        for rb in pa_dataset.to_batches(batch_size=self._dataset_batch_size):
+        for rb in _retryable_batches(pa_dataset, batch_size=self._dataset_batch_size):
             if self._shuffle:
                 rb = rb.take(np.random.permutation(rb.num_rows))
             self._rb_buffer.append(rb)
@@ -138,3 +140,31 @@ def _record_batch_to_arrays(rb: pa.RecordBatch) -> Dict[str, npt.NDArray[Any]]:
         array = column.to_numpy(zero_copy_only=False)
         batch_dict[column_schema.name] = array
     return batch_dict
+def _retryable_batches(
+    dataset: ds.Dataset, batch_size: int, max_retries: int = 3, delay: int = 0
+) -> Iterator[pa.RecordBatch]:
+    """Make the Dataset to_batches retryable."""
+    retries = 0
+    current_batch_index = 0
+    while True:
+        try:
+            for batch_index, batch in enumerate(dataset.to_batches(batch_size=batch_size)):
+                if batch_index < current_batch_index:
+                    # Skip batches that have already been processed
+                    continue
+                yield batch
+                current_batch_index = batch_index + 1
+            # Exit the loop once all batches are processed
+            break
+        except Exception as e:
+            if retries < max_retries:
+                retries += 1
+                logging.info(f"Error encountered: {e}. Retrying {retries}/{max_retries}...")
+                time.sleep(delay)
+            else:
+                raise e

snowflake/ml/model/__init__.py ADDED Viewed

@@ -0,0 +1,6 @@
+from snowflake.ml.model._client.model.model_impl import Model
+from snowflake.ml.model._client.model.model_version_impl import ModelVersion
+from snowflake.ml.model.models.huggingface_pipeline import HuggingFacePipelineModel
+from snowflake.ml.model.models.llm import LLM, LLMOptions
+__all__ = ["Model", "ModelVersion", "HuggingFacePipelineModel", "LLM", "LLMOptions"]

snowflake/ml/model/_client/model/model_impl.py CHANGED Viewed

@@ -1,7 +1,9 @@
-from typing import List, Union
+from typing import Dict, List, Optional, Tuple, Union
+import pandas as pd
 from snowflake.ml._internal import telemetry
-from snowflake.ml._internal.utils import sql_identifier
+from snowflake.ml._internal.utils import identifier, sql_identifier
 from snowflake.ml.model._client.model import model_version_impl
 from snowflake.ml.model._client.ops import model_ops
@@ -37,10 +39,12 @@ class Model:
     @property
     def name(self) -> str:
+        """Return the name of the model that can be used to refer to it in SQL."""
         return self._model_name.identifier()
     @property
     def fully_qualified_name(self) -> str:
+        """Return the fully qualified name of the model that can be used to refer to it in SQL."""
         return self._model_ops._model_version_client.fully_qualified_model_name(self._model_name)
     @property
@@ -49,6 +53,24 @@ class Model:
         subproject=_TELEMETRY_SUBPROJECT,
     )
     def description(self) -> str:
+        """The description for the model. This is an alias of `comment`."""
+        return self.comment
+    @description.setter
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def description(self, description: str) -> None:
+        self.comment = description
+    @property
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def comment(self) -> str:
+        """The comment to the model."""
         statement_params = telemetry.get_statement_params(
             project=_TELEMETRY_PROJECT,
             subproject=_TELEMETRY_SUBPROJECT,
@@ -58,18 +80,18 @@ class Model:
             statement_params=statement_params,
         )
-    @description.setter
+    @comment.setter
     @telemetry.send_api_usage_telemetry(
         project=_TELEMETRY_PROJECT,
         subproject=_TELEMETRY_SUBPROJECT,
     )
-    def description(self, description: str) -> None:
+    def comment(self, comment: str) -> None:
         statement_params = telemetry.get_statement_params(
             project=_TELEMETRY_PROJECT,
             subproject=_TELEMETRY_SUBPROJECT,
         )
         return self._model_ops.set_comment(
-            comment=description,
+            comment=comment,
             model_name=self._model_name,
             statement_params=statement_params,
         )
@@ -80,12 +102,13 @@ class Model:
         subproject=_TELEMETRY_SUBPROJECT,
     )
     def default(self) -> model_version_impl.ModelVersion:
+        """The default version of the model."""
         statement_params = telemetry.get_statement_params(
             project=_TELEMETRY_PROJECT,
             subproject=_TELEMETRY_SUBPROJECT,
             class_name=self.__class__.__name__,
         )
-        default_version_name = self._model_ops._model_version_client.get_default_version(
+        default_version_name = self._model_ops.get_default_version(
             model_name=self._model_name, statement_params=statement_params
         )
         return self.version(default_version_name)
@@ -105,7 +128,7 @@ class Model:
             version_name = sql_identifier.SqlIdentifier(version)
         else:
             version_name = version._version_name
-        self._model_ops._model_version_client.set_default_version(
+        self._model_ops.set_default_version(
             model_name=self._model_name, version_name=version_name, statement_params=statement_params
         )
@@ -114,13 +137,14 @@ class Model:
         subproject=_TELEMETRY_SUBPROJECT,
     )
     def version(self, version_name: str) -> model_version_impl.ModelVersion:
-        """Get a model version object given a version name in the model.
+        """
+        Get a model version object given a version name in the model.
         Args:
-            version_name: The name of version
+            version_name: The name of the version.
         Raises:
-            ValueError: Raised when the version requested does not exist.
+            ValueError: When the requested version does not exist.
         Returns:
             The model version object.
@@ -149,11 +173,11 @@ class Model:
         project=_TELEMETRY_PROJECT,
         subproject=_TELEMETRY_SUBPROJECT,
     )
-    def list_versions(self) -> List[model_version_impl.ModelVersion]:
-        """List all versions in the model.
+    def versions(self) -> List[model_version_impl.ModelVersion]:
+        """Get all versions in the model.
         Returns:
-            A List of ModelVersion object representing all versions in the model.
+            A list of ModelVersion objects representing all versions in the model.
         """
         statement_params = telemetry.get_statement_params(
             project=_TELEMETRY_PROJECT,
@@ -172,5 +196,140 @@ class Model:
             for version_name in version_names
         ]
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def show_versions(self) -> pd.DataFrame:
+        """Show information about all versions in the model.
+        Returns:
+            A Pandas DataFrame showing information about all versions in the model.
+        """
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        rows = self._model_ops.show_models_or_versions(
+            model_name=self._model_name,
+            statement_params=statement_params,
+        )
+        return pd.DataFrame([row.as_dict() for row in rows])
     def delete_version(self, version_name: str) -> None:
         raise NotImplementedError("Deleting version has not been supported yet.")
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def show_tags(self) -> Dict[str, str]:
+        """Get a dictionary showing the tag and its value attached to the model.
+        Returns:
+            The model version object.
+        """
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        return self._model_ops.show_tags(model_name=self._model_name, statement_params=statement_params)
+    def _parse_tag_name(
+        self,
+        tag_name: str,
+    ) -> Tuple[sql_identifier.SqlIdentifier, sql_identifier.SqlIdentifier, sql_identifier.SqlIdentifier]:
+        _tag_db, _tag_schema, _tag_name, _ = identifier.parse_schema_level_object_identifier(tag_name)
+        if _tag_db is None:
+            tag_db_id = self._model_ops._model_client._database_name
+        else:
+            tag_db_id = sql_identifier.SqlIdentifier(_tag_db)
+        if _tag_schema is None:
+            tag_schema_id = self._model_ops._model_client._schema_name
+        else:
+            tag_schema_id = sql_identifier.SqlIdentifier(_tag_schema)
+        if _tag_name is None:
+            raise ValueError(f"Unable parse the tag name `{tag_name}` you input.")
+        tag_name_id = sql_identifier.SqlIdentifier(_tag_name)
+        return tag_db_id, tag_schema_id, tag_name_id
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def get_tag(self, tag_name: str) -> Optional[str]:
+        """Get the value of a tag attached to the model.
+        Args:
+            tag_name: The name of the tag, can be fully qualified. If not fully qualified, the database or schema of
+                the model will be used.
+        Returns:
+            The tag value as a string if the tag is attached, otherwise None.
+        """
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        tag_db_id, tag_schema_id, tag_name_id = self._parse_tag_name(tag_name)
+        return self._model_ops.get_tag_value(
+            model_name=self._model_name,
+            tag_database_name=tag_db_id,
+            tag_schema_name=tag_schema_id,
+            tag_name=tag_name_id,
+            statement_params=statement_params,
+        )
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def set_tag(self, tag_name: str, tag_value: str) -> None:
+        """Set the value of a tag, attaching it to the model if not.
+        Args:
+            tag_name: The name of the tag, can be fully qualified. If not fully qualified, the database or schema of
+                the model will be used.
+            tag_value: The value of the tag
+        """
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        tag_db_id, tag_schema_id, tag_name_id = self._parse_tag_name(tag_name)
+        self._model_ops.set_tag(
+            model_name=self._model_name,
+            tag_database_name=tag_db_id,
+            tag_schema_name=tag_schema_id,
+            tag_name=tag_name_id,
+            tag_value=tag_value,
+            statement_params=statement_params,
+        )
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def unset_tag(self, tag_name: str) -> None:
+        """Unset a tag attached to a model.
+        Args:
+            tag_name: The name of the tag, can be fully qualified. If not fully qualified, the database or schema of
+                the model will be used.
+        """
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        tag_db_id, tag_schema_id, tag_name_id = self._parse_tag_name(tag_name)
+        self._model_ops.unset_tag(
+            model_name=self._model_name,
+            tag_database_name=tag_db_id,
+            tag_schema_name=tag_schema_id,
+            tag_name=tag_name_id,
+            statement_params=statement_params,
+        )

snowflake-ml-python 1.1.2__py3-none-any.whl → 1.2.1__py3-none-any.whl

snowflake-ml-python 1.1.2py3-none-any.whl → 1.2.1py3-none-any.whl