PyPI - snowflake-ml-python - Versions diffs - 1.1.0__py3-none-any.whl → 1.1.2__py3-none-any.whl - Mend

snowflake-ml-python 1.1.0py3-none-any.whl → 1.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (225) hide show

snowflake/cortex/_complete.py +1 -1
snowflake/cortex/_extract_answer.py +1 -1
snowflake/cortex/_sentiment.py +1 -1
snowflake/cortex/_summarize.py +1 -1
snowflake/cortex/_translate.py +1 -1
snowflake/ml/_internal/env_utils.py +68 -6
snowflake/ml/_internal/file_utils.py +34 -4
snowflake/ml/_internal/telemetry.py +79 -91
snowflake/ml/_internal/utils/identifier.py +78 -72
snowflake/ml/_internal/utils/retryable_http.py +16 -4
snowflake/ml/_internal/utils/spcs_attribution_utils.py +122 -0
snowflake/ml/dataset/dataset.py +1 -1
snowflake/ml/model/_api.py +21 -14
snowflake/ml/model/_client/model/model_impl.py +176 -0
snowflake/ml/model/_client/model/model_method_info.py +19 -0
snowflake/ml/model/_client/model/model_version_impl.py +291 -0
snowflake/ml/model/_client/ops/metadata_ops.py +107 -0
snowflake/ml/model/_client/ops/model_ops.py +308 -0
snowflake/ml/model/_client/sql/model.py +75 -0
snowflake/ml/model/_client/sql/model_version.py +213 -0
snowflake/ml/model/_client/sql/stage.py +40 -0
snowflake/ml/model/_deploy_client/image_builds/server_image_builder.py +3 -4
snowflake/ml/model/_deploy_client/image_builds/templates/image_build_job_spec_template +24 -8
snowflake/ml/model/_deploy_client/image_builds/templates/kaniko_shell_script_template +23 -0
snowflake/ml/model/_deploy_client/snowservice/deploy.py +14 -2
snowflake/ml/model/_deploy_client/utils/constants.py +1 -0
snowflake/ml/model/_deploy_client/warehouse/deploy.py +2 -2
snowflake/ml/model/_model_composer/model_composer.py +31 -9
snowflake/ml/model/_model_composer/model_manifest/model_manifest.py +25 -10
snowflake/ml/model/_model_composer/model_manifest/model_manifest_schema.py +2 -2
snowflake/ml/model/_model_composer/model_method/infer_function.py_template +2 -1
snowflake/ml/model/_model_composer/model_method/model_method.py +34 -3
snowflake/ml/model/_model_composer/model_runtime/model_runtime.py +1 -1
snowflake/ml/model/_packager/model_handlers/huggingface_pipeline.py +3 -1
snowflake/ml/model/_packager/model_handlers/snowmlmodel.py +10 -28
snowflake/ml/model/_packager/model_meta/model_meta.py +18 -16
snowflake/ml/model/_signatures/snowpark_handler.py +1 -1
snowflake/ml/model/model_signature.py +108 -53
snowflake/ml/model/type_hints.py +1 -0
snowflake/ml/modeling/_internal/distributed_hpo_trainer.py +554 -0
snowflake/ml/modeling/_internal/estimator_protocols.py +1 -60
snowflake/ml/modeling/_internal/model_specifications.py +146 -0
snowflake/ml/modeling/_internal/model_trainer.py +13 -0
snowflake/ml/modeling/_internal/model_trainer_builder.py +78 -0
snowflake/ml/modeling/_internal/pandas_trainer.py +54 -0
snowflake/ml/modeling/_internal/snowpark_handlers.py +6 -760
snowflake/ml/modeling/_internal/snowpark_trainer.py +331 -0
snowflake/ml/modeling/calibration/calibrated_classifier_cv.py +108 -135
snowflake/ml/modeling/cluster/affinity_propagation.py +106 -135
snowflake/ml/modeling/cluster/agglomerative_clustering.py +106 -135
snowflake/ml/modeling/cluster/birch.py +106 -135
snowflake/ml/modeling/cluster/bisecting_k_means.py +106 -135
snowflake/ml/modeling/cluster/dbscan.py +106 -135
snowflake/ml/modeling/cluster/feature_agglomeration.py +106 -135
snowflake/ml/modeling/cluster/k_means.py +105 -135
snowflake/ml/modeling/cluster/mean_shift.py +106 -135
snowflake/ml/modeling/cluster/mini_batch_k_means.py +105 -135
snowflake/ml/modeling/cluster/optics.py +106 -135
snowflake/ml/modeling/cluster/spectral_biclustering.py +106 -135
snowflake/ml/modeling/cluster/spectral_clustering.py +106 -135
snowflake/ml/modeling/cluster/spectral_coclustering.py +106 -135
snowflake/ml/modeling/compose/column_transformer.py +106 -135
snowflake/ml/modeling/compose/transformed_target_regressor.py +108 -135
snowflake/ml/modeling/covariance/elliptic_envelope.py +106 -135
snowflake/ml/modeling/covariance/empirical_covariance.py +99 -128
snowflake/ml/modeling/covariance/graphical_lasso.py +106 -135
snowflake/ml/modeling/covariance/graphical_lasso_cv.py +106 -135
snowflake/ml/modeling/covariance/ledoit_wolf.py +104 -133
snowflake/ml/modeling/covariance/min_cov_det.py +106 -135
snowflake/ml/modeling/covariance/oas.py +99 -128
snowflake/ml/modeling/covariance/shrunk_covariance.py +103 -132
snowflake/ml/modeling/decomposition/dictionary_learning.py +106 -135
snowflake/ml/modeling/decomposition/factor_analysis.py +106 -135
snowflake/ml/modeling/decomposition/fast_ica.py +106 -135
snowflake/ml/modeling/decomposition/incremental_pca.py +106 -135
snowflake/ml/modeling/decomposition/kernel_pca.py +106 -135
snowflake/ml/modeling/decomposition/mini_batch_dictionary_learning.py +106 -135
snowflake/ml/modeling/decomposition/mini_batch_sparse_pca.py +106 -135
snowflake/ml/modeling/decomposition/pca.py +106 -135
snowflake/ml/modeling/decomposition/sparse_pca.py +106 -135
snowflake/ml/modeling/decomposition/truncated_svd.py +106 -135
snowflake/ml/modeling/discriminant_analysis/linear_discriminant_analysis.py +108 -135
snowflake/ml/modeling/discriminant_analysis/quadratic_discriminant_analysis.py +108 -135
snowflake/ml/modeling/ensemble/ada_boost_classifier.py +108 -135
snowflake/ml/modeling/ensemble/ada_boost_regressor.py +108 -135
snowflake/ml/modeling/ensemble/bagging_classifier.py +108 -135
snowflake/ml/modeling/ensemble/bagging_regressor.py +108 -135
snowflake/ml/modeling/ensemble/extra_trees_classifier.py +108 -135
snowflake/ml/modeling/ensemble/extra_trees_regressor.py +108 -135
snowflake/ml/modeling/ensemble/gradient_boosting_classifier.py +108 -135
snowflake/ml/modeling/ensemble/gradient_boosting_regressor.py +108 -135
snowflake/ml/modeling/ensemble/hist_gradient_boosting_classifier.py +108 -135
snowflake/ml/modeling/ensemble/hist_gradient_boosting_regressor.py +108 -135
snowflake/ml/modeling/ensemble/isolation_forest.py +106 -135
snowflake/ml/modeling/ensemble/random_forest_classifier.py +108 -135
snowflake/ml/modeling/ensemble/random_forest_regressor.py +108 -135
snowflake/ml/modeling/ensemble/stacking_regressor.py +108 -135
snowflake/ml/modeling/ensemble/voting_classifier.py +108 -135
snowflake/ml/modeling/ensemble/voting_regressor.py +108 -135
snowflake/ml/modeling/feature_selection/generic_univariate_select.py +101 -128
snowflake/ml/modeling/feature_selection/select_fdr.py +99 -126
snowflake/ml/modeling/feature_selection/select_fpr.py +99 -126
snowflake/ml/modeling/feature_selection/select_fwe.py +99 -126
snowflake/ml/modeling/feature_selection/select_k_best.py +100 -127
snowflake/ml/modeling/feature_selection/select_percentile.py +99 -126
snowflake/ml/modeling/feature_selection/sequential_feature_selector.py +106 -135
snowflake/ml/modeling/feature_selection/variance_threshold.py +95 -124
snowflake/ml/modeling/framework/base.py +83 -1
snowflake/ml/modeling/gaussian_process/gaussian_process_classifier.py +108 -135
snowflake/ml/modeling/gaussian_process/gaussian_process_regressor.py +108 -135
snowflake/ml/modeling/impute/iterative_imputer.py +106 -135
snowflake/ml/modeling/impute/knn_imputer.py +106 -135
snowflake/ml/modeling/impute/missing_indicator.py +106 -135
snowflake/ml/modeling/impute/simple_imputer.py +9 -1
snowflake/ml/modeling/kernel_approximation/additive_chi2_sampler.py +96 -125
snowflake/ml/modeling/kernel_approximation/nystroem.py +106 -135
snowflake/ml/modeling/kernel_approximation/polynomial_count_sketch.py +106 -135
snowflake/ml/modeling/kernel_approximation/rbf_sampler.py +105 -134
snowflake/ml/modeling/kernel_approximation/skewed_chi2_sampler.py +103 -132
snowflake/ml/modeling/kernel_ridge/kernel_ridge.py +108 -135
snowflake/ml/modeling/lightgbm/lgbm_classifier.py +90 -118
snowflake/ml/modeling/lightgbm/lgbm_regressor.py +90 -118
snowflake/ml/modeling/linear_model/ard_regression.py +108 -135
snowflake/ml/modeling/linear_model/bayesian_ridge.py +108 -135
snowflake/ml/modeling/linear_model/elastic_net.py +108 -135
snowflake/ml/modeling/linear_model/elastic_net_cv.py +108 -135
snowflake/ml/modeling/linear_model/gamma_regressor.py +108 -135
snowflake/ml/modeling/linear_model/huber_regressor.py +108 -135
snowflake/ml/modeling/linear_model/lars.py +108 -135
snowflake/ml/modeling/linear_model/lars_cv.py +108 -135
snowflake/ml/modeling/linear_model/lasso.py +108 -135
snowflake/ml/modeling/linear_model/lasso_cv.py +108 -135
snowflake/ml/modeling/linear_model/lasso_lars.py +108 -135
snowflake/ml/modeling/linear_model/lasso_lars_cv.py +108 -135
snowflake/ml/modeling/linear_model/lasso_lars_ic.py +108 -135
snowflake/ml/modeling/linear_model/linear_regression.py +108 -135
snowflake/ml/modeling/linear_model/logistic_regression.py +108 -135
snowflake/ml/modeling/linear_model/logistic_regression_cv.py +108 -135
snowflake/ml/modeling/linear_model/multi_task_elastic_net.py +108 -135
snowflake/ml/modeling/linear_model/multi_task_elastic_net_cv.py +108 -135
snowflake/ml/modeling/linear_model/multi_task_lasso.py +108 -135
snowflake/ml/modeling/linear_model/multi_task_lasso_cv.py +108 -135
snowflake/ml/modeling/linear_model/orthogonal_matching_pursuit.py +108 -135
snowflake/ml/modeling/linear_model/passive_aggressive_classifier.py +108 -135
snowflake/ml/modeling/linear_model/passive_aggressive_regressor.py +107 -135
snowflake/ml/modeling/linear_model/perceptron.py +107 -135
snowflake/ml/modeling/linear_model/poisson_regressor.py +108 -135
snowflake/ml/modeling/linear_model/ransac_regressor.py +108 -135
snowflake/ml/modeling/linear_model/ridge.py +108 -135
snowflake/ml/modeling/linear_model/ridge_classifier.py +108 -135
snowflake/ml/modeling/linear_model/ridge_classifier_cv.py +108 -135
snowflake/ml/modeling/linear_model/ridge_cv.py +108 -135
snowflake/ml/modeling/linear_model/sgd_classifier.py +108 -135
snowflake/ml/modeling/linear_model/sgd_one_class_svm.py +106 -135
snowflake/ml/modeling/linear_model/sgd_regressor.py +108 -135
snowflake/ml/modeling/linear_model/theil_sen_regressor.py +108 -135
snowflake/ml/modeling/linear_model/tweedie_regressor.py +108 -135
snowflake/ml/modeling/manifold/isomap.py +106 -135
snowflake/ml/modeling/manifold/mds.py +106 -135
snowflake/ml/modeling/manifold/spectral_embedding.py +106 -135
snowflake/ml/modeling/manifold/tsne.py +106 -135
snowflake/ml/modeling/metrics/classification.py +196 -55
snowflake/ml/modeling/metrics/correlation.py +4 -2
snowflake/ml/modeling/metrics/covariance.py +7 -4
snowflake/ml/modeling/metrics/ranking.py +32 -16
snowflake/ml/modeling/metrics/regression.py +60 -32
snowflake/ml/modeling/mixture/bayesian_gaussian_mixture.py +106 -135
snowflake/ml/modeling/mixture/gaussian_mixture.py +106 -135
snowflake/ml/modeling/model_selection/grid_search_cv.py +91 -148
snowflake/ml/modeling/model_selection/randomized_search_cv.py +93 -154
snowflake/ml/modeling/multiclass/one_vs_one_classifier.py +105 -132
snowflake/ml/modeling/multiclass/one_vs_rest_classifier.py +108 -135
snowflake/ml/modeling/multiclass/output_code_classifier.py +108 -135
snowflake/ml/modeling/naive_bayes/bernoulli_nb.py +108 -135
snowflake/ml/modeling/naive_bayes/categorical_nb.py +108 -135
snowflake/ml/modeling/naive_bayes/complement_nb.py +108 -135
snowflake/ml/modeling/naive_bayes/gaussian_nb.py +98 -125
snowflake/ml/modeling/naive_bayes/multinomial_nb.py +107 -134
snowflake/ml/modeling/neighbors/k_neighbors_classifier.py +108 -135
snowflake/ml/modeling/neighbors/k_neighbors_regressor.py +108 -135
snowflake/ml/modeling/neighbors/kernel_density.py +106 -135
snowflake/ml/modeling/neighbors/local_outlier_factor.py +106 -135
snowflake/ml/modeling/neighbors/nearest_centroid.py +108 -135
snowflake/ml/modeling/neighbors/nearest_neighbors.py +106 -135
snowflake/ml/modeling/neighbors/neighborhood_components_analysis.py +108 -135
snowflake/ml/modeling/neighbors/radius_neighbors_classifier.py +108 -135
snowflake/ml/modeling/neighbors/radius_neighbors_regressor.py +108 -135
snowflake/ml/modeling/neural_network/bernoulli_rbm.py +106 -135
snowflake/ml/modeling/neural_network/mlp_classifier.py +108 -135
snowflake/ml/modeling/neural_network/mlp_regressor.py +108 -135
snowflake/ml/modeling/parameters/disable_distributed_hpo.py +2 -6
snowflake/ml/modeling/preprocessing/binarizer.py +25 -8
snowflake/ml/modeling/preprocessing/k_bins_discretizer.py +9 -4
snowflake/ml/modeling/preprocessing/label_encoder.py +31 -11
snowflake/ml/modeling/preprocessing/max_abs_scaler.py +27 -9
snowflake/ml/modeling/preprocessing/min_max_scaler.py +42 -14
snowflake/ml/modeling/preprocessing/normalizer.py +9 -4
snowflake/ml/modeling/preprocessing/one_hot_encoder.py +26 -10
snowflake/ml/modeling/preprocessing/ordinal_encoder.py +37 -13
snowflake/ml/modeling/preprocessing/polynomial_features.py +106 -135
snowflake/ml/modeling/preprocessing/robust_scaler.py +39 -13
snowflake/ml/modeling/preprocessing/standard_scaler.py +36 -12
snowflake/ml/modeling/semi_supervised/label_propagation.py +108 -135
snowflake/ml/modeling/semi_supervised/label_spreading.py +108 -135
snowflake/ml/modeling/svm/linear_svc.py +108 -135
snowflake/ml/modeling/svm/linear_svr.py +108 -135
snowflake/ml/modeling/svm/nu_svc.py +108 -135
snowflake/ml/modeling/svm/nu_svr.py +108 -135
snowflake/ml/modeling/svm/svc.py +108 -135
snowflake/ml/modeling/svm/svr.py +108 -135
snowflake/ml/modeling/tree/decision_tree_classifier.py +108 -135
snowflake/ml/modeling/tree/decision_tree_regressor.py +108 -135
snowflake/ml/modeling/tree/extra_tree_classifier.py +108 -135
snowflake/ml/modeling/tree/extra_tree_regressor.py +108 -135
snowflake/ml/modeling/xgboost/xgb_classifier.py +108 -136
snowflake/ml/modeling/xgboost/xgb_regressor.py +108 -136
snowflake/ml/modeling/xgboost/xgbrf_classifier.py +108 -136
snowflake/ml/modeling/xgboost/xgbrf_regressor.py +108 -136
snowflake/ml/registry/model_registry.py +2 -0
snowflake/ml/registry/registry.py +215 -0
snowflake/ml/version.py +1 -1
{snowflake_ml_python-1.1.0.dist-info → snowflake_ml_python-1.1.2.dist-info}/METADATA +34 -1
snowflake_ml_python-1.1.2.dist-info/RECORD +347 -0
snowflake_ml_python-1.1.0.dist-info/RECORD +0 -331
{snowflake_ml_python-1.1.0.dist-info → snowflake_ml_python-1.1.2.dist-info}/WHEEL +0 -0

snowflake/ml/_internal/utils/identifier.py CHANGED Viewed

@@ -23,7 +23,7 @@ quote_name_without_upper_casing = analyzer_utils.quote_name_without_upper_casing
 def _is_quoted(id: str) -> bool:
-    """Checks if input is quoted.
+    """Checks if input *identifier* is quoted.
     NOTE: Snowflake treats all identifiers as UPPERCASE by default. That is 'Hello' would become 'HELLO'. To preserve
     case, one needs to use quoted identifiers, e.g. "Hello" (note the double quote). Callers must take care of that
@@ -40,23 +40,21 @@ def _is_quoted(id: str) -> bool:
         ValueError: If the id is invalid.
     """
     if not id:
-        raise ValueError("Invalid id passed.")
-    if len(id) < 2:
-        return False
-    if id[0] == '"' and id[-1] == '"':
+        raise ValueError(f"Invalid id {id} passed. ID is empty.")
+    if len(id) >= 2 and id[0] == '"' and id[-1] == '"':
         if len(id) == 2:
-            raise ValueError("Invalid id passed.")
+            raise ValueError(f"Invalid id {id} passed. ID is empty.")
         if not QUOTED_IDENTIFIER_RE.match(id):
-            raise ValueError("Invalid id passed.")
+            raise ValueError(f"Invalid id {id} passed. ID is quoted but does not match the quoted rule.")
         return True
-    if not UNQUOTED_CASE_INSENSITIVE_RE.match(id):
-        raise ValueError("Invalid id passed.")
-    return False  # To keep mypy happy
+    if not UNQUOTED_CASE_SENSITIVE_RE.match(id):
+        raise ValueError(f"Invalid id {id} passed. ID is unquoted but does not match the unquoted rule.")
+    return False
 def _get_unescaped_name(id: str) -> str:
     """Remove double quotes and unescape quotes between them from id if quoted.
-        Uppercase if not quoted.
+        Return as it is otherwise
     NOTE: See note in :meth:`_is_quoted`.
@@ -67,7 +65,7 @@ def _get_unescaped_name(id: str) -> str:
         String with quotes removed if quoted; original string otherwise.
     """
     if not _is_quoted(id):
-        return id.upper()
+        return id
     unquoted_id = id[1:-1]
     return unquoted_id.replace(DOUBLE_QUOTE + DOUBLE_QUOTE, DOUBLE_QUOTE)
@@ -88,9 +86,9 @@ def _get_escaped_name(id: str) -> str:
     return DOUBLE_QUOTE + escape_quotes + DOUBLE_QUOTE
-def get_inferred_name(id: str) -> str:
-    """Double quote id when it is case-sensitive and can start with and
-    contain any valid characters; unquote otherwise.
+def get_inferred_name(name: str) -> str:
+    """Double quote name when it is case-sensitive and can start with and
+    contain any valid characters; otherwise, keep it as it is.
     Examples:
         COL1 -> COL1
@@ -100,42 +98,38 @@ def get_inferred_name(id: str) -> str:
         COL 1 -> "COL 1"
     Args:
-        id: The string to be checked & treated.
+        name: The string to be checked & treated.
     Returns:
         Double quoted identifier if necessary; unquoted string otherwise.
     """
-    if UNQUOTED_CASE_SENSITIVE_RE.match(id):
-        return id
-    escaped_id = get_escaped_names(id)
+    if UNQUOTED_CASE_SENSITIVE_RE.match(name):
+        return name
+    escaped_id = _get_escaped_name(name)
     assert isinstance(escaped_id, str)
     return escaped_id
-def concat_names(ids: List[str]) -> str:
-    """Concatenates `ids` to form one valid id.
+def concat_names(names: List[str]) -> str:
+    """Concatenates `names` to form one valid id.
-    NOTE: See note in :meth:`_is_quoted`.
     Args:
-        ids: List of identifiers to be concatenated.
+        names: List of identifiers to be concatenated.
     Returns:
         Concatenated identifier.
     """
-    quotes_needed = False
     parts = []
-    for id in ids:
-        if _is_quoted(id):
-            # If any part is quoted, the user cares about case.
-            quotes_needed = True
-            # Remove quotes before using it.
-            id = _get_unescaped_name(id)
-        parts.append(id)
+    for name in names:
+        if QUOTED_IDENTIFIER_RE.match(name):
+            # If any part is quoted identifier, we need to remove the quotes
+            unescaped_name: str = _get_unescaped_name(name)
+            parts.append(unescaped_name)
+        else:
+            parts.append(name)
     final_id = "".join(parts)
-    if quotes_needed:
-        return _get_escaped_name(final_id)
-    return final_id
+    return get_inferred_name(final_id)
 def rename_to_valid_snowflake_identifier(name: str) -> str:
@@ -222,6 +216,14 @@ def get_unescaped_names(ids: Optional[Union[str, List[str]]]) -> Optional[Union[
     response pandas dataframe(i.e., in the response of snowpark_df.to_pandas()) using the rules defined here
     https://docs.snowflake.com/en/sql-reference/identifiers-syntax.
+    This function will mimic the behavior of Snowpark's `to_pandas()` from Snowpark DataFrame.
+    Examples:
+        COL1 -> COL1
+        "Col" -> Col
+        \"""COL""\" -> "COL"  (ignore '\')
+        "COL 1" -> COL 1
     Args:
         ids: User provided column name identifier(s).
@@ -243,27 +245,36 @@ def get_unescaped_names(ids: Optional[Union[str, List[str]]]) -> Optional[Union[
 @overload
-def get_escaped_names(ids: None) -> None:
+def get_inferred_names(names: None) -> None:
     ...
 @overload
-def get_escaped_names(ids: str) -> str:
+def get_inferred_names(names: str) -> str:
     ...
 @overload
-def get_escaped_names(ids: List[str]) -> List[str]:
+def get_inferred_names(names: List[str]) -> List[str]:
     ...
-def get_escaped_names(ids: Optional[Union[str, List[str]]]) -> Optional[Union[str, List[str]]]:
-    """Given a user provided identifier(s), this method will compute the equivalent column name identifier(s)
+def get_inferred_names(names: Optional[Union[str, List[str]]]) -> Optional[Union[str, List[str]]]:
+    """Given a user provided *string(s)*, this method will compute the equivalent column name identifier(s)
     in case of column name contains special characters, and maintains case-sensitivity
     https://docs.snowflake.com/en/sql-reference/identifiers-syntax.
+    This function will mimic the behavior of Snowpark's `create_dataframe` from pandas DataFrame.
+    Examples:
+        COL1 -> COL1
+        1COL -> "1COL"
+        Col -> "Col"
+        "COL" -> \"""COL""\"  (ignore '\')
+        COL 1 -> "COL 1"
     Args:
-        ids: User provided column name identifier(s).
+        names: User provided column name identifier(s).
     Returns:
         Double-quoted Identifiers for column names, to make sure that column names are case sensitive
@@ -272,12 +283,12 @@ def get_escaped_names(ids: Optional[Union[str, List[str]]]) -> Optional[Union[st
         ValueError: if input types is unsupported or column name identifiers are invalid.
     """
-    if ids is None:
+    if names is None:
         return None
-    elif type(ids) is list:
-        return [_get_escaped_name(id) for id in ids]
-    elif type(ids) is str:
-        return _get_escaped_name(ids)
+    elif type(names) is list:
+        return [get_inferred_name(id) for id in names]
+    elif type(names) is str:
+        return get_inferred_name(names)
     else:
         raise ValueError("Unsupported type. Only string or list of string are supported for selecting columns.")
@@ -297,39 +308,34 @@ def remove_prefix(s: str, prefix: str) -> str:
     return s
-def resolve_identifier(id: str) -> str:
-    """Following Snowflake identifier resolution strategies:
+def resolve_identifier(name: str) -> str:
+    """Given a user provided *string*, resolve following Snowflake identifier resolution strategies:
         https://docs.snowflake.com/en/sql-reference/identifiers-syntax#label-identifier-casing
-        If identifier is unquoted, it will return upper case.
-        Otherwise return exactly as it is.
-    Args:
-        id: identifier string
-    Returns:
-        Resolved identifier
-    """
-    if _is_quoted(id):
-        if UNQUOTED_CASE_SENSITIVE_RE.match(id[1:-1]):
-            return id[1:-1]
-        else:
-            return id
-    else:
-        return id.upper()
+        This function will mimic the behavior of the SQL parser.
-def strip_wrapping_quotes(id: str) -> str:
-    """Remove wrapping quotes if the identifier is quoted.
-    This is mainly used for keywords like `warehouse` which doesn't like wrapping quotes when being used.
+    Examples:
+        COL1 -> COL1
+        1COL -> Raise Error
+        Col -> COL
+        "COL" -> COL
+        COL 1 -> Raise Error
     Args:
-        id: identifier string
+        name: the string to be resolved.
+    Raises:
+        ValueError: if input would not be accepted by SQL parser.
     Returns:
-        Identifier with wrapping quotes removed
+        Resolved identifier
     """
-    if _is_quoted(id):
-        return id[1:-1]
+    if QUOTED_IDENTIFIER_RE.match(name):
+        unescaped = _get_unescaped_name(name)
+        if UNQUOTED_CASE_SENSITIVE_RE.match(unescaped):
+            return unescaped
+        return name
+    elif UNQUOTED_CASE_INSENSITIVE_RE.match(name):
+        return name.upper()
     else:
-        return id
+        raise ValueError(f"Invalid name {name} passed. ID is not quoted and cannot normalized.")

snowflake/ml/_internal/utils/retryable_http.py CHANGED Viewed

@@ -5,11 +5,23 @@ from requests import adapters
 from urllib3.util import retry
-def get_http_client() -> requests.Session:
-    # Set up a retry policy for requests
+def get_http_client(total_retries: int = 5, backoff_factor: float = 0.1) -> requests.Session:
+    """Construct retryable http client.
+    Args:
+        total_retries: Total number of retries to allow.
+        backoff_factor: A backoff factor to apply between attempts after the second try. Time to sleep is calculated by
+            {backoff factor} * (2 ** ({number of previous retries})). For example, with default retries of 5 and backoff
+            factor set to 0.1, each subsequent retry will sleep [0.2s, 0.4s, 0.8s, 1.6s, 3.2s] respectively.
+    Returns:
+        requests.Session object.
+    """
     retry_strategy = retry.Retry(
-        total=3,  # total number of retries
-        backoff_factor=0.1,  # 100ms initial delay
+        total=total_retries,
+        backoff_factor=backoff_factor,
         status_forcelist=[
             http.HTTPStatus.TOO_MANY_REQUESTS,
             http.HTTPStatus.INTERNAL_SERVER_ERROR,

snowflake/ml/_internal/utils/spcs_attribution_utils.py ADDED Viewed

@@ -0,0 +1,122 @@
+import logging
+from datetime import datetime
+from typing import Any, Dict, Optional
+from snowflake import snowpark
+from snowflake.ml._internal import telemetry
+from snowflake.ml._internal.utils import query_result_checker
+logger = logging.getLogger(__name__)
+_DATETIME_FORMAT = "%Y-%m-%d %H:%M:%S.%f %z"
+_COMPUTE_POOL = "compute_pool"
+_CREATED_ON = "created_on"
+_INSTANCE_FAMILY = "instance_family"
+_NAME = "name"
+_TELEMETRY_PROJECT = "MLOps"
+_TELEMETRY_SUBPROJECT = "SpcsDeployment"
+_SERVICE_START = "SPCS_SERVICE_START"
+_SERVICE_END = "SPCS_SERVICE_END"
+def _desc_compute_pool(session: snowpark.Session, compute_pool_name: str) -> Dict[str, Any]:
+    sql = f"DESC COMPUTE POOL {compute_pool_name}"
+    result = (
+        query_result_checker.SqlResultValidator(
+            session=session,
+            query=sql,
+        )
+        .has_column(_INSTANCE_FAMILY)
+        .has_column(_NAME)
+        .has_dimensions(expected_rows=1)
+        .validate()
+    )
+    return result[0].as_dict()
+def _desc_service(session: snowpark.Session, fully_qualified_name: str) -> Dict[str, Any]:
+    sql = f"DESC SERVICE {fully_qualified_name}"
+    result = (
+        query_result_checker.SqlResultValidator(
+            session=session,
+            query=sql,
+        )
+        .has_column(_COMPUTE_POOL)
+        .has_dimensions(expected_rows=1)
+        .validate()
+    )
+    return result[0].as_dict()
+def _get_current_time() -> datetime:
+    """
+    This method exists to make it easier to mock datetime in test.
+    Returns:
+        current datetime
+    """
+    return datetime.now()
+def _send_service_telemetry(
+    fully_qualified_name: Optional[str] = None,
+    compute_pool_name: Optional[str] = None,
+    service_details: Optional[Dict[str, Any]] = None,
+    compute_pool_details: Optional[Dict[str, Any]] = None,
+    duration_in_seconds: Optional[int] = None,
+    kwargs: Optional[Dict[str, Any]] = None,
+) -> None:
+    try:
+        telemetry.send_custom_usage(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+            telemetry_type=telemetry.TelemetryField.TYPE_SNOWML_SPCS_USAGE.value,
+            data={
+                "service_name": fully_qualified_name,
+                "compute_pool_name": compute_pool_name,
+                "service_details": service_details,
+                "compute_pool_details": compute_pool_details,
+                "duration_in_seconds": duration_in_seconds,
+            },
+            kwargs=kwargs,
+        )
+    except Exception as e:
+        logger.error(f"Failed to send service telemetry: {e}")
+def record_service_start(session: snowpark.Session, fully_qualified_name: str) -> None:
+    service_details = _desc_service(session, fully_qualified_name)
+    compute_pool_name = service_details[_COMPUTE_POOL]
+    compute_pool_details = _desc_compute_pool(session, compute_pool_name)
+    _send_service_telemetry(
+        fully_qualified_name=fully_qualified_name,
+        compute_pool_name=compute_pool_name,
+        service_details=service_details,
+        compute_pool_details=compute_pool_details,
+        kwargs={telemetry.TelemetryField.KEY_CUSTOM_TAGS.value: _SERVICE_START},
+    )
+    logger.info(f"Service {fully_qualified_name} created with compute pool {compute_pool_name}.")
+def record_service_end(session: snowpark.Session, fully_qualified_name: str) -> None:
+    service_details = _desc_service(session, fully_qualified_name)
+    compute_pool_details = _desc_compute_pool(session, service_details[_COMPUTE_POOL])
+    compute_pool_name = service_details[_COMPUTE_POOL]
+    created_on_datetime: datetime = service_details[_CREATED_ON]
+    current_time: datetime = _get_current_time()
+    current_time = current_time.replace(tzinfo=created_on_datetime.tzinfo)
+    duration_in_seconds = int((current_time - created_on_datetime).total_seconds())
+    _send_service_telemetry(
+        fully_qualified_name=fully_qualified_name,
+        compute_pool_name=compute_pool_name,
+        service_details=service_details,
+        compute_pool_details=compute_pool_details,
+        duration_in_seconds=duration_in_seconds,
+        kwargs={telemetry.TelemetryField.KEY_CUSTOM_TAGS.value: _SERVICE_END},
+    )
+    logger.info(f"Service {fully_qualified_name} deleted from compute pool {compute_pool_name}")

snowflake/ml/dataset/dataset.py CHANGED Viewed

@@ -140,7 +140,7 @@ Got {len(self.df.queries['queries'])}: {self.df.queries['queries']}
     @classmethod
     def from_json(cls, json_str: str, session: Session) -> "Dataset":
-        json_dict = json.loads(json_str)
+        json_dict = json.loads(json_str, strict=False)
         json_dict["df"] = session.sql(json_dict.pop("df_query"))
         fs_meta_json = json_dict["feature_store_metadata"]

snowflake/ml/model/_api.py CHANGED Viewed

@@ -7,7 +7,6 @@ from snowflake.ml._internal.exceptions import (
     error_codes,
     exceptions as snowml_exceptions,
 )
-from snowflake.ml._internal.utils import identifier
 from snowflake.ml.model import (
     deploy_platforms,
     model_signature,
@@ -188,6 +187,10 @@ def save_model(
     Returns:
         Model
     """
+    if options is None:
+        options = {}
+    options["_legacy_save"] = True
     m = model_composer.ModelComposer(session=session, stage_path=stage_path)
     m.save(
         name=name,
@@ -481,6 +484,7 @@ def predict(
     # Get options
     INTERMEDIATE_OBJ_NAME = "tmp_result"
     sig = deployment["signature"]
+    identifier_rule = model_signature.SnowparkIdentifierRule.INFERRED
     # Validate and prepare input
     if not isinstance(X, SnowparkDataFrame):
@@ -491,7 +495,7 @@ def predict(
     else:
         keep_order = False
         output_with_input_features = True
-        model_signature._validate_snowpark_data(X, sig.inputs)
+        identifier_rule = model_signature._validate_snowpark_data(X, sig.inputs)
         s_df = X
     if statement_params:
@@ -500,10 +504,14 @@ def predict(
         else:
             s_df._statement_params = statement_params  # type: ignore[assignment]
+    original_cols = s_df.columns
     # Infer and get intermediate result
     input_cols = []
-    for col_name in s_df.columns:
-        literal_col_name = identifier.get_unescaped_names(col_name)
+    for input_feature in sig.inputs:
+        literal_col_name = input_feature.name
+        col_name = identifier_rule.get_identifier_from_feature(input_feature.name)
         input_cols.extend(
             [
                 F.lit(literal_col_name),
@@ -511,29 +519,28 @@ def predict(
             ]
         )
-    # TODO[shchen]: SNOW-870032, For SnowService, external function name cannot be double quoted, else it results in
-    # external function no found.
     udf_name = deployment["name"]
-    output_obj = F.call_udf(udf_name, F.object_construct(*input_cols))
-    if output_with_input_features:
-        df_res = s_df.with_column(INTERMEDIATE_OBJ_NAME, output_obj)
-    else:
-        df_res = s_df.select(output_obj.alias(INTERMEDIATE_OBJ_NAME))
+    output_obj = F.call_udf(udf_name, F.object_construct_keep_null(*input_cols))
+    df_res = s_df.with_column(INTERMEDIATE_OBJ_NAME, output_obj)
     if keep_order:
         df_res = df_res.order_by(
-            F.col(INTERMEDIATE_OBJ_NAME)[infer_template._KEEP_ORDER_COL_NAME],
+            F.col(infer_template._KEEP_ORDER_COL_NAME),
             ascending=True,
         )
+    if not output_with_input_features:
+        df_res = df_res.drop(*original_cols)
     # Prepare the output
     output_cols = []
+    output_col_names = []
     for output_feature in sig.outputs:
         output_cols.append(F.col(INTERMEDIATE_OBJ_NAME)[output_feature.name].astype(output_feature.as_snowpark_type()))
+        output_col_names.append(identifier_rule.get_identifier_from_feature(output_feature.name))
     df_res = df_res.with_columns(
-        [identifier.get_inferred_name(output_feature.name) for output_feature in sig.outputs],
+        output_col_names,
         output_cols,
     ).drop(INTERMEDIATE_OBJ_NAME)

snowflake/ml/model/_client/model/model_impl.py ADDED Viewed

@@ -0,0 +1,176 @@
+from typing import List, Union
+from snowflake.ml._internal import telemetry
+from snowflake.ml._internal.utils import sql_identifier
+from snowflake.ml.model._client.model import model_version_impl
+from snowflake.ml.model._client.ops import model_ops
+_TELEMETRY_PROJECT = "MLOps"
+_TELEMETRY_SUBPROJECT = "ModelManagement"
+class Model:
+    """Model Object containing multiple versions. Mapping to SQL's MODEL object."""
+    _model_ops: model_ops.ModelOperator
+    _model_name: sql_identifier.SqlIdentifier
+    def __init__(self) -> None:
+        raise RuntimeError("Model's initializer is not meant to be used. Use `get_model` from registry instead.")
+    @classmethod
+    def _ref(
+        cls,
+        model_ops: model_ops.ModelOperator,
+        *,
+        model_name: sql_identifier.SqlIdentifier,
+    ) -> "Model":
+        self: "Model" = object.__new__(cls)
+        self._model_ops = model_ops
+        self._model_name = model_name
+        return self
+    def __eq__(self, __value: object) -> bool:
+        if not isinstance(__value, Model):
+            return False
+        return self._model_ops == __value._model_ops and self._model_name == __value._model_name
+    @property
+    def name(self) -> str:
+        return self._model_name.identifier()
+    @property
+    def fully_qualified_name(self) -> str:
+        return self._model_ops._model_version_client.fully_qualified_model_name(self._model_name)
+    @property
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def description(self) -> str:
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        return self._model_ops.get_comment(
+            model_name=self._model_name,
+            statement_params=statement_params,
+        )
+    @description.setter
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def description(self, description: str) -> None:
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        return self._model_ops.set_comment(
+            comment=description,
+            model_name=self._model_name,
+            statement_params=statement_params,
+        )
+    @property
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def default(self) -> model_version_impl.ModelVersion:
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+            class_name=self.__class__.__name__,
+        )
+        default_version_name = self._model_ops._model_version_client.get_default_version(
+            model_name=self._model_name, statement_params=statement_params
+        )
+        return self.version(default_version_name)
+    @default.setter
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def default(self, version: Union[str, model_version_impl.ModelVersion]) -> None:
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+            class_name=self.__class__.__name__,
+        )
+        if isinstance(version, str):
+            version_name = sql_identifier.SqlIdentifier(version)
+        else:
+            version_name = version._version_name
+        self._model_ops._model_version_client.set_default_version(
+            model_name=self._model_name, version_name=version_name, statement_params=statement_params
+        )
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def version(self, version_name: str) -> model_version_impl.ModelVersion:
+        """Get a model version object given a version name in the model.
+        Args:
+            version_name: The name of version
+        Raises:
+            ValueError: Raised when the version requested does not exist.
+        Returns:
+            The model version object.
+        """
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        version_id = sql_identifier.SqlIdentifier(version_name)
+        if self._model_ops.validate_existence(
+            model_name=self._model_name,
+            version_name=version_id,
+            statement_params=statement_params,
+        ):
+            return model_version_impl.ModelVersion._ref(
+                self._model_ops,
+                model_name=self._model_name,
+                version_name=version_id,
+            )
+        else:
+            raise ValueError(
+                f"Unable to find version with name {version_id.identifier()} in model {self.fully_qualified_name}"
+            )
+    @telemetry.send_api_usage_telemetry(
+        project=_TELEMETRY_PROJECT,
+        subproject=_TELEMETRY_SUBPROJECT,
+    )
+    def list_versions(self) -> List[model_version_impl.ModelVersion]:
+        """List all versions in the model.
+        Returns:
+            A List of ModelVersion object representing all versions in the model.
+        """
+        statement_params = telemetry.get_statement_params(
+            project=_TELEMETRY_PROJECT,
+            subproject=_TELEMETRY_SUBPROJECT,
+        )
+        version_names = self._model_ops.list_models_or_versions(
+            model_name=self._model_name,
+            statement_params=statement_params,
+        )
+        return [
+            model_version_impl.ModelVersion._ref(
+                self._model_ops,
+                model_name=self._model_name,
+                version_name=version_name,
+            )
+            for version_name in version_names
+        ]
+    def delete_version(self, version_name: str) -> None:
+        raise NotImplementedError("Deleting version has not been supported yet.")

snowflake-ml-python 1.1.0__py3-none-any.whl → 1.1.2__py3-none-any.whl

snowflake-ml-python 1.1.0py3-none-any.whl → 1.1.2py3-none-any.whl