PyPI - scikit-learn-intelex - Versions diffs - 2024.0.1__py311-none-manylinux1_x86_64.whl → 2024.4.0__py311-none-manylinux1_x86_64.whl - Mend

scikit-learn-intelex 2024.0.1__py311-none-manylinux1_x86_64.whl → 2024.4.0__py311-none-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of scikit-learn-intelex might be problematic. Click here for more details.

Files changed (89) hide show

{scikit_learn_intelex-2024.0.1.dist-info → scikit_learn_intelex-2024.4.0.dist-info}/METADATA +2 -2
scikit_learn_intelex-2024.4.0.dist-info/RECORD +101 -0
sklearnex/__init__.py +11 -7
sklearnex/__main__.py +0 -1
sklearnex/_device_offload.py +31 -4
sklearnex/_utils.py +15 -1
sklearnex/basic_statistics/__init__.py +2 -2
sklearnex/basic_statistics/incremental_basic_statistics.py +288 -0
sklearnex/basic_statistics/tests/test_incremental_basic_statistics.py +386 -0
sklearnex/cluster/__init__.py +0 -1
sklearnex/cluster/dbscan.py +5 -2
sklearnex/cluster/k_means.py +0 -1
sklearnex/cluster/tests/test_dbscan.py +0 -1
sklearnex/cluster/tests/test_kmeans.py +0 -1
sklearnex/conftest.py +63 -0
sklearnex/covariance/__init__.py +19 -0
sklearnex/covariance/incremental_covariance.py +130 -0
sklearnex/covariance/tests/test_incremental_covariance.py +143 -0
sklearnex/decomposition/__init__.py +0 -1
sklearnex/decomposition/pca.py +319 -2
sklearnex/decomposition/tests/test_pca.py +34 -6
sklearnex/dispatcher.py +93 -28
sklearnex/ensemble/__init__.py +0 -1
sklearnex/ensemble/_forest.py +93 -89
sklearnex/ensemble/tests/test_forest.py +15 -20
sklearnex/glob/__main__.py +0 -1
sklearnex/glob/dispatcher.py +0 -1
sklearnex/linear_model/__init__.py +1 -3
sklearnex/linear_model/coordinate_descent.py +0 -1
sklearnex/linear_model/linear.py +275 -332
sklearnex/linear_model/logistic_path.py +0 -1
sklearnex/linear_model/logistic_regression.py +385 -0
sklearnex/linear_model/ridge.py +0 -1
sklearnex/linear_model/tests/test_linear.py +47 -7
sklearnex/linear_model/tests/test_logreg.py +70 -8
sklearnex/manifold/__init__.py +0 -1
sklearnex/manifold/t_sne.py +0 -1
sklearnex/manifold/tests/test_tsne.py +0 -1
sklearnex/metrics/__init__.py +0 -1
sklearnex/metrics/pairwise.py +0 -1
sklearnex/metrics/ranking.py +0 -1
sklearnex/metrics/tests/test_metrics.py +0 -1
sklearnex/model_selection/__init__.py +0 -1
sklearnex/model_selection/split.py +0 -1
sklearnex/model_selection/tests/test_model_selection.py +0 -1
sklearnex/neighbors/__init__.py +1 -2
sklearnex/neighbors/_lof.py +221 -0
sklearnex/neighbors/common.py +5 -3
sklearnex/neighbors/knn_classification.py +47 -133
sklearnex/neighbors/knn_regression.py +20 -129
sklearnex/neighbors/knn_unsupervised.py +15 -89
sklearnex/neighbors/tests/test_neighbors.py +12 -17
sklearnex/preview/__init__.py +1 -2
sklearnex/preview/cluster/__init__.py +0 -1
sklearnex/preview/cluster/k_means.py +7 -74
sklearnex/preview/{decomposition → covariance}/__init__.py +19 -20
sklearnex/preview/covariance/covariance.py +133 -0
sklearnex/preview/covariance/tests/test_covariance.py +66 -0
sklearnex/spmd/__init__.py +1 -0
sklearnex/spmd/covariance/__init__.py +19 -0
sklearnex/spmd/covariance/covariance.py +21 -0
sklearnex/spmd/ensemble/forest.py +4 -12
sklearnex/spmd/linear_model/__init__.py +2 -1
sklearnex/spmd/linear_model/logistic_regression.py +21 -0
sklearnex/svm/__init__.py +0 -1
sklearnex/svm/_common.py +4 -7
sklearnex/svm/nusvc.py +73 -49
sklearnex/svm/nusvr.py +8 -52
sklearnex/svm/svc.py +74 -51
sklearnex/svm/svr.py +5 -49
sklearnex/svm/tests/test_svm.py +0 -1
sklearnex/tests/_utils.py +164 -0
sklearnex/tests/test_memory_usage.py +9 -7
sklearnex/tests/test_monkeypatch.py +192 -134
sklearnex/tests/test_n_jobs_support.py +99 -0
sklearnex/tests/test_parallel.py +6 -8
sklearnex/tests/test_patching.py +338 -89
sklearnex/utils/__init__.py +2 -1
sklearnex/utils/_namespace.py +97 -0
sklearnex/utils/validation.py +0 -1
scikit_learn_intelex-2024.0.1.dist-info/RECORD +0 -90
sklearnex/neighbors/lof.py +0 -437
sklearnex/preview/decomposition/pca.py +0 -376
sklearnex/preview/decomposition/tests/test_preview_pca.py +0 -38
sklearnex/tests/_models_info.py +0 -170
sklearnex/tests/utils/_launch_algorithms.py +0 -118
{scikit_learn_intelex-2024.0.1.dist-info → scikit_learn_intelex-2024.4.0.dist-info}/LICENSE.txt +0 -0
{scikit_learn_intelex-2024.0.1.dist-info → scikit_learn_intelex-2024.4.0.dist-info}/WHEEL +0 -0
{scikit_learn_intelex-2024.0.1.dist-info → scikit_learn_intelex-2024.4.0.dist-info}/top_level.txt +0 -0

sklearnex/neighbors/knn_unsupervised.py CHANGED Viewed

@@ -1,4 +1,3 @@
-#!/usr/bin/env python
 # ===============================================================================
 # Copyright 2021 Intel Corporation
 #
@@ -15,90 +14,22 @@
 # limitations under the License.
 # ===============================================================================
-try:
-    from packaging.version import Version
-except ImportError:
-    from distutils.version import LooseVersion as Version
-import warnings
-import numpy as np
-from sklearn import __version__ as sklearn_version
-from sklearn.neighbors._ball_tree import BallTree
-from sklearn.neighbors._base import VALID_METRICS
-from sklearn.neighbors._base import NeighborsBase as sklearn_NeighborsBase
-from sklearn.neighbors._kd_tree import KDTree
 from sklearn.neighbors._unsupervised import NearestNeighbors as sklearn_NearestNeighbors
 from sklearn.utils.validation import _deprecate_positional_args, check_is_fitted
+from daal4py.sklearn._n_jobs_support import control_n_jobs
 from daal4py.sklearn._utils import sklearn_check_version
 from onedal.neighbors import NearestNeighbors as onedal_NearestNeighbors
-from onedal.utils import _check_array, _num_features, _num_samples
 from .._device_offload import dispatch, wrap_output_data
 from .common import KNeighborsDispatchingBase
-if sklearn_check_version("0.22") and Version(sklearn_version) < Version("0.23"):
-    class NearestNeighbors_(sklearn_NearestNeighbors):
-        def __init__(
-            self,
-            n_neighbors=5,
-            radius=1.0,
-            algorithm="auto",
-            leaf_size=30,
-            metric="minkowski",
-            p=2,
-            metric_params=None,
-            n_jobs=None,
-        ):
-            super().__init__(
-                n_neighbors=n_neighbors,
-                radius=radius,
-                algorithm=algorithm,
-                leaf_size=leaf_size,
-                metric=metric,
-                p=p,
-                metric_params=metric_params,
-                n_jobs=n_jobs,
-            )
-else:
-    class NearestNeighbors_(sklearn_NearestNeighbors):
-        if sklearn_check_version("1.2"):
-            _parameter_constraints: dict = {
-                **sklearn_NearestNeighbors._parameter_constraints
-            }
-        @_deprecate_positional_args
-        def __init__(
-            self,
-            *,
-            n_neighbors=5,
-            radius=1.0,
-            algorithm="auto",
-            leaf_size=30,
-            metric="minkowski",
-            p=2,
-            metric_params=None,
-            n_jobs=None,
-        ):
-            super().__init__(
-                n_neighbors=n_neighbors,
-                radius=radius,
-                algorithm=algorithm,
-                leaf_size=leaf_size,
-                metric=metric,
-                p=p,
-                metric_params=metric_params,
-                n_jobs=n_jobs,
-            )
-class NearestNeighbors(NearestNeighbors_, KNeighborsDispatchingBase):
+@control_n_jobs(decorated_methods=["fit", "kneighbors"])
+class NearestNeighbors(sklearn_NearestNeighbors, KNeighborsDispatchingBase):
+    __doc__ = sklearn_NearestNeighbors.__doc__
     if sklearn_check_version("1.2"):
-        _parameter_constraints: dict = {**NearestNeighbors_._parameter_constraints}
+        _parameter_constraints: dict = {**sklearn_NearestNeighbors._parameter_constraints}
     @_deprecate_positional_args
     def __init__(
@@ -124,7 +55,6 @@ class NearestNeighbors(NearestNeighbors_, KNeighborsDispatchingBase):
         )
     def fit(self, X, y=None):
-        self._fit_validation(X, y)
         dispatch(
             self,
             "fit",
@@ -150,8 +80,8 @@ class NearestNeighbors(NearestNeighbors_, KNeighborsDispatchingBase):
                 "sklearn": sklearn_NearestNeighbors.kneighbors,
             },
             X,
-            n_neighbors,
-            return_distance,
+            n_neighbors=n_neighbors,
+            return_distance=return_distance,
         )
     @wrap_output_data
@@ -165,18 +95,10 @@ class NearestNeighbors(NearestNeighbors_, KNeighborsDispatchingBase):
             or getattr(self, "_tree", 0) is None
             and self._fit_method == "kd_tree"
         ):
-            if sklearn_check_version("0.24"):
-                sklearn_NearestNeighbors.fit(self, self._fit_X, getattr(self, "_y", None))
-            else:
-                sklearn_NearestNeighbors.fit(self, self._fit_X)
-        if sklearn_check_version("0.22"):
-            result = sklearn_NearestNeighbors.radius_neighbors(
-                self, X, radius, return_distance, sort_results
-            )
-        else:
-            result = sklearn_NearestNeighbors.radius_neighbors(
-                self, X, radius, return_distance
-            )
+            sklearn_NearestNeighbors.fit(self, self._fit_X, getattr(self, "_y", None))
+        result = sklearn_NearestNeighbors.radius_neighbors(
+            self, X, radius, return_distance, sort_results
+        )
         return result
@@ -218,3 +140,7 @@ class NearestNeighbors(NearestNeighbors_, KNeighborsDispatchingBase):
         self._fit_X = self._onedal_estimator._fit_X
         self._fit_method = self._onedal_estimator._fit_method
         self._tree = self._onedal_estimator._tree
+    fit.__doc__ = sklearn_NearestNeighbors.__doc__
+    kneighbors.__doc__ = sklearn_NearestNeighbors.kneighbors.__doc__
+    radius_neighbors.__doc__ = sklearn_NearestNeighbors.radius_neighbors.__doc__

sklearnex/neighbors/tests/test_neighbors.py CHANGED Viewed

@@ -1,4 +1,3 @@
-#!/usr/bin/env python
 # ===============================================================================
 # Copyright 2021 Intel Corporation
 #
@@ -15,7 +14,6 @@
 # limitations under the License.
 # ===============================================================================
-import numpy as np
 import pytest
 from numpy.testing import assert_allclose
@@ -24,12 +22,16 @@ from onedal.tests.utils._dataframes_support import (
     _convert_to_dataframe,
     get_dataframes_and_queues,
 )
+from sklearnex.neighbors import (
+    KNeighborsClassifier,
+    KNeighborsRegressor,
+    LocalOutlierFactor,
+    NearestNeighbors,
+)
 @pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
 def test_sklearnex_import_knn_classifier(dataframe, queue):
-    from sklearnex.neighbors import KNeighborsClassifier
     X = _convert_to_dataframe([[0], [1], [2], [3]], sycl_queue=queue, target_df=dataframe)
     y = _convert_to_dataframe([0, 0, 1, 1], sycl_queue=queue, target_df=dataframe)
     neigh = KNeighborsClassifier(n_neighbors=3).fit(X, y)
@@ -41,8 +43,6 @@ def test_sklearnex_import_knn_classifier(dataframe, queue):
 @pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
 def test_sklearnex_import_knn_regression(dataframe, queue):
-    from sklearnex.neighbors import KNeighborsRegressor
     X = _convert_to_dataframe([[0], [1], [2], [3]], sycl_queue=queue, target_df=dataframe)
     y = _convert_to_dataframe([0, 0, 1, 1], sycl_queue=queue, target_df=dataframe)
     neigh = KNeighborsRegressor(n_neighbors=2).fit(X, y)
@@ -52,18 +52,16 @@ def test_sklearnex_import_knn_regression(dataframe, queue):
     assert_allclose(pred, [0.5])
-# TODO:
-# investigate failure for `dpnp.ndarrays` and `dpctl.tensors`.
+@pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
 @pytest.mark.parametrize(
-    "dataframe,queue", get_dataframes_and_queues(dataframe_filter_="numpy")
+    "estimator",
+    [LocalOutlierFactor, NearestNeighbors],
 )
-def test_sklearnex_import_nn(dataframe, queue):
-    from sklearnex.neighbors import NearestNeighbors
+def test_sklearnex_kneighbors(estimator, dataframe, queue):
     X = [[0, 0, 2], [1, 0, 0], [0, 0, 1]]
     X = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
     test = _convert_to_dataframe([[0, 0, 1.3]], sycl_queue=queue, target_df=dataframe)
-    neigh = NearestNeighbors(n_neighbors=2).fit(X)
+    neigh = estimator(n_neighbors=2).fit(X)
     result = neigh.kneighbors(test, 2, return_distance=False)
     result = _as_numpy(result)
     assert "sklearnex" in neigh.__module__
@@ -72,14 +70,11 @@ def test_sklearnex_import_nn(dataframe, queue):
 @pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
 def test_sklearnex_import_lof(dataframe, queue):
-    from sklearnex.neighbors import LocalOutlierFactor
     X = [[7, 7, 7], [1, 0, 0], [0, 0, 1], [0, 0, 1]]
     X = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
     lof = LocalOutlierFactor(n_neighbors=2)
     result = lof.fit_predict(X)
     result = _as_numpy(result)
-    assert hasattr(lof, "_knn")
+    assert hasattr(lof, "_onedal_estimator")
     assert "sklearnex" in lof.__module__
-    assert "sklearnex" in lof._knn.__module__
     assert_allclose(result, [-1, 1, 1, 1])

sklearnex/preview/__init__.py CHANGED Viewed

@@ -1,4 +1,3 @@
-#!/usr/bin/env python
 # ==============================================================================
 # Copyright 2023 Intel Corporation
 #
@@ -15,4 +14,4 @@
 # limitations under the License.
 # ==============================================================================
-__all__ = ["cluster", "decomposition"]
+__all__ = ["cluster", "covariance"]

sklearnex/preview/cluster/__init__.py CHANGED Viewed

@@ -1,4 +1,3 @@
-#!/usr/bin/env python
 # ==============================================================================
 # Copyright 2023 Intel Corporation
 #

sklearnex/preview/cluster/k_means.py CHANGED Viewed

@@ -1,4 +1,3 @@
-#!/usr/bin/env python
 # ==============================================================================
 # Copyright 2023 Intel Corporation
 #
@@ -30,6 +29,7 @@ if daal_check_version((2023, "P", 200)):
         check_is_fitted,
     )
+    from daal4py.sklearn._n_jobs_support import control_n_jobs
     from daal4py.sklearn._utils import sklearn_check_version
     from onedal.cluster import KMeans as onedal_KMeans
@@ -37,6 +37,7 @@ if daal_check_version((2023, "P", 200)):
     from ..._utils import PatchingConditionsChain
     from ._common import BaseKMeans
+    @control_n_jobs(decorated_methods=["fit", "predict"])
     class KMeans(sklearn_KMeans, BaseKMeans):
         __doc__ = sklearn_KMeans.__doc__
         n_iter_, inertia_ = None, None
@@ -171,24 +172,6 @@ if daal_check_version((2023, "P", 200)):
             return patching_status
         def fit(self, X, y=None, sample_weight=None):
-            """Compute k-means clustering.
-            Parameters
-            ----------
-            X : array-like or sparse matrix, shape=(n_samples, n_features)
-                Training instances to cluster. It must be noted that the data
-                will be converted to C ordering, which will cause a memory
-                copy if the given data is not C-contiguous.
-            y : Ignored
-                not used, present here for API consistency by convention.
-            sample_weight : array-like, shape (n_samples,), optional
-                The weights for each observation in X. If None, all observations
-                are assigned equal weight (default: None)
-            """
             if sklearn_check_version("1.0"):
                 self._check_feature_names(X, reset=True)
             if sklearn_check_version("1.2"):
@@ -256,24 +239,6 @@ if daal_check_version((2023, "P", 200)):
         @wrap_output_data
         def predict(self, X):
-            """Compute k-means clustering.
-            Parameters
-            ----------
-            X : array-like or sparse matrix, shape=(n_samples, n_features)
-                Training instances to cluster. It must be noted that the data
-                will be converted to C ordering, which will cause a memory
-                copy if the given data is not C-contiguous.
-            y : Ignored
-                not used, present here for API consistency by convention.
-            sample_weight : array-like, shape (n_samples,), optional
-                The weights for each observation in X. If None, all observations
-                are assigned equal weight (default: None)
-            """
             if sklearn_check_version("1.0"):
                 self._check_feature_names(X, reset=True)
             if sklearn_check_version("1.2"):
@@ -316,52 +281,20 @@ if daal_check_version((2023, "P", 200)):
         @wrap_output_data
         def fit_transform(self, X, y=None, sample_weight=None):
-            """Compute clustering and transform X to cluster-distance space.
-            Equivalent to fit(X).transform(X), but more efficiently implemented.
-            Parameters
-            ----------
-            X : {array-like, sparse matrix} of shape (n_samples, n_features)
-                New data to transform.
-            y : Ignored
-                Not used, present here for API consistency by convention.
-            sample_weight : array-like of shape (n_samples,), default=None
-                The weights for each observation in X. If None, all observations
-                are assigned equal weight.
-            Returns
-            -------
-            X_new : ndarray of shape (n_samples, n_clusters)
-                X transformed in the new space.
-            """
             return self.fit(X, sample_weight=sample_weight)._transform(X)
         @wrap_output_data
         def transform(self, X):
-            """Transform X to a cluster-distance space.
-            In the new space, each dimension is the distance to the cluster
-            centers. Note that even if X is sparse, the array returned by
-            `transform` will typically be dense.
-            Parameters
-            ----------
-            X : {array-like, sparse matrix} of shape (n_samples, n_features)
-                New data to transform.
-            Returns
-            -------
-            X_new : ndarray of shape (n_samples, n_clusters)
-                X transformed in the new space.
-            """
             check_is_fitted(self)
             X = self._check_test_data(X)
             return self._transform(X)
+        fit.__doc__ = sklearn_KMeans.fit.__doc__
+        predict.__doc__ = sklearn_KMeans.predict.__doc__
+        transform.__doc__ = sklearn_KMeans.transform.__doc__
+        fit_transform.__doc__ = sklearn_KMeans.fit_transform.__doc__
 else:
     from daal4py.sklearn.cluster import KMeans

sklearnex/preview/{decomposition → covariance}/__init__.py RENAMED Viewed

@@ -1,20 +1,19 @@
-#!/usr/bin/env python
-# ===============================================================================
-# Copyright 2023 Intel Corporation
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ===============================================================================
-from .pca import PCA
-__all__ = ["PCA"]
+# ===============================================================================
+# Copyright 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ===============================================================================
+from .covariance import EmpiricalCovariance
+__all__ = ["EmpiricalCovariance"]

sklearnex/preview/covariance/covariance.py ADDED Viewed

@@ -0,0 +1,133 @@
+# ===============================================================================
+# Copyright 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ===============================================================================
+import warnings
+import numpy as np
+from scipy import sparse as sp
+from sklearn.covariance import EmpiricalCovariance as sklearn_EmpiricalCovariance
+from sklearn.utils import check_array
+from daal4py.sklearn._n_jobs_support import control_n_jobs
+from daal4py.sklearn._utils import daal_check_version, sklearn_check_version
+from onedal.common.hyperparameters import get_hyperparameters
+from onedal.covariance import EmpiricalCovariance as onedal_EmpiricalCovariance
+from sklearnex import config_context
+from sklearnex.metrics import pairwise_distances
+from ..._device_offload import dispatch, wrap_output_data
+from ..._utils import PatchingConditionsChain, register_hyperparameters
+@register_hyperparameters({"fit": get_hyperparameters("covariance", "compute")})
+@control_n_jobs(decorated_methods=["fit", "mahalanobis"])
+class EmpiricalCovariance(sklearn_EmpiricalCovariance):
+    __doc__ = sklearn_EmpiricalCovariance.__doc__
+    if sklearn_check_version("1.2"):
+        _parameter_constraints: dict = {
+            **sklearn_EmpiricalCovariance._parameter_constraints,
+        }
+    def _save_attributes(self):
+        assert hasattr(self, "_onedal_estimator")
+        if not daal_check_version((2024, "P", 400)) and self.assume_centered:
+            location = self._onedal_estimator.location_[None, :]
+            self._onedal_estimator.covariance_ += np.dot(location.T, location)
+            self._onedal_estimator.location_ = np.zeros_like(np.squeeze(location))
+        self._set_covariance(self._onedal_estimator.covariance_)
+        self.location_ = self._onedal_estimator.location_
+    _onedal_covariance = staticmethod(onedal_EmpiricalCovariance)
+    def _onedal_fit(self, X, queue=None):
+        if X.shape[0] == 1:
+            warnings.warn(
+                "Only one sample available. You may want to reshape your data array"
+            )
+        onedal_params = {
+            "method": "dense",
+            "bias": True,
+            "assume_centered": self.assume_centered,
+        }
+        self._onedal_estimator = self._onedal_covariance(**onedal_params)
+        self._onedal_estimator.fit(X, queue=queue)
+        self._save_attributes()
+    def _onedal_supported(self, method_name, *data):
+        class_name = self.__class__.__name__
+        patching_status = PatchingConditionsChain(
+            f"sklearn.covariance.{class_name}.{method_name}"
+        )
+        if method_name in ["fit", "mahalanobis"]:
+            (X,) = data
+            patching_status.and_conditions(
+                [
+                    (not sp.issparse(X), "X is sparse. Sparse input is not supported."),
+                ]
+            )
+            return patching_status
+        raise RuntimeError(f"Unknown method {method_name} in {self.__class__.__name__}")
+    _onedal_cpu_supported = _onedal_supported
+    _onedal_gpu_supported = _onedal_supported
+    def fit(self, X, y=None):
+        if sklearn_check_version("1.2"):
+            self._validate_params()
+        if sklearn_check_version("0.23"):
+            X = self._validate_data(X, force_all_finite=False)
+        else:
+            X = check_array(X, force_all_finite=False)
+        dispatch(
+            self,
+            "fit",
+            {
+                "onedal": self.__class__._onedal_fit,
+                "sklearn": sklearn_EmpiricalCovariance.fit,
+            },
+            X,
+        )
+        return self
+    # expose sklearnex pairwise_distances if mahalanobis distance eventually supported
+    @wrap_output_data
+    def mahalanobis(self, X):
+        if sklearn_check_version("1.0"):
+            X = self._validate_data(X, reset=False)
+        else:
+            X = check_array(X)
+        precision = self.get_precision()
+        with config_context(assume_finite=True):
+            # compute mahalanobis distances
+            dist = pairwise_distances(
+                X, self.location_[np.newaxis, :], metric="mahalanobis", VI=precision
+            )
+        return np.reshape(dist, (len(X),)) ** 2
+    error_norm = wrap_output_data(sklearn_EmpiricalCovariance.error_norm)
+    score = wrap_output_data(sklearn_EmpiricalCovariance.score)
+    fit.__doc__ = sklearn_EmpiricalCovariance.fit.__doc__
+    mahalanobis.__doc__ = sklearn_EmpiricalCovariance.mahalanobis
+    error_norm.__doc__ = sklearn_EmpiricalCovariance.error_norm.__doc__
+    score.__doc__ = sklearn_EmpiricalCovariance.score.__doc__

sklearnex/preview/covariance/tests/test_covariance.py ADDED Viewed

@@ -0,0 +1,66 @@
+# ===============================================================================
+# Copyright 2023 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ===============================================================================
+import numpy as np
+import pytest
+from numpy.testing import assert_allclose
+from daal4py.sklearn._utils import daal_check_version
+from onedal.tests.utils._dataframes_support import (
+    _convert_to_dataframe,
+    get_dataframes_and_queues,
+)
+@pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
+@pytest.mark.parametrize("macro_block", [None, 1024])
+@pytest.mark.parametrize("assume_centered", [True, False])
+def test_sklearnex_import_covariance(dataframe, queue, macro_block, assume_centered):
+    from sklearnex.preview.covariance import EmpiricalCovariance
+    X = np.array([[0, 1], [0, 1]])
+    X = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
+    empcov = EmpiricalCovariance(assume_centered=assume_centered)
+    if daal_check_version((2024, "P", 0)) and macro_block is not None:
+        hparams = empcov.get_hyperparameters("fit")
+        hparams.cpu_macro_block = macro_block
+    result = empcov.fit(X)
+    expected_covariance = np.array([[0, 0], [0, 0]])
+    expected_means = np.array([0, 0])
+    if assume_centered:
+        expected_covariance = np.array([[0, 0], [0, 1]])
+    else:
+        expected_means = np.array([0, 1])
+    assert_allclose(expected_covariance, result.covariance_)
+    assert_allclose(expected_means, result.location_)
+    X = np.array([[1, 2], [3, 6]])
+    X = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
+    result = empcov.fit(X)
+    if assume_centered:
+        expected_covariance = np.array([[5, 10], [10, 20]])
+    else:
+        expected_covariance = np.array([[1, 2], [2, 4]])
+        expected_means = np.array([2, 4])
+    assert_allclose(expected_covariance, result.covariance_)
+    assert_allclose(expected_means, result.location_)

sklearnex/spmd/__init__.py CHANGED Viewed

@@ -17,6 +17,7 @@
 __all__ = [
     "basic_statistics",
     "cluster",
+    "covariance",
     "decomposition",
     "ensemble",
     "linear_model",

sklearnex/spmd/covariance/__init__.py ADDED Viewed

@@ -0,0 +1,19 @@
+# ==============================================================================
+# Copyright 2024 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+from .covariance import EmpiricalCovariance
+__all__ = ["EmpiricalCovariance"]

sklearnex/spmd/covariance/covariance.py ADDED Viewed

@@ -0,0 +1,21 @@
+# ==============================================================================
+# Copyright 2024 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+from onedal.spmd.covariance import EmpiricalCovariance
+# TODO:
+# Currently it uses `onedal` module interface.
+# Add sklearnex dispatching.