PyPI - scikit-learn-intelex - Versions diffs - 2024.3.0__py39-none-manylinux1_x86_64.whl → 2024.5.0__py39-none-manylinux1_x86_64.whl - Mend

scikit-learn-intelex 2024.3.0__py39-none-manylinux1_x86_64.whl → 2024.5.0__py39-none-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of scikit-learn-intelex might be problematic. Click here for more details.

Files changed (43) hide show

{scikit_learn_intelex-2024.3.0.dist-info → scikit_learn_intelex-2024.5.0.dist-info}/METADATA +2 -2
{scikit_learn_intelex-2024.3.0.dist-info → scikit_learn_intelex-2024.5.0.dist-info}/RECORD +43 -37
sklearnex/_device_offload.py +39 -5
sklearnex/basic_statistics/__init__.py +2 -1
sklearnex/basic_statistics/incremental_basic_statistics.py +288 -0
sklearnex/basic_statistics/tests/test_incremental_basic_statistics.py +384 -0
sklearnex/covariance/incremental_covariance.py +217 -30
sklearnex/covariance/tests/test_incremental_covariance.py +54 -17
sklearnex/decomposition/pca.py +71 -19
sklearnex/decomposition/tests/test_pca.py +2 -2
sklearnex/dispatcher.py +33 -2
sklearnex/ensemble/_forest.py +73 -79
sklearnex/linear_model/__init__.py +5 -3
sklearnex/linear_model/incremental_linear.py +387 -0
sklearnex/linear_model/linear.py +275 -340
sklearnex/linear_model/logistic_regression.py +50 -9
sklearnex/linear_model/tests/test_incremental_linear.py +200 -0
sklearnex/linear_model/tests/test_linear.py +40 -5
sklearnex/neighbors/_lof.py +53 -36
sklearnex/neighbors/common.py +4 -1
sklearnex/neighbors/knn_classification.py +37 -122
sklearnex/neighbors/knn_regression.py +10 -117
sklearnex/neighbors/knn_unsupervised.py +6 -78
sklearnex/neighbors/tests/test_neighbors.py +2 -2
sklearnex/preview/cluster/k_means.py +5 -73
sklearnex/preview/covariance/covariance.py +6 -5
sklearnex/preview/covariance/tests/test_covariance.py +18 -5
sklearnex/svm/_common.py +4 -7
sklearnex/svm/nusvc.py +66 -50
sklearnex/svm/nusvr.py +3 -49
sklearnex/svm/svc.py +66 -51
sklearnex/svm/svr.py +3 -49
sklearnex/tests/_utils.py +34 -16
sklearnex/tests/test_memory_usage.py +5 -1
sklearnex/tests/test_n_jobs_support.py +12 -2
sklearnex/tests/test_patching.py +87 -58
sklearnex/tests/test_run_to_run_stability_tests.py +1 -1
sklearnex/utils/__init__.py +2 -1
sklearnex/utils/_namespace.py +97 -0
sklearnex/utils/tests/test_finite.py +89 -0
{scikit_learn_intelex-2024.3.0.dist-info → scikit_learn_intelex-2024.5.0.dist-info}/LICENSE.txt +0 -0
{scikit_learn_intelex-2024.3.0.dist-info → scikit_learn_intelex-2024.5.0.dist-info}/WHEEL +0 -0
{scikit_learn_intelex-2024.3.0.dist-info → scikit_learn_intelex-2024.5.0.dist-info}/top_level.txt +0 -0

sklearnex/linear_model/logistic_regression.py CHANGED Viewed

@@ -38,19 +38,27 @@ if daal_check_version((2024, "P", 1)):
     import numpy as np
     from scipy.sparse import issparse
     from sklearn.linear_model import LogisticRegression as sklearn_LogisticRegression
+    from sklearn.metrics import accuracy_score
+    from sklearn.utils.multiclass import type_of_target
     from sklearn.utils.validation import check_X_y
     from daal4py.sklearn._n_jobs_support import control_n_jobs
     from daal4py.sklearn._utils import sklearn_check_version
     from onedal.linear_model import LogisticRegression as onedal_LogisticRegression
-    from onedal.utils import _num_features, _num_samples
+    from onedal.utils import _num_samples
     from .._device_offload import dispatch, wrap_output_data
     from .._utils import PatchingConditionsChain, get_patch_message
     from ..utils.validation import _assert_all_finite
     @control_n_jobs(
-        decorated_methods=["fit", "predict", "predict_proba", "predict_log_proba"]
+        decorated_methods=[
+            "fit",
+            "predict",
+            "predict_proba",
+            "predict_log_proba",
+            "score",
+        ]
     )
     class LogisticRegression(sklearn_LogisticRegression, BaseLogisticRegression):
         __doc__ = sklearn_LogisticRegression.__doc__
@@ -72,9 +80,9 @@ if daal_check_version((2024, "P", 1)):
             intercept_scaling=1,
             class_weight=None,
             random_state=None,
-            solver="lbfgs" if sklearn_check_version("0.22") else "liblinear",
+            solver="lbfgs",
             max_iter=100,
-            multi_class="auto" if sklearn_check_version("0.22") else "ovr",
+            multi_class="auto",
             verbose=0,
             warm_start=False,
             n_jobs=None,
@@ -160,6 +168,27 @@ if daal_check_version((2024, "P", 1)):
                 X,
             )
+        @wrap_output_data
+        def score(self, X, y, sample_weight=None):
+            if sklearn_check_version("1.0"):
+                self._check_feature_names(X, reset=False)
+            return dispatch(
+                self,
+                "score",
+                {
+                    "onedal": self.__class__._onedal_score,
+                    "sklearn": sklearn_LogisticRegression.score,
+                },
+                X,
+                y,
+                sample_weight=sample_weight,
+            )
+        def _onedal_score(self, X, y, sample_weight=None, queue=None):
+            return accuracy_score(
+                y, self._onedal_predict(X, queue=queue), sample_weight=sample_weight
+            )
         def _test_type_and_finiteness(self, X_in):
             X = np.asarray(X_in)
@@ -198,6 +227,10 @@ if daal_check_version((2024, "P", 1)):
                     (self.warm_start == False, "Warm start is not supported."),
                     (self.l1_ratio is None, "l1 ratio is not supported."),
                     (sample_weight is None, "Sample weight is not supported."),
+                    (
+                        type_of_target(y) == "binary",
+                        "Only binary classification is supported",
+                    ),
                 ]
             )
@@ -216,22 +249,29 @@ if daal_check_version((2024, "P", 1)):
             return patching_status
         def _onedal_gpu_predict_supported(self, method_name, *data):
-            assert method_name in ["predict", "predict_proba", "predict_log_proba"]
-            assert len(data) == 1
+            assert method_name in [
+                "predict",
+                "predict_proba",
+                "predict_log_proba",
+                "score",
+            ]
             class_name = self.__class__.__name__
             patching_status = PatchingConditionsChain(
                 f"sklearn.linear_model.{class_name}.{method_name}"
             )
-            n_samples = _num_samples(*data)
+            n_samples = _num_samples(data[0])
             model_is_sparse = issparse(self.coef_) or (
                 self.fit_intercept and issparse(self.intercept_)
             )
             dal_ready = patching_status.and_conditions(
                 [
                     (n_samples > 0, "Number of samples is less than 1."),
-                    (not issparse(*data), "Sparse input is not supported."),
+                    (
+                        not any([issparse(i) for i in data]),
+                        "Sparse input is not supported.",
+                    ),
                     (not model_is_sparse, "Sparse coefficients are not supported."),
                     (
                         hasattr(self, "_onedal_estimator"),
@@ -251,7 +291,7 @@ if daal_check_version((2024, "P", 1)):
         def _onedal_gpu_supported(self, method_name, *data):
             if method_name == "fit":
                 return self._onedal_gpu_fit_supported(method_name, *data)
-            if method_name in ["predict", "predict_proba", "predict_log_proba"]:
+            if method_name in ["predict", "predict_proba", "predict_log_proba", "score"]:
                 return self._onedal_gpu_predict_supported(method_name, *data)
             raise RuntimeError(
                 f"Unknown method {method_name} in {self.__class__.__name__}"
@@ -334,6 +374,7 @@ if daal_check_version((2024, "P", 1)):
         predict.__doc__ = sklearn_LogisticRegression.predict.__doc__
         predict_proba.__doc__ = sklearn_LogisticRegression.predict_proba.__doc__
         predict_log_proba.__doc__ = sklearn_LogisticRegression.predict_log_proba.__doc__
+        score.__doc__ = sklearn_LogisticRegression.score.__doc__
 else:
     LogisticRegression = LogisticRegression_daal4py

sklearnex/linear_model/tests/test_incremental_linear.py ADDED Viewed

@@ -0,0 +1,200 @@
+# ===============================================================================
+# Copyright 2024 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ===============================================================================
+import numpy as np
+import pytest
+from numpy.testing import assert_allclose
+from onedal.tests.utils._dataframes_support import (
+    _as_numpy,
+    _convert_to_dataframe,
+    get_dataframes_and_queues,
+)
+from sklearnex.linear_model import IncrementalLinearRegression
+@pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
+@pytest.mark.parametrize("fit_intercept", [True, False])
+@pytest.mark.parametrize("macro_block", [None, 1024])
+@pytest.mark.parametrize("dtype", [np.float32, np.float64])
+def test_sklearnex_fit_on_gold_data(dataframe, queue, fit_intercept, macro_block, dtype):
+    X = np.array([[1], [2]])
+    X = X.astype(dtype=dtype)
+    X_df = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
+    y = np.array([1, 2])
+    y = y.astype(dtype=dtype)
+    y_df = _convert_to_dataframe(y, sycl_queue=queue, target_df=dataframe)
+    inclin = IncrementalLinearRegression(fit_intercept=fit_intercept)
+    if macro_block is not None:
+        hparams = inclin.get_hyperparameters("fit")
+        hparams.cpu_macro_block = macro_block
+        hparams.gpu_macro_block = macro_block
+    inclin.fit(X_df, y_df)
+    y_pred = inclin.predict(X_df)
+    tol = 2e-6 if dtype == np.float32 else 1e-7
+    assert_allclose(inclin.coef_, [1], atol=tol)
+    if fit_intercept:
+        assert_allclose(inclin.intercept_, [0], atol=tol)
+    assert_allclose(_as_numpy(y_pred), y, atol=tol)
+@pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
+@pytest.mark.parametrize("fit_intercept", [True, False])
+@pytest.mark.parametrize("macro_block", [None, 1024])
+@pytest.mark.parametrize("dtype", [np.float32, np.float64])
+def test_sklearnex_partial_fit_on_gold_data(
+    dataframe, queue, fit_intercept, macro_block, dtype
+):
+    X = np.array([[1], [2], [3], [4]])
+    X = X.astype(dtype=dtype)
+    y = X + 3
+    y = y.astype(dtype=dtype)
+    X_split = np.array_split(X, 2)
+    y_split = np.array_split(y, 2)
+    inclin = IncrementalLinearRegression()
+    if macro_block is not None:
+        hparams = inclin.get_hyperparameters("fit")
+        hparams.cpu_macro_block = macro_block
+        hparams.gpu_macro_block = macro_block
+    for i in range(2):
+        X_split_df = _convert_to_dataframe(
+            X_split[i], sycl_queue=queue, target_df=dataframe
+        )
+        y_split_df = _convert_to_dataframe(
+            y_split[i], sycl_queue=queue, target_df=dataframe
+        )
+        inclin.partial_fit(X_split_df, y_split_df)
+    assert inclin.n_features_in_ == 1
+    tol = 2e-6 if dtype == np.float32 else 1e-7
+    assert_allclose(inclin.coef_, [[1]], atol=tol)
+    if fit_intercept:
+        assert_allclose(inclin.intercept_, 3, atol=tol)
+    X_df = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
+    y_pred = inclin.predict(X_df)
+    assert_allclose(_as_numpy(y_pred), y, atol=tol)
+@pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
+@pytest.mark.parametrize("fit_intercept", [True, False])
+@pytest.mark.parametrize("macro_block", [None, 1024])
+@pytest.mark.parametrize("dtype", [np.float32, np.float64])
+def test_sklearnex_partial_fit_multitarget_on_gold_data(
+    dataframe, queue, fit_intercept, macro_block, dtype
+):
+    X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
+    X = X.astype(dtype=dtype)
+    y = np.dot(X, [1, 2]) + 3
+    y = y.astype(dtype=dtype)
+    X_split = np.array_split(X, 2)
+    y_split = np.array_split(y, 2)
+    inclin = IncrementalLinearRegression()
+    if macro_block is not None:
+        hparams = inclin.get_hyperparameters("fit")
+        hparams.cpu_macro_block = macro_block
+        hparams.gpu_macro_block = macro_block
+    for i in range(2):
+        X_split_df = _convert_to_dataframe(
+            X_split[i], sycl_queue=queue, target_df=dataframe
+        )
+        y_split_df = _convert_to_dataframe(
+            y_split[i], sycl_queue=queue, target_df=dataframe
+        )
+        inclin.partial_fit(X_split_df, y_split_df)
+    assert inclin.n_features_in_ == 2
+    tol = 7e-6 if dtype == np.float32 else 1e-7
+    assert_allclose(inclin.coef_, [1.0, 2.0], atol=tol)
+    if fit_intercept:
+        assert_allclose(inclin.intercept_, 3.0, atol=tol)
+    X_df = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
+    y_pred = inclin.predict(X_df)
+    assert_allclose(_as_numpy(y_pred), y, atol=tol)
+@pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
+@pytest.mark.parametrize("fit_intercept", [True, False])
+@pytest.mark.parametrize("num_samples", [100, 1000])
+@pytest.mark.parametrize("num_features", [5, 10])
+@pytest.mark.parametrize("num_targets", [1, 2])
+@pytest.mark.parametrize("num_blocks", [1, 10])
+@pytest.mark.parametrize("macro_block", [None, 1024])
+@pytest.mark.parametrize("dtype", [np.float32, np.float64])
+def test_sklearnex_partial_fit_on_random_data(
+    dataframe,
+    queue,
+    fit_intercept,
+    num_samples,
+    num_features,
+    num_targets,
+    num_blocks,
+    macro_block,
+    dtype,
+):
+    seed = 42
+    gen = np.random.default_rng(seed)
+    intercept = gen.random(size=num_targets, dtype=dtype)
+    coef = gen.random(size=(num_targets, num_features), dtype=dtype).T
+    X = gen.random(size=(num_samples, num_features), dtype=dtype)
+    if fit_intercept:
+        y = X @ coef + intercept[np.newaxis, :]
+    else:
+        y = X @ coef
+    X_split = np.array_split(X, num_blocks)
+    y_split = np.array_split(y, num_blocks)
+    inclin = IncrementalLinearRegression(fit_intercept=fit_intercept)
+    if macro_block is not None:
+        hparams = inclin.get_hyperparameters("fit")
+        hparams.cpu_macro_block = macro_block
+        hparams.gpu_macro_block = macro_block
+    for i in range(num_blocks):
+        X_split_df = _convert_to_dataframe(
+            X_split[i], sycl_queue=queue, target_df=dataframe
+        )
+        y_split_df = _convert_to_dataframe(
+            y_split[i], sycl_queue=queue, target_df=dataframe
+        )
+        inclin.partial_fit(X_split_df, y_split_df)
+    tol = 1e-4 if dtype == np.float32 else 1e-7
+    assert_allclose(coef, inclin.coef_.T, atol=tol)
+    if fit_intercept:
+        assert_allclose(intercept, inclin.intercept_, atol=tol)
+    X_test = gen.random(size=(num_samples, num_features), dtype=dtype)
+    if fit_intercept:
+        expected_y_pred = X_test @ coef + intercept[np.newaxis, :]
+    else:
+        expected_y_pred = X_test @ coef
+    X_test_df = _convert_to_dataframe(X_test, sycl_queue=queue, target_df=dataframe)
+    y_pred = inclin.predict(X_test_df)
+    assert_allclose(expected_y_pred, _as_numpy(y_pred), atol=tol)

sklearnex/linear_model/tests/test_linear.py CHANGED Viewed

@@ -28,26 +28,33 @@ from onedal.tests.utils._dataframes_support import (
 @pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
+@pytest.mark.parametrize("dtype", [np.float32, np.float64])
 @pytest.mark.parametrize("macro_block", [None, 1024])
-def test_sklearnex_import_linear(dataframe, queue, macro_block):
+def test_sklearnex_import_linear(dataframe, queue, dtype, macro_block):
     from sklearnex.linear_model import LinearRegression
     X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
     y = np.dot(X, np.array([1, 2])) + 3
+    X = X.astype(dtype=dtype)
+    y = y.astype(dtype=dtype)
     X = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
     y = _convert_to_dataframe(y, sycl_queue=queue, target_df=dataframe)
     linreg = LinearRegression()
     if daal_check_version((2024, "P", 0)) and macro_block is not None:
         hparams = linreg.get_hyperparameters("fit")
         hparams.cpu_macro_block = macro_block
         hparams.gpu_macro_block = macro_block
     linreg.fit(X, y)
-    if daal_check_version((2023, "P", 100)):
-        assert hasattr(linreg, "_onedal_estimator")
+    assert hasattr(linreg, "_onedal_estimator")
     assert "sklearnex" in linreg.__module__
     assert linreg.n_features_in_ == 2
-    assert_allclose(_as_numpy(linreg.intercept_), 3.0)
-    assert_allclose(_as_numpy(linreg.coef_), [1.0, 2.0])
+    tol = 1e-5 if dtype == np.float32 else 1e-7
+    assert_allclose(_as_numpy(linreg.intercept_), 3.0, rtol=tol)
+    assert_allclose(_as_numpy(linreg.coef_), [1.0, 2.0], rtol=tol)
 def test_sklearnex_import_ridge():
@@ -80,3 +87,31 @@ def test_sklearnex_import_elastic():
     assert "daal4py" in elasticnet.__module__
     assert_allclose(elasticnet.intercept_, 1.451, atol=1e-3)
     assert_allclose(elasticnet.coef_, [18.838, 64.559], atol=1e-3)
+@pytest.mark.parametrize("dataframe,queue", get_dataframes_and_queues())
+@pytest.mark.parametrize("dtype", [np.float32, np.float64])
+def test_sklearnex_reconstruct_model(dataframe, queue, dtype):
+    from sklearnex.linear_model import LinearRegression
+    seed = 42
+    num_samples = 3500
+    num_features, num_targets = 14, 9
+    gen = np.random.default_rng(seed)
+    intercept = gen.random(size=num_targets, dtype=dtype)
+    coef = gen.random(size=(num_targets, num_features), dtype=dtype).T
+    X = gen.random(size=(num_samples, num_features), dtype=dtype)
+    gtr = X @ coef + intercept[np.newaxis, :]
+    X = _convert_to_dataframe(X, sycl_queue=queue, target_df=dataframe)
+    linreg = LinearRegression(fit_intercept=True)
+    linreg.coef_ = coef.T
+    linreg.intercept_ = intercept
+    y_pred = linreg.predict(X)
+    tol = 1e-5 if dtype == np.float32 else 1e-7
+    assert_allclose(gtr, _as_numpy(y_pred), rtol=tol)

sklearnex/neighbors/_lof.py CHANGED Viewed

@@ -23,13 +23,13 @@ from sklearn.utils.validation import check_is_fitted
 from daal4py.sklearn._n_jobs_support import control_n_jobs
 from daal4py.sklearn._utils import sklearn_check_version
+from sklearnex._device_offload import dispatch, wrap_output_data
+from sklearnex.neighbors.common import KNeighborsDispatchingBase
+from sklearnex.neighbors.knn_unsupervised import NearestNeighbors
+from sklearnex.utils import get_namespace
-from .._device_offload import dispatch, wrap_output_data
-from .common import KNeighborsDispatchingBase
-from .knn_unsupervised import NearestNeighbors
-@control_n_jobs(decorated_methods=["fit", "kneighbors"])
+@control_n_jobs(decorated_methods=["fit", "_kneighbors"])
 class LocalOutlierFactor(KNeighborsDispatchingBase, sklearn_LocalOutlierFactor):
     __doc__ = (
         sklearn_LocalOutlierFactor.__doc__
@@ -100,7 +100,6 @@ class LocalOutlierFactor(KNeighborsDispatchingBase, sklearn_LocalOutlierFactor):
         return self
     def fit(self, X, y=None):
-        self._fit_validation(X, y)
         result = dispatch(
             self,
             "fit",
@@ -113,16 +112,13 @@ class LocalOutlierFactor(KNeighborsDispatchingBase, sklearn_LocalOutlierFactor):
         )
         return result
-    # Subtle order change to remove check_array and preserve dpnp and
-    # dpctl conformance. decision_function will return a dpnp or dpctl
-    # instance via kneighbors and an equivalent check_array exists in
-    # that call already in sklearn so no loss of functionality occurs
     def _predict(self, X=None):
         check_is_fitted(self)
         if X is not None:
+            xp, _ = get_namespace(X)
             output = self.decision_function(X) < 0
-            is_inlier = np.ones(output.shape[0], dtype=int)
+            is_inlier = xp.ones_like(output, dtype=int)
             is_inlier[output] = -1
         else:
             is_inlier = np.ones(self.n_samples_fit_, dtype=int)
@@ -159,16 +155,40 @@ class LocalOutlierFactor(KNeighborsDispatchingBase, sklearn_LocalOutlierFactor):
         """
         return self.fit(X)._predict()
-    @available_if(sklearn_LocalOutlierFactor._check_novelty_predict)
+    def _kneighbors(self, X=None, n_neighbors=None, return_distance=True):
+        check_is_fitted(self)
+        if sklearn_check_version("1.0") and X is not None:
+            self._check_feature_names(X, reset=False)
+        return dispatch(
+            self,
+            "kneighbors",
+            {
+                "onedal": self.__class__._onedal_kneighbors,
+                "sklearn": sklearn_LocalOutlierFactor.kneighbors,
+            },
+            X,
+            n_neighbors=n_neighbors,
+            return_distance=return_distance,
+        )
+    kneighbors = wrap_output_data(_kneighbors)
+    @available_if(sklearn_LocalOutlierFactor._check_novelty_score_samples)
     @wrap_output_data
-    def predict(self, X=None):
-        """Predict the labels (1 inlier, -1 outlier) of X according to LOF.
+    def score_samples(self, X):
+        """Opposite of the Local Outlier Factor of X.
+        It is the opposite as bigger is better, i.e. large values correspond
+        to inliers.
         **Only available for novelty detection (when novelty is set to True).**
-        This method allows to generalize prediction to *new observations* (not
-        in the training set). Note that the result of ``clf.fit(X)`` then
-        ``clf.predict(X)`` with ``novelty=True`` may differ from the result
-        obtained by ``clf.fit_predict(X)`` with ``novelty=False``.
+        The argument X is supposed to contain *new data*: if X contains a
+        point from training, it considers the later in its own neighborhood.
+        Also, the samples in X are not considered in the neighborhood of any
+        point. Because of this, the scores obtained via ``score_samples`` may
+        differ from the standard LOF scores.
+        The standard LOF scores for the training data is available via the
+        ``negative_outlier_factor_`` attribute.
         Parameters
         ----------
@@ -178,27 +198,24 @@ class LocalOutlierFactor(KNeighborsDispatchingBase, sklearn_LocalOutlierFactor):
         Returns
         -------
-        is_inlier : ndarray of shape (n_samples,)
-            Returns -1 for anomalies/outliers and +1 for inliers.
+        opposite_lof_scores : ndarray of shape (n_samples,)
+            The opposite of the Local Outlier Factor of each input samples.
+            The lower, the more abnormal.
         """
-        return self._predict(X)
-    @wrap_output_data
-    def kneighbors(self, X=None, n_neighbors=None, return_distance=True):
         check_is_fitted(self)
-        if sklearn_check_version("1.0") and X is not None:
-            self._check_feature_names(X, reset=False)
-        return dispatch(
-            self,
-            "kneighbors",
-            {
-                "onedal": self.__class__._onedal_kneighbors,
-                "sklearn": sklearn_LocalOutlierFactor.kneighbors,
-            },
-            X,
-            n_neighbors=n_neighbors,
-            return_distance=return_distance,
+        distances_X, neighbors_indices_X = self._kneighbors(
+            X, n_neighbors=self.n_neighbors_
         )
+        X_lrd = self._local_reachability_density(
+            distances_X,
+            neighbors_indices_X,
+        )
+        lrd_ratios_array = self._lrd[neighbors_indices_X] / X_lrd[:, np.newaxis]
+        return -np.mean(lrd_ratios_array, axis=1)
     fit.__doc__ = sklearn_LocalOutlierFactor.fit.__doc__
     kneighbors.__doc__ = sklearn_LocalOutlierFactor.kneighbors.__doc__

sklearnex/neighbors/common.py CHANGED Viewed

@@ -137,6 +137,9 @@ class KNeighborsDispatchingBase:
             self.n_features_in_ = X.data.shape[1]
     def _onedal_supported(self, device, method_name, *data):
+        if method_name == "fit":
+            self._fit_validation(data[0], data[1])
         class_name = self.__class__.__name__
         is_classifier = "Classifier" in class_name
         is_regressor = "Regressor" in class_name
@@ -249,7 +252,7 @@ class KNeighborsDispatchingBase:
                     class_count >= 2, "One-class case is not supported."
                 )
             return patching_status
-        if method_name in ["predict", "predict_proba", "kneighbors"]:
+        if method_name in ["predict", "predict_proba", "kneighbors", "score"]:
             patching_status.and_condition(
                 hasattr(self, "_onedal_estimator"), "oneDAL model was not trained."
             )