scikit-learn-intelex 2025.1.0__py39-none-manylinux_2_28_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of scikit-learn-intelex might be problematic. Click here for more details.

Files changed (280) hide show
  1. daal4py/__init__.py +73 -0
  2. daal4py/__main__.py +58 -0
  3. daal4py/_daal4py.cpython-39-x86_64-linux-gnu.so +0 -0
  4. daal4py/doc/third-party-programs.txt +424 -0
  5. daal4py/mb/__init__.py +19 -0
  6. daal4py/mb/model_builders.py +377 -0
  7. daal4py/mpi_transceiver.cpython-39-x86_64-linux-gnu.so +0 -0
  8. daal4py/sklearn/__init__.py +40 -0
  9. daal4py/sklearn/_n_jobs_support.py +248 -0
  10. daal4py/sklearn/_utils.py +245 -0
  11. daal4py/sklearn/cluster/__init__.py +20 -0
  12. daal4py/sklearn/cluster/dbscan.py +165 -0
  13. daal4py/sklearn/cluster/k_means.py +597 -0
  14. daal4py/sklearn/cluster/tests/test_dbscan.py +109 -0
  15. daal4py/sklearn/decomposition/__init__.py +19 -0
  16. daal4py/sklearn/decomposition/_pca.py +524 -0
  17. daal4py/sklearn/ensemble/AdaBoostClassifier.py +196 -0
  18. daal4py/sklearn/ensemble/GBTDAAL.py +337 -0
  19. daal4py/sklearn/ensemble/__init__.py +27 -0
  20. daal4py/sklearn/ensemble/_forest.py +1397 -0
  21. daal4py/sklearn/ensemble/tests/test_decision_forest.py +206 -0
  22. daal4py/sklearn/linear_model/__init__.py +29 -0
  23. daal4py/sklearn/linear_model/_coordinate_descent.py +848 -0
  24. daal4py/sklearn/linear_model/_linear.py +272 -0
  25. daal4py/sklearn/linear_model/_ridge.py +325 -0
  26. daal4py/sklearn/linear_model/coordinate_descent.py +17 -0
  27. daal4py/sklearn/linear_model/linear.py +17 -0
  28. daal4py/sklearn/linear_model/logistic_loss.py +195 -0
  29. daal4py/sklearn/linear_model/logistic_path.py +1026 -0
  30. daal4py/sklearn/linear_model/ridge.py +17 -0
  31. daal4py/sklearn/linear_model/tests/test_linear.py +208 -0
  32. daal4py/sklearn/linear_model/tests/test_ridge.py +69 -0
  33. daal4py/sklearn/manifold/__init__.py +19 -0
  34. daal4py/sklearn/manifold/_t_sne.py +405 -0
  35. daal4py/sklearn/metrics/__init__.py +20 -0
  36. daal4py/sklearn/metrics/_pairwise.py +236 -0
  37. daal4py/sklearn/metrics/_ranking.py +210 -0
  38. daal4py/sklearn/model_selection/__init__.py +19 -0
  39. daal4py/sklearn/model_selection/_split.py +309 -0
  40. daal4py/sklearn/model_selection/tests/test_split.py +56 -0
  41. daal4py/sklearn/monkeypatch/__init__.py +0 -0
  42. daal4py/sklearn/monkeypatch/dispatcher.py +232 -0
  43. daal4py/sklearn/monkeypatch/tests/_models_info.py +161 -0
  44. daal4py/sklearn/monkeypatch/tests/test_monkeypatch.py +71 -0
  45. daal4py/sklearn/monkeypatch/tests/test_patching.py +90 -0
  46. daal4py/sklearn/monkeypatch/tests/utils/_launch_algorithms.py +117 -0
  47. daal4py/sklearn/neighbors/__init__.py +21 -0
  48. daal4py/sklearn/neighbors/_base.py +503 -0
  49. daal4py/sklearn/neighbors/_classification.py +139 -0
  50. daal4py/sklearn/neighbors/_regression.py +74 -0
  51. daal4py/sklearn/neighbors/_unsupervised.py +55 -0
  52. daal4py/sklearn/neighbors/tests/test_kneighbors.py +113 -0
  53. daal4py/sklearn/svm/__init__.py +19 -0
  54. daal4py/sklearn/svm/svm.py +734 -0
  55. daal4py/sklearn/utils/__init__.py +21 -0
  56. daal4py/sklearn/utils/base.py +75 -0
  57. daal4py/sklearn/utils/tests/test_utils.py +51 -0
  58. daal4py/sklearn/utils/validation.py +693 -0
  59. onedal/__init__.py +83 -0
  60. onedal/_config.py +54 -0
  61. onedal/_device_offload.py +222 -0
  62. onedal/_onedal_py_dpc.cpython-39-x86_64-linux-gnu.so +0 -0
  63. onedal/_onedal_py_host.cpython-39-x86_64-linux-gnu.so +0 -0
  64. onedal/_onedal_py_spmd_dpc.cpython-39-x86_64-linux-gnu.so +0 -0
  65. onedal/basic_statistics/__init__.py +20 -0
  66. onedal/basic_statistics/basic_statistics.py +107 -0
  67. onedal/basic_statistics/incremental_basic_statistics.py +160 -0
  68. onedal/basic_statistics/tests/test_basic_statistics.py +298 -0
  69. onedal/basic_statistics/tests/test_incremental_basic_statistics.py +196 -0
  70. onedal/cluster/__init__.py +27 -0
  71. onedal/cluster/dbscan.py +110 -0
  72. onedal/cluster/kmeans.py +564 -0
  73. onedal/cluster/kmeans_init.py +115 -0
  74. onedal/cluster/tests/test_dbscan.py +125 -0
  75. onedal/cluster/tests/test_kmeans.py +88 -0
  76. onedal/cluster/tests/test_kmeans_init.py +93 -0
  77. onedal/common/_base.py +38 -0
  78. onedal/common/_estimator_checks.py +47 -0
  79. onedal/common/_mixin.py +62 -0
  80. onedal/common/_policy.py +59 -0
  81. onedal/common/_spmd_policy.py +30 -0
  82. onedal/common/hyperparameters.py +125 -0
  83. onedal/common/tests/test_policy.py +76 -0
  84. onedal/covariance/__init__.py +20 -0
  85. onedal/covariance/covariance.py +125 -0
  86. onedal/covariance/incremental_covariance.py +146 -0
  87. onedal/covariance/tests/test_covariance.py +50 -0
  88. onedal/covariance/tests/test_incremental_covariance.py +122 -0
  89. onedal/datatypes/__init__.py +19 -0
  90. onedal/datatypes/_data_conversion.py +154 -0
  91. onedal/datatypes/tests/common.py +126 -0
  92. onedal/datatypes/tests/test_data.py +414 -0
  93. onedal/decomposition/__init__.py +20 -0
  94. onedal/decomposition/incremental_pca.py +204 -0
  95. onedal/decomposition/pca.py +186 -0
  96. onedal/decomposition/tests/test_incremental_pca.py +198 -0
  97. onedal/ensemble/__init__.py +29 -0
  98. onedal/ensemble/forest.py +727 -0
  99. onedal/ensemble/tests/test_random_forest.py +97 -0
  100. onedal/linear_model/__init__.py +27 -0
  101. onedal/linear_model/incremental_linear_model.py +258 -0
  102. onedal/linear_model/linear_model.py +329 -0
  103. onedal/linear_model/logistic_regression.py +249 -0
  104. onedal/linear_model/tests/test_incremental_linear_regression.py +168 -0
  105. onedal/linear_model/tests/test_incremental_ridge_regression.py +107 -0
  106. onedal/linear_model/tests/test_linear_regression.py +250 -0
  107. onedal/linear_model/tests/test_logistic_regression.py +95 -0
  108. onedal/linear_model/tests/test_ridge.py +95 -0
  109. onedal/neighbors/__init__.py +19 -0
  110. onedal/neighbors/neighbors.py +767 -0
  111. onedal/neighbors/tests/test_knn_classification.py +49 -0
  112. onedal/primitives/__init__.py +27 -0
  113. onedal/primitives/get_tree.py +25 -0
  114. onedal/primitives/kernel_functions.py +153 -0
  115. onedal/primitives/tests/test_kernel_functions.py +159 -0
  116. onedal/spmd/__init__.py +25 -0
  117. onedal/spmd/_base.py +30 -0
  118. onedal/spmd/basic_statistics/__init__.py +20 -0
  119. onedal/spmd/basic_statistics/basic_statistics.py +30 -0
  120. onedal/spmd/basic_statistics/incremental_basic_statistics.py +69 -0
  121. onedal/spmd/cluster/__init__.py +28 -0
  122. onedal/spmd/cluster/dbscan.py +23 -0
  123. onedal/spmd/cluster/kmeans.py +56 -0
  124. onedal/spmd/covariance/__init__.py +20 -0
  125. onedal/spmd/covariance/covariance.py +26 -0
  126. onedal/spmd/covariance/incremental_covariance.py +82 -0
  127. onedal/spmd/decomposition/__init__.py +20 -0
  128. onedal/spmd/decomposition/incremental_pca.py +117 -0
  129. onedal/spmd/decomposition/pca.py +26 -0
  130. onedal/spmd/ensemble/__init__.py +19 -0
  131. onedal/spmd/ensemble/forest.py +28 -0
  132. onedal/spmd/linear_model/__init__.py +21 -0
  133. onedal/spmd/linear_model/incremental_linear_model.py +97 -0
  134. onedal/spmd/linear_model/linear_model.py +30 -0
  135. onedal/spmd/linear_model/logistic_regression.py +38 -0
  136. onedal/spmd/neighbors/__init__.py +19 -0
  137. onedal/spmd/neighbors/neighbors.py +75 -0
  138. onedal/svm/__init__.py +19 -0
  139. onedal/svm/svm.py +556 -0
  140. onedal/svm/tests/test_csr_svm.py +351 -0
  141. onedal/svm/tests/test_nusvc.py +204 -0
  142. onedal/svm/tests/test_nusvr.py +210 -0
  143. onedal/svm/tests/test_svc.py +176 -0
  144. onedal/svm/tests/test_svr.py +243 -0
  145. onedal/tests/test_common.py +57 -0
  146. onedal/tests/utils/_dataframes_support.py +162 -0
  147. onedal/tests/utils/_device_selection.py +102 -0
  148. onedal/utils/__init__.py +49 -0
  149. onedal/utils/_array_api.py +81 -0
  150. onedal/utils/_dpep_helpers.py +56 -0
  151. onedal/utils/validation.py +440 -0
  152. scikit_learn_intelex-2025.1.0.dist-info/LICENSE.txt +202 -0
  153. scikit_learn_intelex-2025.1.0.dist-info/METADATA +231 -0
  154. scikit_learn_intelex-2025.1.0.dist-info/RECORD +280 -0
  155. scikit_learn_intelex-2025.1.0.dist-info/WHEEL +5 -0
  156. scikit_learn_intelex-2025.1.0.dist-info/top_level.txt +3 -0
  157. sklearnex/__init__.py +66 -0
  158. sklearnex/__main__.py +58 -0
  159. sklearnex/_config.py +116 -0
  160. sklearnex/_device_offload.py +126 -0
  161. sklearnex/_utils.py +132 -0
  162. sklearnex/basic_statistics/__init__.py +20 -0
  163. sklearnex/basic_statistics/basic_statistics.py +230 -0
  164. sklearnex/basic_statistics/incremental_basic_statistics.py +345 -0
  165. sklearnex/basic_statistics/tests/test_basic_statistics.py +270 -0
  166. sklearnex/basic_statistics/tests/test_incremental_basic_statistics.py +404 -0
  167. sklearnex/cluster/__init__.py +20 -0
  168. sklearnex/cluster/dbscan.py +197 -0
  169. sklearnex/cluster/k_means.py +395 -0
  170. sklearnex/cluster/tests/test_dbscan.py +38 -0
  171. sklearnex/cluster/tests/test_kmeans.py +159 -0
  172. sklearnex/conftest.py +82 -0
  173. sklearnex/covariance/__init__.py +19 -0
  174. sklearnex/covariance/incremental_covariance.py +398 -0
  175. sklearnex/covariance/tests/test_incremental_covariance.py +237 -0
  176. sklearnex/decomposition/__init__.py +19 -0
  177. sklearnex/decomposition/pca.py +425 -0
  178. sklearnex/decomposition/tests/test_pca.py +58 -0
  179. sklearnex/dispatcher.py +543 -0
  180. sklearnex/doc/third-party-programs.txt +424 -0
  181. sklearnex/ensemble/__init__.py +29 -0
  182. sklearnex/ensemble/_forest.py +2029 -0
  183. sklearnex/ensemble/tests/test_forest.py +135 -0
  184. sklearnex/glob/__main__.py +72 -0
  185. sklearnex/glob/dispatcher.py +101 -0
  186. sklearnex/linear_model/__init__.py +32 -0
  187. sklearnex/linear_model/coordinate_descent.py +30 -0
  188. sklearnex/linear_model/incremental_linear.py +482 -0
  189. sklearnex/linear_model/incremental_ridge.py +425 -0
  190. sklearnex/linear_model/linear.py +341 -0
  191. sklearnex/linear_model/logistic_regression.py +413 -0
  192. sklearnex/linear_model/ridge.py +24 -0
  193. sklearnex/linear_model/tests/test_incremental_linear.py +207 -0
  194. sklearnex/linear_model/tests/test_incremental_ridge.py +153 -0
  195. sklearnex/linear_model/tests/test_linear.py +167 -0
  196. sklearnex/linear_model/tests/test_logreg.py +134 -0
  197. sklearnex/manifold/__init__.py +19 -0
  198. sklearnex/manifold/t_sne.py +21 -0
  199. sklearnex/manifold/tests/test_tsne.py +26 -0
  200. sklearnex/metrics/__init__.py +23 -0
  201. sklearnex/metrics/pairwise.py +22 -0
  202. sklearnex/metrics/ranking.py +20 -0
  203. sklearnex/metrics/tests/test_metrics.py +39 -0
  204. sklearnex/model_selection/__init__.py +21 -0
  205. sklearnex/model_selection/split.py +22 -0
  206. sklearnex/model_selection/tests/test_model_selection.py +34 -0
  207. sklearnex/neighbors/__init__.py +27 -0
  208. sklearnex/neighbors/_lof.py +236 -0
  209. sklearnex/neighbors/common.py +310 -0
  210. sklearnex/neighbors/knn_classification.py +231 -0
  211. sklearnex/neighbors/knn_regression.py +207 -0
  212. sklearnex/neighbors/knn_unsupervised.py +178 -0
  213. sklearnex/neighbors/tests/test_neighbors.py +82 -0
  214. sklearnex/preview/__init__.py +17 -0
  215. sklearnex/preview/covariance/__init__.py +19 -0
  216. sklearnex/preview/covariance/covariance.py +138 -0
  217. sklearnex/preview/covariance/tests/test_covariance.py +66 -0
  218. sklearnex/preview/decomposition/__init__.py +19 -0
  219. sklearnex/preview/decomposition/incremental_pca.py +233 -0
  220. sklearnex/preview/decomposition/tests/test_incremental_pca.py +266 -0
  221. sklearnex/preview/linear_model/__init__.py +19 -0
  222. sklearnex/preview/linear_model/ridge.py +424 -0
  223. sklearnex/preview/linear_model/tests/test_ridge.py +102 -0
  224. sklearnex/spmd/__init__.py +25 -0
  225. sklearnex/spmd/basic_statistics/__init__.py +20 -0
  226. sklearnex/spmd/basic_statistics/basic_statistics.py +21 -0
  227. sklearnex/spmd/basic_statistics/incremental_basic_statistics.py +30 -0
  228. sklearnex/spmd/basic_statistics/tests/test_basic_statistics_spmd.py +107 -0
  229. sklearnex/spmd/basic_statistics/tests/test_incremental_basic_statistics_spmd.py +307 -0
  230. sklearnex/spmd/cluster/__init__.py +30 -0
  231. sklearnex/spmd/cluster/dbscan.py +50 -0
  232. sklearnex/spmd/cluster/kmeans.py +21 -0
  233. sklearnex/spmd/cluster/tests/test_dbscan_spmd.py +97 -0
  234. sklearnex/spmd/cluster/tests/test_kmeans_spmd.py +172 -0
  235. sklearnex/spmd/covariance/__init__.py +20 -0
  236. sklearnex/spmd/covariance/covariance.py +21 -0
  237. sklearnex/spmd/covariance/incremental_covariance.py +37 -0
  238. sklearnex/spmd/covariance/tests/test_covariance_spmd.py +107 -0
  239. sklearnex/spmd/covariance/tests/test_incremental_covariance_spmd.py +184 -0
  240. sklearnex/spmd/decomposition/__init__.py +20 -0
  241. sklearnex/spmd/decomposition/incremental_pca.py +30 -0
  242. sklearnex/spmd/decomposition/pca.py +21 -0
  243. sklearnex/spmd/decomposition/tests/test_incremental_pca_spmd.py +269 -0
  244. sklearnex/spmd/decomposition/tests/test_pca_spmd.py +128 -0
  245. sklearnex/spmd/ensemble/__init__.py +19 -0
  246. sklearnex/spmd/ensemble/forest.py +71 -0
  247. sklearnex/spmd/ensemble/tests/test_forest_spmd.py +265 -0
  248. sklearnex/spmd/linear_model/__init__.py +21 -0
  249. sklearnex/spmd/linear_model/incremental_linear_model.py +35 -0
  250. sklearnex/spmd/linear_model/linear_model.py +21 -0
  251. sklearnex/spmd/linear_model/logistic_regression.py +21 -0
  252. sklearnex/spmd/linear_model/tests/test_incremental_linear_spmd.py +329 -0
  253. sklearnex/spmd/linear_model/tests/test_linear_regression_spmd.py +145 -0
  254. sklearnex/spmd/linear_model/tests/test_logistic_regression_spmd.py +162 -0
  255. sklearnex/spmd/neighbors/__init__.py +19 -0
  256. sklearnex/spmd/neighbors/neighbors.py +25 -0
  257. sklearnex/spmd/neighbors/tests/test_neighbors_spmd.py +288 -0
  258. sklearnex/svm/__init__.py +29 -0
  259. sklearnex/svm/_common.py +339 -0
  260. sklearnex/svm/nusvc.py +371 -0
  261. sklearnex/svm/nusvr.py +170 -0
  262. sklearnex/svm/svc.py +399 -0
  263. sklearnex/svm/svr.py +167 -0
  264. sklearnex/svm/tests/test_svm.py +93 -0
  265. sklearnex/tests/test_common.py +390 -0
  266. sklearnex/tests/test_config.py +123 -0
  267. sklearnex/tests/test_memory_usage.py +379 -0
  268. sklearnex/tests/test_monkeypatch.py +276 -0
  269. sklearnex/tests/test_n_jobs_support.py +108 -0
  270. sklearnex/tests/test_parallel.py +48 -0
  271. sklearnex/tests/test_patching.py +385 -0
  272. sklearnex/tests/test_run_to_run_stability.py +321 -0
  273. sklearnex/tests/utils/__init__.py +44 -0
  274. sklearnex/tests/utils/base.py +371 -0
  275. sklearnex/tests/utils/spmd.py +198 -0
  276. sklearnex/utils/__init__.py +19 -0
  277. sklearnex/utils/_array_api.py +82 -0
  278. sklearnex/utils/parallel.py +59 -0
  279. sklearnex/utils/tests/test_finite.py +89 -0
  280. sklearnex/utils/validation.py +17 -0
sklearnex/__main__.py ADDED
@@ -0,0 +1,58 @@
1
+ # ==============================================================================
2
+ # Copyright 2021 Intel Corporation
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+ # ==============================================================================
16
+
17
+ import sys
18
+
19
+ from sklearnex import patch_sklearn
20
+
21
+
22
+ def _main():
23
+ import argparse
24
+
25
+ parser = argparse.ArgumentParser(
26
+ prog="python -m sklearnex",
27
+ description="""
28
+ Run your Python script with Intel(R) Extension for
29
+ scikit-learn, optimizing solvers of
30
+ scikit-learn with Intel(R) oneAPI Data Analytics Library.
31
+ """,
32
+ formatter_class=argparse.ArgumentDefaultsHelpFormatter,
33
+ )
34
+
35
+ parser.add_argument(
36
+ "-m", action="store_true", dest="module", help="Executes following as a module"
37
+ )
38
+ parser.add_argument("name", help="Script or module name")
39
+ parser.add_argument("args", nargs=argparse.REMAINDER, help="Command line arguments")
40
+ args = parser.parse_args()
41
+
42
+ try:
43
+ import sklearn
44
+
45
+ patch_sklearn()
46
+ except ImportError:
47
+ print("Scikit-learn could not be imported. Nothing to patch")
48
+
49
+ sys.argv = [args.name] + args.args
50
+ if "_" + args.name in globals():
51
+ return globals()["_" + args.name](*args.args)
52
+ import runpy
53
+
54
+ runf = runpy.run_module if args.module else runpy.run_path
55
+ runf(args.name, run_name="__main__")
56
+
57
+
58
+ sys.exit(_main())
sklearnex/_config.py ADDED
@@ -0,0 +1,116 @@
1
+ # ==============================================================================
2
+ # Copyright 2021 Intel Corporation
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+ # ==============================================================================
16
+
17
+ from contextlib import contextmanager
18
+ from os import environ
19
+
20
+ from sklearn import get_config as skl_get_config
21
+ from sklearn import set_config as skl_set_config
22
+
23
+ from daal4py.sklearn._utils import sklearn_check_version
24
+ from onedal._config import _get_config as onedal_get_config
25
+
26
+
27
+ def get_config():
28
+ """Retrieve current values for configuration set by :func:`set_config`
29
+ Returns
30
+ -------
31
+ config : dict
32
+ Keys are parameter names that can be passed to :func:`set_config`.
33
+ See Also
34
+ --------
35
+ config_context : Context manager for global configuration.
36
+ set_config : Set global configuration.
37
+ """
38
+ sklearn = skl_get_config()
39
+ sklearnex = onedal_get_config()
40
+ return {**sklearn, **sklearnex}
41
+
42
+
43
+ def set_config(
44
+ target_offload=None,
45
+ allow_fallback_to_host=None,
46
+ allow_sklearn_after_onedal=None,
47
+ **sklearn_configs,
48
+ ):
49
+ """Set global configuration
50
+ Parameters
51
+ ----------
52
+ target_offload : string or dpctl.SyclQueue, default=None
53
+ The device primarily used to perform computations.
54
+ If string, expected to be "auto" (the execution context
55
+ is deduced from input data location),
56
+ or SYCL* filter selector string. Global default: "auto".
57
+ allow_fallback_to_host : bool, default=None
58
+ If True, allows to fallback computation to host device
59
+ in case particular estimator does not support the selected one.
60
+ Global default: False.
61
+ allow_sklearn_after_onedal : bool, default=None
62
+ If True, allows to fallback computation to sklearn after onedal
63
+ backend in case of runtime error on onedal backend computations.
64
+ Global default: True.
65
+ See Also
66
+ --------
67
+ config_context : Context manager for global configuration.
68
+ get_config : Retrieve current values of the global configuration.
69
+ """
70
+
71
+ array_api_dispatch = sklearn_configs.get("array_api_dispatch", False)
72
+ if array_api_dispatch and sklearn_check_version("1.6"):
73
+ environ["SCIPY_ARRAY_API"] = "1"
74
+
75
+ skl_set_config(**sklearn_configs)
76
+
77
+ local_config = onedal_get_config(copy=False)
78
+
79
+ if target_offload is not None:
80
+ local_config["target_offload"] = target_offload
81
+ if allow_fallback_to_host is not None:
82
+ local_config["allow_fallback_to_host"] = allow_fallback_to_host
83
+ if allow_sklearn_after_onedal is not None:
84
+ local_config["allow_sklearn_after_onedal"] = allow_sklearn_after_onedal
85
+
86
+
87
+ @contextmanager
88
+ def config_context(**new_config):
89
+ """Context manager for global scikit-learn configuration
90
+ Parameters
91
+ ----------
92
+ target_offload : string or dpctl.SyclQueue, default=None
93
+ The device primarily used to perform computations.
94
+ If string, expected to be "auto" (the execution context
95
+ is deduced from input data location),
96
+ or SYCL* filter selector string. Global default: "auto".
97
+ allow_fallback_to_host : bool, default=None
98
+ If True, allows to fallback computation to host device
99
+ in case particular estimator does not support the selected one.
100
+ Global default: False.
101
+ Notes
102
+ -----
103
+ All settings, not just those presently modified, will be returned to
104
+ their previous values when the context manager is exited.
105
+ See Also
106
+ --------
107
+ set_config : Set global scikit-learn configuration.
108
+ get_config : Retrieve current values of the global configuration.
109
+ """
110
+ old_config = get_config()
111
+ set_config(**new_config)
112
+
113
+ try:
114
+ yield
115
+ finally:
116
+ set_config(**old_config)
@@ -0,0 +1,126 @@
1
+ # ==============================================================================
2
+ # Copyright 2021 Intel Corporation
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+ # ==============================================================================
16
+
17
+ from functools import wraps
18
+
19
+ from onedal._device_offload import _copy_to_usm, _get_global_queue, _transfer_to_host
20
+ from onedal.utils._array_api import _asarray
21
+ from onedal.utils._dpep_helpers import dpnp_available
22
+
23
+ if dpnp_available:
24
+ import dpnp
25
+ from onedal.utils._array_api import _convert_to_dpnp
26
+
27
+ from ._config import get_config
28
+
29
+
30
+ def _get_backend(obj, queue, method_name, *data):
31
+ cpu_device = queue is None or queue.sycl_device.is_cpu
32
+ gpu_device = queue is not None and queue.sycl_device.is_gpu
33
+
34
+ if cpu_device:
35
+ patching_status = obj._onedal_cpu_supported(method_name, *data)
36
+ if patching_status.get_status():
37
+ return "onedal", queue, patching_status
38
+ else:
39
+ return "sklearn", None, patching_status
40
+
41
+ allow_fallback_to_host = get_config()["allow_fallback_to_host"]
42
+
43
+ if gpu_device:
44
+ patching_status = obj._onedal_gpu_supported(method_name, *data)
45
+ if patching_status.get_status():
46
+ return "onedal", queue, patching_status
47
+ else:
48
+ if allow_fallback_to_host:
49
+ patching_status = obj._onedal_cpu_supported(method_name, *data)
50
+ if patching_status.get_status():
51
+ return "onedal", None, patching_status
52
+ else:
53
+ return "sklearn", None, patching_status
54
+ else:
55
+ return "sklearn", None, patching_status
56
+
57
+ raise RuntimeError("Device support is not implemented")
58
+
59
+
60
+ def dispatch(obj, method_name, branches, *args, **kwargs):
61
+ q = _get_global_queue()
62
+ has_usm_data_for_args, q, hostargs = _transfer_to_host(q, *args)
63
+ has_usm_data_for_kwargs, q, hostvalues = _transfer_to_host(q, *kwargs.values())
64
+ hostkwargs = dict(zip(kwargs.keys(), hostvalues))
65
+
66
+ backend, q, patching_status = _get_backend(obj, q, method_name, *hostargs)
67
+ has_usm_data = has_usm_data_for_args or has_usm_data_for_kwargs
68
+ if backend == "onedal":
69
+ # Host args only used before onedal backend call.
70
+ # Device will be offloaded when onedal backend will be called.
71
+ patching_status.write_log(queue=q, transferred_to_host=False)
72
+ return branches[backend](obj, *hostargs, **hostkwargs, queue=q)
73
+ if backend == "sklearn":
74
+ if (
75
+ "array_api_dispatch" in get_config()
76
+ and get_config()["array_api_dispatch"]
77
+ and "array_api_support" in obj._get_tags()
78
+ and obj._get_tags()["array_api_support"]
79
+ and not has_usm_data
80
+ ):
81
+ # USM ndarrays are also excluded for the fallback Array API. Currently, DPNP.ndarray is
82
+ # not compliant with the Array API standard, and DPCTL usm_ndarray Array API is compliant,
83
+ # except for the linalg module. There is no guarantee that stock scikit-learn will
84
+ # work with such input data. The condition will be updated after DPNP.ndarray and
85
+ # DPCTL usm_ndarray enabling for conformance testing and these arrays supportance
86
+ # of the fallback cases.
87
+ # If `array_api_dispatch` enabled and array api is supported for the stock scikit-learn,
88
+ # then raw inputs are used for the fallback.
89
+ patching_status.write_log(transferred_to_host=False)
90
+ return branches[backend](obj, *args, **kwargs)
91
+ else:
92
+ patching_status.write_log()
93
+ return branches[backend](obj, *hostargs, **hostkwargs)
94
+ raise RuntimeError(
95
+ f"Undefined backend {backend} in " f"{obj.__class__.__name__}.{method_name}"
96
+ )
97
+
98
+
99
+ def wrap_output_data(func):
100
+ """
101
+ Converts and moves the output arrays of the decorated function
102
+ to match the input array type and device.
103
+ """
104
+
105
+ @wraps(func)
106
+ def wrapper(self, *args, **kwargs):
107
+ result = func(self, *args, **kwargs)
108
+ if not (len(args) == 0 and len(kwargs) == 0):
109
+ data = (*args, *kwargs.values())
110
+ usm_iface = getattr(data[0], "__sycl_usm_array_interface__", None)
111
+ if usm_iface is not None:
112
+ result = _copy_to_usm(usm_iface["syclobj"], result)
113
+ if dpnp_available and isinstance(data[0], dpnp.ndarray):
114
+ result = _convert_to_dpnp(result)
115
+ return result
116
+ config = get_config()
117
+ if not ("transform_output" in config and config["transform_output"]):
118
+ input_array_api = getattr(data[0], "__array_namespace__", lambda: None)()
119
+ if input_array_api:
120
+ input_array_api_device = data[0].device
121
+ result = _asarray(
122
+ result, input_array_api, device=input_array_api_device
123
+ )
124
+ return result
125
+
126
+ return wrapper
sklearnex/_utils.py ADDED
@@ -0,0 +1,132 @@
1
+ # ===============================================================================
2
+ # Copyright 2021 Intel Corporation
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+ # ===============================================================================
16
+
17
+ import logging
18
+ import os
19
+ import sys
20
+ import warnings
21
+ from abc import ABC
22
+
23
+ from daal4py.sklearn._utils import (
24
+ PatchingConditionsChain as daal4py_PatchingConditionsChain,
25
+ )
26
+ from daal4py.sklearn._utils import daal_check_version
27
+
28
+
29
+ class PatchingConditionsChain(daal4py_PatchingConditionsChain):
30
+ def get_status(self):
31
+ return self.patching_is_enabled
32
+
33
+ def write_log(self, queue=None, transferred_to_host=True):
34
+ if self.patching_is_enabled:
35
+ self.logger.info(
36
+ f"{self.scope_name}: {get_patch_message('onedal', queue=queue, transferred_to_host=transferred_to_host)}"
37
+ )
38
+ else:
39
+ self.logger.debug(
40
+ f"{self.scope_name}: debugging for the patch is enabled to track"
41
+ " the usage of Intel® oneAPI Data Analytics Library (oneDAL)"
42
+ )
43
+ for message in self.messages:
44
+ self.logger.debug(
45
+ f"{self.scope_name}: patching failed with cause - {message}"
46
+ )
47
+ self.logger.info(
48
+ f"{self.scope_name}: {get_patch_message('sklearn', transferred_to_host=transferred_to_host)}"
49
+ )
50
+
51
+
52
+ def set_sklearn_ex_verbose():
53
+ log_level = os.environ.get("SKLEARNEX_VERBOSE")
54
+
55
+ logger = logging.getLogger("sklearnex")
56
+ logging_channel = logging.StreamHandler()
57
+ logging_formatter = logging.Formatter("%(levelname)s:%(name)s: %(message)s")
58
+ logging_channel.setFormatter(logging_formatter)
59
+ logger.addHandler(logging_channel)
60
+
61
+ try:
62
+ if log_level is not None:
63
+ logger.setLevel(log_level)
64
+ except Exception:
65
+ warnings.warn(
66
+ 'Unknown level "{}" for logging.\n'
67
+ 'Please, use one of "CRITICAL", "ERROR", '
68
+ '"WARNING", "INFO", "DEBUG".'.format(log_level)
69
+ )
70
+
71
+
72
+ def get_patch_message(s, queue=None, transferred_to_host=True):
73
+ if s == "onedal":
74
+ message = "running accelerated version on "
75
+ if queue is not None:
76
+ if queue.sycl_device.is_gpu:
77
+ message += "GPU"
78
+ elif queue.sycl_device.is_cpu:
79
+ message += "CPU"
80
+ else:
81
+ raise RuntimeError("Unsupported device")
82
+ else:
83
+ message += "CPU"
84
+ elif s == "sklearn":
85
+ message = "fallback to original Scikit-learn"
86
+ elif s == "sklearn_after_onedal":
87
+ message = "failed to run accelerated version, fallback to original Scikit-learn"
88
+ else:
89
+ raise ValueError(
90
+ f"Invalid input - expected one of 'onedal','sklearn',"
91
+ f" 'sklearn_after_onedal', got {s}"
92
+ )
93
+ if transferred_to_host:
94
+ message += (
95
+ ". All input data transferred to host for further backend computations."
96
+ )
97
+ return message
98
+
99
+
100
+ def get_sklearnex_version(rule):
101
+ return daal_check_version(rule)
102
+
103
+
104
+ def register_hyperparameters(hyperparameters_map):
105
+ """Decorator for hyperparameters support in estimator class.
106
+ Adds `get_hyperparameters` method to class.
107
+ """
108
+
109
+ def wrap_class(estimator_class):
110
+ def get_hyperparameters(self, op):
111
+ return hyperparameters_map[op]
112
+
113
+ estimator_class.get_hyperparameters = get_hyperparameters
114
+ return estimator_class
115
+
116
+ return wrap_class
117
+
118
+
119
+ # This abstract class is meant to generate a clickable doc link for classses
120
+ # in sklearnex that are not part of base scikit-learn. It should be inherited
121
+ # before inheriting from a scikit-learn estimator, otherwise will get overriden
122
+ # by the estimator's original.
123
+ class IntelEstimator(ABC):
124
+ @property
125
+ def _doc_link_module(self) -> str:
126
+ return "sklearnex"
127
+
128
+ @property
129
+ def _doc_link_template(self) -> str:
130
+ module_path, _ = self.__class__.__module__.rsplit(".", 1)
131
+ class_name = self.__class__.__name__
132
+ return f"https://intel.github.io/scikit-learn-intelex/latest/non-scikit-algorithms.html#{module_path}.{class_name}"
@@ -0,0 +1,20 @@
1
+ # ==============================================================================
2
+ # Copyright 2023 Intel Corporation
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+ # ==============================================================================
16
+
17
+ from .basic_statistics import BasicStatistics
18
+ from .incremental_basic_statistics import IncrementalBasicStatistics
19
+
20
+ __all__ = ["BasicStatistics", "IncrementalBasicStatistics"]
@@ -0,0 +1,230 @@
1
+ # ==============================================================================
2
+ # Copyright 2023 Intel Corporation
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+ # ==============================================================================
16
+
17
+ import warnings
18
+
19
+ import numpy as np
20
+ from sklearn.base import BaseEstimator
21
+ from sklearn.utils import check_array
22
+ from sklearn.utils.validation import _check_sample_weight
23
+
24
+ from daal4py.sklearn._n_jobs_support import control_n_jobs
25
+ from daal4py.sklearn._utils import sklearn_check_version
26
+ from onedal.basic_statistics import BasicStatistics as onedal_BasicStatistics
27
+
28
+ from .._device_offload import dispatch
29
+ from .._utils import IntelEstimator, PatchingConditionsChain
30
+
31
+ if sklearn_check_version("1.6"):
32
+ from sklearn.utils.validation import validate_data
33
+ else:
34
+ validate_data = BaseEstimator._validate_data
35
+
36
+ if sklearn_check_version("1.2"):
37
+ from sklearn.utils._param_validation import StrOptions
38
+
39
+
40
+ @control_n_jobs(decorated_methods=["fit"])
41
+ class BasicStatistics(IntelEstimator, BaseEstimator):
42
+ """
43
+ Estimator for basic statistics.
44
+ Allows to compute basic statistics for provided data.
45
+
46
+ Parameters
47
+ ----------
48
+ result_options: string or list, default='all'
49
+ Used to set statistics to calculate. Possible values are ``'min'``, ``'max'``, ``'sum'``, ``'mean'``, ``'variance'``,
50
+ ``'variation'``, ``sum_squares'``, ``sum_squares_centered'``, ``'standard_deviation'``, ``'second_order_raw_moment'``
51
+ or a list containing any of these values. If set to ``'all'`` then all possible statistics will be
52
+ calculated.
53
+
54
+ Attributes
55
+ ----------
56
+ min_ : ndarray of shape (n_features,)
57
+ Minimum of each feature over all samples.
58
+ max_ : ndarray of shape (n_features,)
59
+ Maximum of each feature over all samples.
60
+ sum_ : ndarray of shape (n_features,)
61
+ Sum of each feature over all samples.
62
+ mean_ : ndarray of shape (n_features,)
63
+ Mean of each feature over all samples.
64
+ variance_ : ndarray of shape (n_features,)
65
+ Variance of each feature over all samples.
66
+ variation_ : ndarray of shape (n_features,)
67
+ Variation of each feature over all samples.
68
+ sum_squares_ : ndarray of shape (n_features,)
69
+ Sum of squares for each feature over all samples.
70
+ standard_deviation_ : ndarray of shape (n_features,)
71
+ Standard deviation of each feature over all samples.
72
+ sum_squares_centered_ : ndarray of shape (n_features,)
73
+ Centered sum of squares for each feature over all samples.
74
+ second_order_raw_moment_ : ndarray of shape (n_features,)
75
+ Second order moment of each feature over all samples.
76
+
77
+ Note
78
+ ----
79
+ Attribute exists only if corresponding result option has been provided.
80
+
81
+ Note
82
+ ----
83
+ Names of attributes without the trailing underscore are
84
+ supported currently but deprecated in 2025.1 and will be removed in 2026.0
85
+
86
+ Note
87
+ ----
88
+ Some results can exhibit small variations due to
89
+ floating point error accumulation and multithreading.
90
+
91
+ Examples
92
+ --------
93
+ >>> import numpy as np
94
+ >>> from sklearnex.basic_statistics import BasicStatistics
95
+ >>> bs = BasicStatistics(result_options=['sum', 'min', 'max'])
96
+ >>> X = np.array([[1, 2], [3, 4]])
97
+ >>> bs.fit(X)
98
+ >>> bs.sum_
99
+ np.array([4., 6.])
100
+ >>> bs.min_
101
+ np.array([1., 2.])
102
+ """
103
+
104
+ def __init__(self, result_options="all"):
105
+ self.result_options = result_options
106
+
107
+ _onedal_basic_statistics = staticmethod(onedal_BasicStatistics)
108
+
109
+ if sklearn_check_version("1.2"):
110
+ _parameter_constraints: dict = {
111
+ "result_options": [
112
+ StrOptions(
113
+ {
114
+ "all",
115
+ "min",
116
+ "max",
117
+ "sum",
118
+ "mean",
119
+ "variance",
120
+ "variation",
121
+ "sum_squares",
122
+ "standard_deviation",
123
+ "sum_squares_centered",
124
+ "second_order_raw_moment",
125
+ }
126
+ ),
127
+ list,
128
+ ],
129
+ }
130
+
131
+ def _save_attributes(self):
132
+ assert hasattr(self, "_onedal_estimator")
133
+
134
+ if self.result_options == "all":
135
+ result_options = onedal_BasicStatistics.get_all_result_options()
136
+ else:
137
+ result_options = self.result_options
138
+
139
+ if isinstance(result_options, str):
140
+ setattr(
141
+ self,
142
+ result_options + "_",
143
+ getattr(self._onedal_estimator, result_options),
144
+ )
145
+ elif isinstance(result_options, list):
146
+ for option in result_options:
147
+ setattr(self, option + "_", getattr(self._onedal_estimator, option))
148
+
149
+ def __getattr__(self, attr):
150
+ if self.result_options == "all":
151
+ result_options = onedal_BasicStatistics.get_all_result_options()
152
+ else:
153
+ result_options = self.result_options
154
+ is_deprecated_attr = (
155
+ isinstance(result_options, str) and (attr == result_options)
156
+ ) or (isinstance(result_options, list) and (attr in result_options))
157
+ if is_deprecated_attr:
158
+ warnings.warn(
159
+ "Result attributes without a trailing underscore were deprecated in version 2025.1 and will be removed in 2026.0"
160
+ )
161
+ attr += "_"
162
+ if attr in self.__dict__:
163
+ return self.__dict__[attr]
164
+
165
+ raise AttributeError(
166
+ f"'{self.__class__.__name__}' object has no attribute '{attr}'"
167
+ )
168
+
169
+ def _onedal_supported(self, method_name, *data):
170
+ patching_status = PatchingConditionsChain(
171
+ f"sklearnex.basic_statistics.{self.__class__.__name__}.{method_name}"
172
+ )
173
+ return patching_status
174
+
175
+ _onedal_cpu_supported = _onedal_supported
176
+ _onedal_gpu_supported = _onedal_supported
177
+
178
+ def _onedal_fit(self, X, sample_weight=None, queue=None):
179
+ if sklearn_check_version("1.2"):
180
+ self._validate_params()
181
+
182
+ if sklearn_check_version("1.0"):
183
+ X = validate_data(self, X, dtype=[np.float64, np.float32], ensure_2d=False)
184
+ else:
185
+ X = check_array(X, dtype=[np.float64, np.float32])
186
+
187
+ if sample_weight is not None:
188
+ sample_weight = _check_sample_weight(sample_weight, X)
189
+
190
+ onedal_params = {
191
+ "result_options": self.result_options,
192
+ }
193
+
194
+ if not hasattr(self, "_onedal_estimator"):
195
+ self._onedal_estimator = self._onedal_basic_statistics(**onedal_params)
196
+ self._onedal_estimator.fit(X, sample_weight, queue)
197
+ self._save_attributes()
198
+ self.n_features_in_ = X.shape[1] if len(X.shape) > 1 else 1
199
+
200
+ def fit(self, X, y=None, *, sample_weight=None):
201
+ """Calculate statistics of X.
202
+
203
+ Parameters
204
+ ----------
205
+ X : array-like of shape (n_samples, n_features)
206
+ Data for compute, where ``n_samples`` is the number of samples and
207
+ ``n_features`` is the number of features.
208
+
209
+ y : Ignored
210
+ Not used, present for API consistency by convention.
211
+
212
+ sample_weight : array-like of shape (n_samples,), default=None
213
+ Weights for compute weighted statistics, where ``n_samples`` is the number of samples.
214
+
215
+ Returns
216
+ -------
217
+ self : object
218
+ Returns the instance itself.
219
+ """
220
+ dispatch(
221
+ self,
222
+ "fit",
223
+ {
224
+ "onedal": self.__class__._onedal_fit,
225
+ "sklearn": None,
226
+ },
227
+ X,
228
+ sample_weight,
229
+ )
230
+ return self