maxframe 1.3.0__cp310-cp310-macosx_10_9_universal2.whl → 2.0.0b1__cp310-cp310-macosx_10_9_universal2.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of maxframe might be problematic. Click here for more details.

Files changed (643) hide show
  1. maxframe/_utils.cpython-310-darwin.so +0 -0
  2. maxframe/_utils.pyi +21 -0
  3. maxframe/_utils.pyx +4 -3
  4. maxframe/codegen/__init__.py +27 -0
  5. maxframe/{codegen.py → codegen/core.py} +49 -43
  6. maxframe/codegen/spe/__init__.py +16 -0
  7. maxframe/codegen/spe/core.py +307 -0
  8. maxframe/codegen/spe/dataframe/__init__.py +37 -0
  9. maxframe/codegen/spe/dataframe/accessors/__init__.py +15 -0
  10. maxframe/codegen/spe/dataframe/accessors/base.py +53 -0
  11. maxframe/codegen/spe/dataframe/accessors/dict_.py +194 -0
  12. maxframe/codegen/spe/dataframe/accessors/list_.py +80 -0
  13. maxframe/codegen/spe/dataframe/arithmetic.py +84 -0
  14. maxframe/codegen/spe/dataframe/datasource.py +181 -0
  15. maxframe/codegen/spe/dataframe/datastore.py +204 -0
  16. maxframe/codegen/spe/dataframe/extensions.py +63 -0
  17. maxframe/codegen/spe/dataframe/fetch.py +26 -0
  18. maxframe/codegen/spe/dataframe/groupby.py +224 -0
  19. maxframe/codegen/spe/dataframe/indexing.py +238 -0
  20. maxframe/codegen/spe/dataframe/merge.py +73 -0
  21. maxframe/codegen/spe/dataframe/misc.py +286 -0
  22. maxframe/codegen/spe/dataframe/missing.py +64 -0
  23. maxframe/codegen/spe/dataframe/reduction.py +160 -0
  24. maxframe/codegen/spe/dataframe/sort.py +83 -0
  25. maxframe/codegen/spe/dataframe/statistics.py +46 -0
  26. maxframe/codegen/spe/dataframe/tests/__init__.py +13 -0
  27. maxframe/codegen/spe/dataframe/tests/accessors/__init__.py +13 -0
  28. maxframe/codegen/spe/dataframe/tests/accessors/test_base.py +33 -0
  29. maxframe/codegen/spe/dataframe/tests/accessors/test_dict.py +310 -0
  30. maxframe/codegen/spe/dataframe/tests/accessors/test_list.py +137 -0
  31. maxframe/codegen/spe/dataframe/tests/indexing/__init__.py +13 -0
  32. maxframe/codegen/spe/dataframe/tests/indexing/conftest.py +58 -0
  33. maxframe/codegen/spe/dataframe/tests/indexing/test_getitem.py +124 -0
  34. maxframe/codegen/spe/dataframe/tests/indexing/test_iloc.py +76 -0
  35. maxframe/codegen/spe/dataframe/tests/indexing/test_indexing.py +39 -0
  36. maxframe/codegen/spe/dataframe/tests/indexing/test_rename.py +51 -0
  37. maxframe/codegen/spe/dataframe/tests/indexing/test_reset_index.py +88 -0
  38. maxframe/codegen/spe/dataframe/tests/indexing/test_sample.py +45 -0
  39. maxframe/codegen/spe/dataframe/tests/indexing/test_set_axis.py +45 -0
  40. maxframe/codegen/spe/dataframe/tests/indexing/test_set_index.py +41 -0
  41. maxframe/codegen/spe/dataframe/tests/indexing/test_setitem.py +46 -0
  42. maxframe/codegen/spe/dataframe/tests/misc/__init__.py +13 -0
  43. maxframe/codegen/spe/dataframe/tests/misc/test_apply.py +133 -0
  44. maxframe/codegen/spe/dataframe/tests/misc/test_drop_duplicates.py +92 -0
  45. maxframe/codegen/spe/dataframe/tests/misc/test_misc.py +234 -0
  46. maxframe/codegen/spe/dataframe/tests/missing/__init__.py +13 -0
  47. maxframe/codegen/spe/dataframe/tests/missing/test_checkna.py +94 -0
  48. maxframe/codegen/spe/dataframe/tests/missing/test_dropna.py +50 -0
  49. maxframe/codegen/spe/dataframe/tests/missing/test_fillna.py +94 -0
  50. maxframe/codegen/spe/dataframe/tests/missing/test_replace.py +45 -0
  51. maxframe/codegen/spe/dataframe/tests/test_arithmetic.py +73 -0
  52. maxframe/codegen/spe/dataframe/tests/test_datasource.py +184 -0
  53. maxframe/codegen/spe/dataframe/tests/test_datastore.py +200 -0
  54. maxframe/codegen/spe/dataframe/tests/test_extensions.py +88 -0
  55. maxframe/codegen/spe/dataframe/tests/test_groupby.py +225 -0
  56. maxframe/codegen/spe/dataframe/tests/test_merge.py +400 -0
  57. maxframe/codegen/spe/dataframe/tests/test_reduction.py +104 -0
  58. maxframe/codegen/spe/dataframe/tests/test_sort.py +159 -0
  59. maxframe/codegen/spe/dataframe/tests/test_statistics.py +70 -0
  60. maxframe/codegen/spe/dataframe/tests/test_tseries.py +29 -0
  61. maxframe/codegen/spe/dataframe/tests/test_value_counts.py +60 -0
  62. maxframe/codegen/spe/dataframe/tests/test_window.py +69 -0
  63. maxframe/codegen/spe/dataframe/tseries.py +46 -0
  64. maxframe/codegen/spe/dataframe/udf.py +62 -0
  65. maxframe/codegen/spe/dataframe/value_counts.py +31 -0
  66. maxframe/codegen/spe/dataframe/window.py +65 -0
  67. maxframe/codegen/spe/learn/__init__.py +15 -0
  68. maxframe/codegen/spe/learn/contrib/__init__.py +15 -0
  69. maxframe/codegen/spe/learn/contrib/lightgbm.py +160 -0
  70. maxframe/codegen/spe/learn/contrib/models.py +41 -0
  71. maxframe/codegen/spe/learn/contrib/pytorch.py +49 -0
  72. maxframe/codegen/spe/learn/contrib/tests/__init__.py +13 -0
  73. maxframe/codegen/spe/learn/contrib/tests/test_lightgbm.py +123 -0
  74. maxframe/codegen/spe/learn/contrib/tests/test_models.py +41 -0
  75. maxframe/codegen/spe/learn/contrib/tests/test_pytorch.py +53 -0
  76. maxframe/codegen/spe/learn/contrib/tests/test_xgboost.py +98 -0
  77. maxframe/codegen/spe/learn/contrib/xgboost.py +152 -0
  78. maxframe/codegen/spe/learn/metrics/__init__.py +15 -0
  79. maxframe/codegen/spe/learn/metrics/_classification.py +120 -0
  80. maxframe/codegen/spe/learn/metrics/tests/__init__.py +13 -0
  81. maxframe/codegen/spe/learn/metrics/tests/test_classification.py +93 -0
  82. maxframe/codegen/spe/learn/model_selection/__init__.py +13 -0
  83. maxframe/codegen/spe/learn/model_selection/tests/__init__.py +13 -0
  84. maxframe/codegen/spe/learn/model_selection/tests/test_split.py +41 -0
  85. maxframe/codegen/spe/learn/preprocessing/__init__.py +15 -0
  86. maxframe/codegen/spe/learn/preprocessing/_data.py +37 -0
  87. maxframe/codegen/spe/learn/preprocessing/_label.py +47 -0
  88. maxframe/codegen/spe/learn/preprocessing/tests/__init__.py +13 -0
  89. maxframe/codegen/spe/learn/preprocessing/tests/test_data.py +31 -0
  90. maxframe/codegen/spe/learn/preprocessing/tests/test_label.py +43 -0
  91. maxframe/codegen/spe/learn/utils/__init__.py +15 -0
  92. maxframe/codegen/spe/learn/utils/checks.py +55 -0
  93. maxframe/codegen/spe/learn/utils/multiclass.py +60 -0
  94. maxframe/codegen/spe/learn/utils/shuffle.py +85 -0
  95. maxframe/codegen/spe/learn/utils/sparsefuncs.py +35 -0
  96. maxframe/codegen/spe/learn/utils/tests/__init__.py +13 -0
  97. maxframe/codegen/spe/learn/utils/tests/test_checks.py +48 -0
  98. maxframe/codegen/spe/learn/utils/tests/test_multiclass.py +52 -0
  99. maxframe/codegen/spe/learn/utils/tests/test_shuffle.py +50 -0
  100. maxframe/codegen/spe/learn/utils/tests/test_sparsefuncs.py +34 -0
  101. maxframe/codegen/spe/learn/utils/tests/test_validation.py +44 -0
  102. maxframe/codegen/spe/learn/utils/validation.py +35 -0
  103. maxframe/codegen/spe/objects.py +26 -0
  104. maxframe/codegen/spe/remote.py +29 -0
  105. maxframe/codegen/spe/tensor/__init__.py +28 -0
  106. maxframe/codegen/spe/tensor/arithmetic.py +95 -0
  107. maxframe/codegen/spe/tensor/core.py +41 -0
  108. maxframe/codegen/spe/tensor/datasource.py +165 -0
  109. maxframe/codegen/spe/tensor/extensions.py +35 -0
  110. maxframe/codegen/spe/tensor/fetch.py +26 -0
  111. maxframe/codegen/spe/tensor/indexing.py +63 -0
  112. maxframe/codegen/spe/tensor/linalg.py +63 -0
  113. maxframe/codegen/spe/tensor/merge.py +31 -0
  114. maxframe/codegen/spe/tensor/misc.py +121 -0
  115. maxframe/codegen/spe/tensor/random.py +29 -0
  116. maxframe/codegen/spe/tensor/reduction.py +39 -0
  117. maxframe/codegen/spe/tensor/reshape.py +26 -0
  118. maxframe/codegen/spe/tensor/sort.py +42 -0
  119. maxframe/codegen/spe/tensor/special.py +35 -0
  120. maxframe/codegen/spe/tensor/statistics.py +24 -0
  121. maxframe/codegen/spe/tensor/tests/__init__.py +13 -0
  122. maxframe/codegen/spe/tensor/tests/test_arithmetic.py +103 -0
  123. maxframe/codegen/spe/tensor/tests/test_datasource.py +99 -0
  124. maxframe/codegen/spe/tensor/tests/test_extensions.py +37 -0
  125. maxframe/codegen/spe/tensor/tests/test_indexing.py +44 -0
  126. maxframe/codegen/spe/tensor/tests/test_linalg.py +38 -0
  127. maxframe/codegen/spe/tensor/tests/test_merge.py +28 -0
  128. maxframe/codegen/spe/tensor/tests/test_misc.py +94 -0
  129. maxframe/codegen/spe/tensor/tests/test_random.py +55 -0
  130. maxframe/codegen/spe/tensor/tests/test_reduction.py +65 -0
  131. maxframe/codegen/spe/tensor/tests/test_reshape.py +39 -0
  132. maxframe/codegen/spe/tensor/tests/test_sort.py +49 -0
  133. maxframe/codegen/spe/tensor/tests/test_special.py +28 -0
  134. maxframe/codegen/spe/tensor/tests/test_statistics.py +29 -0
  135. maxframe/codegen/spe/tests/__init__.py +13 -0
  136. maxframe/codegen/spe/tests/test_remote.py +29 -0
  137. maxframe/codegen/spe/tests/test_spe_codegen.py +141 -0
  138. maxframe/codegen/spe/utils.py +54 -0
  139. maxframe/codegen/tests/__init__.py +13 -0
  140. maxframe/{tests → codegen/tests}/test_codegen.py +3 -5
  141. maxframe/config/__init__.py +1 -1
  142. maxframe/config/config.py +50 -23
  143. maxframe/config/tests/test_config.py +4 -12
  144. maxframe/config/validators.py +5 -0
  145. maxframe/conftest.py +38 -10
  146. maxframe/core/__init__.py +1 -0
  147. maxframe/core/context.py +110 -0
  148. maxframe/core/entity/__init__.py +1 -0
  149. maxframe/core/entity/core.py +0 -7
  150. maxframe/core/entity/objects.py +19 -5
  151. maxframe/core/entity/output_types.py +11 -0
  152. maxframe/core/entity/tests/test_objects.py +11 -12
  153. maxframe/core/entity/tileables.py +3 -1
  154. maxframe/core/entity/utils.py +15 -0
  155. maxframe/core/graph/__init__.py +6 -1
  156. maxframe/core/graph/builder/base.py +5 -1
  157. maxframe/core/graph/core.cpython-310-darwin.so +0 -0
  158. maxframe/core/graph/core.pyx +17 -6
  159. maxframe/core/graph/entity.py +18 -6
  160. maxframe/core/operator/__init__.py +8 -3
  161. maxframe/core/operator/base.py +35 -12
  162. maxframe/core/operator/core.py +37 -14
  163. maxframe/core/operator/fetch.py +5 -18
  164. maxframe/core/operator/objects.py +0 -20
  165. maxframe/core/operator/shuffle.py +6 -72
  166. maxframe/dataframe/__init__.py +1 -0
  167. maxframe/dataframe/accessors/datetime_/core.py +7 -4
  168. maxframe/dataframe/accessors/string_/core.py +9 -6
  169. maxframe/dataframe/arithmetic/core.py +31 -20
  170. maxframe/dataframe/arithmetic/tests/test_arithmetic.py +6 -0
  171. maxframe/dataframe/core.py +98 -91
  172. maxframe/dataframe/datasource/core.py +8 -1
  173. maxframe/dataframe/datasource/date_range.py +8 -0
  174. maxframe/dataframe/datasource/from_index.py +9 -5
  175. maxframe/dataframe/datasource/from_records.py +9 -2
  176. maxframe/dataframe/datasource/from_tensor.py +32 -21
  177. maxframe/dataframe/datasource/read_csv.py +8 -2
  178. maxframe/dataframe/datasource/read_odps_query.py +33 -3
  179. maxframe/dataframe/datasource/read_odps_table.py +20 -5
  180. maxframe/dataframe/datasource/read_parquet.py +8 -3
  181. maxframe/dataframe/datasource/tests/test_datasource.py +33 -0
  182. maxframe/dataframe/datastore/tests/test_to_odps.py +52 -1
  183. maxframe/dataframe/datastore/to_csv.py +7 -3
  184. maxframe/dataframe/datastore/to_odps.py +42 -6
  185. maxframe/dataframe/extensions/__init__.py +6 -1
  186. maxframe/dataframe/extensions/apply_chunk.py +96 -136
  187. maxframe/dataframe/extensions/flatjson.py +3 -2
  188. maxframe/dataframe/extensions/flatmap.py +15 -7
  189. maxframe/dataframe/fetch/core.py +12 -1
  190. maxframe/dataframe/groupby/__init__.py +7 -0
  191. maxframe/dataframe/groupby/aggregation.py +62 -9
  192. maxframe/dataframe/groupby/apply.py +50 -74
  193. maxframe/dataframe/groupby/apply_chunk.py +393 -0
  194. maxframe/dataframe/groupby/core.py +80 -17
  195. maxframe/dataframe/groupby/extensions.py +26 -0
  196. maxframe/dataframe/groupby/fill.py +9 -4
  197. maxframe/dataframe/groupby/sample.py +7 -7
  198. maxframe/dataframe/groupby/tests/test_groupby.py +3 -3
  199. maxframe/dataframe/groupby/transform.py +57 -54
  200. maxframe/dataframe/indexing/align.py +7 -6
  201. maxframe/dataframe/indexing/getitem.py +9 -8
  202. maxframe/dataframe/indexing/iloc.py +28 -23
  203. maxframe/dataframe/indexing/insert.py +7 -3
  204. maxframe/dataframe/indexing/loc.py +9 -8
  205. maxframe/dataframe/indexing/reindex.py +36 -30
  206. maxframe/dataframe/indexing/rename_axis.py +18 -10
  207. maxframe/dataframe/indexing/reset_index.py +0 -2
  208. maxframe/dataframe/indexing/sample.py +13 -9
  209. maxframe/dataframe/indexing/set_axis.py +9 -6
  210. maxframe/dataframe/indexing/setitem.py +8 -5
  211. maxframe/dataframe/indexing/where.py +12 -9
  212. maxframe/dataframe/merge/__init__.py +0 -1
  213. maxframe/dataframe/merge/concat.py +10 -31
  214. maxframe/dataframe/merge/merge.py +2 -24
  215. maxframe/dataframe/misc/__init__.py +6 -0
  216. maxframe/dataframe/misc/_duplicate.py +7 -3
  217. maxframe/dataframe/misc/apply.py +106 -139
  218. maxframe/dataframe/misc/astype.py +3 -2
  219. maxframe/dataframe/misc/case_when.py +11 -7
  220. maxframe/dataframe/misc/cut.py +11 -10
  221. maxframe/dataframe/misc/describe.py +7 -3
  222. maxframe/dataframe/misc/drop.py +13 -11
  223. maxframe/dataframe/misc/eval.py +0 -2
  224. maxframe/dataframe/misc/get_dummies.py +78 -49
  225. maxframe/dataframe/misc/isin.py +13 -10
  226. maxframe/dataframe/misc/map.py +21 -6
  227. maxframe/dataframe/misc/melt.py +8 -1
  228. maxframe/dataframe/misc/pivot.py +232 -0
  229. maxframe/dataframe/misc/pivot_table.py +52 -40
  230. maxframe/dataframe/misc/rechunk.py +59 -0
  231. maxframe/dataframe/misc/shift.py +7 -4
  232. maxframe/dataframe/misc/stack.py +5 -3
  233. maxframe/dataframe/misc/tests/test_misc.py +167 -1
  234. maxframe/dataframe/misc/transform.py +63 -65
  235. maxframe/dataframe/misc/value_counts.py +7 -4
  236. maxframe/dataframe/missing/dropna.py +16 -7
  237. maxframe/dataframe/missing/fillna.py +18 -10
  238. maxframe/dataframe/missing/replace.py +10 -6
  239. maxframe/dataframe/missing/tests/test_missing.py +2 -2
  240. maxframe/dataframe/operators.py +1 -27
  241. maxframe/dataframe/reduction/aggregation.py +128 -3
  242. maxframe/dataframe/reduction/core.py +20 -6
  243. maxframe/dataframe/reduction/median.py +1 -1
  244. maxframe/dataframe/reduction/tests/test_reduction.py +33 -0
  245. maxframe/dataframe/reduction/unique.py +53 -7
  246. maxframe/dataframe/statistics/corr.py +9 -6
  247. maxframe/dataframe/statistics/quantile.py +9 -6
  248. maxframe/dataframe/tseries/to_datetime.py +6 -4
  249. maxframe/dataframe/utils.py +219 -31
  250. maxframe/dataframe/window/rolling.py +7 -4
  251. maxframe/env.py +1 -0
  252. maxframe/errors.py +9 -0
  253. maxframe/extension.py +13 -2
  254. maxframe/io/objects/core.py +67 -51
  255. maxframe/io/objects/tensor.py +73 -17
  256. maxframe/io/objects/tests/test_object_io.py +8 -55
  257. maxframe/io/odpsio/arrow.py +15 -2
  258. maxframe/io/odpsio/schema.py +43 -13
  259. maxframe/io/odpsio/tableio.py +63 -11
  260. maxframe/io/odpsio/tests/test_arrow.py +1 -2
  261. maxframe/io/odpsio/tests/test_schema.py +114 -1
  262. maxframe/io/odpsio/tests/test_tableio.py +42 -0
  263. maxframe/io/odpsio/tests/test_volumeio.py +22 -48
  264. maxframe/learn/__init__.py +2 -2
  265. maxframe/learn/contrib/__init__.py +2 -2
  266. maxframe/learn/contrib/graph/connected_components.py +2 -1
  267. maxframe/learn/contrib/lightgbm/__init__.py +33 -0
  268. maxframe/learn/contrib/lightgbm/_predict.py +138 -0
  269. maxframe/learn/contrib/lightgbm/_train.py +163 -0
  270. maxframe/learn/contrib/lightgbm/callback.py +114 -0
  271. maxframe/learn/contrib/lightgbm/classifier.py +199 -0
  272. maxframe/learn/contrib/lightgbm/core.py +372 -0
  273. maxframe/learn/contrib/lightgbm/dataset.py +153 -0
  274. maxframe/learn/contrib/lightgbm/regressor.py +29 -0
  275. maxframe/learn/contrib/lightgbm/tests/__init__.py +13 -0
  276. maxframe/learn/contrib/lightgbm/tests/test_callback.py +58 -0
  277. maxframe/learn/contrib/llm/models/dashscope.py +34 -0
  278. maxframe/learn/contrib/llm/models/managed.py +15 -0
  279. maxframe/learn/contrib/llm/multi_modal.py +92 -0
  280. maxframe/learn/contrib/llm/text.py +21 -5
  281. maxframe/learn/contrib/models.py +38 -9
  282. maxframe/learn/contrib/utils.py +55 -0
  283. maxframe/learn/contrib/xgboost/callback.py +86 -0
  284. maxframe/learn/contrib/xgboost/classifier.py +26 -30
  285. maxframe/learn/contrib/xgboost/core.py +53 -42
  286. maxframe/learn/contrib/xgboost/dmatrix.py +19 -12
  287. maxframe/learn/contrib/xgboost/predict.py +13 -8
  288. maxframe/learn/contrib/xgboost/regressor.py +28 -27
  289. maxframe/learn/contrib/xgboost/tests/test_callback.py +41 -0
  290. maxframe/learn/contrib/xgboost/train.py +59 -16
  291. maxframe/learn/core.py +252 -0
  292. maxframe/learn/datasets/__init__.py +20 -0
  293. maxframe/learn/datasets/samples_generator.py +628 -0
  294. maxframe/learn/linear_model/__init__.py +15 -0
  295. maxframe/learn/linear_model/_base.py +163 -0
  296. maxframe/learn/linear_model/_lin_reg.py +175 -0
  297. maxframe/learn/metrics/__init__.py +25 -0
  298. maxframe/learn/metrics/_check_targets.py +95 -0
  299. maxframe/learn/metrics/_classification.py +1121 -0
  300. maxframe/learn/metrics/_regression.py +256 -0
  301. maxframe/learn/model_selection/__init__.py +15 -0
  302. maxframe/learn/model_selection/_split.py +451 -0
  303. maxframe/learn/model_selection/tests/__init__.py +13 -0
  304. maxframe/learn/model_selection/tests/test_split.py +156 -0
  305. maxframe/learn/preprocessing/__init__.py +16 -0
  306. maxframe/learn/preprocessing/_data/__init__.py +17 -0
  307. maxframe/learn/preprocessing/_data/min_max_scaler.py +390 -0
  308. maxframe/learn/preprocessing/_data/normalize.py +127 -0
  309. maxframe/learn/preprocessing/_data/standard_scaler.py +503 -0
  310. maxframe/learn/preprocessing/_data/utils.py +79 -0
  311. maxframe/learn/preprocessing/_label/__init__.py +16 -0
  312. maxframe/learn/preprocessing/_label/_label_binarizer.py +599 -0
  313. maxframe/learn/preprocessing/_label/_label_encoder.py +174 -0
  314. maxframe/learn/utils/__init__.py +4 -0
  315. maxframe/learn/utils/_encode.py +314 -0
  316. maxframe/learn/utils/checks.py +161 -0
  317. maxframe/learn/utils/core.py +33 -0
  318. maxframe/learn/utils/extmath.py +176 -0
  319. maxframe/learn/utils/multiclass.py +292 -0
  320. maxframe/learn/utils/shuffle.py +114 -0
  321. maxframe/learn/utils/sparsefuncs.py +87 -0
  322. maxframe/learn/utils/validation.py +775 -0
  323. maxframe/lib/__init__.py +0 -2
  324. maxframe/lib/compat.py +145 -0
  325. maxframe/lib/filesystem/_oss_lib/glob.py +1 -1
  326. maxframe/lib/mmh3.cpython-310-darwin.so +0 -0
  327. maxframe/lib/sparse/__init__.py +10 -15
  328. maxframe/lib/sparse/array.py +45 -33
  329. maxframe/lib/sparse/core.py +0 -2
  330. maxframe/lib/sparse/linalg.py +31 -0
  331. maxframe/lib/sparse/matrix.py +5 -2
  332. maxframe/lib/sparse/tests/__init__.py +0 -2
  333. maxframe/lib/sparse/tests/test_sparse.py +53 -53
  334. maxframe/lib/sparse/vector.py +0 -2
  335. maxframe/mixin.py +59 -2
  336. maxframe/opcodes.py +13 -5
  337. maxframe/protocol.py +67 -14
  338. maxframe/remote/core.py +16 -14
  339. maxframe/remote/run_script.py +6 -3
  340. maxframe/serialization/__init__.py +2 -0
  341. maxframe/serialization/core.cpython-310-darwin.so +0 -0
  342. maxframe/serialization/core.pxd +3 -0
  343. maxframe/serialization/core.pyi +3 -1
  344. maxframe/serialization/core.pyx +82 -4
  345. maxframe/serialization/pandas.py +5 -1
  346. maxframe/serialization/serializables/core.py +6 -5
  347. maxframe/serialization/serializables/field.py +2 -2
  348. maxframe/serialization/serializables/tests/test_field_type.py +3 -5
  349. maxframe/serialization/tests/test_serial.py +27 -0
  350. maxframe/session.py +4 -71
  351. maxframe/sperunner.py +165 -0
  352. maxframe/tensor/__init__.py +35 -2
  353. maxframe/tensor/arithmetic/__init__.py +2 -4
  354. maxframe/tensor/arithmetic/abs.py +0 -2
  355. maxframe/tensor/arithmetic/absolute.py +0 -2
  356. maxframe/tensor/arithmetic/add.py +34 -4
  357. maxframe/tensor/arithmetic/angle.py +0 -2
  358. maxframe/tensor/arithmetic/arccos.py +1 -4
  359. maxframe/tensor/arithmetic/arccosh.py +1 -3
  360. maxframe/tensor/arithmetic/arcsin.py +0 -2
  361. maxframe/tensor/arithmetic/arcsinh.py +0 -2
  362. maxframe/tensor/arithmetic/arctan.py +0 -2
  363. maxframe/tensor/arithmetic/arctan2.py +0 -2
  364. maxframe/tensor/arithmetic/arctanh.py +0 -2
  365. maxframe/tensor/arithmetic/around.py +0 -2
  366. maxframe/tensor/arithmetic/bitand.py +0 -2
  367. maxframe/tensor/arithmetic/bitor.py +1 -3
  368. maxframe/tensor/arithmetic/bitxor.py +1 -3
  369. maxframe/tensor/arithmetic/cbrt.py +0 -2
  370. maxframe/tensor/arithmetic/ceil.py +0 -2
  371. maxframe/tensor/arithmetic/clip.py +13 -13
  372. maxframe/tensor/arithmetic/conj.py +0 -2
  373. maxframe/tensor/arithmetic/copysign.py +0 -2
  374. maxframe/tensor/arithmetic/core.py +47 -39
  375. maxframe/tensor/arithmetic/cos.py +1 -3
  376. maxframe/tensor/arithmetic/cosh.py +0 -2
  377. maxframe/tensor/arithmetic/deg2rad.py +0 -2
  378. maxframe/tensor/arithmetic/degrees.py +0 -2
  379. maxframe/tensor/arithmetic/divide.py +0 -2
  380. maxframe/tensor/arithmetic/equal.py +0 -2
  381. maxframe/tensor/arithmetic/exp.py +1 -3
  382. maxframe/tensor/arithmetic/exp2.py +0 -2
  383. maxframe/tensor/arithmetic/expm1.py +0 -2
  384. maxframe/tensor/arithmetic/fabs.py +0 -2
  385. maxframe/tensor/arithmetic/fix.py +0 -2
  386. maxframe/tensor/arithmetic/float_power.py +0 -2
  387. maxframe/tensor/arithmetic/floor.py +0 -2
  388. maxframe/tensor/arithmetic/floordiv.py +0 -2
  389. maxframe/tensor/arithmetic/fmax.py +0 -2
  390. maxframe/tensor/arithmetic/fmin.py +0 -2
  391. maxframe/tensor/arithmetic/fmod.py +0 -2
  392. maxframe/tensor/arithmetic/frexp.py +6 -2
  393. maxframe/tensor/arithmetic/greater.py +0 -2
  394. maxframe/tensor/arithmetic/greater_equal.py +0 -2
  395. maxframe/tensor/arithmetic/hypot.py +0 -2
  396. maxframe/tensor/arithmetic/i0.py +1 -3
  397. maxframe/tensor/arithmetic/imag.py +0 -2
  398. maxframe/tensor/arithmetic/invert.py +1 -3
  399. maxframe/tensor/arithmetic/isclose.py +0 -2
  400. maxframe/tensor/arithmetic/iscomplex.py +0 -2
  401. maxframe/tensor/arithmetic/isfinite.py +1 -3
  402. maxframe/tensor/arithmetic/isinf.py +0 -2
  403. maxframe/tensor/arithmetic/isnan.py +0 -2
  404. maxframe/tensor/arithmetic/isreal.py +0 -2
  405. maxframe/tensor/arithmetic/ldexp.py +0 -2
  406. maxframe/tensor/arithmetic/less.py +0 -2
  407. maxframe/tensor/arithmetic/less_equal.py +0 -2
  408. maxframe/tensor/arithmetic/log.py +1 -3
  409. maxframe/tensor/arithmetic/log10.py +1 -3
  410. maxframe/tensor/arithmetic/log1p.py +1 -3
  411. maxframe/tensor/arithmetic/log2.py +1 -3
  412. maxframe/tensor/arithmetic/logaddexp.py +0 -2
  413. maxframe/tensor/arithmetic/logaddexp2.py +0 -2
  414. maxframe/tensor/arithmetic/logical_and.py +0 -2
  415. maxframe/tensor/arithmetic/logical_not.py +1 -3
  416. maxframe/tensor/arithmetic/logical_or.py +0 -2
  417. maxframe/tensor/arithmetic/logical_xor.py +0 -2
  418. maxframe/tensor/arithmetic/lshift.py +0 -2
  419. maxframe/tensor/arithmetic/maximum.py +0 -2
  420. maxframe/tensor/arithmetic/minimum.py +0 -2
  421. maxframe/tensor/arithmetic/mod.py +0 -2
  422. maxframe/tensor/arithmetic/modf.py +6 -2
  423. maxframe/tensor/arithmetic/multiply.py +37 -4
  424. maxframe/tensor/arithmetic/nan_to_num.py +0 -2
  425. maxframe/tensor/arithmetic/negative.py +0 -2
  426. maxframe/tensor/arithmetic/nextafter.py +0 -2
  427. maxframe/tensor/arithmetic/not_equal.py +0 -2
  428. maxframe/tensor/arithmetic/positive.py +0 -2
  429. maxframe/tensor/arithmetic/power.py +0 -2
  430. maxframe/tensor/arithmetic/rad2deg.py +0 -2
  431. maxframe/tensor/arithmetic/radians.py +0 -2
  432. maxframe/tensor/arithmetic/real.py +0 -2
  433. maxframe/tensor/arithmetic/reciprocal.py +5 -3
  434. maxframe/tensor/arithmetic/rint.py +1 -3
  435. maxframe/tensor/arithmetic/rshift.py +0 -2
  436. maxframe/tensor/arithmetic/setimag.py +0 -2
  437. maxframe/tensor/arithmetic/setreal.py +0 -2
  438. maxframe/tensor/arithmetic/sign.py +0 -2
  439. maxframe/tensor/arithmetic/signbit.py +0 -2
  440. maxframe/tensor/arithmetic/sin.py +0 -2
  441. maxframe/tensor/arithmetic/sinc.py +1 -3
  442. maxframe/tensor/arithmetic/sinh.py +0 -2
  443. maxframe/tensor/arithmetic/spacing.py +0 -2
  444. maxframe/tensor/arithmetic/sqrt.py +0 -2
  445. maxframe/tensor/arithmetic/square.py +0 -2
  446. maxframe/tensor/arithmetic/subtract.py +4 -2
  447. maxframe/tensor/arithmetic/tan.py +0 -2
  448. maxframe/tensor/arithmetic/tanh.py +0 -2
  449. maxframe/tensor/arithmetic/tests/__init__.py +0 -2
  450. maxframe/tensor/arithmetic/tests/test_arithmetic.py +43 -9
  451. maxframe/tensor/arithmetic/truediv.py +0 -2
  452. maxframe/tensor/arithmetic/trunc.py +0 -2
  453. maxframe/tensor/arithmetic/utils.py +32 -6
  454. maxframe/tensor/array_utils.py +3 -25
  455. maxframe/tensor/core.py +6 -6
  456. maxframe/tensor/datasource/__init__.py +10 -2
  457. maxframe/tensor/datasource/arange.py +0 -2
  458. maxframe/tensor/datasource/array.py +3 -22
  459. maxframe/tensor/datasource/core.py +15 -10
  460. maxframe/tensor/datasource/diag.py +140 -0
  461. maxframe/tensor/datasource/diagflat.py +69 -0
  462. maxframe/tensor/datasource/empty.py +0 -2
  463. maxframe/tensor/datasource/eye.py +95 -0
  464. maxframe/tensor/datasource/from_dataframe.py +0 -2
  465. maxframe/tensor/datasource/from_dense.py +0 -17
  466. maxframe/tensor/datasource/from_sparse.py +0 -2
  467. maxframe/tensor/datasource/full.py +0 -2
  468. maxframe/tensor/datasource/identity.py +54 -0
  469. maxframe/tensor/datasource/indices.py +115 -0
  470. maxframe/tensor/datasource/linspace.py +140 -0
  471. maxframe/tensor/datasource/meshgrid.py +135 -0
  472. maxframe/tensor/datasource/ones.py +8 -3
  473. maxframe/tensor/datasource/tests/test_datasource.py +32 -1
  474. maxframe/tensor/datasource/tri_array.py +107 -0
  475. maxframe/tensor/datasource/zeros.py +7 -3
  476. maxframe/tensor/extensions/__init__.py +31 -0
  477. maxframe/tensor/extensions/accessor.py +25 -0
  478. maxframe/tensor/extensions/apply_chunk.py +137 -0
  479. maxframe/tensor/indexing/__init__.py +1 -1
  480. maxframe/tensor/indexing/choose.py +8 -6
  481. maxframe/tensor/indexing/compress.py +0 -2
  482. maxframe/tensor/indexing/extract.py +0 -2
  483. maxframe/tensor/indexing/fill_diagonal.py +9 -6
  484. maxframe/tensor/indexing/flatnonzero.py +1 -3
  485. maxframe/tensor/indexing/getitem.py +10 -43
  486. maxframe/tensor/indexing/nonzero.py +2 -4
  487. maxframe/tensor/indexing/setitem.py +19 -9
  488. maxframe/tensor/indexing/slice.py +6 -3
  489. maxframe/tensor/indexing/take.py +0 -2
  490. maxframe/tensor/indexing/tests/__init__.py +0 -2
  491. maxframe/tensor/indexing/tests/test_indexing.py +0 -2
  492. maxframe/tensor/indexing/unravel_index.py +6 -6
  493. maxframe/tensor/lib/__init__.py +16 -0
  494. maxframe/tensor/lib/index_tricks.py +404 -0
  495. maxframe/tensor/linalg/__init__.py +36 -0
  496. maxframe/tensor/linalg/dot.py +145 -0
  497. maxframe/tensor/linalg/inner.py +36 -0
  498. maxframe/tensor/linalg/inv.py +83 -0
  499. maxframe/tensor/linalg/lu.py +115 -0
  500. maxframe/tensor/linalg/matmul.py +225 -0
  501. maxframe/tensor/linalg/qr.py +124 -0
  502. maxframe/tensor/linalg/solve_triangular.py +103 -0
  503. maxframe/tensor/linalg/svd.py +167 -0
  504. maxframe/tensor/linalg/tensordot.py +213 -0
  505. maxframe/tensor/linalg/vdot.py +73 -0
  506. maxframe/tensor/merge/__init__.py +4 -0
  507. maxframe/tensor/merge/append.py +74 -0
  508. maxframe/tensor/merge/column_stack.py +63 -0
  509. maxframe/tensor/merge/concatenate.py +3 -2
  510. maxframe/tensor/merge/dstack.py +71 -0
  511. maxframe/tensor/merge/hstack.py +70 -0
  512. maxframe/tensor/merge/stack.py +0 -2
  513. maxframe/tensor/merge/tests/test_merge.py +0 -2
  514. maxframe/tensor/misc/__init__.py +18 -5
  515. maxframe/tensor/misc/astype.py +10 -8
  516. maxframe/tensor/misc/broadcast_to.py +1 -1
  517. maxframe/tensor/misc/copy.py +64 -0
  518. maxframe/tensor/misc/diff.py +115 -0
  519. maxframe/tensor/misc/flatten.py +63 -0
  520. maxframe/tensor/misc/in1d.py +94 -0
  521. maxframe/tensor/misc/isin.py +130 -0
  522. maxframe/tensor/misc/ndim.py +53 -0
  523. maxframe/tensor/misc/ravel.py +0 -2
  524. maxframe/tensor/misc/repeat.py +129 -0
  525. maxframe/tensor/misc/searchsorted.py +147 -0
  526. maxframe/tensor/misc/setdiff1d.py +58 -0
  527. maxframe/tensor/misc/squeeze.py +117 -0
  528. maxframe/tensor/misc/swapaxes.py +113 -0
  529. maxframe/tensor/misc/tests/test_misc.py +0 -2
  530. maxframe/tensor/misc/transpose.py +8 -4
  531. maxframe/tensor/misc/trapezoid.py +123 -0
  532. maxframe/tensor/misc/unique.py +0 -1
  533. maxframe/tensor/misc/where.py +10 -8
  534. maxframe/tensor/operators.py +0 -34
  535. maxframe/tensor/random/__init__.py +3 -5
  536. maxframe/tensor/random/binomial.py +0 -2
  537. maxframe/tensor/random/bytes.py +0 -2
  538. maxframe/tensor/random/chisquare.py +0 -2
  539. maxframe/tensor/random/choice.py +9 -8
  540. maxframe/tensor/random/core.py +20 -5
  541. maxframe/tensor/random/dirichlet.py +0 -2
  542. maxframe/tensor/random/exponential.py +0 -2
  543. maxframe/tensor/random/f.py +2 -4
  544. maxframe/tensor/random/gamma.py +0 -2
  545. maxframe/tensor/random/geometric.py +0 -2
  546. maxframe/tensor/random/gumbel.py +0 -2
  547. maxframe/tensor/random/hypergeometric.py +0 -2
  548. maxframe/tensor/random/laplace.py +2 -4
  549. maxframe/tensor/random/logistic.py +0 -2
  550. maxframe/tensor/random/lognormal.py +0 -2
  551. maxframe/tensor/random/logseries.py +0 -2
  552. maxframe/tensor/random/multinomial.py +0 -2
  553. maxframe/tensor/random/multivariate_normal.py +0 -2
  554. maxframe/tensor/random/negative_binomial.py +0 -2
  555. maxframe/tensor/random/noncentral_chisquare.py +0 -2
  556. maxframe/tensor/random/noncentral_f.py +1 -3
  557. maxframe/tensor/random/normal.py +0 -2
  558. maxframe/tensor/random/pareto.py +0 -2
  559. maxframe/tensor/random/permutation.py +6 -3
  560. maxframe/tensor/random/poisson.py +0 -2
  561. maxframe/tensor/random/power.py +0 -2
  562. maxframe/tensor/random/rand.py +0 -2
  563. maxframe/tensor/random/randint.py +0 -2
  564. maxframe/tensor/random/randn.py +0 -2
  565. maxframe/tensor/random/random_integers.py +0 -2
  566. maxframe/tensor/random/random_sample.py +0 -2
  567. maxframe/tensor/random/rayleigh.py +0 -2
  568. maxframe/tensor/random/standard_cauchy.py +0 -2
  569. maxframe/tensor/random/standard_exponential.py +0 -2
  570. maxframe/tensor/random/standard_gamma.py +0 -2
  571. maxframe/tensor/random/standard_normal.py +0 -2
  572. maxframe/tensor/random/standard_t.py +0 -2
  573. maxframe/tensor/random/tests/__init__.py +0 -2
  574. maxframe/tensor/random/tests/test_random.py +0 -2
  575. maxframe/tensor/random/triangular.py +0 -2
  576. maxframe/tensor/random/uniform.py +0 -2
  577. maxframe/tensor/random/vonmises.py +0 -2
  578. maxframe/tensor/random/wald.py +0 -2
  579. maxframe/tensor/random/weibull.py +0 -2
  580. maxframe/tensor/random/zipf.py +0 -2
  581. maxframe/tensor/reduction/__init__.py +0 -2
  582. maxframe/tensor/reduction/all.py +0 -2
  583. maxframe/tensor/reduction/allclose.py +0 -2
  584. maxframe/tensor/reduction/any.py +0 -2
  585. maxframe/tensor/reduction/argmax.py +1 -3
  586. maxframe/tensor/reduction/argmin.py +1 -3
  587. maxframe/tensor/reduction/array_equal.py +0 -2
  588. maxframe/tensor/reduction/core.py +0 -2
  589. maxframe/tensor/reduction/count_nonzero.py +0 -2
  590. maxframe/tensor/reduction/cumprod.py +0 -2
  591. maxframe/tensor/reduction/cumsum.py +0 -2
  592. maxframe/tensor/reduction/max.py +0 -2
  593. maxframe/tensor/reduction/mean.py +0 -2
  594. maxframe/tensor/reduction/min.py +0 -2
  595. maxframe/tensor/reduction/nanargmax.py +0 -2
  596. maxframe/tensor/reduction/nanargmin.py +0 -2
  597. maxframe/tensor/reduction/nancumprod.py +0 -2
  598. maxframe/tensor/reduction/nancumsum.py +0 -2
  599. maxframe/tensor/reduction/nanmax.py +0 -2
  600. maxframe/tensor/reduction/nanmean.py +0 -2
  601. maxframe/tensor/reduction/nanmin.py +0 -2
  602. maxframe/tensor/reduction/nanprod.py +0 -2
  603. maxframe/tensor/reduction/nanstd.py +0 -2
  604. maxframe/tensor/reduction/nansum.py +0 -2
  605. maxframe/tensor/reduction/nanvar.py +0 -2
  606. maxframe/tensor/reduction/prod.py +0 -2
  607. maxframe/tensor/reduction/std.py +0 -2
  608. maxframe/tensor/reduction/sum.py +0 -2
  609. maxframe/tensor/reduction/tests/test_reduction.py +1 -4
  610. maxframe/tensor/reduction/var.py +0 -2
  611. maxframe/tensor/reshape/__init__.py +0 -2
  612. maxframe/tensor/reshape/reshape.py +6 -5
  613. maxframe/tensor/reshape/tests/__init__.py +0 -2
  614. maxframe/tensor/reshape/tests/test_reshape.py +0 -2
  615. maxframe/tensor/sort/__init__.py +16 -0
  616. maxframe/tensor/sort/argsort.py +150 -0
  617. maxframe/tensor/sort/sort.py +295 -0
  618. maxframe/tensor/special/__init__.py +37 -0
  619. maxframe/tensor/special/core.py +38 -0
  620. maxframe/tensor/special/misc.py +142 -0
  621. maxframe/tensor/special/statistical.py +56 -0
  622. maxframe/tensor/statistics/__init__.py +5 -0
  623. maxframe/tensor/statistics/average.py +143 -0
  624. maxframe/tensor/statistics/bincount.py +133 -0
  625. maxframe/tensor/statistics/quantile.py +10 -8
  626. maxframe/tensor/ufunc/__init__.py +0 -2
  627. maxframe/tensor/ufunc/ufunc.py +0 -2
  628. maxframe/tensor/utils.py +21 -3
  629. maxframe/tests/test_protocol.py +3 -3
  630. maxframe/tests/test_utils.py +210 -1
  631. maxframe/tests/utils.py +67 -1
  632. maxframe/udf.py +76 -6
  633. maxframe/utils.py +418 -17
  634. {maxframe-1.3.0.dist-info → maxframe-2.0.0b1.dist-info}/METADATA +5 -1
  635. maxframe-2.0.0b1.dist-info/RECORD +939 -0
  636. {maxframe-1.3.0.dist-info → maxframe-2.0.0b1.dist-info}/WHEEL +1 -1
  637. maxframe_client/clients/framedriver.py +19 -3
  638. maxframe_client/fetcher.py +113 -6
  639. maxframe_client/session/odps.py +173 -38
  640. maxframe_client/session/task.py +3 -1
  641. maxframe_client/tests/test_session.py +41 -5
  642. maxframe-1.3.0.dist-info/RECORD +0 -705
  643. {maxframe-1.3.0.dist-info → maxframe-2.0.0b1.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,400 @@
1
+ # Copyright 1999-2025 Alibaba Group Holding Ltd.
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ import pandas as pd
16
+ import pytest
17
+
18
+ from ..... import dataframe as md
19
+ from ...core import SPECodeContext
20
+ from ..merge import DataFrameConcatAdapter, DataFrameMergeAdapter
21
+
22
+
23
+ @pytest.fixture
24
+ def df1():
25
+ return md.DataFrame(
26
+ [
27
+ [1, 10, 100, 1000],
28
+ [2, 20, 200, 2000],
29
+ [3, 30, 300, 3000],
30
+ [7, 70, 700, 7000],
31
+ ],
32
+ index=md.Index([1, 2, 3, 7], name="test_idx"),
33
+ columns=list("ABCD"),
34
+ )
35
+
36
+
37
+ @pytest.fixture
38
+ def df2():
39
+ return md.DataFrame(
40
+ [
41
+ [1, 10, 101, 1001],
42
+ [2, 20, 202, 2002],
43
+ [3, 30, 303, 3003],
44
+ [8, 80, 808, 8008],
45
+ ],
46
+ index=pd.MultiIndex.from_arrays(
47
+ [[1, 2, 3, 8], [1, 2, 3, 8], [1, 2, 3, 8]],
48
+ names=("idx_1", "idx_2", "idx_4"),
49
+ ),
50
+ columns=list("ABCE"),
51
+ )
52
+
53
+
54
+ @pytest.fixture
55
+ def df3():
56
+ return md.DataFrame(
57
+ [
58
+ [1, 10, 101],
59
+ [9, 90, 909],
60
+ [2, 20, 202],
61
+ ],
62
+ index=pd.MultiIndex.from_arrays(
63
+ [[1, 9, 2], [1, 9, 2], [1, 9, 2]], names=("idx_3", "idx_4", "idx_5")
64
+ ),
65
+ columns=list("ZCE"),
66
+ )
67
+
68
+
69
+ @pytest.fixture
70
+ def df4():
71
+ return md.DataFrame(
72
+ [
73
+ [1, 10, 100, 1000],
74
+ [2, 20, 200, 2000],
75
+ [3, 30, 300, 3000],
76
+ [4, 400, 4000, 40000],
77
+ ],
78
+ index=[1, 2, 3, 4],
79
+ columns=list("ABCD"),
80
+ )
81
+
82
+
83
+ @pytest.fixture
84
+ def df5():
85
+ return md.DataFrame(
86
+ [
87
+ [1, 10, 100, 1000],
88
+ [2, 20, 200, 2000],
89
+ [3, 30, 300, 3000],
90
+ [4, 4000, 40000, 400000],
91
+ ],
92
+ index=[1, 2, 3, 4],
93
+ columns=list("ABCD"),
94
+ )
95
+
96
+
97
+ @pytest.fixture
98
+ def df6():
99
+ # Same index with df2
100
+ return md.DataFrame(
101
+ [
102
+ [1, 10, 101, 1001],
103
+ [2, 20, 202, 2002],
104
+ [3, 30, 303, 3003],
105
+ [8, 810, 8108, 81008],
106
+ ],
107
+ index=pd.MultiIndex.from_arrays(
108
+ [[1, 2, 3, 8], [1, 2, 3, 8], [1, 2, 3, 8]],
109
+ names=("idx_1", "idx_2", "idx_4"),
110
+ ),
111
+ columns=list("ABCF"),
112
+ )
113
+
114
+
115
+ @pytest.fixture
116
+ def s1():
117
+ return md.Series([5, 2, 3, 1], index=[5, 2, 3, 1], name="A")
118
+
119
+
120
+ @pytest.fixture
121
+ def s2():
122
+ return md.Series([1, 2, 3, 4], index=[1, 2, 3, 4], name="B")
123
+
124
+
125
+ @pytest.fixture
126
+ def s3():
127
+ return md.Series(
128
+ [1, 2, 3, 6],
129
+ index=pd.MultiIndex.from_arrays(
130
+ [[1, 2, 3, 6], [1, 2, 3, 6], [1, 2, 3, 6]],
131
+ names=("idx_1", "idx_2", "idx_3"),
132
+ ),
133
+ name="A",
134
+ )
135
+
136
+
137
+ def test_series_merge_series_using_index(s1, s2):
138
+ merged = md.merge(s1, s2, left_index=True, right_index=True)
139
+ context = SPECodeContext()
140
+ adapter = DataFrameMergeAdapter()
141
+ results = adapter.generate_code(merged.op, context)
142
+ assert "pd" in context.imports["pandas"]
143
+ expected_results = [
144
+ "var_2 = pd.merge(var_0, var_1, how='inner', left_index=True, right_index=True,"
145
+ " sort=False, suffixes=('_x', '_y'), indicator=False, validate=None, copy=True)"
146
+ ]
147
+ assert results == expected_results
148
+
149
+
150
+ def test_series_merge_series_on_index_and_columns(s1, s3):
151
+ merged = md.merge(
152
+ s1,
153
+ s3,
154
+ suffixes=("_left", "_right"),
155
+ how="left",
156
+ left_on="A",
157
+ right_on="idx_2",
158
+ indicator=True,
159
+ )
160
+ context = SPECodeContext()
161
+ adapter = DataFrameMergeAdapter()
162
+ results = adapter.generate_code(merged.op, context)
163
+ expected_results = [
164
+ "var_2 = pd.merge(var_0, var_1, how='left', left_on='A', right_on='idx_2',"
165
+ " sort=False, suffixes=('_left', '_right'), indicator=True, validate=None,"
166
+ " copy=True)"
167
+ ]
168
+ assert results == expected_results
169
+
170
+
171
+ def test_series_merge_series_on_columns(s1, s3):
172
+ merged = md.merge(s1, s3, how="right", on="A", sort=True, copy=False)
173
+ context = SPECodeContext()
174
+ adapter = DataFrameMergeAdapter()
175
+ results = adapter.generate_code(merged.op, context)
176
+ expected_results = [
177
+ "var_2 = pd.merge(var_0, var_1, how='right', on='A',"
178
+ " sort=True, suffixes=('_x', '_y'), indicator=False, validate=None, copy=False)"
179
+ ]
180
+ assert results == expected_results
181
+
182
+
183
+ def test_series_merge_dataframe_using_index(s1, df1):
184
+ merged = md.merge(
185
+ s1, df1, how="outer", left_index=True, right_index=True, validate="m:m"
186
+ )
187
+ context = SPECodeContext()
188
+ adapter = DataFrameMergeAdapter()
189
+ results = adapter.generate_code(merged.op, context)
190
+ expected_results = [
191
+ "var_2 = pd.merge(var_0, var_1, how='outer', left_index=True, right_index=True,"
192
+ " sort=False, suffixes=('_x', '_y'), indicator=False, validate='m:m', copy=True)"
193
+ ]
194
+ assert results == expected_results
195
+
196
+
197
+ def test_series_merge_dataframe_on_index_and_columns(s1, df2):
198
+ merged = md.merge(
199
+ s1,
200
+ df2,
201
+ suffixes=("_left", "_right"),
202
+ how="outer",
203
+ left_on="A",
204
+ right_on="idx_2",
205
+ sort=True,
206
+ )
207
+ context = SPECodeContext()
208
+ adapter = DataFrameMergeAdapter()
209
+ results = adapter.generate_code(merged.op, context)
210
+ expected_results = [
211
+ "var_2 = pd.merge(var_0, var_1, how='outer', left_on='A', right_on='idx_2',"
212
+ " sort=True, suffixes=('_left', '_right'), indicator=False, validate=None,"
213
+ " copy=True)"
214
+ ]
215
+ assert results == expected_results
216
+
217
+
218
+ def test_series_merge_dataframe_on_columns(s1, df2):
219
+ merged = md.merge(s1, df2, how="cross")
220
+ context = SPECodeContext()
221
+ adapter = DataFrameMergeAdapter()
222
+ results = adapter.generate_code(merged.op, context)
223
+ expected_results = [
224
+ "var_2 = pd.merge(var_0, var_1, how='cross',"
225
+ " sort=False, suffixes=('_x', '_y'), indicator=False, validate=None, copy=True)"
226
+ ]
227
+ assert results == expected_results
228
+
229
+
230
+ def test_dataframe_merge_dataframe_using_index(df1, df2):
231
+ merged = md.merge(df1, df2, how="inner", left_index=True, right_on="idx_4")
232
+ context = SPECodeContext()
233
+ adapter = DataFrameMergeAdapter()
234
+ results = adapter.generate_code(merged.op, context)
235
+ expected_results = [
236
+ "var_2 = pd.merge(var_0, var_1, how='inner', left_index=True, right_on='idx_4',"
237
+ " sort=False, suffixes=('_x', '_y'), indicator=False, validate=None, copy=True)"
238
+ ]
239
+ assert results == expected_results
240
+
241
+
242
+ def test_dataframe_merge_dataframe_on_index_and_columns(df1, df2):
243
+ merged = md.merge(
244
+ df1,
245
+ df2,
246
+ suffixes=("_left", "_right"),
247
+ how="outer",
248
+ left_on=["A", "B"],
249
+ right_on=["idx_1", "idx_4"],
250
+ sort=True,
251
+ )
252
+ context = SPECodeContext()
253
+ adapter = DataFrameMergeAdapter()
254
+ results = adapter.generate_code(merged.op, context)
255
+ expected_results = [
256
+ "var_2 = pd.merge(var_0, var_1, how='outer', left_on=['A', 'B'],"
257
+ " right_on=['idx_1', 'idx_4'], sort=True, suffixes=('_left', '_right'),"
258
+ " indicator=False, validate=None, copy=True)"
259
+ ]
260
+ assert results == expected_results
261
+
262
+
263
+ def test_dataframe_merge_dataframe_on_columns(df1, df2):
264
+ merged = md.merge(df1, df2, how="outer", on=["A", "B"], sort=True)
265
+ context = SPECodeContext()
266
+ adapter = DataFrameMergeAdapter()
267
+ results = adapter.generate_code(merged.op, context)
268
+ expected_results = [
269
+ "var_2 = pd.merge(var_0, var_1, how='outer', on=['A', 'B'],"
270
+ " sort=True, suffixes=('_x', '_y'), indicator=False, validate=None, copy=True)"
271
+ ]
272
+ assert results == expected_results
273
+
274
+
275
+ def test_join(df1, df2):
276
+ joined = df1.join(df2, how="right", on=["A", "B", "C"], lsuffix="_l", rsuffix="_r")
277
+ context = SPECodeContext()
278
+ adapter = DataFrameMergeAdapter()
279
+ results = adapter.generate_code(joined.op, context)
280
+ expected_results = [
281
+ "var_2 = pd.merge(var_0, var_1, how='right', left_on=['A', 'B', 'C'],"
282
+ " right_index=True, sort=False, suffixes=('_l', '_r'), indicator=False,"
283
+ " validate=None, copy=True)"
284
+ ]
285
+ assert results == expected_results
286
+
287
+
288
+ def test_concat_single(df2):
289
+ adapter = DataFrameConcatAdapter()
290
+ df = md.concat([df2], axis="index")
291
+ context = SPECodeContext()
292
+ results = adapter.generate_code(df.op, context)
293
+
294
+ expected_results = [
295
+ "var_0 = pd.concat(axis=0, join='outer', ignore_index=False, keys=None,"
296
+ " levels=None, names=None, verify_integrity=False, sort=False, objs=[var_1],"
297
+ " copy=True)"
298
+ ]
299
+ assert results == expected_results
300
+
301
+ expected_results = [
302
+ "var_0 = pd.concat(axis=1, join='outer', ignore_index=False, keys=None,"
303
+ " levels=None, names=None, verify_integrity=False, sort=False, objs=[var_1],"
304
+ " copy=True)"
305
+ ]
306
+ df = md.concat([df2], axis="columns")
307
+ context = SPECodeContext()
308
+ results = adapter.generate_code(df.op, context)
309
+ assert results == expected_results
310
+
311
+
312
+ def test_concat_indexes_from_series(s1, s2):
313
+ adapter = DataFrameConcatAdapter()
314
+ df = md.concat([s1, s2], names=["l1", "l2"], axis="index", ignore_index=True)
315
+ context = SPECodeContext()
316
+ results = adapter.generate_code(df.op, context)
317
+ expected_results = [
318
+ "var_0 = pd.concat(axis=0, join='outer', ignore_index=True, keys=None,"
319
+ " levels=None, names=['l1', 'l2'], verify_integrity=False, sort=False,"
320
+ " objs=[var_1, var_2], copy=True)"
321
+ ]
322
+ assert results == expected_results
323
+
324
+
325
+ def test_concat_indexes_from_series_and_dataframes(s1, s2, df1):
326
+ adapter = DataFrameConcatAdapter()
327
+ df = md.concat([s1, s2, df1], axis=0, copy=False)
328
+ context = SPECodeContext()
329
+ results = adapter.generate_code(df.op, context)
330
+ expected_results = [
331
+ "var_0 = pd.concat(axis=0, join='outer', ignore_index=False, keys=None,"
332
+ " levels=None, names=None, verify_integrity=False, sort=False,"
333
+ " objs=[var_1, var_2, var_3], copy=False)"
334
+ ]
335
+ assert results == expected_results
336
+
337
+
338
+ def test_concat_indexes_from_inner_join_dataframes(df2, df3):
339
+ adapter = DataFrameConcatAdapter()
340
+ df = md.concat([df2, df3], join="inner")
341
+ context = SPECodeContext()
342
+ results = adapter.generate_code(df.op, context)
343
+ expected_results = [
344
+ "var_0 = pd.concat(axis=0, join='inner', ignore_index=False, keys=None,"
345
+ " levels=None, names=None, verify_integrity=False, sort=False,"
346
+ " objs=[var_1, var_2], copy=True)"
347
+ ]
348
+ assert results == expected_results
349
+
350
+
351
+ def test_concat_indexes_from_outer_join_dataframes(df2, df3):
352
+ adapter = DataFrameConcatAdapter()
353
+ df = md.concat([df2, df3], join="outer")
354
+ context = SPECodeContext()
355
+ results = adapter.generate_code(df.op, context)
356
+ expected_results = [
357
+ "var_0 = pd.concat(axis=0, join='outer', ignore_index=False, keys=None,"
358
+ " levels=None, names=None, verify_integrity=False, sort=False,"
359
+ " objs=[var_1, var_2], copy=True)"
360
+ ]
361
+ assert results == expected_results
362
+
363
+
364
+ def test_concat_columns_from_series(s1, s2):
365
+ adapter = DataFrameConcatAdapter()
366
+ df = md.concat([s1, s2], axis="columns", ignore_index=True)
367
+ context = SPECodeContext()
368
+ results = adapter.generate_code(df.op, context)
369
+ expected_results = [
370
+ "var_0 = pd.concat(axis=1, join='outer', ignore_index=True, keys=None,"
371
+ " levels=None, names=None, verify_integrity=False, sort=False, "
372
+ "objs=[var_1, var_2], copy=True)"
373
+ ]
374
+ assert results == expected_results
375
+
376
+
377
+ def test_concat_columns_from_series_and_dataframes(s2, df4, df5):
378
+ adapter = DataFrameConcatAdapter()
379
+ df = md.concat([s2, df4, df5], axis=1)
380
+ context = SPECodeContext()
381
+ results = adapter.generate_code(df.op, context)
382
+ expected_results = [
383
+ "var_0 = pd.concat(axis=1, join='outer', ignore_index=False, keys=None,"
384
+ " levels=None, names=None, verify_integrity=False, sort=False,"
385
+ " objs=[var_1, var_2, var_3], copy=True)"
386
+ ]
387
+ assert results == expected_results
388
+
389
+
390
+ def test_concat_columns_from_dataframes(df2, df6):
391
+ adapter = DataFrameConcatAdapter()
392
+ df = md.concat([df2, df6], axis=1)
393
+ context = SPECodeContext()
394
+ results = adapter.generate_code(df.op, context)
395
+ expected_results = [
396
+ "var_0 = pd.concat(axis=1, join='outer', ignore_index=False, keys=None,"
397
+ " levels=None, names=None, verify_integrity=False, sort=False,"
398
+ " objs=[var_1, var_2], copy=True)"
399
+ ]
400
+ assert results == expected_results
@@ -0,0 +1,104 @@
1
+ # Copyright 1999-2025 Alibaba Group Holding Ltd.
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ import pytest
16
+
17
+ from ..... import dataframe as md
18
+ from ...core import SPECodeContext
19
+ from ..reduction import (
20
+ DataFrameAggregateAdapter,
21
+ DataFrameKurtosisAdapter,
22
+ DataFrameNuniqueAdapter,
23
+ DataFrameReductionAdapter,
24
+ DataFrameUniqueAdapter,
25
+ DataFrameVarAdapter,
26
+ )
27
+
28
+
29
+ @pytest.fixture
30
+ def df1():
31
+ return md.DataFrame(
32
+ [[1, 10], [2, 20], [3, 30], [4, 40]], index=list("abcd"), columns=list("AB")
33
+ )
34
+
35
+
36
+ @pytest.fixture
37
+ def s1():
38
+ return md.Series([1, 2, 3, 4])
39
+
40
+
41
+ def test_sum(df1):
42
+ df = df1.sum(skipna=False)
43
+ results = DataFrameReductionAdapter().generate_code(df.op, SPECodeContext())
44
+ expected_results = ["var_1 = var_0.sum(axis=0, skipna=False, min_count=0)"]
45
+ assert results == expected_results
46
+
47
+
48
+ def test_kurtosis(df1):
49
+ df = df1.kurt(bias=False, fisher=True)
50
+ results = DataFrameKurtosisAdapter().generate_code(df.op, SPECodeContext())
51
+ expected_results = [
52
+ "var_1 = var_0.kurt(axis=0, skipna=True, bias=False, fisher=True)"
53
+ ]
54
+ assert results == expected_results
55
+
56
+
57
+ def test_dataframe_nunique(df1):
58
+ df = df1.nunique()
59
+ results = DataFrameNuniqueAdapter().generate_code(df.op, SPECodeContext())
60
+ expected_results = ["var_1 = var_0.nunique(axis=0, dropna=True)"]
61
+ assert results == expected_results
62
+
63
+
64
+ def test_series_nunique(s1):
65
+ s = s1.nunique()
66
+ results = DataFrameNuniqueAdapter().generate_code(s.op, SPECodeContext())
67
+ expected_results = ["var_1 = var_0.nunique(dropna=True)"]
68
+ assert results == expected_results
69
+
70
+
71
+ def test_var(df1):
72
+ df = df1.var(ddof=2)
73
+ results = DataFrameVarAdapter().generate_code(df.op, SPECodeContext())
74
+ expected_results = ["var_1 = var_0.var(axis=0, skipna=True, ddof=2)"]
75
+ assert results == expected_results
76
+
77
+
78
+ def test_unique(s1):
79
+ df = md.unique(s1)
80
+ context = SPECodeContext()
81
+ results = DataFrameUniqueAdapter().generate_code(df.op, context)
82
+ assert "pd" in context.imports["pandas"]
83
+ expected_results = ["var_1 = pd.unique(var_0)"]
84
+ assert results == expected_results
85
+
86
+
87
+ def test_median(df1):
88
+ df = df1.median(skipna=False)
89
+ results = DataFrameReductionAdapter().generate_code(df.op, SPECodeContext())
90
+ expected_results = ["var_1 = var_0.median(axis=0, skipna=False)"]
91
+ assert results == expected_results
92
+
93
+ df = df1.median(axis=1, numeric_only=True)
94
+ results = DataFrameReductionAdapter().generate_code(df.op, SPECodeContext())
95
+ expected_results = ["var_1 = var_0.median(axis=1, skipna=True, numeric_only=True)"]
96
+ assert results == expected_results
97
+
98
+
99
+ def test_aggregate(df1):
100
+ df = df1.agg(["sum", "mean"])
101
+ context = SPECodeContext()
102
+ results = DataFrameAggregateAdapter().generate_code(df.op, context)
103
+ expected_results = ["var_1 = var_0.agg(['sum', 'mean'], axis=0)"]
104
+ assert results == expected_results
@@ -0,0 +1,159 @@
1
+ # Copyright 1999-2025 Alibaba Group Holding Ltd.
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ import numpy as np
16
+ import pandas as pd
17
+ import pytest
18
+
19
+ from ..... import dataframe as md
20
+ from ....core import EngineAcceptance
21
+ from ...core import SPECodeContext
22
+ from ..sort import DataFrameSortIndexAdapter, DataFrameSortValuesAdapter
23
+
24
+
25
+ @pytest.fixture
26
+ def multi_index():
27
+ arrays = [
28
+ ["a1", "a2", "a3"],
29
+ ["b1", "b2", "b3"],
30
+ ["c1", "c2", "c3"],
31
+ ["d1", "d2", "d3"],
32
+ ["e1", "e2", "e3"],
33
+ ]
34
+ return pd.MultiIndex.from_arrays(
35
+ arrays, names=("idx_a", "idx_b", "idx_c", "idx_d", "idx_e")
36
+ )
37
+
38
+
39
+ @pytest.fixture
40
+ def df1():
41
+ return md.DataFrame(
42
+ np.random.randn(6, 4),
43
+ index=md.Index(["1", "2", "3", "4", "5", "6"], name="test_idx"),
44
+ columns=list("ABCD"),
45
+ )
46
+
47
+
48
+ @pytest.fixture
49
+ def df2(multi_index):
50
+ return md.DataFrame(
51
+ np.random.randn(3, 4),
52
+ index=multi_index,
53
+ columns=list("ABCD"),
54
+ )
55
+
56
+
57
+ @pytest.fixture
58
+ def s1():
59
+ return md.Series([1, 2, 3], index=list("abc"))
60
+
61
+
62
+ @pytest.fixture
63
+ def s2(multi_index):
64
+ return md.Series([1, 2, 3], index=multi_index)
65
+
66
+
67
+ def test_series_sort_values(s1):
68
+ s = s1.sort_values(na_position="last", ascending=False, inplace=False)
69
+ adapter = DataFrameSortValuesAdapter()
70
+ context = SPECodeContext()
71
+ assert adapter.accepts(s.op) == EngineAcceptance.ACCEPT
72
+ results = adapter.generate_code(s.op, context)
73
+ expected_results = [
74
+ "var_1 = var_0.sort_values(axis=0, ascending=False, inplace=False,"
75
+ " na_position='last', ignore_index=False)"
76
+ ]
77
+ assert results == expected_results
78
+
79
+
80
+ def test_dataframe_sort_by_values_single_column(df1):
81
+ s = df1.sort_values(by="A", na_position="first", ascending=True)
82
+ adapter = DataFrameSortValuesAdapter()
83
+ context = SPECodeContext()
84
+ assert adapter.accepts(s.op) == EngineAcceptance.ACCEPT
85
+ results = adapter.generate_code(s.op, context)
86
+ expected_results = [
87
+ "var_1 = var_0.sort_values(axis=0, ascending=True, inplace=False,"
88
+ " na_position='first', ignore_index=False, by=['A'])"
89
+ ]
90
+ assert results == expected_results
91
+
92
+
93
+ def test_dataframe_sort_by_values_multi_columns(df1):
94
+ df1.sort_values(by=["A", "B"], inplace=True)
95
+ adapter = DataFrameSortValuesAdapter()
96
+ context = SPECodeContext()
97
+ assert adapter.accepts(df1.op) == EngineAcceptance.ACCEPT
98
+ results = adapter.generate_code(df1.op, context)
99
+ expected_results = [
100
+ "var_1 = var_0.sort_values(axis=0, ascending=True, inplace=True,"
101
+ " na_position='last', ignore_index=False, by=['A', 'B'])"
102
+ ]
103
+ assert results == expected_results
104
+
105
+
106
+ def test_series_sort_index_by_single(s2):
107
+ s = s2.sort_index(
108
+ level=1, na_position="first", sort_remaining=False, ignore_index=True
109
+ )
110
+ adapter = DataFrameSortIndexAdapter()
111
+ context = SPECodeContext()
112
+ assert adapter.accepts(s.op) == EngineAcceptance.ACCEPT
113
+ results = adapter.generate_code(s.op, context)
114
+ expected_results = [
115
+ "var_1 = var_0.sort_index(axis=0, ascending=True, inplace=False,"
116
+ " na_position='first', ignore_index=True, level=[1], sort_remaining=False)"
117
+ ]
118
+ assert results == expected_results
119
+
120
+
121
+ def test_series_sort_index_by_multiple(s2):
122
+ s = s2.sort_index(level=[1, "idx_d"])
123
+ adapter = DataFrameSortIndexAdapter()
124
+ context = SPECodeContext()
125
+ assert adapter.accepts(s.op) == EngineAcceptance.ACCEPT
126
+ results = adapter.generate_code(s.op, context)
127
+ expected_results = [
128
+ "var_1 = var_0.sort_index(axis=0, ascending=True, inplace=False,"
129
+ " na_position='last', ignore_index=False, level=[1, 'idx_d'],"
130
+ " sort_remaining=True)"
131
+ ]
132
+ assert results == expected_results
133
+
134
+
135
+ def test_dataframe_sort_index_by_single(df2):
136
+ s = df2.sort_index(level="idx_b", na_position="first")
137
+ adapter = DataFrameSortIndexAdapter()
138
+ context = SPECodeContext()
139
+ assert adapter.accepts(s.op) == EngineAcceptance.ACCEPT
140
+ results = adapter.generate_code(s.op, context)
141
+ expected_results = [
142
+ "var_1 = var_0.sort_index(axis=0, ascending=True, inplace=False,"
143
+ " na_position='first', ignore_index=False, level=['idx_b'],"
144
+ " sort_remaining=True)"
145
+ ]
146
+ assert results == expected_results
147
+
148
+
149
+ def test_dataframe_sort_index_by_all(df2):
150
+ s = df2.sort_index()
151
+ adapter = DataFrameSortIndexAdapter()
152
+ context = SPECodeContext()
153
+ assert adapter.accepts(s.op) == EngineAcceptance.ACCEPT
154
+ results = adapter.generate_code(s.op, context)
155
+ expected_results = [
156
+ "var_1 = var_0.sort_index(axis=0, ascending=True, inplace=False,"
157
+ " na_position='last', ignore_index=False, level=None, sort_remaining=True)"
158
+ ]
159
+ assert results == expected_results