PyPI - maxframe - Versions diffs - 2.0.0b2__cp38-cp38-win_amd64.whl → 2.2.0__cp38-cp38-win_amd64.whl - Mend

maxframe 2.0.0b2__cp38-cp38-win_amd64.whl → 2.2.0__cp38-cp38-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of maxframe might be problematic. Click here for more details.

Files changed (391) hide show

maxframe/__init__.py +1 -0
maxframe/_utils.cp38-win_amd64.pyd +0 -0
maxframe/_utils.pyx +14 -1
maxframe/codegen/core.py +6 -6
maxframe/codegen/spe/core.py +1 -1
maxframe/codegen/spe/dataframe/__init__.py +1 -0
maxframe/codegen/spe/dataframe/accessors/base.py +18 -0
maxframe/codegen/spe/dataframe/accessors/dict_.py +25 -130
maxframe/codegen/spe/dataframe/accessors/list_.py +12 -48
maxframe/codegen/spe/dataframe/accessors/struct_.py +28 -0
maxframe/codegen/spe/dataframe/arithmetic.py +7 -2
maxframe/codegen/spe/dataframe/groupby.py +88 -0
maxframe/codegen/spe/dataframe/indexing.py +99 -4
maxframe/codegen/spe/dataframe/merge.py +34 -1
maxframe/codegen/spe/dataframe/misc.py +9 -33
maxframe/codegen/spe/dataframe/reduction.py +14 -9
maxframe/codegen/spe/dataframe/reshape.py +46 -0
maxframe/codegen/spe/dataframe/sort.py +30 -17
maxframe/codegen/spe/dataframe/tests/accessors/test_dict.py +9 -15
maxframe/codegen/spe/dataframe/tests/accessors/test_list.py +4 -7
maxframe/codegen/spe/dataframe/tests/accessors/test_struct.py +75 -0
maxframe/codegen/spe/dataframe/tests/indexing/test_iloc.py +20 -1
maxframe/codegen/spe/dataframe/tests/indexing/test_loc.py +35 -0
maxframe/codegen/spe/dataframe/tests/misc/test_misc.py +0 -32
maxframe/codegen/spe/dataframe/tests/test_groupby.py +81 -18
maxframe/codegen/spe/dataframe/tests/test_merge.py +27 -1
maxframe/codegen/spe/dataframe/tests/test_reshape.py +79 -0
maxframe/codegen/spe/dataframe/tests/test_sort.py +20 -0
maxframe/codegen/spe/learn/contrib/tests/test_xgboost.py +2 -1
maxframe/codegen/spe/learn/metrics/__init__.py +1 -1
maxframe/codegen/spe/learn/metrics/_ranking.py +76 -0
maxframe/codegen/spe/learn/metrics/pairwise.py +51 -0
maxframe/codegen/spe/learn/metrics/tests/test_pairwise.py +36 -0
maxframe/codegen/spe/learn/metrics/tests/test_ranking.py +59 -0
maxframe/codegen/spe/tensor/__init__.py +3 -0
maxframe/codegen/spe/tensor/fft.py +74 -0
maxframe/codegen/spe/tensor/linalg.py +29 -2
maxframe/codegen/spe/tensor/misc.py +79 -25
maxframe/codegen/spe/tensor/spatial.py +45 -0
maxframe/codegen/spe/tensor/statistics.py +44 -0
maxframe/codegen/spe/tensor/tests/test_fft.py +64 -0
maxframe/codegen/spe/tensor/tests/test_linalg.py +15 -1
maxframe/codegen/spe/tensor/tests/test_misc.py +52 -2
maxframe/codegen/spe/tensor/tests/test_spatial.py +33 -0
maxframe/codegen/spe/tensor/tests/test_statistics.py +15 -1
maxframe/codegen/spe/tests/test_spe_codegen.py +6 -12
maxframe/codegen/spe/utils.py +2 -0
maxframe/config/config.py +70 -9
maxframe/config/tests/test_validators.py +13 -1
maxframe/config/validators.py +49 -0
maxframe/conftest.py +44 -17
maxframe/core/accessor.py +2 -2
maxframe/core/entity/core.py +5 -0
maxframe/core/entity/tileables.py +1 -1
maxframe/core/graph/core.cp38-win_amd64.pyd +0 -0
maxframe/core/graph/entity.py +1 -2
maxframe/core/operator/base.py +9 -2
maxframe/core/operator/core.py +10 -2
maxframe/core/operator/utils.py +13 -0
maxframe/dataframe/__init__.py +10 -3
maxframe/dataframe/accessors/__init__.py +1 -1
maxframe/dataframe/accessors/compat.py +45 -0
maxframe/dataframe/accessors/datetime_/__init__.py +4 -1
maxframe/dataframe/accessors/dict_/contains.py +7 -16
maxframe/dataframe/accessors/dict_/core.py +48 -0
maxframe/dataframe/accessors/dict_/getitem.py +17 -21
maxframe/dataframe/accessors/dict_/length.py +7 -16
maxframe/dataframe/accessors/dict_/remove.py +6 -18
maxframe/dataframe/accessors/dict_/setitem.py +8 -18
maxframe/dataframe/accessors/dict_/tests/test_dict_accessor.py +62 -22
maxframe/dataframe/accessors/list_/__init__.py +2 -2
maxframe/dataframe/accessors/list_/core.py +48 -0
maxframe/dataframe/accessors/list_/getitem.py +12 -19
maxframe/dataframe/accessors/list_/length.py +7 -16
maxframe/dataframe/accessors/list_/tests/test_list_accessor.py +11 -9
maxframe/dataframe/accessors/string_/__init__.py +4 -1
maxframe/dataframe/accessors/struct_/__init__.py +37 -0
maxframe/dataframe/accessors/struct_/accessor.py +39 -0
maxframe/dataframe/accessors/struct_/core.py +43 -0
maxframe/dataframe/accessors/struct_/dtypes.py +53 -0
maxframe/dataframe/accessors/struct_/field.py +123 -0
maxframe/dataframe/accessors/struct_/tests/__init__.py +13 -0
maxframe/dataframe/accessors/struct_/tests/test_struct_accessor.py +91 -0
maxframe/dataframe/arithmetic/__init__.py +14 -4
maxframe/dataframe/arithmetic/between.py +106 -0
maxframe/dataframe/arithmetic/dot.py +237 -0
maxframe/dataframe/arithmetic/{around.py → round.py} +11 -7
maxframe/dataframe/core.py +63 -118
maxframe/dataframe/datasource/__init__.py +18 -0
maxframe/dataframe/datasource/from_dict.py +124 -0
maxframe/dataframe/datasource/from_index.py +1 -1
maxframe/dataframe/datasource/from_records.py +77 -0
maxframe/dataframe/datasource/from_tensor.py +109 -41
maxframe/dataframe/datasource/read_csv.py +2 -3
maxframe/dataframe/datasource/tests/test_datasource.py +37 -0
maxframe/dataframe/datastore/__init__.py +5 -1
maxframe/dataframe/datastore/to_csv.py +29 -41
maxframe/dataframe/datastore/to_odps.py +30 -4
maxframe/dataframe/extensions/__init__.py +20 -4
maxframe/dataframe/extensions/apply_chunk.py +32 -6
maxframe/dataframe/extensions/cartesian_chunk.py +153 -0
maxframe/dataframe/extensions/collect_kv.py +126 -0
maxframe/dataframe/extensions/extract_kv.py +177 -0
maxframe/dataframe/extensions/map_reduce.py +263 -0
maxframe/dataframe/extensions/rebalance.py +62 -0
maxframe/dataframe/extensions/tests/test_apply_chunk.py +9 -2
maxframe/dataframe/extensions/tests/test_extensions.py +54 -0
maxframe/dataframe/extensions/tests/test_map_reduce.py +135 -0
maxframe/dataframe/groupby/__init__.py +12 -1
maxframe/dataframe/groupby/aggregation.py +78 -45
maxframe/dataframe/groupby/apply.py +1 -1
maxframe/dataframe/groupby/apply_chunk.py +18 -2
maxframe/dataframe/groupby/core.py +96 -12
maxframe/dataframe/groupby/cum.py +4 -25
maxframe/dataframe/groupby/expanding.py +264 -0
maxframe/dataframe/groupby/fill.py +1 -1
maxframe/dataframe/groupby/getitem.py +12 -5
maxframe/dataframe/groupby/head.py +11 -1
maxframe/dataframe/groupby/rank.py +136 -0
maxframe/dataframe/groupby/rolling.py +206 -0
maxframe/dataframe/groupby/shift.py +114 -0
maxframe/dataframe/groupby/tests/test_groupby.py +0 -5
maxframe/dataframe/indexing/__init__.py +20 -1
maxframe/dataframe/indexing/droplevel.py +195 -0
maxframe/dataframe/indexing/filter.py +169 -0
maxframe/dataframe/indexing/get_level_values.py +76 -0
maxframe/dataframe/indexing/iat.py +45 -0
maxframe/dataframe/indexing/iloc.py +152 -12
maxframe/dataframe/indexing/insert.py +1 -1
maxframe/dataframe/indexing/loc.py +287 -7
maxframe/dataframe/indexing/reindex.py +14 -5
maxframe/dataframe/indexing/rename.py +6 -0
maxframe/dataframe/indexing/rename_axis.py +2 -2
maxframe/dataframe/indexing/reorder_levels.py +143 -0
maxframe/dataframe/indexing/reset_index.py +33 -6
maxframe/dataframe/indexing/sample.py +8 -0
maxframe/dataframe/indexing/setitem.py +3 -3
maxframe/dataframe/indexing/swaplevel.py +185 -0
maxframe/dataframe/indexing/take.py +99 -0
maxframe/dataframe/indexing/truncate.py +140 -0
maxframe/dataframe/indexing/where.py +0 -11
maxframe/dataframe/indexing/xs.py +148 -0
maxframe/dataframe/merge/__init__.py +12 -1
maxframe/dataframe/merge/append.py +97 -98
maxframe/dataframe/merge/combine_first.py +120 -0
maxframe/dataframe/merge/compare.py +387 -0
maxframe/dataframe/merge/concat.py +183 -0
maxframe/dataframe/merge/update.py +271 -0
maxframe/dataframe/misc/__init__.py +16 -10
maxframe/dataframe/misc/_duplicate.py +10 -4
maxframe/dataframe/misc/apply.py +1 -1
maxframe/dataframe/misc/check_unique.py +51 -0
maxframe/dataframe/misc/clip.py +145 -0
maxframe/dataframe/misc/describe.py +175 -9
maxframe/dataframe/misc/drop_duplicates.py +2 -2
maxframe/dataframe/misc/duplicated.py +2 -2
maxframe/dataframe/misc/get_dummies.py +5 -1
maxframe/dataframe/misc/isin.py +2 -2
maxframe/dataframe/misc/map.py +94 -0
maxframe/dataframe/misc/tests/test_misc.py +13 -2
maxframe/dataframe/misc/to_numeric.py +3 -0
maxframe/dataframe/misc/transform.py +12 -5
maxframe/dataframe/misc/transpose.py +13 -1
maxframe/dataframe/misc/valid_index.py +115 -0
maxframe/dataframe/misc/value_counts.py +38 -4
maxframe/dataframe/missing/checkna.py +13 -6
maxframe/dataframe/missing/dropna.py +5 -0
maxframe/dataframe/missing/fillna.py +1 -1
maxframe/dataframe/missing/replace.py +7 -4
maxframe/dataframe/reduction/__init__.py +29 -15
maxframe/dataframe/reduction/aggregation.py +38 -9
maxframe/dataframe/reduction/all.py +2 -2
maxframe/dataframe/reduction/any.py +2 -2
maxframe/dataframe/reduction/argmax.py +100 -0
maxframe/dataframe/reduction/argmin.py +100 -0
maxframe/dataframe/reduction/core.py +65 -18
maxframe/dataframe/reduction/count.py +13 -9
maxframe/dataframe/reduction/cov.py +166 -0
maxframe/dataframe/reduction/cummax.py +2 -2
maxframe/dataframe/reduction/cummin.py +2 -2
maxframe/dataframe/reduction/cumprod.py +2 -2
maxframe/dataframe/reduction/cumsum.py +2 -2
maxframe/dataframe/reduction/custom_reduction.py +2 -2
maxframe/dataframe/reduction/idxmax.py +185 -0
maxframe/dataframe/reduction/idxmin.py +185 -0
maxframe/dataframe/reduction/kurtosis.py +37 -30
maxframe/dataframe/reduction/max.py +2 -2
maxframe/dataframe/reduction/mean.py +9 -7
maxframe/dataframe/reduction/median.py +2 -2
maxframe/dataframe/reduction/min.py +2 -2
maxframe/dataframe/reduction/nunique.py +9 -8
maxframe/dataframe/reduction/prod.py +18 -13
maxframe/dataframe/reduction/reduction_size.py +2 -2
maxframe/dataframe/reduction/sem.py +13 -9
maxframe/dataframe/reduction/skew.py +31 -27
maxframe/dataframe/reduction/str_concat.py +10 -7
maxframe/dataframe/reduction/sum.py +18 -14
maxframe/dataframe/reduction/unique.py +20 -3
maxframe/dataframe/reduction/var.py +16 -12
maxframe/dataframe/reshape/__init__.py +38 -0
maxframe/dataframe/{misc → reshape}/pivot.py +1 -0
maxframe/dataframe/{misc → reshape}/pivot_table.py +1 -0
maxframe/dataframe/reshape/unstack.py +114 -0
maxframe/dataframe/sort/__init__.py +8 -0
maxframe/dataframe/sort/argsort.py +62 -0
maxframe/dataframe/sort/core.py +1 -0
maxframe/dataframe/sort/nlargest.py +238 -0
maxframe/dataframe/sort/nsmallest.py +228 -0
maxframe/dataframe/statistics/__init__.py +3 -3
maxframe/dataframe/statistics/corr.py +1 -0
maxframe/dataframe/statistics/quantile.py +2 -2
maxframe/dataframe/tests/test_typing.py +104 -0
maxframe/dataframe/tests/test_utils.py +66 -2
maxframe/dataframe/typing_.py +185 -0
maxframe/dataframe/utils.py +95 -26
maxframe/dataframe/window/aggregation.py +8 -4
maxframe/dataframe/window/core.py +14 -1
maxframe/dataframe/window/ewm.py +1 -3
maxframe/dataframe/window/expanding.py +37 -35
maxframe/dataframe/window/rolling.py +49 -39
maxframe/dataframe/window/tests/test_expanding.py +1 -7
maxframe/dataframe/window/tests/test_rolling.py +1 -1
maxframe/env.py +7 -4
maxframe/errors.py +2 -2
maxframe/io/odpsio/schema.py +9 -3
maxframe/io/odpsio/tableio.py +7 -2
maxframe/io/odpsio/tests/test_schema.py +198 -83
maxframe/learn/__init__.py +10 -2
maxframe/learn/cluster/__init__.py +15 -0
maxframe/learn/cluster/_kmeans.py +782 -0
maxframe/learn/contrib/llm/core.py +2 -0
maxframe/learn/contrib/xgboost/core.py +86 -1
maxframe/learn/contrib/xgboost/train.py +5 -2
maxframe/learn/core.py +66 -0
maxframe/learn/linear_model/_base.py +58 -1
maxframe/learn/linear_model/_lin_reg.py +1 -1
maxframe/learn/metrics/__init__.py +6 -0
maxframe/learn/metrics/_classification.py +145 -0
maxframe/learn/metrics/_ranking.py +477 -0
maxframe/learn/metrics/_scorer.py +60 -0
maxframe/learn/metrics/pairwise/__init__.py +21 -0
maxframe/learn/metrics/pairwise/core.py +77 -0
maxframe/learn/metrics/pairwise/cosine.py +115 -0
maxframe/learn/metrics/pairwise/euclidean.py +176 -0
maxframe/learn/metrics/pairwise/haversine.py +96 -0
maxframe/learn/metrics/pairwise/manhattan.py +80 -0
maxframe/learn/metrics/pairwise/pairwise.py +127 -0
maxframe/learn/metrics/pairwise/pairwise_distances_topk.py +121 -0
maxframe/learn/metrics/pairwise/rbf_kernel.py +51 -0
maxframe/learn/metrics/tests/__init__.py +13 -0
maxframe/learn/metrics/tests/test_scorer.py +26 -0
maxframe/learn/utils/__init__.py +1 -1
maxframe/learn/utils/checks.py +1 -2
maxframe/learn/utils/core.py +59 -0
maxframe/learn/utils/extmath.py +37 -0
maxframe/learn/utils/odpsio.py +193 -0
maxframe/learn/utils/validation.py +2 -2
maxframe/lib/compat.py +40 -0
maxframe/lib/dtypes_extension/__init__.py +16 -1
maxframe/lib/dtypes_extension/_fake_arrow_dtype.py +604 -0
maxframe/lib/dtypes_extension/blob.py +304 -0
maxframe/lib/dtypes_extension/dtypes.py +40 -0
maxframe/lib/dtypes_extension/tests/test_blob.py +88 -0
maxframe/lib/dtypes_extension/tests/test_dtypes.py +16 -1
maxframe/lib/dtypes_extension/tests/test_fake_arrow_dtype.py +75 -0
maxframe/lib/filesystem/_oss_lib/common.py +122 -50
maxframe/lib/filesystem/_oss_lib/glob.py +1 -1
maxframe/lib/filesystem/_oss_lib/handle.py +21 -25
maxframe/lib/filesystem/base.py +1 -1
maxframe/lib/filesystem/core.py +1 -1
maxframe/lib/filesystem/oss.py +115 -46
maxframe/lib/filesystem/tests/test_oss.py +74 -36
maxframe/lib/mmh3.cp38-win_amd64.pyd +0 -0
maxframe/lib/wrapped_pickle.py +10 -0
maxframe/opcodes.py +33 -15
maxframe/protocol.py +12 -0
maxframe/serialization/__init__.py +11 -2
maxframe/serialization/arrow.py +38 -13
maxframe/serialization/blob.py +32 -0
maxframe/serialization/core.cp38-win_amd64.pyd +0 -0
maxframe/serialization/core.pyx +39 -1
maxframe/serialization/exception.py +2 -4
maxframe/serialization/numpy.py +11 -0
maxframe/serialization/pandas.py +46 -9
maxframe/serialization/serializables/core.py +2 -2
maxframe/serialization/tests/test_serial.py +29 -2
maxframe/tensor/__init__.py +38 -8
maxframe/tensor/arithmetic/__init__.py +19 -10
maxframe/tensor/arithmetic/iscomplexobj.py +53 -0
maxframe/tensor/arithmetic/tests/test_arithmetic.py +6 -0
maxframe/tensor/core.py +3 -2
maxframe/tensor/datasource/tests/test_datasource.py +2 -1
maxframe/tensor/extensions/__init__.py +2 -0
maxframe/tensor/extensions/apply_chunk.py +3 -3
maxframe/tensor/extensions/rebalance.py +65 -0
maxframe/tensor/fft/__init__.py +32 -0
maxframe/tensor/fft/core.py +168 -0
maxframe/tensor/fft/fft.py +112 -0
maxframe/tensor/fft/fft2.py +118 -0
maxframe/tensor/fft/fftfreq.py +80 -0
maxframe/tensor/fft/fftn.py +123 -0
maxframe/tensor/fft/fftshift.py +79 -0
maxframe/tensor/fft/hfft.py +112 -0
maxframe/tensor/fft/ifft.py +114 -0
maxframe/tensor/fft/ifft2.py +115 -0
maxframe/tensor/fft/ifftn.py +123 -0
maxframe/tensor/fft/ifftshift.py +73 -0
maxframe/tensor/fft/ihfft.py +93 -0
maxframe/tensor/fft/irfft.py +118 -0
maxframe/tensor/fft/irfft2.py +62 -0
maxframe/tensor/fft/irfftn.py +114 -0
maxframe/tensor/fft/rfft.py +116 -0
maxframe/tensor/fft/rfft2.py +63 -0
maxframe/tensor/fft/rfftfreq.py +87 -0
maxframe/tensor/fft/rfftn.py +113 -0
maxframe/tensor/indexing/fill_diagonal.py +1 -7
maxframe/tensor/linalg/__init__.py +7 -0
maxframe/tensor/linalg/_einsumfunc.py +1025 -0
maxframe/tensor/linalg/cholesky.py +117 -0
maxframe/tensor/linalg/einsum.py +339 -0
maxframe/tensor/linalg/lstsq.py +100 -0
maxframe/tensor/linalg/matrix_norm.py +75 -0
maxframe/tensor/linalg/norm.py +249 -0
maxframe/tensor/linalg/solve.py +72 -0
maxframe/tensor/linalg/solve_triangular.py +2 -2
maxframe/tensor/linalg/vector_norm.py +113 -0
maxframe/tensor/misc/__init__.py +24 -1
maxframe/tensor/misc/argwhere.py +72 -0
maxframe/tensor/misc/array_split.py +46 -0
maxframe/tensor/misc/broadcast_arrays.py +57 -0
maxframe/tensor/misc/copyto.py +130 -0
maxframe/tensor/misc/delete.py +104 -0
maxframe/tensor/misc/dsplit.py +68 -0
maxframe/tensor/misc/ediff1d.py +74 -0
maxframe/tensor/misc/expand_dims.py +85 -0
maxframe/tensor/misc/flip.py +90 -0
maxframe/tensor/misc/fliplr.py +64 -0
maxframe/tensor/misc/flipud.py +68 -0
maxframe/tensor/misc/hsplit.py +85 -0
maxframe/tensor/misc/insert.py +139 -0
maxframe/tensor/misc/moveaxis.py +83 -0
maxframe/tensor/misc/result_type.py +88 -0
maxframe/tensor/misc/roll.py +124 -0
maxframe/tensor/misc/rollaxis.py +77 -0
maxframe/tensor/misc/shape.py +89 -0
maxframe/tensor/misc/split.py +190 -0
maxframe/tensor/misc/tile.py +109 -0
maxframe/tensor/misc/vsplit.py +74 -0
maxframe/tensor/reduction/array_equal.py +2 -1
maxframe/tensor/sort/__init__.py +2 -0
maxframe/tensor/sort/argpartition.py +98 -0
maxframe/tensor/sort/partition.py +228 -0
maxframe/tensor/spatial/__init__.py +15 -0
maxframe/tensor/spatial/distance/__init__.py +17 -0
maxframe/tensor/spatial/distance/cdist.py +421 -0
maxframe/tensor/spatial/distance/pdist.py +398 -0
maxframe/tensor/spatial/distance/squareform.py +153 -0
maxframe/tensor/special/__init__.py +159 -21
maxframe/tensor/special/airy.py +55 -0
maxframe/tensor/special/bessel.py +199 -0
maxframe/tensor/special/core.py +65 -4
maxframe/tensor/special/ellip_func_integrals.py +155 -0
maxframe/tensor/special/ellip_harm.py +55 -0
maxframe/tensor/special/err_fresnel.py +223 -0
maxframe/tensor/special/gamma_funcs.py +303 -0
maxframe/tensor/special/hypergeometric_funcs.py +69 -0
maxframe/tensor/special/info_theory.py +189 -0
maxframe/tensor/special/misc.py +21 -0
maxframe/tensor/statistics/__init__.py +6 -0
maxframe/tensor/statistics/corrcoef.py +77 -0
maxframe/tensor/statistics/cov.py +222 -0
maxframe/tensor/statistics/digitize.py +126 -0
maxframe/tensor/statistics/histogram.py +520 -0
maxframe/tensor/statistics/median.py +85 -0
maxframe/tensor/statistics/ptp.py +89 -0
maxframe/tensor/utils.py +3 -3
maxframe/tests/test_utils.py +43 -1
maxframe/tests/utils.py +0 -2
maxframe/typing_.py +2 -0
maxframe/udf.py +27 -2
maxframe/utils.py +193 -19
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/METADATA +3 -2
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/RECORD +391 -236
maxframe_client/fetcher.py +35 -4
maxframe_client/session/odps.py +7 -2
maxframe_client/tests/test_fetcher.py +76 -3
maxframe_client/tests/test_session.py +4 -1
/maxframe/dataframe/{misc → reshape}/melt.py +0 -0
/maxframe/dataframe/{misc → reshape}/stack.py +0 -0
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/WHEEL +0 -0
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/top_level.txt +0 -0

maxframe/dataframe/reduction/core.py CHANGED Viewed

@@ -26,7 +26,9 @@ from ...serialization.serializables import (
     AnyField,
     BoolField,
     DataTypeField,
+    DictField,
     Int32Field,
+    Serializable,
     StringField,
 )
 from ...typing_ import TileableType
@@ -48,8 +50,12 @@ _level_reduction_keep_object = pd_release_version[:2] < (1, 3)
 # results in object.
 _reduce_bool_as_object = pd_release_version[:2] != (1, 2)
+_idx_reduction_without_numeric_only = pd_release_version[:2] < (1, 5)
+class DataFrameReduction(DataFrameOperator):
+    _legacy_name = "DataFrameReductionOperator"  # since v2.2.0
-class DataFrameReductionOperator(DataFrameOperator):
     axis = AnyField("axis", default=None)
     skipna = BoolField("skipna", default=True)
     level = AnyField("level", default=None)
@@ -59,8 +65,13 @@ class DataFrameReductionOperator(DataFrameOperator):
     method = StringField("method", default=None)
     dtype = DataTypeField("dtype", default=None)
+    combine_size = Int32Field("combine_size", default=None)
+    use_inf_as_na = BoolField("use_inf_as_na", default=None)
     def __init__(self, gpu=None, sparse=None, output_types=None, **kw):
+        kw["use_inf_as_na"] = kw.pop(
+            "use_inf_as_na", pd.get_option("mode.use_inf_as_na")
+        )
         super().__init__(gpu=gpu, sparse=sparse, _output_types=output_types, **kw)
     @property
@@ -78,23 +89,28 @@ class DataFrameReductionOperator(DataFrameOperator):
         return {k: v for k, v in args.items() if v is not None}
-class DataFrameCumReductionOperator(DataFrameOperator):
+# Keep for import compatibility
+DataFrameReductionOperator = DataFrameReduction
+class DataFrameCumReduction(DataFrameOperator):
+    _legacy_name = "DataFrameCumReductionOperator"  # since v2.2.0
     axis = AnyField("axis", default=None)
     skipna = BoolField("skipna", default=None)
     dtype = DataTypeField("dtype", default=None)
+    use_inf_as_na = BoolField("use_inf_as_na", default=None)
     def __init__(self, gpu=None, sparse=None, output_types=None, **kw):
+        kw["use_inf_as_na"] = kw.pop(
+            "use_inf_as_na", pd.get_option("mode.use_inf_as_na")
+        )
         super().__init__(gpu=gpu, sparse=sparse, _output_types=output_types, **kw)
-def _default_agg_fun(value, func_name=None, **kw):
-    if value.ndim == 1:
-        kw.pop("bool_only", None)
-        kw.pop("numeric_only", None)
-        return getattr(value, func_name)(**kw)
-    else:
-        return getattr(value, func_name)(**kw)
+# Keep for import compatibility
+DataFrameCumReductionOperator = DataFrameCumReduction
 @functools.lru_cache(100)
@@ -117,6 +133,8 @@ def _get_series_reduction_dtype(
         reduced = test_series.size
     elif func_name == "str_concat":
         reduced = pd.Series([test_series.str.cat()])
+    elif func_name in ("idxmin", "idxmax", "argmin", "argmax"):
+        reduced = getattr(test_series, func_name)(axis=axis, skipna=skipna)
     else:
         reduced = getattr(test_series, func_name)(
             axis=axis, skipna=skipna, numeric_only=numeric_only
@@ -135,6 +153,8 @@ def _get_df_reduction_dtype(
         reduced = getattr(test_df, func_name)(axis=axis)
     elif func_name in ("all", "any"):
         reduced = getattr(test_df, func_name)(axis=axis, bool_only=bool_only)
+    elif _idx_reduction_without_numeric_only and func_name in ("idxmin", "idxmax"):
+        reduced = getattr(test_df, func_name)(axis=axis, skipna=skipna)
     elif func_name == "str_concat":
         reduced = test_df.apply(lambda s: s.str.cat(), axis=axis)
     else:
@@ -146,6 +166,27 @@ def _get_df_reduction_dtype(
     return reduced.dtype
+class ReductionCallable(Serializable):
+    func_name = StringField("func_name")
+    kwargs = DictField("kwargs", default=None)
+    def __name__(self):
+        return self.func_name
+    def __call__(self, value):
+        kw = self.kwargs.copy()
+        if value.ndim == 1:
+            kw.pop("bool_only", None)
+            kw.pop("numeric_only", None)
+            return getattr(value, self.func_name)(**kw)
+        else:
+            return getattr(value, self.func_name)(**kw)
+    def __maxframe_tokenize__(self):
+        # make sure compiled functions are correctly cached
+        return type(self), self.func_name, self.kwargs
 class DataFrameReductionMixin(DataFrameOperatorMixin):
     @classmethod
     def get_reduction_callable(cls, op):
@@ -154,9 +195,7 @@ class DataFrameReductionMixin(DataFrameOperatorMixin):
             skipna=op.skipna, numeric_only=op.numeric_only, bool_only=op.bool_only
         )
         kw = {k: v for k, v in kw.items() if v is not None}
-        fun = functools.partial(_default_agg_fun, func_name=func_name, **kw)
-        fun.__name__ = func_name
-        return fun
+        return ReductionCallable(func_name=func_name, kwargs=kw)
     def _call_groupby_level(self, df, level):
         return df.groupby(level=level).agg(
@@ -426,6 +465,8 @@ _func_name_converts = dict(
     true_divide="truediv",
     floor_divide="floordiv",
     power="pow",
+    subtract="sub",
+    multiply="mul",
 )
 _func_compile_cache = dict()  # type: Dict[str, ReductionSteps]
@@ -442,8 +483,8 @@ _idl_primitive_types = (
 IN_VAR_IDL_OP = "in_var"
 OUT_VAR_IDL_OP = "out_var"
-MASK_VAR_OP = "mask"
-WHERE_VAR_OP = "where"
+MASK_VAR_IDL_OP = "mask"
+WHERE_VAR_IDL_OP = "where"
 LET_VAR_OP = "let"
 UNARY_IDL_OP_PREFIX = "unary:"
 BINARY_IDL_OP_PREFIX = "bin:"
@@ -471,7 +512,7 @@ class ReductionCompiler:
     def _check_function_valid(cls, func):
         if isinstance(func, functools.partial):
             return cls._check_function_valid(func.func)
-        elif isinstance(func, CustomReduction):
+        elif isinstance(func, (CustomReduction, ReductionCallable)):
             return
         func_code = func.__code__
@@ -569,6 +610,7 @@ class ReductionCompiler:
         from ..datasource.dataframe import DataFrameDataSource
         from ..datasource.series import SeriesDataSource
         from ..indexing.where import DataFrameWhere
+        from .custom_reduction import DataFrameCustomReduction
         func_token = tokenize(func, self._axis, func_name, ndim)
         if func_token in _func_compile_cache:
@@ -639,6 +681,9 @@ class ReductionCompiler:
             else:
                 map_func_name, agg_func_name = step_func_name, step_func_name
+            if isinstance(t.op, DataFrameCustomReduction):
+                custom_reduction = custom_reduction or t.op.custom_reduction
             # build agg description
             agg_funcs.append(
                 ReductionAggStep(
@@ -705,7 +750,7 @@ class ReductionCompiler:
         input_op_types = (
             DataFrameDataSource,
             SeriesDataSource,
-            DataFrameReductionOperator,
+            DataFrameReduction,
         )
         def _gen_expr_str(t):
@@ -776,9 +821,11 @@ class ReductionCompiler:
                     cond = _interpret_var(t.op.condition)
                     x = _interpret_var(t.op.x)
                     y = _interpret_var(t.op.y)
-                    statements = [[WHERE_VAR_OP, var_name, [cond, x, y], {}]]
+                    statements = [[WHERE_VAR_IDL_OP, var_name, [cond, x, y], {}]]
                 elif isinstance(t.op, DataFrameWhere):
-                    func_name = MASK_VAR_OP if t.op.replace_true else WHERE_VAR_OP
+                    func_name = (
+                        MASK_VAR_IDL_OP if t.op.replace_true else WHERE_VAR_IDL_OP
+                    )
                     inp = _interpret_var(t.op.input)
                     cond = _interpret_var(t.op.cond)
                     other = _interpret_var(t.op.other)

maxframe/dataframe/reduction/count.py CHANGED Viewed

@@ -14,10 +14,18 @@
 from ... import opcodes
 from ...core import OutputType
-from .core import DataFrameReductionMixin, DataFrameReductionOperator
+from .core import DataFrameReduction, DataFrameReductionMixin, ReductionCallable
-class DataFrameCount(DataFrameReductionOperator, DataFrameReductionMixin):
+class CountReductionCallable(ReductionCallable):
+    def __call__(self, value):
+        skipna, numeric_only = self.kwargs["skipna"], self.kwargs["numeric_only"]
+        if value.ndim == 1:
+            return value.count()
+        return value.count(skipna=skipna, numeric_only=numeric_only)
+class DataFrameCount(DataFrameReduction, DataFrameReductionMixin):
     _op_type_ = opcodes.COUNT
     _func_name = "count"
@@ -28,13 +36,9 @@ class DataFrameCount(DataFrameReductionOperator, DataFrameReductionMixin):
     @classmethod
     def get_reduction_callable(cls, op):
         skipna, numeric_only = op.skipna, op.numeric_only
-        def count(value):
-            if value.ndim == 1:
-                return value.count()
-            return value.count(skipna=skipna, numeric_only=numeric_only)
-        return count
+        return CountReductionCallable(
+            func_name="count", kwargs={"skipna": skipna, "numeric_only": numeric_only}
+        )
 def count_series(series, level=None, **kw):

maxframe/dataframe/reduction/cov.py ADDED Viewed

@@ -0,0 +1,166 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+def cov_dataframe(df, min_periods=None, ddof=1, numeric_only=True):
+    """
+    Compute pairwise covariance of columns, excluding NA/null values.
+    Compute the pairwise covariance among the series of a DataFrame.
+    The returned data frame is the `covariance matrix
+    <https://en.wikipedia.org/wiki/Covariance_matrix>`__ of the columns
+    of the DataFrame.
+    Both NA and null values are automatically excluded from the
+    calculation. (See the note below about bias from missing values.)
+    A threshold can be set for the minimum number of
+    observations for each value created. Comparisons with observations
+    below this threshold will be returned as ``NaN``.
+    This method is generally used for the analysis of time series data to
+    understand the relationship between different measures
+    across time.
+    Parameters
+    ----------
+    min_periods : int, optional
+        Minimum number of observations required per pair of columns
+        to have a valid result.
+    ddof : int, default 1
+        Delta degrees of freedom.  The divisor used in calculations
+        is ``N - ddof``, where ``N`` represents the number of elements.
+        This argument is applicable only when no ``nan`` is in the dataframe.
+    numeric_only : bool, default True
+        Include only `float`, `int` or `boolean` data.
+    Returns
+    -------
+    DataFrame
+        The covariance matrix of the series of the DataFrame.
+    See Also
+    --------
+    Series.cov : Compute covariance with another Series.
+    core.window.ewm.ExponentialMovingWindow.cov : Exponential weighted sample
+        covariance.
+    core.window.expanding.Expanding.cov : Expanding sample covariance.
+    core.window.rolling.Rolling.cov : Rolling sample covariance.
+    Notes
+    -----
+    Returns the covariance matrix of the DataFrame's time series.
+    The covariance is normalized by N-ddof.
+    For DataFrames that have Series that are missing data (assuming that
+    data is `missing at random
+    <https://en.wikipedia.org/wiki/Missing_data#Missing_at_random>`__)
+    the returned covariance matrix will be an unbiased estimate
+    of the variance and covariance between the member Series.
+    However, for many applications this estimate may not be acceptable
+    because the estimate covariance matrix is not guaranteed to be positive
+    semi-definite. This could lead to estimate correlations having
+    absolute values which are greater than one, and/or a non-invertible
+    covariance matrix. See `Estimation of covariance matrices
+    <https://en.wikipedia.org/w/index.php?title=Estimation_of_covariance_
+    matrices>`__ for more details.
+    Examples
+    --------
+    >>> import maxframe.tensor as mt
+    >>> import maxframe.dataframe as md
+    >>> df = md.DataFrame([(1, 2), (0, 3), (2, 0), (1, 1)],
+    ...                   columns=['dogs', 'cats'])
+    >>> df.cov().execute()
+              dogs      cats
+    dogs  0.666667 -1.000000
+    cats -1.000000  1.666667
+    >>> mt.random.seed(42)
+    >>> df = md.DataFrame(mt.random.randn(1000, 5),
+    ...                   columns=['a', 'b', 'c', 'd', 'e'])
+    >>> df.cov().execute()
+              a         b         c         d         e
+    a  0.998438 -0.020161  0.059277 -0.008943  0.014144
+    b -0.020161  1.059352 -0.008543 -0.024738  0.009826
+    c  0.059277 -0.008543  1.010670 -0.001486 -0.000271
+    d -0.008943 -0.024738 -0.001486  0.921297 -0.013692
+    e  0.014144  0.009826 -0.000271 -0.013692  0.977795
+    **Minimum number of periods**
+    This method also supports an optional ``min_periods`` keyword
+    that specifies the required minimum number of non-NA observations for
+    each column pair in order to have a valid result:
+    >>> mt.random.seed(42)
+    >>> df = md.DataFrame(mt.random.randn(20, 3),
+    ...                   columns=['a', 'b', 'c'])
+    >>> df.loc[df.index[:5], 'a'] = mt.nan
+    >>> df.loc[df.index[5:10], 'b'] = mt.nan
+    >>> df.cov(min_periods=12).execute()
+              a         b         c
+    a  0.316741       NaN -0.150812
+    b       NaN  1.248003  0.191417
+    c -0.150812  0.191417  0.895202
+    """
+    from ..statistics.corr import DataFrameCorr
+    if not numeric_only:
+        raise NotImplementedError("numeric_only==True not supported")
+    op = DataFrameCorr(method="cov", min_periods=min_periods, ddof=ddof)
+    return op(df)
+def cov_series(series, other, min_periods=None, ddof=1):
+    """
+    Compute covariance with Series, excluding missing values.
+    The two `Series` objects are not required to be the same length and
+    will be aligned internally before the covariance is calculated.
+    Parameters
+    ----------
+    other : Series
+        Series with which to compute the covariance.
+    min_periods : int, optional
+        Minimum number of observations needed to have a valid result.
+    ddof : int, default 1
+        Delta degrees of freedom.  The divisor used in calculations
+        is ``N - ddof``, where ``N`` represents the number of elements.
+    Returns
+    -------
+    float
+        Covariance between Series and other normalized by N-1
+        (unbiased estimator).
+    See Also
+    --------
+    DataFrame.cov : Compute pairwise covariance of columns.
+    Examples
+    --------
+    >>> import maxframe.dataframe as md
+    >>> s1 = md.Series([0.90010907, 0.13484424, 0.62036035])
+    >>> s2 = md.Series([0.12528585, 0.26962463, 0.51111198])
+    >>> s1.cov(s2).execute()
+    -0.01685762652715874
+    """
+    from ..statistics.corr import DataFrameCorr
+    op = DataFrameCorr(other=other, method="cov", min_periods=min_periods, ddof=ddof)
+    return op(series)

maxframe/dataframe/reduction/cummax.py CHANGED Viewed

@@ -13,10 +13,10 @@
 # limitations under the License.
 from ... import opcodes
-from .core import DataFrameCumReductionMixin, DataFrameCumReductionOperator
+from .core import DataFrameCumReduction, DataFrameCumReductionMixin
-class DataFrameCummax(DataFrameCumReductionOperator, DataFrameCumReductionMixin):
+class DataFrameCummax(DataFrameCumReduction, DataFrameCumReductionMixin):
     _op_type_ = opcodes.CUMMAX
     _func_name = "cummax"

maxframe/dataframe/reduction/cummin.py CHANGED Viewed

@@ -13,10 +13,10 @@
 # limitations under the License.
 from ... import opcodes
-from .core import DataFrameCumReductionMixin, DataFrameCumReductionOperator
+from .core import DataFrameCumReduction, DataFrameCumReductionMixin
-class DataFrameCummin(DataFrameCumReductionOperator, DataFrameCumReductionMixin):
+class DataFrameCummin(DataFrameCumReduction, DataFrameCumReductionMixin):
     _op_type_ = opcodes.CUMMIN
     _func_name = "cummin"

maxframe/dataframe/reduction/cumprod.py CHANGED Viewed

@@ -13,10 +13,10 @@
 # limitations under the License.
 from ... import opcodes
-from .core import DataFrameCumReductionMixin, DataFrameCumReductionOperator
+from .core import DataFrameCumReduction, DataFrameCumReductionMixin
-class DataFrameCumprod(DataFrameCumReductionOperator, DataFrameCumReductionMixin):
+class DataFrameCumprod(DataFrameCumReduction, DataFrameCumReductionMixin):
     _op_type_ = opcodes.CUMPROD
     _func_name = "cumprod"

maxframe/dataframe/reduction/cumsum.py CHANGED Viewed

@@ -13,10 +13,10 @@
 # limitations under the License.
 from ... import opcodes
-from .core import DataFrameCumReductionMixin, DataFrameCumReductionOperator
+from .core import DataFrameCumReduction, DataFrameCumReductionMixin
-class DataFrameCumsum(DataFrameCumReductionOperator, DataFrameCumReductionMixin):
+class DataFrameCumsum(DataFrameCumReduction, DataFrameCumReductionMixin):
     _op_type_ = opcodes.CUMSUM
     _func_name = "cumsum"

maxframe/dataframe/reduction/custom_reduction.py CHANGED Viewed

@@ -15,10 +15,10 @@
 from ... import opcodes
 from ...core import OutputType
 from ...serialization.serializables import AnyField
-from .core import DataFrameReductionMixin, DataFrameReductionOperator
+from .core import DataFrameReduction, DataFrameReductionMixin
-class DataFrameCustomReduction(DataFrameReductionOperator, DataFrameReductionMixin):
+class DataFrameCustomReduction(DataFrameReduction, DataFrameReductionMixin):
     _op_type_ = opcodes.CUSTOM_REDUCTION
     _func_name = "custom_reduction"

maxframe/dataframe/reduction/idxmax.py ADDED Viewed

@@ -0,0 +1,185 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from ... import opcodes
+from ...core import OutputType
+from ..utils import validate_axis
+from .core import DataFrameReduction, DataFrameReductionMixin, ReductionCallable
+class DataFrameIdxMax(DataFrameReduction, DataFrameReductionMixin):
+    _op_type_ = opcodes.IDXMAX
+    _func_name = "idxmax"
+    @property
+    def is_atomic(self):
+        return True
+    def get_reduction_args(self, axis=None):
+        args = dict(skipna=self.skipna)
+        if self.inputs and self.inputs[0].ndim > 1:
+            args["axis"] = axis
+        return {k: v for k, v in args.items() if v is not None}
+    @classmethod
+    def get_reduction_callable(cls, op):
+        func_name = getattr(op, "_func_name")
+        kw = dict(skipna=op.skipna)
+        kw = {k: v for k, v in kw.items() if v is not None}
+        return ReductionCallable(func_name=func_name, kwargs=kw)
+def idxmax_dataframe(df, axis=0, skipna=True):
+    """
+    Return index of first occurrence of maximum over requested axis.
+    NA/null values are excluded.
+    Parameters
+    ----------
+    axis : {0 or 'index', 1 or 'columns'}, default 0
+        The axis to use. 0 or 'index' for row-wise, 1 or 'columns' for column-wise.
+    skipna : bool, default True
+        Exclude NA/null values. If an entire row/column is NA, the result
+        will be NA.
+    Returns
+    -------
+    Series
+        Indexes of maxima along the specified axis.
+    Raises
+    ------
+    ValueError
+        * If the row/column is empty
+    See Also
+    --------
+    Series.idxmax : Return index of the maximum element.
+    Notes
+    -----
+    This method is the DataFrame version of ``ndarray.argmax``.
+    Examples
+    --------
+    Consider a dataset containing food consumption in Argentina.
+    >>> import maxframe.dataframe as md
+    >>> df = md.DataFrame({'consumption': [10.51, 103.11, 55.48],
+    ...                    'co2_emissions': [37.2, 19.66, 1712]},
+    ...                    index=['Pork', 'Wheat Products', 'Beef'])
+    >>> df.execute()
+                    consumption  co2_emissions
+    Pork                  10.51         37.20
+    Wheat Products       103.11         19.66
+    Beef                  55.48       1712.00
+    By default, it returns the index for the maximum value in each column.
+    >>> df.idxmax().execute()
+    consumption     Wheat Products
+    co2_emissions             Beef
+    dtype: object
+    To return the index for the maximum value in each row, use ``axis="columns"``.
+    >>> df.idxmax(axis="columns").execute()
+    Pork              co2_emissions
+    Wheat Products     consumption
+    Beef              co2_emissions
+    dtype: object
+    """
+    axis = validate_axis(axis, df)
+    op = DataFrameIdxMax(
+        axis=axis,
+        skipna=skipna,
+        output_types=[OutputType.series],
+    )
+    return op(df)
+def idxmax_series(series, axis=0, skipna=True):
+    """
+    Return the row label of the maximum value.
+    If multiple values equal the maximum, the first row label with that
+    value is returned.
+    Parameters
+    ----------
+    axis : int, default 0
+        For compatibility with DataFrame.idxmax. Redundant for application
+        on Series.
+    skipna : bool, default True
+        Exclude NA/null values. If the entire Series is NA, the result
+        will be NA.
+    *args, **kwargs
+        Additional arguments and keywords have no effect but might be
+        accepted for compatibility with NumPy.
+    Returns
+    -------
+    Index
+        Label of the maximum value.
+    Raises
+    ------
+    ValueError
+        If the Series is empty.
+    See Also
+    --------
+    numpy.argmax : Return indices of the maximum values
+        along the given axis.
+    DataFrame.idxmax : Return index of first occurrence of maximum
+        over requested axis.
+    Series.idxmin : Return index *label* of the first occurrence
+        of minimum of values.
+    Notes
+    -----
+    This method is the Series version of ``ndarray.argmax``. This method
+    returns the label of the maximum, while ``ndarray.argmax`` returns
+    the position. To get the position, use ``series.values.argmax()``.
+    Examples
+    --------
+    >>> import maxframe.dataframe as md
+    >>> s = md.Series(data=[1, None, 4, 3, 4],
+    ...               index=['A', 'B', 'C', 'D', 'E'])
+    >>> s.execute()
+    A    1.0
+    B    NaN
+    C    4.0
+    D    3.0
+    E    4.0
+    dtype: float64
+    >>> s.idxmax().execute()
+    'C'
+    If `skipna` is False and there is an NA value in the data,
+    the function returns ``nan``.
+    >>> s.idxmax(skipna=False).execute()
+    nan
+    """
+    validate_axis(axis, series)
+    op = DataFrameIdxMax(
+        dropna=skipna,
+        output_types=[OutputType.scalar],
+    )
+    return op(series)