PyPI - maxframe - Versions diffs - 2.0.0b2__cp311-cp311-win32.whl → 2.2.0__cp311-cp311-win32.whl - Mend

maxframe 2.0.0b2cp311-cp311-win32.whl → 2.2.0cp311-cp311-win32.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of maxframe might be problematic. Click here for more details.

Files changed (391) hide show

maxframe/__init__.py +1 -0
maxframe/_utils.cp311-win32.pyd +0 -0
maxframe/_utils.pyx +14 -1
maxframe/codegen/core.py +6 -6
maxframe/codegen/spe/core.py +1 -1
maxframe/codegen/spe/dataframe/__init__.py +1 -0
maxframe/codegen/spe/dataframe/accessors/base.py +18 -0
maxframe/codegen/spe/dataframe/accessors/dict_.py +25 -130
maxframe/codegen/spe/dataframe/accessors/list_.py +12 -48
maxframe/codegen/spe/dataframe/accessors/struct_.py +28 -0
maxframe/codegen/spe/dataframe/arithmetic.py +7 -2
maxframe/codegen/spe/dataframe/groupby.py +88 -0
maxframe/codegen/spe/dataframe/indexing.py +99 -4
maxframe/codegen/spe/dataframe/merge.py +34 -1
maxframe/codegen/spe/dataframe/misc.py +9 -33
maxframe/codegen/spe/dataframe/reduction.py +14 -9
maxframe/codegen/spe/dataframe/reshape.py +46 -0
maxframe/codegen/spe/dataframe/sort.py +30 -17
maxframe/codegen/spe/dataframe/tests/accessors/test_dict.py +9 -15
maxframe/codegen/spe/dataframe/tests/accessors/test_list.py +4 -7
maxframe/codegen/spe/dataframe/tests/accessors/test_struct.py +75 -0
maxframe/codegen/spe/dataframe/tests/indexing/test_iloc.py +20 -1
maxframe/codegen/spe/dataframe/tests/indexing/test_loc.py +35 -0
maxframe/codegen/spe/dataframe/tests/misc/test_misc.py +0 -32
maxframe/codegen/spe/dataframe/tests/test_groupby.py +81 -18
maxframe/codegen/spe/dataframe/tests/test_merge.py +27 -1
maxframe/codegen/spe/dataframe/tests/test_reshape.py +79 -0
maxframe/codegen/spe/dataframe/tests/test_sort.py +20 -0
maxframe/codegen/spe/learn/contrib/tests/test_xgboost.py +2 -1
maxframe/codegen/spe/learn/metrics/__init__.py +1 -1
maxframe/codegen/spe/learn/metrics/_ranking.py +76 -0
maxframe/codegen/spe/learn/metrics/pairwise.py +51 -0
maxframe/codegen/spe/learn/metrics/tests/test_pairwise.py +36 -0
maxframe/codegen/spe/learn/metrics/tests/test_ranking.py +59 -0
maxframe/codegen/spe/tensor/__init__.py +3 -0
maxframe/codegen/spe/tensor/fft.py +74 -0
maxframe/codegen/spe/tensor/linalg.py +29 -2
maxframe/codegen/spe/tensor/misc.py +79 -25
maxframe/codegen/spe/tensor/spatial.py +45 -0
maxframe/codegen/spe/tensor/statistics.py +44 -0
maxframe/codegen/spe/tensor/tests/test_fft.py +64 -0
maxframe/codegen/spe/tensor/tests/test_linalg.py +15 -1
maxframe/codegen/spe/tensor/tests/test_misc.py +52 -2
maxframe/codegen/spe/tensor/tests/test_spatial.py +33 -0
maxframe/codegen/spe/tensor/tests/test_statistics.py +15 -1
maxframe/codegen/spe/tests/test_spe_codegen.py +6 -12
maxframe/codegen/spe/utils.py +2 -0
maxframe/config/config.py +70 -9
maxframe/config/tests/test_validators.py +13 -1
maxframe/config/validators.py +49 -0
maxframe/conftest.py +44 -17
maxframe/core/accessor.py +2 -2
maxframe/core/entity/core.py +5 -0
maxframe/core/entity/tileables.py +1 -1
maxframe/core/graph/core.cp311-win32.pyd +0 -0
maxframe/core/graph/entity.py +1 -2
maxframe/core/operator/base.py +9 -2
maxframe/core/operator/core.py +10 -2
maxframe/core/operator/utils.py +13 -0
maxframe/dataframe/__init__.py +10 -3
maxframe/dataframe/accessors/__init__.py +1 -1
maxframe/dataframe/accessors/compat.py +45 -0
maxframe/dataframe/accessors/datetime_/__init__.py +4 -1
maxframe/dataframe/accessors/dict_/contains.py +7 -16
maxframe/dataframe/accessors/dict_/core.py +48 -0
maxframe/dataframe/accessors/dict_/getitem.py +17 -21
maxframe/dataframe/accessors/dict_/length.py +7 -16
maxframe/dataframe/accessors/dict_/remove.py +6 -18
maxframe/dataframe/accessors/dict_/setitem.py +8 -18
maxframe/dataframe/accessors/dict_/tests/test_dict_accessor.py +62 -22
maxframe/dataframe/accessors/list_/__init__.py +2 -2
maxframe/dataframe/accessors/list_/core.py +48 -0
maxframe/dataframe/accessors/list_/getitem.py +12 -19
maxframe/dataframe/accessors/list_/length.py +7 -16
maxframe/dataframe/accessors/list_/tests/test_list_accessor.py +11 -9
maxframe/dataframe/accessors/string_/__init__.py +4 -1
maxframe/dataframe/accessors/struct_/__init__.py +37 -0
maxframe/dataframe/accessors/struct_/accessor.py +39 -0
maxframe/dataframe/accessors/struct_/core.py +43 -0
maxframe/dataframe/accessors/struct_/dtypes.py +53 -0
maxframe/dataframe/accessors/struct_/field.py +123 -0
maxframe/dataframe/accessors/struct_/tests/__init__.py +13 -0
maxframe/dataframe/accessors/struct_/tests/test_struct_accessor.py +91 -0
maxframe/dataframe/arithmetic/__init__.py +14 -4
maxframe/dataframe/arithmetic/between.py +106 -0
maxframe/dataframe/arithmetic/dot.py +237 -0
maxframe/dataframe/arithmetic/{around.py → round.py} +11 -7
maxframe/dataframe/core.py +63 -118
maxframe/dataframe/datasource/__init__.py +18 -0
maxframe/dataframe/datasource/from_dict.py +124 -0
maxframe/dataframe/datasource/from_index.py +1 -1
maxframe/dataframe/datasource/from_records.py +77 -0
maxframe/dataframe/datasource/from_tensor.py +109 -41
maxframe/dataframe/datasource/read_csv.py +2 -3
maxframe/dataframe/datasource/tests/test_datasource.py +37 -0
maxframe/dataframe/datastore/__init__.py +5 -1
maxframe/dataframe/datastore/to_csv.py +29 -41
maxframe/dataframe/datastore/to_odps.py +30 -4
maxframe/dataframe/extensions/__init__.py +20 -4
maxframe/dataframe/extensions/apply_chunk.py +32 -6
maxframe/dataframe/extensions/cartesian_chunk.py +153 -0
maxframe/dataframe/extensions/collect_kv.py +126 -0
maxframe/dataframe/extensions/extract_kv.py +177 -0
maxframe/dataframe/extensions/map_reduce.py +263 -0
maxframe/dataframe/extensions/rebalance.py +62 -0
maxframe/dataframe/extensions/tests/test_apply_chunk.py +9 -2
maxframe/dataframe/extensions/tests/test_extensions.py +54 -0
maxframe/dataframe/extensions/tests/test_map_reduce.py +135 -0
maxframe/dataframe/groupby/__init__.py +12 -1
maxframe/dataframe/groupby/aggregation.py +78 -45
maxframe/dataframe/groupby/apply.py +1 -1
maxframe/dataframe/groupby/apply_chunk.py +18 -2
maxframe/dataframe/groupby/core.py +96 -12
maxframe/dataframe/groupby/cum.py +4 -25
maxframe/dataframe/groupby/expanding.py +264 -0
maxframe/dataframe/groupby/fill.py +1 -1
maxframe/dataframe/groupby/getitem.py +12 -5
maxframe/dataframe/groupby/head.py +11 -1
maxframe/dataframe/groupby/rank.py +136 -0
maxframe/dataframe/groupby/rolling.py +206 -0
maxframe/dataframe/groupby/shift.py +114 -0
maxframe/dataframe/groupby/tests/test_groupby.py +0 -5
maxframe/dataframe/indexing/__init__.py +20 -1
maxframe/dataframe/indexing/droplevel.py +195 -0
maxframe/dataframe/indexing/filter.py +169 -0
maxframe/dataframe/indexing/get_level_values.py +76 -0
maxframe/dataframe/indexing/iat.py +45 -0
maxframe/dataframe/indexing/iloc.py +152 -12
maxframe/dataframe/indexing/insert.py +1 -1
maxframe/dataframe/indexing/loc.py +287 -7
maxframe/dataframe/indexing/reindex.py +14 -5
maxframe/dataframe/indexing/rename.py +6 -0
maxframe/dataframe/indexing/rename_axis.py +2 -2
maxframe/dataframe/indexing/reorder_levels.py +143 -0
maxframe/dataframe/indexing/reset_index.py +33 -6
maxframe/dataframe/indexing/sample.py +8 -0
maxframe/dataframe/indexing/setitem.py +3 -3
maxframe/dataframe/indexing/swaplevel.py +185 -0
maxframe/dataframe/indexing/take.py +99 -0
maxframe/dataframe/indexing/truncate.py +140 -0
maxframe/dataframe/indexing/where.py +0 -11
maxframe/dataframe/indexing/xs.py +148 -0
maxframe/dataframe/merge/__init__.py +12 -1
maxframe/dataframe/merge/append.py +97 -98
maxframe/dataframe/merge/combine_first.py +120 -0
maxframe/dataframe/merge/compare.py +387 -0
maxframe/dataframe/merge/concat.py +183 -0
maxframe/dataframe/merge/update.py +271 -0
maxframe/dataframe/misc/__init__.py +16 -10
maxframe/dataframe/misc/_duplicate.py +10 -4
maxframe/dataframe/misc/apply.py +1 -1
maxframe/dataframe/misc/check_unique.py +51 -0
maxframe/dataframe/misc/clip.py +145 -0
maxframe/dataframe/misc/describe.py +175 -9
maxframe/dataframe/misc/drop_duplicates.py +2 -2
maxframe/dataframe/misc/duplicated.py +2 -2
maxframe/dataframe/misc/get_dummies.py +5 -1
maxframe/dataframe/misc/isin.py +2 -2
maxframe/dataframe/misc/map.py +94 -0
maxframe/dataframe/misc/tests/test_misc.py +13 -2
maxframe/dataframe/misc/to_numeric.py +3 -0
maxframe/dataframe/misc/transform.py +12 -5
maxframe/dataframe/misc/transpose.py +13 -1
maxframe/dataframe/misc/valid_index.py +115 -0
maxframe/dataframe/misc/value_counts.py +38 -4
maxframe/dataframe/missing/checkna.py +13 -6
maxframe/dataframe/missing/dropna.py +5 -0
maxframe/dataframe/missing/fillna.py +1 -1
maxframe/dataframe/missing/replace.py +7 -4
maxframe/dataframe/reduction/__init__.py +29 -15
maxframe/dataframe/reduction/aggregation.py +38 -9
maxframe/dataframe/reduction/all.py +2 -2
maxframe/dataframe/reduction/any.py +2 -2
maxframe/dataframe/reduction/argmax.py +100 -0
maxframe/dataframe/reduction/argmin.py +100 -0
maxframe/dataframe/reduction/core.py +65 -18
maxframe/dataframe/reduction/count.py +13 -9
maxframe/dataframe/reduction/cov.py +166 -0
maxframe/dataframe/reduction/cummax.py +2 -2
maxframe/dataframe/reduction/cummin.py +2 -2
maxframe/dataframe/reduction/cumprod.py +2 -2
maxframe/dataframe/reduction/cumsum.py +2 -2
maxframe/dataframe/reduction/custom_reduction.py +2 -2
maxframe/dataframe/reduction/idxmax.py +185 -0
maxframe/dataframe/reduction/idxmin.py +185 -0
maxframe/dataframe/reduction/kurtosis.py +37 -30
maxframe/dataframe/reduction/max.py +2 -2
maxframe/dataframe/reduction/mean.py +9 -7
maxframe/dataframe/reduction/median.py +2 -2
maxframe/dataframe/reduction/min.py +2 -2
maxframe/dataframe/reduction/nunique.py +9 -8
maxframe/dataframe/reduction/prod.py +18 -13
maxframe/dataframe/reduction/reduction_size.py +2 -2
maxframe/dataframe/reduction/sem.py +13 -9
maxframe/dataframe/reduction/skew.py +31 -27
maxframe/dataframe/reduction/str_concat.py +10 -7
maxframe/dataframe/reduction/sum.py +18 -14
maxframe/dataframe/reduction/unique.py +20 -3
maxframe/dataframe/reduction/var.py +16 -12
maxframe/dataframe/reshape/__init__.py +38 -0
maxframe/dataframe/{misc → reshape}/pivot.py +1 -0
maxframe/dataframe/{misc → reshape}/pivot_table.py +1 -0
maxframe/dataframe/reshape/unstack.py +114 -0
maxframe/dataframe/sort/__init__.py +8 -0
maxframe/dataframe/sort/argsort.py +62 -0
maxframe/dataframe/sort/core.py +1 -0
maxframe/dataframe/sort/nlargest.py +238 -0
maxframe/dataframe/sort/nsmallest.py +228 -0
maxframe/dataframe/statistics/__init__.py +3 -3
maxframe/dataframe/statistics/corr.py +1 -0
maxframe/dataframe/statistics/quantile.py +2 -2
maxframe/dataframe/tests/test_typing.py +104 -0
maxframe/dataframe/tests/test_utils.py +66 -2
maxframe/dataframe/typing_.py +185 -0
maxframe/dataframe/utils.py +95 -26
maxframe/dataframe/window/aggregation.py +8 -4
maxframe/dataframe/window/core.py +14 -1
maxframe/dataframe/window/ewm.py +1 -3
maxframe/dataframe/window/expanding.py +37 -35
maxframe/dataframe/window/rolling.py +49 -39
maxframe/dataframe/window/tests/test_expanding.py +1 -7
maxframe/dataframe/window/tests/test_rolling.py +1 -1
maxframe/env.py +7 -4
maxframe/errors.py +2 -2
maxframe/io/odpsio/schema.py +9 -3
maxframe/io/odpsio/tableio.py +7 -2
maxframe/io/odpsio/tests/test_schema.py +198 -83
maxframe/learn/__init__.py +10 -2
maxframe/learn/cluster/__init__.py +15 -0
maxframe/learn/cluster/_kmeans.py +782 -0
maxframe/learn/contrib/llm/core.py +2 -0
maxframe/learn/contrib/xgboost/core.py +86 -1
maxframe/learn/contrib/xgboost/train.py +5 -2
maxframe/learn/core.py +66 -0
maxframe/learn/linear_model/_base.py +58 -1
maxframe/learn/linear_model/_lin_reg.py +1 -1
maxframe/learn/metrics/__init__.py +6 -0
maxframe/learn/metrics/_classification.py +145 -0
maxframe/learn/metrics/_ranking.py +477 -0
maxframe/learn/metrics/_scorer.py +60 -0
maxframe/learn/metrics/pairwise/__init__.py +21 -0
maxframe/learn/metrics/pairwise/core.py +77 -0
maxframe/learn/metrics/pairwise/cosine.py +115 -0
maxframe/learn/metrics/pairwise/euclidean.py +176 -0
maxframe/learn/metrics/pairwise/haversine.py +96 -0
maxframe/learn/metrics/pairwise/manhattan.py +80 -0
maxframe/learn/metrics/pairwise/pairwise.py +127 -0
maxframe/learn/metrics/pairwise/pairwise_distances_topk.py +121 -0
maxframe/learn/metrics/pairwise/rbf_kernel.py +51 -0
maxframe/learn/metrics/tests/__init__.py +13 -0
maxframe/learn/metrics/tests/test_scorer.py +26 -0
maxframe/learn/utils/__init__.py +1 -1
maxframe/learn/utils/checks.py +1 -2
maxframe/learn/utils/core.py +59 -0
maxframe/learn/utils/extmath.py +37 -0
maxframe/learn/utils/odpsio.py +193 -0
maxframe/learn/utils/validation.py +2 -2
maxframe/lib/compat.py +40 -0
maxframe/lib/dtypes_extension/__init__.py +16 -1
maxframe/lib/dtypes_extension/_fake_arrow_dtype.py +604 -0
maxframe/lib/dtypes_extension/blob.py +304 -0
maxframe/lib/dtypes_extension/dtypes.py +40 -0
maxframe/lib/dtypes_extension/tests/test_blob.py +88 -0
maxframe/lib/dtypes_extension/tests/test_dtypes.py +16 -1
maxframe/lib/dtypes_extension/tests/test_fake_arrow_dtype.py +75 -0
maxframe/lib/filesystem/_oss_lib/common.py +122 -50
maxframe/lib/filesystem/_oss_lib/glob.py +1 -1
maxframe/lib/filesystem/_oss_lib/handle.py +21 -25
maxframe/lib/filesystem/base.py +1 -1
maxframe/lib/filesystem/core.py +1 -1
maxframe/lib/filesystem/oss.py +115 -46
maxframe/lib/filesystem/tests/test_oss.py +74 -36
maxframe/lib/mmh3.cp311-win32.pyd +0 -0
maxframe/lib/wrapped_pickle.py +10 -0
maxframe/opcodes.py +33 -15
maxframe/protocol.py +12 -0
maxframe/serialization/__init__.py +11 -2
maxframe/serialization/arrow.py +38 -13
maxframe/serialization/blob.py +32 -0
maxframe/serialization/core.cp311-win32.pyd +0 -0
maxframe/serialization/core.pyx +39 -1
maxframe/serialization/exception.py +2 -4
maxframe/serialization/numpy.py +11 -0
maxframe/serialization/pandas.py +46 -9
maxframe/serialization/serializables/core.py +2 -2
maxframe/serialization/tests/test_serial.py +29 -2
maxframe/tensor/__init__.py +38 -8
maxframe/tensor/arithmetic/__init__.py +19 -10
maxframe/tensor/arithmetic/iscomplexobj.py +53 -0
maxframe/tensor/arithmetic/tests/test_arithmetic.py +6 -0
maxframe/tensor/core.py +3 -2
maxframe/tensor/datasource/tests/test_datasource.py +2 -1
maxframe/tensor/extensions/__init__.py +2 -0
maxframe/tensor/extensions/apply_chunk.py +3 -3
maxframe/tensor/extensions/rebalance.py +65 -0
maxframe/tensor/fft/__init__.py +32 -0
maxframe/tensor/fft/core.py +168 -0
maxframe/tensor/fft/fft.py +112 -0
maxframe/tensor/fft/fft2.py +118 -0
maxframe/tensor/fft/fftfreq.py +80 -0
maxframe/tensor/fft/fftn.py +123 -0
maxframe/tensor/fft/fftshift.py +79 -0
maxframe/tensor/fft/hfft.py +112 -0
maxframe/tensor/fft/ifft.py +114 -0
maxframe/tensor/fft/ifft2.py +115 -0
maxframe/tensor/fft/ifftn.py +123 -0
maxframe/tensor/fft/ifftshift.py +73 -0
maxframe/tensor/fft/ihfft.py +93 -0
maxframe/tensor/fft/irfft.py +118 -0
maxframe/tensor/fft/irfft2.py +62 -0
maxframe/tensor/fft/irfftn.py +114 -0
maxframe/tensor/fft/rfft.py +116 -0
maxframe/tensor/fft/rfft2.py +63 -0
maxframe/tensor/fft/rfftfreq.py +87 -0
maxframe/tensor/fft/rfftn.py +113 -0
maxframe/tensor/indexing/fill_diagonal.py +1 -7
maxframe/tensor/linalg/__init__.py +7 -0
maxframe/tensor/linalg/_einsumfunc.py +1025 -0
maxframe/tensor/linalg/cholesky.py +117 -0
maxframe/tensor/linalg/einsum.py +339 -0
maxframe/tensor/linalg/lstsq.py +100 -0
maxframe/tensor/linalg/matrix_norm.py +75 -0
maxframe/tensor/linalg/norm.py +249 -0
maxframe/tensor/linalg/solve.py +72 -0
maxframe/tensor/linalg/solve_triangular.py +2 -2
maxframe/tensor/linalg/vector_norm.py +113 -0
maxframe/tensor/misc/__init__.py +24 -1
maxframe/tensor/misc/argwhere.py +72 -0
maxframe/tensor/misc/array_split.py +46 -0
maxframe/tensor/misc/broadcast_arrays.py +57 -0
maxframe/tensor/misc/copyto.py +130 -0
maxframe/tensor/misc/delete.py +104 -0
maxframe/tensor/misc/dsplit.py +68 -0
maxframe/tensor/misc/ediff1d.py +74 -0
maxframe/tensor/misc/expand_dims.py +85 -0
maxframe/tensor/misc/flip.py +90 -0
maxframe/tensor/misc/fliplr.py +64 -0
maxframe/tensor/misc/flipud.py +68 -0
maxframe/tensor/misc/hsplit.py +85 -0
maxframe/tensor/misc/insert.py +139 -0
maxframe/tensor/misc/moveaxis.py +83 -0
maxframe/tensor/misc/result_type.py +88 -0
maxframe/tensor/misc/roll.py +124 -0
maxframe/tensor/misc/rollaxis.py +77 -0
maxframe/tensor/misc/shape.py +89 -0
maxframe/tensor/misc/split.py +190 -0
maxframe/tensor/misc/tile.py +109 -0
maxframe/tensor/misc/vsplit.py +74 -0
maxframe/tensor/reduction/array_equal.py +2 -1
maxframe/tensor/sort/__init__.py +2 -0
maxframe/tensor/sort/argpartition.py +98 -0
maxframe/tensor/sort/partition.py +228 -0
maxframe/tensor/spatial/__init__.py +15 -0
maxframe/tensor/spatial/distance/__init__.py +17 -0
maxframe/tensor/spatial/distance/cdist.py +421 -0
maxframe/tensor/spatial/distance/pdist.py +398 -0
maxframe/tensor/spatial/distance/squareform.py +153 -0
maxframe/tensor/special/__init__.py +159 -21
maxframe/tensor/special/airy.py +55 -0
maxframe/tensor/special/bessel.py +199 -0
maxframe/tensor/special/core.py +65 -4
maxframe/tensor/special/ellip_func_integrals.py +155 -0
maxframe/tensor/special/ellip_harm.py +55 -0
maxframe/tensor/special/err_fresnel.py +223 -0
maxframe/tensor/special/gamma_funcs.py +303 -0
maxframe/tensor/special/hypergeometric_funcs.py +69 -0
maxframe/tensor/special/info_theory.py +189 -0
maxframe/tensor/special/misc.py +21 -0
maxframe/tensor/statistics/__init__.py +6 -0
maxframe/tensor/statistics/corrcoef.py +77 -0
maxframe/tensor/statistics/cov.py +222 -0
maxframe/tensor/statistics/digitize.py +126 -0
maxframe/tensor/statistics/histogram.py +520 -0
maxframe/tensor/statistics/median.py +85 -0
maxframe/tensor/statistics/ptp.py +89 -0
maxframe/tensor/utils.py +3 -3
maxframe/tests/test_utils.py +43 -1
maxframe/tests/utils.py +0 -2
maxframe/typing_.py +2 -0
maxframe/udf.py +27 -2
maxframe/utils.py +193 -19
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/METADATA +3 -2
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/RECORD +391 -236
maxframe_client/fetcher.py +35 -4
maxframe_client/session/odps.py +7 -2
maxframe_client/tests/test_fetcher.py +76 -3
maxframe_client/tests/test_session.py +4 -1
/maxframe/dataframe/{misc → reshape}/melt.py +0 -0
/maxframe/dataframe/{misc → reshape}/stack.py +0 -0
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/WHEEL +0 -0
{maxframe-2.0.0b2.dist-info → maxframe-2.2.0.dist-info}/top_level.txt +0 -0

maxframe/dataframe/arithmetic/dot.py ADDED Viewed

@@ -0,0 +1,237 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import List
+import numpy as np
+import pandas as pd
+from ... import opcodes
+from ...core import EntityData
+from ...serialization.serializables import AnyField, KeyField
+from ...tensor import tensor as astensor
+from ...tensor.core import TENSOR_TYPE
+from ..core import DATAFRAME_TYPE, SERIES_TYPE
+from ..operators import DataFrameOperator, DataFrameOperatorMixin
+from ..utils import parse_index
+class DataFrameDot(DataFrameOperator, DataFrameOperatorMixin):
+    _op_type_ = opcodes.DOT
+    lhs = KeyField("lhs")
+    rhs = AnyField("rhs")
+    def __init__(self, output_types=None, **kw):
+        super().__init__(_output_types=output_types, **kw)
+    @classmethod
+    def _set_inputs(cls, op: "DataFrameDot", inputs: List[EntityData]):
+        super()._set_inputs(op, inputs)
+        op.lhs, op.rhs = op._inputs[:2]
+    def __call__(self, lhs, rhs):
+        lhs = self._process_input(lhs)
+        rhs = self._process_input(rhs)
+        if not isinstance(rhs, (DATAFRAME_TYPE, SERIES_TYPE)):
+            rhs = astensor(rhs)
+            test_rhs = rhs
+        else:
+            test_rhs = rhs.to_tensor()
+        test_ret = lhs.to_tensor().dot(test_rhs)
+        if test_ret.ndim == 0:
+            if isinstance(lhs, SERIES_TYPE) and isinstance(rhs, TENSOR_TYPE):
+                # return tensor
+                return test_ret
+            return self.new_scalar([lhs, rhs], dtype=test_ret.dtype)
+        elif test_ret.ndim == 1:
+            if lhs.ndim == 1:
+                if hasattr(rhs, "columns_value"):
+                    index_value = rhs.columns_value
+                else:
+                    # tensor
+                    length = -1 if np.isnan(rhs.shape[1]) else rhs.shape[1]
+                    pd_index = pd.RangeIndex(length)
+                    index_value = parse_index(pd_index, store_data=True)
+            else:
+                assert rhs.ndim == 1
+                index_value = lhs.index_value
+            return self.new_series(
+                [lhs, rhs],
+                shape=test_ret.shape,
+                dtype=test_ret.dtype,
+                index_value=index_value,
+            )
+        else:
+            if isinstance(rhs, TENSOR_TYPE):
+                dtypes = pd.Series(
+                    np.repeat(test_ret.dtype, test_ret.shape[1]),
+                    index=pd.RangeIndex(test_ret.shape[1]),
+                )
+                columns_value = parse_index(dtypes.index, store_data=True)
+            else:
+                dtypes = pd.Series(
+                    np.repeat(test_ret.dtype, test_ret.shape[1]),
+                    index=rhs.columns_value.to_pandas(),
+                )
+                columns_value = rhs.columns_value
+            return self.new_dataframe(
+                [lhs, rhs],
+                shape=test_ret.shape,
+                index_value=lhs.index_value,
+                columns_value=columns_value,
+                dtypes=dtypes,
+            )
+def dot(df_or_series, other):
+    op = DataFrameDot(lhs=df_or_series, rhs=other)
+    return op(df_or_series, other)
+def rdot(df_or_series, other):
+    op = DataFrameDot(lhs=other, rhs=df_or_series)
+    return op(other, df_or_series)
+dot.__frame_doc__ = """
+Compute the matrix multiplication between the DataFrame and other.
+This method computes the matrix product between the DataFrame and the
+values of an other Series, DataFrame or a numpy array.
+It can also be called using ``self @ other`` in Python >= 3.5.
+Parameters
+----------
+other : Series, DataFrame or array-like
+    The other object to compute the matrix product with.
+Returns
+-------
+Series or DataFrame
+    If other is a Series, return the matrix product between self and
+    other as a Series. If other is a DataFrame or a numpy.array, return
+    the matrix product of self and other in a DataFrame of a np.array.
+See Also
+--------
+Series.dot: Similar method for Series.
+Notes
+-----
+The dimensions of DataFrame and other must be compatible in order to
+compute the matrix multiplication. In addition, the column names of
+DataFrame and the index of other must contain the same values, as they
+will be aligned prior to the multiplication.
+The dot method for Series computes the inner product, instead of the
+matrix product here.
+Examples
+--------
+Here we multiply a DataFrame with a Series.
+>>> import maxframe.tensor as mt
+>>> import maxframe.dataframe as md
+>>> df = md.DataFrame([[0, 1, -2, -1], [1, 1, 1, 1]])
+>>> s = md.Series([1, 1, 2, 1])
+>>> df.dot(s).execute()
+0    -4
+1     5
+dtype: int64
+Here we multiply a DataFrame with another DataFrame.
+>>> other = md.DataFrame([[0, 1], [1, 2], [-1, -1], [2, 0]])
+>>> df.dot(other).execute()
+    0   1
+0   1   4
+1   2   2
+Note that the dot method give the same result as @
+>>> (df @ other).execute()
+    0   1
+0   1   4
+1   2   2
+The dot method works also if other is an np.array.
+>>> arr = mt.array([[0, 1], [1, 2], [-1, -1], [2, 0]])
+>>> df.dot(arr).execute()
+    0   1
+0   1   4
+1   2   2
+Note how shuffling of the objects does not change the result.
+>>> s2 = s.reindex([1, 0, 2, 3])
+>>> df.dot(s2).execute()
+0    -4
+1     5
+dtype: int64
+"""
+dot.__series_doc__ = """
+Compute the dot product between the Series and the columns of other.
+This method computes the dot product between the Series and another
+one, or the Series and each columns of a DataFrame, or the Series and
+each columns of an array.
+It can also be called using `self @ other` in Python >= 3.5.
+Parameters
+----------
+other : Series, DataFrame or array-like
+    The other object to compute the dot product with its columns.
+Returns
+-------
+scalar, Series or numpy.ndarray
+    Return the dot product of the Series and other if other is a
+    Series, the Series of the dot product of Series and each rows of
+    other if other is a DataFrame or a numpy.ndarray between the Series
+    and each columns of the numpy array.
+See Also
+--------
+DataFrame.dot: Compute the matrix product with the DataFrame.
+Series.mul: Multiplication of series and other, element-wise.
+Notes
+-----
+The Series and other has to share the same index if other is a Series
+or a DataFrame.
+Examples
+--------
+>>> import maxframe.tensor as mt
+>>> import maxframe.dataframe as md
+>>> s = md.Series([0, 1, 2, 3])
+>>> other = md.Series([-1, 2, -3, 4])
+>>> s.dot(other).execute()
+8
+>>> (s @ other).execute()
+8
+>>> df = md.DataFrame([[0, 1], [-2, 3], [4, -5], [6, 7]])
+>>> s.dot(df).execute()
+0    24
+1    14
+dtype: int64
+>>> arr = mt.array([[0, 1], [-2, 3], [4, -5], [6, 7]])
+>>> s.dot(arr).execute()
+array([24, 14])
+"""

maxframe/dataframe/arithmetic/{around.py → round.py} RENAMED Viewed

@@ -18,9 +18,10 @@ from ...utils import classproperty
 from .core import DataFrameUnaryUfunc
-class DataFrameAround(DataFrameUnaryUfunc):
+class DataFrameRound(DataFrameUnaryUfunc):
     _op_type_ = opcodes.AROUND
-    _func_name = "around"
+    _func_name = "round"
+    _legacy_name = "DataFrameAround"  # since v2.3.0
     decimals = Int32Field("decimals", default=None)
@@ -34,17 +35,20 @@ class DataFrameAround(DataFrameUnaryUfunc):
         return TensorAround
-def around(df, decimals=0, *args, **kwargs):
+def round(df, decimals=0, *args, **kwargs):
     if len(args) > 0:
         raise TypeError(
             f"round() takes 0 positional arguments but {len(args)} was given"
         )
-    op = DataFrameAround(decimals=decimals, **kwargs)
+    op = DataFrameRound(decimals=decimals, **kwargs)
     return op(df)
-# FIXME Series input of decimals not supported yet
-around.__frame_doc__ = """
+# keep for import compatibility
+DataFrameAround = DataFrameRound
+round.__frame_doc__ = """
 Round a DataFrame to a variable number of decimal places.
 Parameters
@@ -108,7 +112,7 @@ places as value
 2   0.7   0.0
 3   0.2   0.0
 """
-around.__series_doc__ = """
+round.__series_doc__ = """
 Round each value in a Series to the given number of decimals.
 Parameters

maxframe/dataframe/core.py CHANGED Viewed

@@ -56,8 +56,11 @@ from ..utils import (
     ceildiv,
     estimate_pandas_size,
     on_serialize_numpy_type,
+    pd_release_version,
+    prevent_called_from_pandas,
     tokenize,
 )
+from .typing_ import DataFrameType, IndexType, SeriesType
 from .utils import (
     ReprSeries,
     apply_if_callable,
@@ -66,6 +69,8 @@ from .utils import (
     parse_index,
 )
+_df_with_iteritems = pd_release_version[:2] < (2, 0)
 class IndexValue(Serializable):
     """
@@ -478,9 +483,17 @@ _lazy_chunk_meta_properties = (
 )
+def _calc_cum_nsplit(nsplit: Tuple[int]) -> List[int]:
+    return [0] + np.cumsum(nsplit).tolist()
+def calc_cum_nsplits(nsplits: Tuple[Tuple[int]]) -> List[List[int]]:
+    return tuple(_calc_cum_nsplit(nsplit) for nsplit in nsplits)
 @functools.lru_cache(maxsize=128)
 def _get_cum_nsplit(nsplit: Tuple[int]) -> List[int]:
-    return [0] + np.cumsum(nsplit).tolist()
+    return _calc_cum_nsplit(nsplit)
 def _calc_axis_slice(nsplit: Tuple[int], index: int) -> slice:
@@ -684,6 +697,10 @@ class IndexData(HasShapeTileableData, _ToPandasMixin):
     def names(self):
         return getattr(self, "_names", None) or [self.name]
+    @property
+    def nlevels(self) -> int:
+        return len(self.names)
     @property
     def index_value(self) -> IndexValue:
         return self._index_value
@@ -818,6 +835,9 @@ class Index(HasShapeTileable, _ToPandasMixin):
     def __len__(self):
         return len(self._data)
+    def __class_getitem__(cls, item):
+        return IndexType.from_getitem_args(item)
     def __maxframe_tensor__(self, dtype=None, order="K"):
         return self._data.__maxframe_tensor__(dtype=dtype, order=order)
@@ -1049,12 +1069,6 @@ class BaseSeriesData(HasShapeTileableData, _ToPandasMixin):
         return from_series(self, dtype=dtype)
-    @staticmethod
-    def from_tensor(in_tensor, index=None, name=None):
-        from .datasource.from_tensor import series_from_tensor
-        return series_from_tensor(in_tensor, index=index, name=name)
 class SeriesData(_BatchedFetcher, BaseSeriesData):
     type_name = "Series"
@@ -1065,8 +1079,9 @@ class SeriesData(_BatchedFetcher, BaseSeriesData):
         return tensor.astype(dtype=dtype, order=order, copy=False)
     def iteritems(self, batch_size=10000, session=None):
+        method_name = "iteritems" if _df_with_iteritems else "items"
         for batch_data in self.iterbatch(batch_size=batch_size, session=session):
-            yield from getattr(batch_data, "iteritems")()
+            yield from getattr(batch_data, method_name)()
     items = iteritems
@@ -1082,12 +1097,39 @@ class SeriesData(_BatchedFetcher, BaseSeriesData):
         name = name or self.name or 0
         return dataframe_from_tensor(self, columns=[name])
+    @property
+    def hasnans(self):
+        """
+        Return True if there are any NaNs.
+        Returns
+        -------
+        bool
+        Examples
+        --------
+        >>> import maxframe.dataframe as md
+        >>> s = md.Series([1, 2, 3, None])
+        >>> s.execute()
+        0    1.0
+        1    2.0
+        2    3.0
+        3    NaN
+        dtype: float64
+        >>> s.hasnans.execute()
+        True
+        """
+        return self.isna().any()
 class Series(HasShapeTileable, _ToPandasMixin):
     __slots__ = ("_cache",)
     _allow_data_type_ = (SeriesData,)
     type_name = "Series"
+    def __class_getitem__(cls, item):
+        return SeriesType.from_getitem_args(item)
     def to_tensor(self, dtype=None):
         return self._data.to_tensor(dtype=dtype)
@@ -1185,6 +1227,11 @@ class Series(HasShapeTileable, _ToPandasMixin):
         else:
             return super()._view()
+    def __iter__(self):
+        # prevent being called by pandas to make sure `__eq__` works
+        prevent_called_from_pandas()
+        return (tp[1] for tp in self.items())
     def __len__(self):
         return len(self._data)
@@ -1297,98 +1344,6 @@ class Series(HasShapeTileable, _ToPandasMixin):
         """
         return self._data.to_frame(name=name)
-    def between(self, left, right, inclusive="both"):
-        """
-        Return boolean Series equivalent to left <= series <= right.
-        This function returns a boolean vector containing `True` wherever the
-        corresponding Series element is between the boundary values `left` and
-        `right`. NA values are treated as `False`.
-        Parameters
-        ----------
-        left : scalar or list-like
-            Left boundary.
-        right : scalar or list-like
-            Right boundary.
-        inclusive : {"both", "neither", "left", "right"}
-            Include boundaries. Whether to set each bound as closed or open.
-        Returns
-        -------
-        Series
-            Series representing whether each element is between left and
-            right (inclusive).
-        See Also
-        --------
-        Series.gt : Greater than of series and other.
-        Series.lt : Less than of series and other.
-        Notes
-        -----
-        This function is equivalent to ``(left <= ser) & (ser <= right)``
-        Examples
-        --------
-        >>> import maxframe.dataframe as md
-        >>> s = md.Series([2, 0, 4, 8, np.nan])
-        Boundary values are included by default:
-        >>> s.between(1, 4).execute()
-        0     True
-        1    False
-        2     True
-        3    False
-        4    False
-        dtype: bool
-        With `inclusive` set to ``"neither"`` boundary values are excluded:
-        >>> s.between(1, 4, inclusive="neither").execute()
-        0     True
-        1    False
-        2    False
-        3    False
-        4    False
-        dtype: bool
-        `left` and `right` can be any scalar value:
-        >>> s = md.Series(['Alice', 'Bob', 'Carol', 'Eve'])
-        >>> s.between('Anna', 'Daniel').execute()
-        0    False
-        1     True
-        2     True
-        3    False
-        dtype: bool
-        """
-        if isinstance(inclusive, bool):  # pragma: no cover
-            # for pandas < 1.3.0
-            if inclusive:
-                inclusive = "both"
-            else:
-                inclusive = "neither"
-        if inclusive == "both":
-            lmask = self >= left
-            rmask = self <= right
-        elif inclusive == "left":
-            lmask = self >= left
-            rmask = self < right
-        elif inclusive == "right":
-            lmask = self > left
-            rmask = self <= right
-        elif inclusive == "neither":
-            lmask = self > left
-            rmask = self < right
-        else:
-            raise ValueError(
-                "Inclusive has to be either string of 'both',"
-                "'left', 'right', or 'neither'."
-            )
-        return lmask & rmask
     # def median(
     #     self, axis=None, skipna=True, out=None, overwrite_input=False, keepdims=False
     # ):
@@ -1589,18 +1544,6 @@ class BaseDataFrameData(HasShapeTileableData, _ToPandasMixin):
         return from_dataframe(self, dtype=dtype)
-    @staticmethod
-    def from_tensor(in_tensor, index=None, columns=None):
-        from .datasource.from_tensor import dataframe_from_tensor
-        return dataframe_from_tensor(in_tensor, index=index, columns=columns)
-    @staticmethod
-    def from_records(records, **kw):
-        from .datasource.from_records import from_records
-        return from_records(records, **kw)
     @property
     def index(self):
         from .datasource.index import from_tileable
@@ -1747,12 +1690,6 @@ class DataFrame(HasShapeTileable, _ToPandasMixin):
     def to_tensor(self):
         return self._data.to_tensor()
-    def from_tensor(self, in_tensor, index=None, columns=None):
-        return self._data.from_tensor(in_tensor, index=index, columns=columns)
-    def from_records(self, records, **kw):
-        return self._data.from_records(records, **kw)
     def __maxframe_tensor__(self, dtype=None, order="K"):
         return self._data.__maxframe_tensor__(dtype=dtype, order=order)
@@ -1772,6 +1709,14 @@ class DataFrame(HasShapeTileable, _ToPandasMixin):
             + [k for k in self.dtypes.index if isinstance(k, str) and k.isidentifier()]
         )
+    def __iter__(self):
+        # prevent being called by pandas to make sure `__eq__` works
+        prevent_called_from_pandas()
+        return iter(self.dtypes.index)
+    def __class_getitem__(cls, item):
+        return DataFrameType.from_getitem_args(item)
     @property
     def T(self):
         return self.transpose()

maxframe/dataframe/datasource/__init__.py CHANGED Viewed

@@ -13,3 +13,21 @@
 # limitations under the License.
 from .core import PandasDataSourceOperator
+from .from_dict import dataframe_from_dict
+from .from_records import from_records
+from .from_tensor import dataframe_from_tensor, series_from_tensor
+def _install():
+    from ..core import DATAFRAME_TYPE, SERIES_TYPE
+    for t in DATAFRAME_TYPE:
+        t.from_dict = staticmethod(dataframe_from_dict)
+        t.from_records = staticmethod(from_records)
+        t.from_tensor = staticmethod(dataframe_from_tensor)
+    for t in SERIES_TYPE:
+        t.from_tensor = staticmethod(series_from_tensor)
+_install()
+del _install

maxframe/dataframe/datasource/from_dict.py ADDED Viewed

@@ -0,0 +1,124 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from ...core import ENTITY_TYPE
+from ...utils import find_objects, no_default
+from ..utils import validate_axis
+def dataframe_from_dict(data, orient="columns", dtype=None, columns=None):
+    """
+    Construct DataFrame from dict of array-like or dicts.
+    Creates DataFrame object from dictionary by columns or by index
+    allowing dtype specification.
+    Parameters
+    ----------
+    data : dict
+        Of the form {field : array-like} or {field : dict}.
+    orient : {'columns', 'index', 'tight'}, default 'columns'
+        The "orientation" of the data. If the keys of the passed dict
+        should be the columns of the resulting DataFrame, pass 'columns'
+        (default). Otherwise if the keys should be rows, pass 'index'.
+        If 'tight', assume a dict with keys ['index', 'columns', 'data',
+        'index_names', 'column_names'].
+    dtype : dtype, default None
+        Data type to force after DataFrame construction, otherwise infer.
+    columns : list, default None
+        Column labels to use when ``orient='index'``. Raises a ValueError
+        if used with ``orient='columns'`` or ``orient='tight'``.
+    Returns
+    -------
+    DataFrame
+    See Also
+    --------
+    DataFrame.from_records : DataFrame from structured ndarray, sequence
+        of tuples or dicts, or DataFrame.
+    DataFrame : DataFrame object creation using constructor.
+    DataFrame.to_dict : Convert the DataFrame to a dictionary.
+    Examples
+    --------
+    By default the keys of the dict become the DataFrame columns:
+    >>> import maxframe.dataframe as md
+    >>> data = {'col_1': [3, 2, 1, 0], 'col_2': ['a', 'b', 'c', 'd']}
+    >>> md.DataFrame.from_dict(data).execute()
+       col_1 col_2
+    0      3     a
+    1      2     b
+    2      1     c
+    3      0     d
+    Specify ``orient='index'`` to create the DataFrame using dictionary
+    keys as rows:
+    >>> data = {'row_1': [3, 2, 1, 0], 'row_2': ['a', 'b', 'c', 'd']}
+    >>> md.DataFrame.from_dict(data, orient='index').execute()
+           0  1  2  3
+    row_1  3  2  1  0
+    row_2  a  b  c  d
+    When using the 'index' orientation, the column names can be
+    specified manually:
+    >>> md.DataFrame.from_dict(data, orient='index',
+    ...                        columns=['A', 'B', 'C', 'D']).execute()
+           A  B  C  D
+    row_1  3  2  1  0
+    row_2  a  b  c  d
+    Specify ``orient='tight'`` to create the DataFrame using a 'tight'
+    format:
+    >>> data = {'index': [('a', 'b'), ('a', 'c')],
+    ...         'columns': [('x', 1), ('y', 2)],
+    ...         'data': [[1, 3], [2, 4]],
+    ...         'index_names': ['n1', 'n2'],
+    ...         'column_names': ['z1', 'z2']}
+    >>> md.DataFrame.from_dict(data, orient='tight').execute()
+    z1     x  y
+    z2     1  2
+    n1 n2
+    a  b   1  3
+       c   2  4
+    """
+    from ..initializer import DataFrame as DataFrameInit
+    from .from_tensor import dataframe_from_1d_tileables
+    if orient != "tight" and not find_objects(data, ENTITY_TYPE):
+        res = DataFrameInit(data)
+    elif orient == "tight":
+        # init directly
+        init_kw = {
+            "index": data.get("index"),
+            "columns": data.get("columns"),
+        }
+        df = DataFrameInit(data["data"], **init_kw)
+        rename_kw = {
+            "index": data.get("index_names", no_default),
+            "columns": data.get("column_names", no_default),
+        }
+        res = df.rename_axis(**rename_kw)
+    else:
+        axis = validate_axis(orient)
+        res = dataframe_from_1d_tileables(data, columns=columns, axis=axis)
+    if dtype is not None:
+        res = res.astype(dtype)
+    return res

maxframe 2.0.0b2__cp311-cp311-win32.whl → 2.2.0__cp311-cp311-win32.whl

Potentially problematic release.

maxframe 2.0.0b2cp311-cp311-win32.whl → 2.2.0cp311-cp311-win32.whl