PyPI - maxframe - Versions diffs - 2.0.0b2__cp37-cp37m-win32.whl → 2.3.0rc1__cp37-cp37m-win32.whl - Mend

maxframe 2.0.0b2cp37-cp37m-win32.whl → 2.3.0rc1cp37-cp37m-win32.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of maxframe might be problematic. Click here for more details.

Files changed (443) hide show

maxframe/__init__.py +1 -0
maxframe/_utils.cp37-win32.pyd +0 -0
maxframe/_utils.pyx +14 -1
maxframe/codegen/core.py +9 -8
maxframe/codegen/spe/core.py +1 -1
maxframe/codegen/spe/dataframe/__init__.py +1 -0
maxframe/codegen/spe/dataframe/accessors/base.py +18 -0
maxframe/codegen/spe/dataframe/accessors/dict_.py +25 -130
maxframe/codegen/spe/dataframe/accessors/list_.py +12 -48
maxframe/codegen/spe/dataframe/accessors/struct_.py +28 -0
maxframe/codegen/spe/dataframe/arithmetic.py +7 -2
maxframe/codegen/spe/dataframe/groupby.py +88 -0
maxframe/codegen/spe/dataframe/indexing.py +99 -4
maxframe/codegen/spe/dataframe/merge.py +38 -1
maxframe/codegen/spe/dataframe/misc.py +11 -33
maxframe/codegen/spe/dataframe/reduction.py +32 -9
maxframe/codegen/spe/dataframe/reshape.py +46 -0
maxframe/codegen/spe/dataframe/sort.py +39 -18
maxframe/codegen/spe/dataframe/tests/accessors/test_dict.py +9 -15
maxframe/codegen/spe/dataframe/tests/accessors/test_list.py +4 -7
maxframe/codegen/spe/dataframe/tests/accessors/test_struct.py +75 -0
maxframe/codegen/spe/dataframe/tests/indexing/test_iloc.py +20 -1
maxframe/codegen/spe/dataframe/tests/indexing/test_loc.py +35 -0
maxframe/codegen/spe/dataframe/tests/misc/test_misc.py +0 -32
maxframe/codegen/spe/dataframe/tests/test_groupby.py +81 -18
maxframe/codegen/spe/dataframe/tests/test_merge.py +27 -1
maxframe/codegen/spe/dataframe/tests/test_reduction.py +13 -0
maxframe/codegen/spe/dataframe/tests/test_reshape.py +79 -0
maxframe/codegen/spe/dataframe/tests/test_sort.py +20 -0
maxframe/codegen/spe/dataframe/tseries.py +9 -0
maxframe/codegen/spe/learn/contrib/lightgbm.py +4 -3
maxframe/codegen/spe/learn/contrib/tests/test_xgboost.py +2 -1
maxframe/codegen/spe/learn/metrics/__init__.py +1 -1
maxframe/codegen/spe/learn/metrics/_ranking.py +76 -0
maxframe/codegen/spe/learn/metrics/pairwise.py +51 -0
maxframe/codegen/spe/learn/metrics/tests/test_pairwise.py +36 -0
maxframe/codegen/spe/learn/metrics/tests/test_ranking.py +59 -0
maxframe/codegen/spe/tensor/__init__.py +3 -0
maxframe/codegen/spe/tensor/datasource.py +1 -0
maxframe/codegen/spe/tensor/fft.py +74 -0
maxframe/codegen/spe/tensor/linalg.py +29 -2
maxframe/codegen/spe/tensor/misc.py +79 -25
maxframe/codegen/spe/tensor/spatial.py +45 -0
maxframe/codegen/spe/tensor/statistics.py +44 -0
maxframe/codegen/spe/tensor/tests/test_fft.py +64 -0
maxframe/codegen/spe/tensor/tests/test_linalg.py +15 -1
maxframe/codegen/spe/tensor/tests/test_misc.py +52 -2
maxframe/codegen/spe/tensor/tests/test_spatial.py +33 -0
maxframe/codegen/spe/tensor/tests/test_statistics.py +15 -1
maxframe/codegen/spe/tests/test_spe_codegen.py +6 -12
maxframe/codegen/spe/utils.py +2 -0
maxframe/config/config.py +73 -9
maxframe/config/tests/test_validators.py +13 -1
maxframe/config/validators.py +49 -0
maxframe/conftest.py +54 -17
maxframe/core/accessor.py +2 -2
maxframe/core/base.py +2 -1
maxframe/core/entity/core.py +5 -0
maxframe/core/entity/tileables.py +3 -1
maxframe/core/graph/core.cp37-win32.pyd +0 -0
maxframe/core/graph/entity.py +8 -3
maxframe/core/mode.py +6 -1
maxframe/core/operator/base.py +9 -2
maxframe/core/operator/core.py +10 -2
maxframe/core/operator/utils.py +13 -0
maxframe/dataframe/__init__.py +12 -5
maxframe/dataframe/accessors/__init__.py +1 -1
maxframe/dataframe/accessors/compat.py +45 -0
maxframe/dataframe/accessors/datetime_/__init__.py +4 -1
maxframe/dataframe/accessors/dict_/contains.py +7 -16
maxframe/dataframe/accessors/dict_/core.py +48 -0
maxframe/dataframe/accessors/dict_/getitem.py +17 -21
maxframe/dataframe/accessors/dict_/length.py +7 -16
maxframe/dataframe/accessors/dict_/remove.py +6 -18
maxframe/dataframe/accessors/dict_/setitem.py +8 -18
maxframe/dataframe/accessors/dict_/tests/test_dict_accessor.py +62 -22
maxframe/dataframe/accessors/list_/__init__.py +2 -2
maxframe/dataframe/accessors/list_/core.py +48 -0
maxframe/dataframe/accessors/list_/getitem.py +12 -19
maxframe/dataframe/accessors/list_/length.py +7 -16
maxframe/dataframe/accessors/list_/tests/test_list_accessor.py +11 -9
maxframe/dataframe/accessors/string_/__init__.py +4 -1
maxframe/dataframe/accessors/struct_/__init__.py +37 -0
maxframe/dataframe/accessors/struct_/accessor.py +39 -0
maxframe/dataframe/accessors/struct_/core.py +43 -0
maxframe/dataframe/accessors/struct_/dtypes.py +53 -0
maxframe/dataframe/accessors/struct_/field.py +123 -0
maxframe/dataframe/accessors/struct_/tests/__init__.py +13 -0
maxframe/dataframe/accessors/struct_/tests/test_struct_accessor.py +91 -0
maxframe/dataframe/arithmetic/__init__.py +18 -4
maxframe/dataframe/arithmetic/between.py +106 -0
maxframe/dataframe/arithmetic/dot.py +237 -0
maxframe/dataframe/arithmetic/maximum.py +33 -0
maxframe/dataframe/arithmetic/minimum.py +33 -0
maxframe/dataframe/arithmetic/{around.py → round.py} +11 -7
maxframe/dataframe/core.py +161 -224
maxframe/dataframe/datasource/__init__.py +18 -0
maxframe/dataframe/datasource/core.py +6 -0
maxframe/dataframe/datasource/direct.py +57 -0
maxframe/dataframe/datasource/from_dict.py +124 -0
maxframe/dataframe/datasource/from_index.py +1 -1
maxframe/dataframe/datasource/from_records.py +77 -0
maxframe/dataframe/datasource/from_tensor.py +109 -41
maxframe/dataframe/datasource/read_csv.py +21 -14
maxframe/dataframe/datasource/read_odps_query.py +29 -6
maxframe/dataframe/datasource/read_odps_table.py +32 -10
maxframe/dataframe/datasource/read_parquet.py +38 -39
maxframe/dataframe/datasource/tests/test_datasource.py +37 -0
maxframe/dataframe/datastore/__init__.py +11 -1
maxframe/dataframe/datastore/direct.py +268 -0
maxframe/dataframe/datastore/to_csv.py +29 -41
maxframe/dataframe/datastore/to_odps.py +36 -4
maxframe/dataframe/extensions/__init__.py +20 -4
maxframe/dataframe/extensions/apply_chunk.py +32 -6
maxframe/dataframe/extensions/cartesian_chunk.py +153 -0
maxframe/dataframe/extensions/collect_kv.py +126 -0
maxframe/dataframe/extensions/extract_kv.py +177 -0
maxframe/dataframe/extensions/flatjson.py +2 -1
maxframe/dataframe/extensions/map_reduce.py +263 -0
maxframe/dataframe/extensions/rebalance.py +62 -0
maxframe/dataframe/extensions/tests/test_apply_chunk.py +9 -2
maxframe/dataframe/extensions/tests/test_extensions.py +54 -0
maxframe/dataframe/extensions/tests/test_map_reduce.py +135 -0
maxframe/dataframe/groupby/__init__.py +17 -2
maxframe/dataframe/groupby/aggregation.py +86 -49
maxframe/dataframe/groupby/apply.py +1 -1
maxframe/dataframe/groupby/apply_chunk.py +19 -5
maxframe/dataframe/groupby/core.py +116 -16
maxframe/dataframe/groupby/cum.py +4 -25
maxframe/dataframe/groupby/expanding.py +264 -0
maxframe/dataframe/groupby/fill.py +1 -1
maxframe/dataframe/groupby/getitem.py +12 -5
maxframe/dataframe/groupby/head.py +11 -1
maxframe/dataframe/groupby/rank.py +136 -0
maxframe/dataframe/groupby/rolling.py +206 -0
maxframe/dataframe/groupby/shift.py +114 -0
maxframe/dataframe/groupby/tests/test_groupby.py +0 -5
maxframe/dataframe/indexing/__init__.py +22 -2
maxframe/dataframe/indexing/droplevel.py +195 -0
maxframe/dataframe/indexing/filter.py +169 -0
maxframe/dataframe/indexing/get_level_values.py +76 -0
maxframe/dataframe/indexing/iat.py +45 -0
maxframe/dataframe/indexing/iloc.py +152 -12
maxframe/dataframe/indexing/insert.py +46 -18
maxframe/dataframe/indexing/loc.py +287 -7
maxframe/dataframe/indexing/reindex.py +14 -5
maxframe/dataframe/indexing/rename.py +6 -0
maxframe/dataframe/indexing/rename_axis.py +2 -2
maxframe/dataframe/indexing/reorder_levels.py +143 -0
maxframe/dataframe/indexing/reset_index.py +33 -6
maxframe/dataframe/indexing/sample.py +8 -0
maxframe/dataframe/indexing/setitem.py +3 -3
maxframe/dataframe/indexing/swaplevel.py +185 -0
maxframe/dataframe/indexing/take.py +99 -0
maxframe/dataframe/indexing/truncate.py +140 -0
maxframe/dataframe/indexing/where.py +0 -11
maxframe/dataframe/indexing/xs.py +148 -0
maxframe/dataframe/merge/__init__.py +15 -1
maxframe/dataframe/merge/append.py +97 -98
maxframe/dataframe/merge/combine.py +244 -0
maxframe/dataframe/merge/combine_first.py +120 -0
maxframe/dataframe/merge/compare.py +387 -0
maxframe/dataframe/merge/concat.py +183 -0
maxframe/dataframe/merge/update.py +271 -0
maxframe/dataframe/misc/__init__.py +28 -11
maxframe/dataframe/misc/_duplicate.py +10 -4
maxframe/dataframe/misc/apply.py +1 -1
maxframe/dataframe/misc/check_unique.py +82 -0
maxframe/dataframe/misc/clip.py +145 -0
maxframe/dataframe/misc/describe.py +175 -9
maxframe/dataframe/misc/drop.py +31 -0
maxframe/dataframe/misc/drop_duplicates.py +2 -2
maxframe/dataframe/misc/duplicated.py +2 -2
maxframe/dataframe/misc/get_dummies.py +5 -1
maxframe/dataframe/misc/infer_dtypes.py +251 -0
maxframe/dataframe/misc/isin.py +2 -2
maxframe/dataframe/misc/map.py +125 -18
maxframe/dataframe/misc/repeat.py +159 -0
maxframe/dataframe/misc/tests/test_misc.py +48 -3
maxframe/dataframe/misc/to_numeric.py +3 -0
maxframe/dataframe/misc/transform.py +12 -5
maxframe/dataframe/misc/transpose.py +13 -1
maxframe/dataframe/misc/valid_index.py +115 -0
maxframe/dataframe/misc/value_counts.py +38 -4
maxframe/dataframe/missing/checkna.py +14 -6
maxframe/dataframe/missing/dropna.py +5 -0
maxframe/dataframe/missing/fillna.py +1 -1
maxframe/dataframe/missing/replace.py +7 -4
maxframe/dataframe/reduction/__init__.py +35 -16
maxframe/dataframe/reduction/aggregation.py +43 -14
maxframe/dataframe/reduction/all.py +2 -2
maxframe/dataframe/reduction/any.py +2 -2
maxframe/dataframe/reduction/argmax.py +103 -0
maxframe/dataframe/reduction/argmin.py +103 -0
maxframe/dataframe/reduction/core.py +80 -24
maxframe/dataframe/reduction/count.py +13 -9
maxframe/dataframe/reduction/cov.py +166 -0
maxframe/dataframe/reduction/cummax.py +2 -2
maxframe/dataframe/reduction/cummin.py +2 -2
maxframe/dataframe/reduction/cumprod.py +2 -2
maxframe/dataframe/reduction/cumsum.py +2 -2
maxframe/dataframe/reduction/custom_reduction.py +2 -2
maxframe/dataframe/reduction/idxmax.py +185 -0
maxframe/dataframe/reduction/idxmin.py +185 -0
maxframe/dataframe/reduction/kurtosis.py +37 -30
maxframe/dataframe/reduction/max.py +2 -2
maxframe/dataframe/reduction/mean.py +9 -7
maxframe/dataframe/reduction/median.py +2 -2
maxframe/dataframe/reduction/min.py +2 -2
maxframe/dataframe/reduction/mode.py +144 -0
maxframe/dataframe/reduction/nunique.py +19 -11
maxframe/dataframe/reduction/prod.py +18 -13
maxframe/dataframe/reduction/reduction_size.py +2 -2
maxframe/dataframe/reduction/sem.py +13 -9
maxframe/dataframe/reduction/skew.py +31 -27
maxframe/dataframe/reduction/str_concat.py +10 -7
maxframe/dataframe/reduction/sum.py +18 -14
maxframe/dataframe/reduction/tests/test_reduction.py +12 -0
maxframe/dataframe/reduction/unique.py +20 -3
maxframe/dataframe/reduction/var.py +16 -12
maxframe/dataframe/reshape/__init__.py +38 -0
maxframe/dataframe/{misc → reshape}/pivot.py +1 -0
maxframe/dataframe/{misc → reshape}/pivot_table.py +1 -0
maxframe/dataframe/reshape/unstack.py +114 -0
maxframe/dataframe/sort/__init__.py +16 -1
maxframe/dataframe/sort/argsort.py +68 -0
maxframe/dataframe/sort/core.py +2 -1
maxframe/dataframe/sort/nlargest.py +238 -0
maxframe/dataframe/sort/nsmallest.py +228 -0
maxframe/dataframe/sort/rank.py +147 -0
maxframe/dataframe/statistics/__init__.py +3 -3
maxframe/dataframe/statistics/corr.py +1 -0
maxframe/dataframe/statistics/quantile.py +2 -2
maxframe/dataframe/tests/test_typing.py +104 -0
maxframe/dataframe/tests/test_utils.py +66 -2
maxframe/dataframe/tseries/__init__.py +19 -0
maxframe/dataframe/tseries/at_time.py +61 -0
maxframe/dataframe/tseries/between_time.py +122 -0
maxframe/dataframe/typing_.py +185 -0
maxframe/dataframe/utils.py +125 -52
maxframe/dataframe/window/aggregation.py +8 -4
maxframe/dataframe/window/core.py +14 -1
maxframe/dataframe/window/ewm.py +1 -3
maxframe/dataframe/window/expanding.py +37 -35
maxframe/dataframe/window/rolling.py +49 -39
maxframe/dataframe/window/tests/test_expanding.py +1 -7
maxframe/dataframe/window/tests/test_rolling.py +1 -1
maxframe/env.py +7 -4
maxframe/errors.py +2 -2
maxframe/io/odpsio/schema.py +9 -3
maxframe/io/odpsio/tableio.py +7 -2
maxframe/io/odpsio/tests/test_schema.py +198 -83
maxframe/learn/__init__.py +10 -2
maxframe/learn/cluster/__init__.py +15 -0
maxframe/learn/cluster/_kmeans.py +782 -0
maxframe/learn/contrib/llm/core.py +18 -7
maxframe/learn/contrib/llm/deploy/__init__.py +13 -0
maxframe/learn/contrib/llm/deploy/config.py +221 -0
maxframe/learn/contrib/llm/deploy/core.py +247 -0
maxframe/learn/contrib/llm/deploy/framework.py +35 -0
maxframe/learn/contrib/llm/deploy/loader.py +360 -0
maxframe/learn/contrib/llm/deploy/tests/__init__.py +13 -0
maxframe/learn/contrib/llm/deploy/tests/test_register_models.py +359 -0
maxframe/learn/contrib/llm/models/__init__.py +1 -0
maxframe/learn/contrib/llm/models/dashscope.py +12 -6
maxframe/learn/contrib/llm/models/managed.py +76 -11
maxframe/learn/contrib/llm/models/openai.py +72 -0
maxframe/learn/contrib/llm/tests/__init__.py +13 -0
maxframe/learn/contrib/llm/tests/test_core.py +34 -0
maxframe/learn/contrib/llm/tests/test_openai.py +187 -0
maxframe/learn/contrib/llm/tests/test_text_gen.py +155 -0
maxframe/learn/contrib/llm/text.py +348 -42
maxframe/learn/contrib/models.py +4 -1
maxframe/learn/contrib/xgboost/classifier.py +2 -0
maxframe/learn/contrib/xgboost/core.py +113 -4
maxframe/learn/contrib/xgboost/predict.py +4 -2
maxframe/learn/contrib/xgboost/regressor.py +5 -0
maxframe/learn/contrib/xgboost/train.py +7 -2
maxframe/learn/core.py +66 -0
maxframe/learn/linear_model/_base.py +58 -1
maxframe/learn/linear_model/_lin_reg.py +1 -1
maxframe/learn/metrics/__init__.py +6 -0
maxframe/learn/metrics/_classification.py +145 -0
maxframe/learn/metrics/_ranking.py +477 -0
maxframe/learn/metrics/_scorer.py +60 -0
maxframe/learn/metrics/pairwise/__init__.py +21 -0
maxframe/learn/metrics/pairwise/core.py +77 -0
maxframe/learn/metrics/pairwise/cosine.py +115 -0
maxframe/learn/metrics/pairwise/euclidean.py +176 -0
maxframe/learn/metrics/pairwise/haversine.py +96 -0
maxframe/learn/metrics/pairwise/manhattan.py +80 -0
maxframe/learn/metrics/pairwise/pairwise.py +127 -0
maxframe/learn/metrics/pairwise/pairwise_distances_topk.py +121 -0
maxframe/learn/metrics/pairwise/rbf_kernel.py +51 -0
maxframe/learn/metrics/tests/__init__.py +13 -0
maxframe/learn/metrics/tests/test_scorer.py +26 -0
maxframe/learn/preprocessing/_data/min_max_scaler.py +34 -23
maxframe/learn/preprocessing/_data/standard_scaler.py +34 -25
maxframe/learn/utils/__init__.py +2 -1
maxframe/learn/utils/checks.py +1 -2
maxframe/learn/utils/core.py +59 -0
maxframe/learn/utils/extmath.py +79 -9
maxframe/learn/utils/odpsio.py +262 -0
maxframe/learn/utils/validation.py +2 -2
maxframe/lib/compat.py +40 -0
maxframe/lib/dtypes_extension/__init__.py +16 -1
maxframe/lib/dtypes_extension/_fake_arrow_dtype.py +604 -0
maxframe/lib/dtypes_extension/blob.py +304 -0
maxframe/lib/dtypes_extension/dtypes.py +40 -0
maxframe/lib/dtypes_extension/tests/test_blob.py +88 -0
maxframe/lib/dtypes_extension/tests/test_dtypes.py +16 -1
maxframe/lib/dtypes_extension/tests/test_fake_arrow_dtype.py +75 -0
maxframe/lib/filesystem/_oss_lib/common.py +124 -50
maxframe/lib/filesystem/_oss_lib/glob.py +1 -1
maxframe/lib/filesystem/_oss_lib/handle.py +21 -25
maxframe/lib/filesystem/base.py +1 -1
maxframe/lib/filesystem/core.py +1 -1
maxframe/lib/filesystem/oss.py +115 -46
maxframe/lib/filesystem/tests/test_oss.py +74 -36
maxframe/lib/mmh3.cp37-win32.pyd +0 -0
maxframe/lib/wrapped_pickle.py +10 -0
maxframe/opcodes.py +41 -15
maxframe/protocol.py +12 -0
maxframe/remote/core.py +4 -0
maxframe/serialization/__init__.py +11 -2
maxframe/serialization/arrow.py +38 -13
maxframe/serialization/blob.py +32 -0
maxframe/serialization/core.cp37-win32.pyd +0 -0
maxframe/serialization/core.pyx +39 -1
maxframe/serialization/exception.py +2 -4
maxframe/serialization/numpy.py +11 -0
maxframe/serialization/pandas.py +46 -9
maxframe/serialization/serializables/core.py +2 -2
maxframe/serialization/tests/test_serial.py +31 -4
maxframe/tensor/__init__.py +38 -8
maxframe/tensor/arithmetic/__init__.py +19 -10
maxframe/tensor/arithmetic/core.py +2 -2
maxframe/tensor/arithmetic/iscomplexobj.py +53 -0
maxframe/tensor/arithmetic/tests/test_arithmetic.py +6 -9
maxframe/tensor/core.py +6 -2
maxframe/tensor/datasource/tests/test_datasource.py +2 -1
maxframe/tensor/extensions/__init__.py +2 -0
maxframe/tensor/extensions/apply_chunk.py +3 -3
maxframe/tensor/extensions/rebalance.py +65 -0
maxframe/tensor/fft/__init__.py +32 -0
maxframe/tensor/fft/core.py +168 -0
maxframe/tensor/fft/fft.py +112 -0
maxframe/tensor/fft/fft2.py +118 -0
maxframe/tensor/fft/fftfreq.py +80 -0
maxframe/tensor/fft/fftn.py +123 -0
maxframe/tensor/fft/fftshift.py +79 -0
maxframe/tensor/fft/hfft.py +112 -0
maxframe/tensor/fft/ifft.py +114 -0
maxframe/tensor/fft/ifft2.py +115 -0
maxframe/tensor/fft/ifftn.py +123 -0
maxframe/tensor/fft/ifftshift.py +73 -0
maxframe/tensor/fft/ihfft.py +93 -0
maxframe/tensor/fft/irfft.py +118 -0
maxframe/tensor/fft/irfft2.py +62 -0
maxframe/tensor/fft/irfftn.py +114 -0
maxframe/tensor/fft/rfft.py +116 -0
maxframe/tensor/fft/rfft2.py +63 -0
maxframe/tensor/fft/rfftfreq.py +87 -0
maxframe/tensor/fft/rfftn.py +113 -0
maxframe/tensor/indexing/fill_diagonal.py +1 -7
maxframe/tensor/linalg/__init__.py +7 -0
maxframe/tensor/linalg/_einsumfunc.py +1025 -0
maxframe/tensor/linalg/cholesky.py +117 -0
maxframe/tensor/linalg/einsum.py +339 -0
maxframe/tensor/linalg/lstsq.py +100 -0
maxframe/tensor/linalg/matrix_norm.py +75 -0
maxframe/tensor/linalg/norm.py +249 -0
maxframe/tensor/linalg/solve.py +72 -0
maxframe/tensor/linalg/solve_triangular.py +2 -2
maxframe/tensor/linalg/vector_norm.py +113 -0
maxframe/tensor/misc/__init__.py +24 -1
maxframe/tensor/misc/argwhere.py +72 -0
maxframe/tensor/misc/array_split.py +46 -0
maxframe/tensor/misc/broadcast_arrays.py +57 -0
maxframe/tensor/misc/copyto.py +130 -0
maxframe/tensor/misc/delete.py +104 -0
maxframe/tensor/misc/dsplit.py +68 -0
maxframe/tensor/misc/ediff1d.py +74 -0
maxframe/tensor/misc/expand_dims.py +85 -0
maxframe/tensor/misc/flip.py +90 -0
maxframe/tensor/misc/fliplr.py +64 -0
maxframe/tensor/misc/flipud.py +68 -0
maxframe/tensor/misc/hsplit.py +85 -0
maxframe/tensor/misc/insert.py +139 -0
maxframe/tensor/misc/moveaxis.py +83 -0
maxframe/tensor/misc/result_type.py +88 -0
maxframe/tensor/misc/roll.py +124 -0
maxframe/tensor/misc/rollaxis.py +77 -0
maxframe/tensor/misc/shape.py +89 -0
maxframe/tensor/misc/split.py +190 -0
maxframe/tensor/misc/tile.py +109 -0
maxframe/tensor/misc/vsplit.py +74 -0
maxframe/tensor/reduction/array_equal.py +2 -1
maxframe/tensor/sort/__init__.py +2 -0
maxframe/tensor/sort/argpartition.py +98 -0
maxframe/tensor/sort/partition.py +228 -0
maxframe/tensor/spatial/__init__.py +15 -0
maxframe/tensor/spatial/distance/__init__.py +17 -0
maxframe/tensor/spatial/distance/cdist.py +421 -0
maxframe/tensor/spatial/distance/pdist.py +398 -0
maxframe/tensor/spatial/distance/squareform.py +153 -0
maxframe/tensor/special/__init__.py +159 -21
maxframe/tensor/special/airy.py +55 -0
maxframe/tensor/special/bessel.py +199 -0
maxframe/tensor/special/core.py +65 -4
maxframe/tensor/special/ellip_func_integrals.py +155 -0
maxframe/tensor/special/ellip_harm.py +55 -0
maxframe/tensor/special/err_fresnel.py +223 -0
maxframe/tensor/special/gamma_funcs.py +303 -0
maxframe/tensor/special/hypergeometric_funcs.py +69 -0
maxframe/tensor/special/info_theory.py +189 -0
maxframe/tensor/special/misc.py +21 -0
maxframe/tensor/statistics/__init__.py +6 -0
maxframe/tensor/statistics/corrcoef.py +77 -0
maxframe/tensor/statistics/cov.py +222 -0
maxframe/tensor/statistics/digitize.py +126 -0
maxframe/tensor/statistics/histogram.py +520 -0
maxframe/tensor/statistics/median.py +85 -0
maxframe/tensor/statistics/ptp.py +89 -0
maxframe/tensor/utils.py +3 -3
maxframe/tests/test_udf.py +61 -0
maxframe/tests/test_utils.py +51 -6
maxframe/tests/utils.py +0 -2
maxframe/typing_.py +2 -0
maxframe/udf.py +130 -9
maxframe/utils.py +254 -27
{maxframe-2.0.0b2.dist-info → maxframe-2.3.0rc1.dist-info}/METADATA +3 -3
{maxframe-2.0.0b2.dist-info → maxframe-2.3.0rc1.dist-info}/RECORD +442 -264
maxframe_client/fetcher.py +35 -4
maxframe_client/session/odps.py +7 -2
maxframe_client/session/task.py +8 -1
maxframe_client/tests/test_fetcher.py +76 -3
maxframe_client/tests/test_session.py +28 -1
maxframe/dataframe/arrays.py +0 -864
/maxframe/dataframe/{misc → reshape}/melt.py +0 -0
/maxframe/dataframe/{misc → reshape}/stack.py +0 -0
{maxframe-2.0.0b2.dist-info → maxframe-2.3.0rc1.dist-info}/WHEEL +0 -0
{maxframe-2.0.0b2.dist-info → maxframe-2.3.0rc1.dist-info}/top_level.txt +0 -0

maxframe/dataframe/indexing/filter.py ADDED Viewed

@@ -0,0 +1,169 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import re
+import numpy as np
+import pandas as pd
+from ... import opcodes
+from ...core import get_output_types
+from ...serialization.serializables import Int32Field, ListField, StringField
+from ..operators import DataFrameOperator, DataFrameOperatorMixin
+from ..utils import parse_index
+class DataFrameFilter(DataFrameOperatorMixin, DataFrameOperator):
+    _op_type_ = opcodes.DATAFRAME_FILTER
+    items = ListField("items", default=None)
+    like = StringField("like", default=None)
+    regex = StringField("regex", default=None)
+    axis = Int32Field("axis", default=None)
+    def __call__(self, df_or_series):
+        self._output_types = get_output_types(df_or_series)
+        # Get axis labels to filter
+        if self.axis == 0:
+            # Filter by index
+            labels = df_or_series.index_value.to_pandas()
+        else:
+            # Filter by columns (DataFrame only)
+            if not hasattr(df_or_series, "columns"):
+                raise ValueError("axis=1 (columns) not valid for Series")
+            labels = df_or_series.columns_value.to_pandas()
+        # Apply filter criteria
+        filtered_labels = self._apply_filter_criteria(labels)
+        # Calculate output shape and metadata
+        out_params = self._calculate_output_metadata(df_or_series, filtered_labels)
+        return self.new_tileable([df_or_series], **out_params)
+    def _apply_filter_criteria(self, labels):
+        """Apply filter criteria to labels"""
+        if self.items is not None:
+            # Exact match filter
+            return [label for label in labels if label in self.items]
+        elif self.like is not None:
+            # Substring match filter
+            return [label for label in labels if self.like in str(label)]
+        elif self.regex is not None:
+            # Regex match filter
+            pattern = re.compile(self.regex)
+            return [label for label in labels if pattern.search(str(label))]
+        else:
+            return list(labels)
+    def _calculate_output_metadata(self, input_tileable, filtered_labels):
+        input_shape = input_tileable.shape
+        out_params = input_tileable.params
+        if self.axis == 0:
+            out_params["shape"] = (len(filtered_labels) or np.nan,) + input_shape[1:]
+            out_params["index_value"] = parse_index(
+                pd.Index(filtered_labels), input_tileable.index_value
+            )
+        else:
+            out_params["shape"] = (input_shape[0], len(filtered_labels))
+            out_params["columns_value"] = parse_index(
+                input_tileable.dtypes[filtered_labels].index, store_data=True
+            )
+        return out_params
+def filter_dataframe(df_or_series, items=None, like=None, regex=None, axis=None):
+    """
+    Subset the dataframe rows or columns according to the specified index labels.
+    Note that this routine does not filter a dataframe on its
+    contents. The filter is applied to the labels of the index.
+    Parameters
+    ----------
+    items : list-like
+        Keep labels from axis which are in items.
+    like : str
+        Keep labels from axis for which "like in label == True".
+    regex : str (regular expression)
+        Keep labels from axis for which re.search(regex, label) == True.
+    axis : {0 or 'index', 1 or 'columns', None}, default None
+        The axis to filter on, expressed either as an index (int)
+        or axis name (str). By default this is the info axis, 'columns' for
+        DataFrame. For `Series` this parameter is unused and defaults to `None`.
+    Returns
+    -------
+    same type as input object
+    See Also
+    --------
+    DataFrame.loc : Access a group of rows and columns
+        by label(s) or a boolean array.
+    Notes
+    -----
+    The ``items``, ``like``, and ``regex`` parameters are
+    enforced to be mutually exclusive.
+    ``axis`` defaults to the info axis that is used when indexing
+    with ``[]``.
+    Examples
+    --------
+    >>> import maxframe.tensor as mt
+    >>> import maxframe.dataframe as md
+    >>> df = md.DataFrame(mt.array(([1, 2, 3], [4, 5, 6])),
+    ...                   index=['mouse', 'rabbit'],
+    ...                   columns=['one', 'two', 'three'])
+    >>> df.execute()
+            one  two  three
+    mouse     1    2      3
+    rabbit    4    5      6
+    >>> # select columns by name
+    >>> df.filter(items=['one', 'three']).execute()
+             one  three
+    mouse     1      3
+    rabbit    4      6
+    >>> # select columns by regular expression
+    >>> df.filter(regex='e$', axis=1).execute()
+             one  three
+    mouse     1      3
+    rabbit    4      6
+    >>> # select rows containing 'bbi'
+    >>> df.filter(like='bbi', axis=0).execute()
+             one  two  three
+    rabbit    4    5      6
+    """
+    if axis is None:
+        # For Series, axis is always 0 (index)
+        # For DataFrame, default is 1 (columns)
+        if hasattr(df_or_series, "columns"):
+            axis = 1  # DataFrame - filter columns by default
+        else:
+            axis = 0  # Series - filter index
+    param_count = sum(x is not None for x in [items, like, regex])
+    if param_count == 0:
+        raise TypeError("Must pass either `items`, `like`, or `regex`")
+    if param_count > 1:
+        raise TypeError(
+            "keyword arguments `items`, `like`, `regex` are mutually exclusive"
+        )
+    op = DataFrameFilter(items=items, like=like, regex=regex, axis=axis)
+    return op(df_or_series)

maxframe/dataframe/indexing/get_level_values.py ADDED Viewed

@@ -0,0 +1,76 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from ... import opcodes
+from ...serialization.serializables import AnyField
+from ..operators import DataFrameOperator, DataFrameOperatorMixin
+from ..utils import parse_index
+class IndexGetLevelValues(DataFrameOperator, DataFrameOperatorMixin):
+    _op_type_ = opcodes.GET_LEVEL_VALUES
+    level = AnyField("level")
+    def __init__(self, output_types=None, **kw):
+        super().__init__(_output_types=output_types, **kw)
+    def __call__(self, index):
+        empty_index = index.index_value.to_pandas()
+        result_index = empty_index.get_level_values(self.level)
+        return self.new_index(
+            [index],
+            shape=(index.shape[0],),
+            dtype=result_index.dtype,
+            index_value=parse_index(result_index, store_data=False),
+            names=result_index.names,
+        )
+def get_level_values(index, level):
+    """
+    Return vector of label values for requested level.
+    Length of returned vector is equal to the length of the index.
+    Parameters
+    ----------
+    level : int or str
+        ``level`` is either the integer position of the level in the
+        MultiIndex, or the name of the level.
+    Returns
+    -------
+    values : Index
+        Values is a level of this MultiIndex converted to
+        a single :class:`Index` (or subclass thereof).
+    Examples
+    --------
+    Create a MultiIndex:
+    >>> import maxframe.dataframe as md
+    >>> import pandas as pd
+    >>> mi = md.Index(pd.MultiIndex.from_arrays((list('abc'), list('def')), names=['level_1', 'level_2']))
+    Get level values by supplying level as either integer or name:
+    >>> mi.get_level_values(0).execute()
+    Index(['a', 'b', 'c'], dtype='object', name='level_1')
+    >>> mi.get_level_values('level_2').execute()
+    Index(['d', 'e', 'f'], dtype='object', name='level_2')
+    """
+    op = IndexGetLevelValues(level=level)
+    return op(index)

maxframe/dataframe/indexing/iat.py CHANGED Viewed

@@ -34,4 +34,49 @@ class DataFrameIat:
 def iat(a):
+    """
+    Access a single value for a row/column pair by integer position.
+    Similar to ``iloc``, in that both provide integer-based lookups. Use
+    ``iat`` if you only need to get or set a single value in a DataFrame
+    or Series.
+    Raises
+    ------
+    IndexError
+        When integer position is out of bounds.
+    See Also
+    --------
+    DataFrame.at : Access a single value for a row/column label pair.
+    DataFrame.loc : Access a group of rows and columns by label(s).
+    DataFrame.iloc : Access a group of rows and columns by integer position(s).
+    Examples
+    --------
+    >>> import maxframe.dataframe as md
+    >>> df = md.DataFrame([[0, 2, 3], [0, 4, 1], [10, 20, 30]],
+    ...                   columns=['A', 'B', 'C'])
+    >>> df.execute()
+        A   B   C
+    0   0   2   3
+    1   0   4   1
+    2  10  20  30
+    Get value at specified row/column pair
+    >>> df.iat[1, 2].execute()
+    1
+    Set value at specified row/column pair
+    >>> df.iat[1, 2] = 10
+    >>> df.iat[1, 2].execute()
+    10
+    Get value within a series
+    >>> df.loc[0].iat[1].execute()
+    2
+    """
     return DataFrameIat(a)

maxframe/dataframe/indexing/iloc.py CHANGED Viewed

@@ -27,7 +27,7 @@ from ...serialization.serializables import AnyField, KeyField, ListField
 from ...tensor import asarray
 from ...tensor.indexing.core import calc_shape
 from ..operators import DATAFRAME_TYPE, DataFrameOperator, DataFrameOperatorMixin
-from ..utils import indexing_index_value
+from ..utils import indexing_index_value, validate_axis
 _ILOC_ERROR_MSG = (
     "Location based indexing can only have [integer, "
@@ -36,13 +36,16 @@ _ILOC_ERROR_MSG = (
 )
-def process_iloc_indexes(inp, indexes):
+def process_iloc_indexes(inp, indexes, axis=0):
     ndim = inp.ndim
     if not isinstance(indexes, tuple):
         indexes = (indexes,)
     if len(indexes) < ndim:
-        indexes += (slice(None),) * (ndim - len(indexes))
+        if not axis:
+            indexes += (slice(None),) * (ndim - len(indexes))
+        else:
+            indexes = (slice(None),) * (ndim - len(indexes)) + indexes
     if len(indexes) > ndim:
         raise IndexingError("Too many indexers")
@@ -105,32 +108,35 @@ def process_iloc_indexes(inp, indexes):
 class DataFrameIloc:
-    def __init__(self, obj):
+    def __init__(self, obj, axis=None):
         self._obj = obj
+        self._axis = axis
     def __getitem__(self, indexes):
+        indexes = process_iloc_indexes(self._obj, indexes, axis=self._axis)
         if isinstance(self._obj, DATAFRAME_TYPE):
-            op = DataFrameIlocGetItem(indexes=process_iloc_indexes(self._obj, indexes))
+            op = DataFrameIlocGetItem(indexes=indexes)
         else:
-            op = SeriesIlocGetItem(indexes=process_iloc_indexes(self._obj, indexes))
+            op = SeriesIlocGetItem(indexes=indexes)
         return op(self._obj)
     def __setitem__(self, indexes, value):
         if not np.isscalar(value):
             raise NotImplementedError("Only scalar value is supported to set by iloc")
+        indexes = process_iloc_indexes(self._obj, indexes, axis=self._axis)
         if isinstance(self._obj, DATAFRAME_TYPE):
-            op = DataFrameIlocSetItem(
-                indexes=process_iloc_indexes(self._obj, indexes), value=value
-            )
+            op = DataFrameIlocSetItem(indexes=indexes, value=value)
         else:
-            op = SeriesIlocSetItem(
-                indexes=process_iloc_indexes(self._obj, indexes), value=value
-            )
+            op = SeriesIlocSetItem(indexes=indexes, value=value)
         ret = op(self._obj)
         self._obj.data = ret.data
+    def __call__(self, axis):
+        axis = validate_axis(axis, self._obj)
+        return DataFrameIloc(self._obj, axis)
 class HeadTailOptimizedOperatorMixin(DataFrameOperatorMixin):
     __slots__ = ()
@@ -420,6 +426,140 @@ def index_setitem(_idx, *_):
 def iloc(a):
+    """
+    Purely integer-location based indexing for selection by position.
+    ``.iloc[]`` is primarily integer position based (from ``0`` to
+    ``length-1`` of the axis), but may also be used with a boolean
+    array.
+    Allowed inputs are:
+    - An integer, e.g. ``5``.
+    - A list or array of integers, e.g. ``[4, 3, 0]``.
+    - A slice object with ints, e.g. ``1:7``.
+    - A boolean array.
+    - A ``callable`` function with one argument (the calling Series or
+      DataFrame) and that returns valid output for indexing (one of the above).
+      This is useful in method chains, when you don't have a reference to the
+      calling object, but would like to base your selection on some value.
+    ``.iloc`` will raise ``IndexError`` if a requested indexer is
+    out-of-bounds, except *slice* indexers which allow out-of-bounds
+    indexing (this conforms with python/numpy *slice* semantics).
+    See more at :ref:`Selection by Position <indexing.integer>`.
+    See Also
+    --------
+    DataFrame.iat : Fast integer location scalar accessor.
+    DataFrame.loc : Purely label-location based indexer for selection by label.
+    Series.iloc : Purely integer-location based indexing for
+                   selection by position.
+    Examples
+    --------
+    >>> import maxframe.dataframe as md
+    >>> mydict = [{'a': 1, 'b': 2, 'c': 3, 'd': 4},
+    ...           {'a': 100, 'b': 200, 'c': 300, 'd': 400},
+    ...           {'a': 1000, 'b': 2000, 'c': 3000, 'd': 4000 }]
+    >>> df = md.DataFrame(mydict)
+    >>> df.execute()
+          a     b     c     d
+    0     1     2     3     4
+    1   100   200   300   400
+    2  1000  2000  3000  4000
+    **Indexing just the rows**
+    With a scalar integer.
+    >>> type(df.iloc[0]).execute()
+    <class 'pandas.core.series.Series'>
+    >>> df.iloc[0].execute()
+    a    1
+    b    2
+    c    3
+    d    4
+    Name: 0, dtype: int64
+    With a list of integers.
+    >>> df.iloc[[0]].execute()
+       a  b  c  d
+    0  1  2  3  4
+    >>> type(df.iloc[[0]]).execute()
+    <class 'pandas.core.frame.DataFrame'>
+    >>> df.iloc[[0, 1]].execute()
+         a    b    c    d
+    0    1    2    3    4
+    1  100  200  300  400
+    With a `slice` object.
+    >>> df.iloc[:3].execute()
+          a     b     c     d
+    0     1     2     3     4
+    1   100   200   300   400
+    2  1000  2000  3000  4000
+    With a boolean mask the same length as the index.
+    >>> df.iloc[[True, False, True]].execute()
+          a     b     c     d
+    0     1     2     3     4
+    2  1000  2000  3000  4000
+    With a callable, useful in method chains. The `x` passed
+    to the ``lambda`` is the DataFrame being sliced. This selects
+    the rows whose index label even.
+    >>> df.iloc[lambda x: x.index % 2 == 0].execute()
+          a     b     c     d
+    0     1     2     3     4
+    2  1000  2000  3000  4000
+    **Indexing both axes**
+    You can mix the indexer types for the index and columns. Use ``:`` to
+    select the entire axis.
+    With scalar integers.
+    >>> df.iloc[0, 1].execute()
+    2
+    With lists of integers.
+    >>> df.iloc[[0, 2], [1, 3]].execute()
+          b     d
+    0     2     4
+    2  2000  4000
+    With `slice` objects.
+    >>> df.iloc[1:3, 0:3].execute()
+          a     b     c
+    1   100   200   300
+    2  1000  2000  3000
+    With a boolean array whose length matches the columns.
+    >>> df.iloc[:, [True, False, True, False]].execute()
+          a     c
+    0     1     3
+    1   100   300
+    2  1000  3000
+    With a callable function that expects the Series or DataFrame.
+    >>> df.iloc[:, lambda df: [0, 2]].execute()
+          a     c
+    0     1     3
+    1   100   300
+    2  1000  3000
+    """
     return DataFrameIloc(a)

maxframe/dataframe/indexing/insert.py CHANGED Viewed

@@ -17,10 +17,10 @@ from typing import List
 import pandas as pd
 from ... import opcodes
-from ...core import EntityData
+from ...core import EntityData, get_output_types
 from ...serialization.serializables import AnyField, BoolField, Int64Field
 from ...tensor.core import TENSOR_TYPE
-from ..core import SERIES_TYPE
+from ..core import INDEX_TYPE, SERIES_TYPE
 from ..operators import DataFrameOperator, DataFrameOperatorMixin
 from ..utils import build_empty_df, parse_index
@@ -29,17 +29,18 @@ class DataFrameInsert(DataFrameOperator, DataFrameOperatorMixin):
     _op_type_ = opcodes.INSERT
     loc = Int64Field("loc")
-    column = AnyField("column")
-    value = AnyField("value")
-    allow_duplicates = BoolField("allow_duplicates")
+    column = AnyField("column", default=None)
+    value = AnyField("value", default=None)
+    allow_duplicates = BoolField("allow_duplicates", default=False)
     @classmethod
     def _set_inputs(cls, op: "DataFrameInsert", inputs: List[EntityData]):
         super()._set_inputs(op, inputs)
         if len(inputs) > 1:
-            op._value = op._inputs[-1]
+            op.value = op._inputs[-1]
     def __call__(self, df):
+        self._output_types = get_output_types(df)
         inputs = [df]
         if isinstance(self.value, (SERIES_TYPE, TENSOR_TYPE)):
             value_dtype = self.value.dtype
@@ -47,19 +48,27 @@ class DataFrameInsert(DataFrameOperator, DataFrameOperatorMixin):
         else:
             value_dtype = pd.Series(self.value).dtype
-        empty_df = build_empty_df(df.dtypes)
-        empty_df.insert(
-            loc=self.loc,
-            column=self.column,
-            allow_duplicates=self.allow_duplicates,
-            value=pd.Series([], dtype=value_dtype),
-        )
         params = df.params
-        params["columns_value"] = parse_index(empty_df.columns, store_data=True)
-        params["dtypes"] = empty_df.dtypes
-        params["shape"] = (df.shape[0], df.shape[1] + 1)
-        return self.new_dataframe(inputs, **params)
+        if df.ndim == 2:
+            empty_obj = build_empty_df(df.dtypes)
+            empty_obj.insert(
+                loc=self.loc,
+                column=self.column,
+                allow_duplicates=self.allow_duplicates,
+                value=pd.Series([], dtype=value_dtype),
+            )
+            params["columns_value"] = parse_index(empty_obj.columns, store_data=True)
+            params["dtypes"] = empty_obj.dtypes
+            params["shape"] = (df.shape[0], df.shape[1] + 1)
+        else:
+            assert isinstance(df, INDEX_TYPE)
+            params["index_value"] = parse_index(
+                df.index_value, type(self), df, self.loc, self.value
+            )
+            params["shape"] = (df.shape[0] + 1,)
+        return self.new_tileable(inputs, **params)
 def df_insert(df, loc, column, value, allow_duplicates=False):
@@ -88,3 +97,22 @@ def df_insert(df, loc, column, value, allow_duplicates=False):
     )
     out_df = op(df)
     df.data = out_df.data
+def index_insert(idx, loc, value):
+    """
+    Make new Index inserting new item at location.
+    Follows Python list.append semantics for negative values.
+    Parameters
+    ----------
+    loc : int
+    item : object
+    Returns
+    -------
+    new_index : Index
+    """
+    op = DataFrameInsert(loc=loc, value=value)
+    return op(idx)

maxframe 2.0.0b2__cp37-cp37m-win32.whl → 2.3.0rc1__cp37-cp37m-win32.whl

Potentially problematic release.

maxframe 2.0.0b2cp37-cp37m-win32.whl → 2.3.0rc1cp37-cp37m-win32.whl