maxframe 0.1.0b5__cp310-cp310-macosx_11_0_arm64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of maxframe might be problematic. Click here for more details.
- maxframe/__init__.py +32 -0
- maxframe/_utils.cpython-310-darwin.so +0 -0
- maxframe/_utils.pxd +33 -0
- maxframe/_utils.pyx +547 -0
- maxframe/codegen.py +528 -0
- maxframe/config/__init__.py +15 -0
- maxframe/config/config.py +443 -0
- maxframe/config/tests/__init__.py +13 -0
- maxframe/config/tests/test_config.py +103 -0
- maxframe/config/tests/test_validators.py +34 -0
- maxframe/config/validators.py +57 -0
- maxframe/conftest.py +139 -0
- maxframe/core/__init__.py +65 -0
- maxframe/core/base.py +156 -0
- maxframe/core/entity/__init__.py +44 -0
- maxframe/core/entity/chunks.py +68 -0
- maxframe/core/entity/core.py +152 -0
- maxframe/core/entity/executable.py +337 -0
- maxframe/core/entity/fuse.py +73 -0
- maxframe/core/entity/objects.py +100 -0
- maxframe/core/entity/output_types.py +90 -0
- maxframe/core/entity/tileables.py +438 -0
- maxframe/core/entity/utils.py +24 -0
- maxframe/core/graph/__init__.py +17 -0
- maxframe/core/graph/builder/__init__.py +16 -0
- maxframe/core/graph/builder/base.py +86 -0
- maxframe/core/graph/builder/chunk.py +430 -0
- maxframe/core/graph/builder/tileable.py +34 -0
- maxframe/core/graph/builder/utils.py +41 -0
- maxframe/core/graph/core.cpython-310-darwin.so +0 -0
- maxframe/core/graph/core.pyx +467 -0
- maxframe/core/graph/entity.py +171 -0
- maxframe/core/graph/tests/__init__.py +13 -0
- maxframe/core/graph/tests/test_graph.py +205 -0
- maxframe/core/mode.py +96 -0
- maxframe/core/operator/__init__.py +34 -0
- maxframe/core/operator/base.py +450 -0
- maxframe/core/operator/core.py +276 -0
- maxframe/core/operator/fetch.py +53 -0
- maxframe/core/operator/fuse.py +29 -0
- maxframe/core/operator/objects.py +72 -0
- maxframe/core/operator/shuffle.py +111 -0
- maxframe/core/operator/tests/__init__.py +13 -0
- maxframe/core/operator/tests/test_core.py +64 -0
- maxframe/core/tests/__init__.py +13 -0
- maxframe/core/tests/test_mode.py +75 -0
- maxframe/dataframe/__init__.py +81 -0
- maxframe/dataframe/arithmetic/__init__.py +359 -0
- maxframe/dataframe/arithmetic/abs.py +33 -0
- maxframe/dataframe/arithmetic/add.py +60 -0
- maxframe/dataframe/arithmetic/arccos.py +28 -0
- maxframe/dataframe/arithmetic/arccosh.py +28 -0
- maxframe/dataframe/arithmetic/arcsin.py +28 -0
- maxframe/dataframe/arithmetic/arcsinh.py +28 -0
- maxframe/dataframe/arithmetic/arctan.py +28 -0
- maxframe/dataframe/arithmetic/arctanh.py +28 -0
- maxframe/dataframe/arithmetic/around.py +152 -0
- maxframe/dataframe/arithmetic/bitwise_and.py +46 -0
- maxframe/dataframe/arithmetic/bitwise_or.py +50 -0
- maxframe/dataframe/arithmetic/bitwise_xor.py +46 -0
- maxframe/dataframe/arithmetic/ceil.py +28 -0
- maxframe/dataframe/arithmetic/core.py +342 -0
- maxframe/dataframe/arithmetic/cos.py +28 -0
- maxframe/dataframe/arithmetic/cosh.py +28 -0
- maxframe/dataframe/arithmetic/degrees.py +28 -0
- maxframe/dataframe/arithmetic/docstring.py +442 -0
- maxframe/dataframe/arithmetic/equal.py +56 -0
- maxframe/dataframe/arithmetic/exp.py +28 -0
- maxframe/dataframe/arithmetic/exp2.py +28 -0
- maxframe/dataframe/arithmetic/expm1.py +28 -0
- maxframe/dataframe/arithmetic/floor.py +28 -0
- maxframe/dataframe/arithmetic/floordiv.py +64 -0
- maxframe/dataframe/arithmetic/greater.py +57 -0
- maxframe/dataframe/arithmetic/greater_equal.py +57 -0
- maxframe/dataframe/arithmetic/invert.py +33 -0
- maxframe/dataframe/arithmetic/is_ufuncs.py +62 -0
- maxframe/dataframe/arithmetic/less.py +57 -0
- maxframe/dataframe/arithmetic/less_equal.py +57 -0
- maxframe/dataframe/arithmetic/log.py +28 -0
- maxframe/dataframe/arithmetic/log10.py +28 -0
- maxframe/dataframe/arithmetic/log2.py +28 -0
- maxframe/dataframe/arithmetic/mod.py +60 -0
- maxframe/dataframe/arithmetic/multiply.py +60 -0
- maxframe/dataframe/arithmetic/negative.py +33 -0
- maxframe/dataframe/arithmetic/not_equal.py +56 -0
- maxframe/dataframe/arithmetic/power.py +68 -0
- maxframe/dataframe/arithmetic/radians.py +28 -0
- maxframe/dataframe/arithmetic/sin.py +28 -0
- maxframe/dataframe/arithmetic/sinh.py +28 -0
- maxframe/dataframe/arithmetic/sqrt.py +28 -0
- maxframe/dataframe/arithmetic/subtract.py +64 -0
- maxframe/dataframe/arithmetic/tan.py +28 -0
- maxframe/dataframe/arithmetic/tanh.py +28 -0
- maxframe/dataframe/arithmetic/tests/__init__.py +13 -0
- maxframe/dataframe/arithmetic/tests/test_arithmetic.py +695 -0
- maxframe/dataframe/arithmetic/truediv.py +64 -0
- maxframe/dataframe/arithmetic/trunc.py +28 -0
- maxframe/dataframe/arrays.py +864 -0
- maxframe/dataframe/core.py +2417 -0
- maxframe/dataframe/datasource/__init__.py +15 -0
- maxframe/dataframe/datasource/core.py +81 -0
- maxframe/dataframe/datasource/dataframe.py +59 -0
- maxframe/dataframe/datasource/date_range.py +504 -0
- maxframe/dataframe/datasource/from_index.py +54 -0
- maxframe/dataframe/datasource/from_records.py +107 -0
- maxframe/dataframe/datasource/from_tensor.py +419 -0
- maxframe/dataframe/datasource/index.py +117 -0
- maxframe/dataframe/datasource/read_csv.py +528 -0
- maxframe/dataframe/datasource/read_odps_query.py +299 -0
- maxframe/dataframe/datasource/read_odps_table.py +253 -0
- maxframe/dataframe/datasource/read_parquet.py +421 -0
- maxframe/dataframe/datasource/series.py +55 -0
- maxframe/dataframe/datasource/tests/__init__.py +13 -0
- maxframe/dataframe/datasource/tests/test_datasource.py +401 -0
- maxframe/dataframe/datastore/__init__.py +26 -0
- maxframe/dataframe/datastore/core.py +19 -0
- maxframe/dataframe/datastore/to_csv.py +227 -0
- maxframe/dataframe/datastore/to_odps.py +162 -0
- maxframe/dataframe/extensions/__init__.py +41 -0
- maxframe/dataframe/extensions/accessor.py +50 -0
- maxframe/dataframe/extensions/reshuffle.py +83 -0
- maxframe/dataframe/extensions/tests/__init__.py +13 -0
- maxframe/dataframe/extensions/tests/test_extensions.py +38 -0
- maxframe/dataframe/fetch/__init__.py +15 -0
- maxframe/dataframe/fetch/core.py +86 -0
- maxframe/dataframe/groupby/__init__.py +82 -0
- maxframe/dataframe/groupby/aggregation.py +350 -0
- maxframe/dataframe/groupby/apply.py +251 -0
- maxframe/dataframe/groupby/core.py +179 -0
- maxframe/dataframe/groupby/cum.py +124 -0
- maxframe/dataframe/groupby/fill.py +141 -0
- maxframe/dataframe/groupby/getitem.py +92 -0
- maxframe/dataframe/groupby/head.py +105 -0
- maxframe/dataframe/groupby/sample.py +214 -0
- maxframe/dataframe/groupby/tests/__init__.py +13 -0
- maxframe/dataframe/groupby/tests/test_groupby.py +374 -0
- maxframe/dataframe/groupby/transform.py +255 -0
- maxframe/dataframe/indexing/__init__.py +84 -0
- maxframe/dataframe/indexing/add_prefix_suffix.py +110 -0
- maxframe/dataframe/indexing/align.py +349 -0
- maxframe/dataframe/indexing/at.py +83 -0
- maxframe/dataframe/indexing/getitem.py +204 -0
- maxframe/dataframe/indexing/iat.py +37 -0
- maxframe/dataframe/indexing/iloc.py +566 -0
- maxframe/dataframe/indexing/insert.py +86 -0
- maxframe/dataframe/indexing/loc.py +411 -0
- maxframe/dataframe/indexing/reindex.py +526 -0
- maxframe/dataframe/indexing/rename.py +462 -0
- maxframe/dataframe/indexing/rename_axis.py +209 -0
- maxframe/dataframe/indexing/reset_index.py +402 -0
- maxframe/dataframe/indexing/sample.py +221 -0
- maxframe/dataframe/indexing/set_axis.py +194 -0
- maxframe/dataframe/indexing/set_index.py +61 -0
- maxframe/dataframe/indexing/setitem.py +130 -0
- maxframe/dataframe/indexing/tests/__init__.py +13 -0
- maxframe/dataframe/indexing/tests/test_indexing.py +488 -0
- maxframe/dataframe/indexing/where.py +308 -0
- maxframe/dataframe/initializer.py +288 -0
- maxframe/dataframe/merge/__init__.py +32 -0
- maxframe/dataframe/merge/append.py +121 -0
- maxframe/dataframe/merge/concat.py +325 -0
- maxframe/dataframe/merge/merge.py +593 -0
- maxframe/dataframe/merge/tests/__init__.py +13 -0
- maxframe/dataframe/merge/tests/test_merge.py +215 -0
- maxframe/dataframe/misc/__init__.py +134 -0
- maxframe/dataframe/misc/_duplicate.py +46 -0
- maxframe/dataframe/misc/accessor.py +276 -0
- maxframe/dataframe/misc/apply.py +692 -0
- maxframe/dataframe/misc/astype.py +236 -0
- maxframe/dataframe/misc/case_when.py +141 -0
- maxframe/dataframe/misc/check_monotonic.py +84 -0
- maxframe/dataframe/misc/cut.py +383 -0
- maxframe/dataframe/misc/datetimes.py +79 -0
- maxframe/dataframe/misc/describe.py +108 -0
- maxframe/dataframe/misc/diff.py +210 -0
- maxframe/dataframe/misc/drop.py +440 -0
- maxframe/dataframe/misc/drop_duplicates.py +248 -0
- maxframe/dataframe/misc/duplicated.py +292 -0
- maxframe/dataframe/misc/eval.py +728 -0
- maxframe/dataframe/misc/explode.py +171 -0
- maxframe/dataframe/misc/get_dummies.py +208 -0
- maxframe/dataframe/misc/isin.py +217 -0
- maxframe/dataframe/misc/map.py +236 -0
- maxframe/dataframe/misc/melt.py +162 -0
- maxframe/dataframe/misc/memory_usage.py +248 -0
- maxframe/dataframe/misc/pct_change.py +150 -0
- maxframe/dataframe/misc/pivot_table.py +262 -0
- maxframe/dataframe/misc/qcut.py +104 -0
- maxframe/dataframe/misc/select_dtypes.py +104 -0
- maxframe/dataframe/misc/shift.py +256 -0
- maxframe/dataframe/misc/stack.py +238 -0
- maxframe/dataframe/misc/string_.py +221 -0
- maxframe/dataframe/misc/tests/__init__.py +13 -0
- maxframe/dataframe/misc/tests/test_misc.py +468 -0
- maxframe/dataframe/misc/to_numeric.py +178 -0
- maxframe/dataframe/misc/transform.py +361 -0
- maxframe/dataframe/misc/transpose.py +136 -0
- maxframe/dataframe/misc/value_counts.py +182 -0
- maxframe/dataframe/missing/__init__.py +53 -0
- maxframe/dataframe/missing/checkna.py +223 -0
- maxframe/dataframe/missing/dropna.py +280 -0
- maxframe/dataframe/missing/fillna.py +275 -0
- maxframe/dataframe/missing/replace.py +439 -0
- maxframe/dataframe/missing/tests/__init__.py +13 -0
- maxframe/dataframe/missing/tests/test_missing.py +89 -0
- maxframe/dataframe/operators.py +273 -0
- maxframe/dataframe/plotting/__init__.py +40 -0
- maxframe/dataframe/plotting/core.py +78 -0
- maxframe/dataframe/plotting/tests/__init__.py +13 -0
- maxframe/dataframe/plotting/tests/test_plotting.py +136 -0
- maxframe/dataframe/reduction/__init__.py +107 -0
- maxframe/dataframe/reduction/aggregation.py +344 -0
- maxframe/dataframe/reduction/all.py +78 -0
- maxframe/dataframe/reduction/any.py +78 -0
- maxframe/dataframe/reduction/core.py +837 -0
- maxframe/dataframe/reduction/count.py +59 -0
- maxframe/dataframe/reduction/cummax.py +30 -0
- maxframe/dataframe/reduction/cummin.py +30 -0
- maxframe/dataframe/reduction/cumprod.py +30 -0
- maxframe/dataframe/reduction/cumsum.py +30 -0
- maxframe/dataframe/reduction/custom_reduction.py +42 -0
- maxframe/dataframe/reduction/kurtosis.py +104 -0
- maxframe/dataframe/reduction/max.py +65 -0
- maxframe/dataframe/reduction/mean.py +61 -0
- maxframe/dataframe/reduction/min.py +65 -0
- maxframe/dataframe/reduction/nunique.py +141 -0
- maxframe/dataframe/reduction/prod.py +76 -0
- maxframe/dataframe/reduction/reduction_size.py +36 -0
- maxframe/dataframe/reduction/sem.py +69 -0
- maxframe/dataframe/reduction/skew.py +89 -0
- maxframe/dataframe/reduction/std.py +53 -0
- maxframe/dataframe/reduction/str_concat.py +48 -0
- maxframe/dataframe/reduction/sum.py +77 -0
- maxframe/dataframe/reduction/tests/__init__.py +13 -0
- maxframe/dataframe/reduction/tests/test_reduction.py +486 -0
- maxframe/dataframe/reduction/unique.py +90 -0
- maxframe/dataframe/reduction/var.py +72 -0
- maxframe/dataframe/sort/__init__.py +34 -0
- maxframe/dataframe/sort/core.py +36 -0
- maxframe/dataframe/sort/sort_index.py +153 -0
- maxframe/dataframe/sort/sort_values.py +311 -0
- maxframe/dataframe/sort/tests/__init__.py +13 -0
- maxframe/dataframe/sort/tests/test_sort.py +81 -0
- maxframe/dataframe/statistics/__init__.py +33 -0
- maxframe/dataframe/statistics/corr.py +280 -0
- maxframe/dataframe/statistics/quantile.py +341 -0
- maxframe/dataframe/statistics/tests/__init__.py +13 -0
- maxframe/dataframe/statistics/tests/test_statistics.py +82 -0
- maxframe/dataframe/tests/__init__.py +13 -0
- maxframe/dataframe/tests/test_initializer.py +29 -0
- maxframe/dataframe/tseries/__init__.py +13 -0
- maxframe/dataframe/tseries/tests/__init__.py +13 -0
- maxframe/dataframe/tseries/tests/test_tseries.py +30 -0
- maxframe/dataframe/tseries/to_datetime.py +297 -0
- maxframe/dataframe/ufunc/__init__.py +27 -0
- maxframe/dataframe/ufunc/tensor.py +54 -0
- maxframe/dataframe/ufunc/ufunc.py +52 -0
- maxframe/dataframe/utils.py +1267 -0
- maxframe/dataframe/window/__init__.py +29 -0
- maxframe/dataframe/window/aggregation.py +96 -0
- maxframe/dataframe/window/core.py +69 -0
- maxframe/dataframe/window/ewm.py +249 -0
- maxframe/dataframe/window/expanding.py +147 -0
- maxframe/dataframe/window/rolling.py +376 -0
- maxframe/dataframe/window/tests/__init__.py +13 -0
- maxframe/dataframe/window/tests/test_ewm.py +70 -0
- maxframe/dataframe/window/tests/test_expanding.py +66 -0
- maxframe/dataframe/window/tests/test_rolling.py +57 -0
- maxframe/env.py +33 -0
- maxframe/errors.py +21 -0
- maxframe/extension.py +81 -0
- maxframe/learn/__init__.py +17 -0
- maxframe/learn/contrib/__init__.py +17 -0
- maxframe/learn/contrib/pytorch/__init__.py +16 -0
- maxframe/learn/contrib/pytorch/run_function.py +110 -0
- maxframe/learn/contrib/pytorch/run_script.py +102 -0
- maxframe/learn/contrib/pytorch/tests/__init__.py +13 -0
- maxframe/learn/contrib/pytorch/tests/test_pytorch.py +42 -0
- maxframe/learn/contrib/utils.py +52 -0
- maxframe/learn/contrib/xgboost/__init__.py +26 -0
- maxframe/learn/contrib/xgboost/classifier.py +86 -0
- maxframe/learn/contrib/xgboost/core.py +156 -0
- maxframe/learn/contrib/xgboost/dmatrix.py +150 -0
- maxframe/learn/contrib/xgboost/predict.py +138 -0
- maxframe/learn/contrib/xgboost/regressor.py +78 -0
- maxframe/learn/contrib/xgboost/tests/__init__.py +13 -0
- maxframe/learn/contrib/xgboost/tests/test_core.py +43 -0
- maxframe/learn/contrib/xgboost/train.py +121 -0
- maxframe/learn/utils/__init__.py +15 -0
- maxframe/learn/utils/core.py +29 -0
- maxframe/lib/__init__.py +15 -0
- maxframe/lib/aio/__init__.py +27 -0
- maxframe/lib/aio/_runners.py +162 -0
- maxframe/lib/aio/_threads.py +35 -0
- maxframe/lib/aio/base.py +82 -0
- maxframe/lib/aio/file.py +85 -0
- maxframe/lib/aio/isolation.py +100 -0
- maxframe/lib/aio/lru.py +242 -0
- maxframe/lib/aio/parallelism.py +37 -0
- maxframe/lib/aio/tests/__init__.py +13 -0
- maxframe/lib/aio/tests/test_aio_file.py +55 -0
- maxframe/lib/compression.py +55 -0
- maxframe/lib/cython/__init__.py +13 -0
- maxframe/lib/cython/libcpp.pxd +30 -0
- maxframe/lib/filesystem/__init__.py +21 -0
- maxframe/lib/filesystem/_glob.py +173 -0
- maxframe/lib/filesystem/_oss_lib/__init__.py +13 -0
- maxframe/lib/filesystem/_oss_lib/common.py +198 -0
- maxframe/lib/filesystem/_oss_lib/glob.py +147 -0
- maxframe/lib/filesystem/_oss_lib/handle.py +156 -0
- maxframe/lib/filesystem/arrow.py +236 -0
- maxframe/lib/filesystem/base.py +263 -0
- maxframe/lib/filesystem/core.py +95 -0
- maxframe/lib/filesystem/fsmap.py +164 -0
- maxframe/lib/filesystem/hdfs.py +31 -0
- maxframe/lib/filesystem/local.py +112 -0
- maxframe/lib/filesystem/oss.py +157 -0
- maxframe/lib/filesystem/tests/__init__.py +13 -0
- maxframe/lib/filesystem/tests/test_filesystem.py +223 -0
- maxframe/lib/filesystem/tests/test_oss.py +182 -0
- maxframe/lib/functools_compat.py +81 -0
- maxframe/lib/mmh3.cpython-310-darwin.so +0 -0
- maxframe/lib/mmh3_src/MurmurHash3.cpp +339 -0
- maxframe/lib/mmh3_src/MurmurHash3.h +43 -0
- maxframe/lib/mmh3_src/mmh3module.cpp +387 -0
- maxframe/lib/sparse/__init__.py +861 -0
- maxframe/lib/sparse/array.py +1604 -0
- maxframe/lib/sparse/core.py +92 -0
- maxframe/lib/sparse/matrix.py +241 -0
- maxframe/lib/sparse/tests/__init__.py +15 -0
- maxframe/lib/sparse/tests/test_sparse.py +476 -0
- maxframe/lib/sparse/vector.py +150 -0
- maxframe/lib/tblib/LICENSE +20 -0
- maxframe/lib/tblib/__init__.py +327 -0
- maxframe/lib/tblib/cpython.py +83 -0
- maxframe/lib/tblib/decorators.py +44 -0
- maxframe/lib/tblib/pickling_support.py +90 -0
- maxframe/lib/tests/__init__.py +13 -0
- maxframe/lib/tests/test_wrapped_pickle.py +51 -0
- maxframe/lib/version.py +620 -0
- maxframe/lib/wrapped_pickle.py +139 -0
- maxframe/mixin.py +100 -0
- maxframe/odpsio/__init__.py +21 -0
- maxframe/odpsio/arrow.py +91 -0
- maxframe/odpsio/schema.py +364 -0
- maxframe/odpsio/tableio.py +322 -0
- maxframe/odpsio/tests/__init__.py +13 -0
- maxframe/odpsio/tests/test_arrow.py +88 -0
- maxframe/odpsio/tests/test_schema.py +297 -0
- maxframe/odpsio/tests/test_tableio.py +136 -0
- maxframe/odpsio/tests/test_volumeio.py +90 -0
- maxframe/odpsio/volumeio.py +95 -0
- maxframe/opcodes.py +590 -0
- maxframe/protocol.py +415 -0
- maxframe/remote/__init__.py +18 -0
- maxframe/remote/core.py +210 -0
- maxframe/remote/run_script.py +121 -0
- maxframe/serialization/__init__.py +26 -0
- maxframe/serialization/arrow.py +95 -0
- maxframe/serialization/core.cpython-310-darwin.so +0 -0
- maxframe/serialization/core.pxd +44 -0
- maxframe/serialization/core.pyi +61 -0
- maxframe/serialization/core.pyx +1094 -0
- maxframe/serialization/exception.py +86 -0
- maxframe/serialization/maxframe_objects.py +39 -0
- maxframe/serialization/numpy.py +91 -0
- maxframe/serialization/pandas.py +202 -0
- maxframe/serialization/scipy.py +71 -0
- maxframe/serialization/serializables/__init__.py +55 -0
- maxframe/serialization/serializables/core.py +262 -0
- maxframe/serialization/serializables/field.py +624 -0
- maxframe/serialization/serializables/field_type.py +589 -0
- maxframe/serialization/serializables/tests/__init__.py +13 -0
- maxframe/serialization/serializables/tests/test_field_type.py +121 -0
- maxframe/serialization/serializables/tests/test_serializable.py +250 -0
- maxframe/serialization/tests/__init__.py +13 -0
- maxframe/serialization/tests/test_serial.py +412 -0
- maxframe/session.py +1310 -0
- maxframe/tensor/__init__.py +183 -0
- maxframe/tensor/arithmetic/__init__.py +315 -0
- maxframe/tensor/arithmetic/abs.py +68 -0
- maxframe/tensor/arithmetic/absolute.py +68 -0
- maxframe/tensor/arithmetic/add.py +82 -0
- maxframe/tensor/arithmetic/angle.py +72 -0
- maxframe/tensor/arithmetic/arccos.py +104 -0
- maxframe/tensor/arithmetic/arccosh.py +91 -0
- maxframe/tensor/arithmetic/arcsin.py +94 -0
- maxframe/tensor/arithmetic/arcsinh.py +86 -0
- maxframe/tensor/arithmetic/arctan.py +106 -0
- maxframe/tensor/arithmetic/arctan2.py +128 -0
- maxframe/tensor/arithmetic/arctanh.py +86 -0
- maxframe/tensor/arithmetic/around.py +114 -0
- maxframe/tensor/arithmetic/bitand.py +95 -0
- maxframe/tensor/arithmetic/bitor.py +102 -0
- maxframe/tensor/arithmetic/bitxor.py +95 -0
- maxframe/tensor/arithmetic/cbrt.py +66 -0
- maxframe/tensor/arithmetic/ceil.py +71 -0
- maxframe/tensor/arithmetic/clip.py +165 -0
- maxframe/tensor/arithmetic/conj.py +74 -0
- maxframe/tensor/arithmetic/copysign.py +78 -0
- maxframe/tensor/arithmetic/core.py +544 -0
- maxframe/tensor/arithmetic/cos.py +85 -0
- maxframe/tensor/arithmetic/cosh.py +72 -0
- maxframe/tensor/arithmetic/deg2rad.py +72 -0
- maxframe/tensor/arithmetic/degrees.py +77 -0
- maxframe/tensor/arithmetic/divide.py +114 -0
- maxframe/tensor/arithmetic/equal.py +76 -0
- maxframe/tensor/arithmetic/exp.py +106 -0
- maxframe/tensor/arithmetic/exp2.py +67 -0
- maxframe/tensor/arithmetic/expm1.py +79 -0
- maxframe/tensor/arithmetic/fabs.py +74 -0
- maxframe/tensor/arithmetic/fix.py +69 -0
- maxframe/tensor/arithmetic/float_power.py +103 -0
- maxframe/tensor/arithmetic/floor.py +77 -0
- maxframe/tensor/arithmetic/floordiv.py +94 -0
- maxframe/tensor/arithmetic/fmax.py +105 -0
- maxframe/tensor/arithmetic/fmin.py +106 -0
- maxframe/tensor/arithmetic/fmod.py +99 -0
- maxframe/tensor/arithmetic/frexp.py +92 -0
- maxframe/tensor/arithmetic/greater.py +77 -0
- maxframe/tensor/arithmetic/greater_equal.py +69 -0
- maxframe/tensor/arithmetic/hypot.py +77 -0
- maxframe/tensor/arithmetic/i0.py +89 -0
- maxframe/tensor/arithmetic/imag.py +67 -0
- maxframe/tensor/arithmetic/invert.py +110 -0
- maxframe/tensor/arithmetic/isclose.py +115 -0
- maxframe/tensor/arithmetic/iscomplex.py +64 -0
- maxframe/tensor/arithmetic/isfinite.py +106 -0
- maxframe/tensor/arithmetic/isinf.py +103 -0
- maxframe/tensor/arithmetic/isnan.py +82 -0
- maxframe/tensor/arithmetic/isreal.py +63 -0
- maxframe/tensor/arithmetic/ldexp.py +99 -0
- maxframe/tensor/arithmetic/less.py +69 -0
- maxframe/tensor/arithmetic/less_equal.py +69 -0
- maxframe/tensor/arithmetic/log.py +92 -0
- maxframe/tensor/arithmetic/log10.py +85 -0
- maxframe/tensor/arithmetic/log1p.py +95 -0
- maxframe/tensor/arithmetic/log2.py +85 -0
- maxframe/tensor/arithmetic/logaddexp.py +80 -0
- maxframe/tensor/arithmetic/logaddexp2.py +78 -0
- maxframe/tensor/arithmetic/logical_and.py +81 -0
- maxframe/tensor/arithmetic/logical_not.py +74 -0
- maxframe/tensor/arithmetic/logical_or.py +82 -0
- maxframe/tensor/arithmetic/logical_xor.py +88 -0
- maxframe/tensor/arithmetic/lshift.py +82 -0
- maxframe/tensor/arithmetic/maximum.py +108 -0
- maxframe/tensor/arithmetic/minimum.py +108 -0
- maxframe/tensor/arithmetic/mod.py +104 -0
- maxframe/tensor/arithmetic/modf.py +83 -0
- maxframe/tensor/arithmetic/multiply.py +81 -0
- maxframe/tensor/arithmetic/nan_to_num.py +99 -0
- maxframe/tensor/arithmetic/negative.py +65 -0
- maxframe/tensor/arithmetic/nextafter.py +68 -0
- maxframe/tensor/arithmetic/not_equal.py +72 -0
- maxframe/tensor/arithmetic/positive.py +47 -0
- maxframe/tensor/arithmetic/power.py +106 -0
- maxframe/tensor/arithmetic/rad2deg.py +71 -0
- maxframe/tensor/arithmetic/radians.py +77 -0
- maxframe/tensor/arithmetic/real.py +70 -0
- maxframe/tensor/arithmetic/reciprocal.py +76 -0
- maxframe/tensor/arithmetic/rint.py +68 -0
- maxframe/tensor/arithmetic/rshift.py +81 -0
- maxframe/tensor/arithmetic/setimag.py +29 -0
- maxframe/tensor/arithmetic/setreal.py +29 -0
- maxframe/tensor/arithmetic/sign.py +81 -0
- maxframe/tensor/arithmetic/signbit.py +65 -0
- maxframe/tensor/arithmetic/sin.py +98 -0
- maxframe/tensor/arithmetic/sinc.py +102 -0
- maxframe/tensor/arithmetic/sinh.py +93 -0
- maxframe/tensor/arithmetic/spacing.py +72 -0
- maxframe/tensor/arithmetic/sqrt.py +81 -0
- maxframe/tensor/arithmetic/square.py +69 -0
- maxframe/tensor/arithmetic/subtract.py +81 -0
- maxframe/tensor/arithmetic/tan.py +88 -0
- maxframe/tensor/arithmetic/tanh.py +92 -0
- maxframe/tensor/arithmetic/tests/__init__.py +15 -0
- maxframe/tensor/arithmetic/tests/test_arithmetic.py +414 -0
- maxframe/tensor/arithmetic/truediv.py +104 -0
- maxframe/tensor/arithmetic/trunc.py +72 -0
- maxframe/tensor/arithmetic/utils.py +65 -0
- maxframe/tensor/array_utils.py +186 -0
- maxframe/tensor/base/__init__.py +34 -0
- maxframe/tensor/base/astype.py +119 -0
- maxframe/tensor/base/atleast_1d.py +74 -0
- maxframe/tensor/base/broadcast_to.py +89 -0
- maxframe/tensor/base/ravel.py +92 -0
- maxframe/tensor/base/tests/__init__.py +13 -0
- maxframe/tensor/base/tests/test_base.py +114 -0
- maxframe/tensor/base/transpose.py +125 -0
- maxframe/tensor/base/unique.py +205 -0
- maxframe/tensor/base/where.py +127 -0
- maxframe/tensor/core.py +724 -0
- maxframe/tensor/datasource/__init__.py +32 -0
- maxframe/tensor/datasource/arange.py +156 -0
- maxframe/tensor/datasource/array.py +415 -0
- maxframe/tensor/datasource/core.py +109 -0
- maxframe/tensor/datasource/empty.py +169 -0
- maxframe/tensor/datasource/from_dataframe.py +70 -0
- maxframe/tensor/datasource/from_dense.py +54 -0
- maxframe/tensor/datasource/from_sparse.py +47 -0
- maxframe/tensor/datasource/full.py +186 -0
- maxframe/tensor/datasource/ones.py +173 -0
- maxframe/tensor/datasource/scalar.py +40 -0
- maxframe/tensor/datasource/tests/__init__.py +13 -0
- maxframe/tensor/datasource/tests/test_datasource.py +278 -0
- maxframe/tensor/datasource/zeros.py +188 -0
- maxframe/tensor/fetch/__init__.py +15 -0
- maxframe/tensor/fetch/core.py +54 -0
- maxframe/tensor/indexing/__init__.py +47 -0
- maxframe/tensor/indexing/choose.py +196 -0
- maxframe/tensor/indexing/compress.py +124 -0
- maxframe/tensor/indexing/core.py +190 -0
- maxframe/tensor/indexing/extract.py +71 -0
- maxframe/tensor/indexing/fill_diagonal.py +183 -0
- maxframe/tensor/indexing/flatnonzero.py +60 -0
- maxframe/tensor/indexing/getitem.py +175 -0
- maxframe/tensor/indexing/nonzero.py +120 -0
- maxframe/tensor/indexing/setitem.py +132 -0
- maxframe/tensor/indexing/slice.py +29 -0
- maxframe/tensor/indexing/take.py +130 -0
- maxframe/tensor/indexing/tests/__init__.py +15 -0
- maxframe/tensor/indexing/tests/test_indexing.py +234 -0
- maxframe/tensor/indexing/unravel_index.py +103 -0
- maxframe/tensor/merge/__init__.py +15 -0
- maxframe/tensor/merge/stack.py +132 -0
- maxframe/tensor/merge/tests/__init__.py +13 -0
- maxframe/tensor/merge/tests/test_merge.py +52 -0
- maxframe/tensor/operators.py +123 -0
- maxframe/tensor/random/__init__.py +168 -0
- maxframe/tensor/random/beta.py +87 -0
- maxframe/tensor/random/binomial.py +137 -0
- maxframe/tensor/random/bytes.py +39 -0
- maxframe/tensor/random/chisquare.py +110 -0
- maxframe/tensor/random/choice.py +186 -0
- maxframe/tensor/random/core.py +234 -0
- maxframe/tensor/random/dirichlet.py +123 -0
- maxframe/tensor/random/exponential.py +94 -0
- maxframe/tensor/random/f.py +135 -0
- maxframe/tensor/random/gamma.py +128 -0
- maxframe/tensor/random/geometric.py +93 -0
- maxframe/tensor/random/gumbel.py +167 -0
- maxframe/tensor/random/hypergeometric.py +148 -0
- maxframe/tensor/random/laplace.py +133 -0
- maxframe/tensor/random/logistic.py +129 -0
- maxframe/tensor/random/lognormal.py +159 -0
- maxframe/tensor/random/logseries.py +122 -0
- maxframe/tensor/random/multinomial.py +133 -0
- maxframe/tensor/random/multivariate_normal.py +192 -0
- maxframe/tensor/random/negative_binomial.py +125 -0
- maxframe/tensor/random/noncentral_chisquare.py +132 -0
- maxframe/tensor/random/noncentral_f.py +126 -0
- maxframe/tensor/random/normal.py +143 -0
- maxframe/tensor/random/pareto.py +140 -0
- maxframe/tensor/random/permutation.py +104 -0
- maxframe/tensor/random/poisson.py +111 -0
- maxframe/tensor/random/power.py +142 -0
- maxframe/tensor/random/rand.py +82 -0
- maxframe/tensor/random/randint.py +121 -0
- maxframe/tensor/random/randn.py +96 -0
- maxframe/tensor/random/random_integers.py +123 -0
- maxframe/tensor/random/random_sample.py +86 -0
- maxframe/tensor/random/rayleigh.py +110 -0
- maxframe/tensor/random/shuffle.py +61 -0
- maxframe/tensor/random/standard_cauchy.py +105 -0
- maxframe/tensor/random/standard_exponential.py +72 -0
- maxframe/tensor/random/standard_gamma.py +120 -0
- maxframe/tensor/random/standard_normal.py +74 -0
- maxframe/tensor/random/standard_t.py +135 -0
- maxframe/tensor/random/tests/__init__.py +15 -0
- maxframe/tensor/random/tests/test_random.py +167 -0
- maxframe/tensor/random/triangular.py +119 -0
- maxframe/tensor/random/uniform.py +131 -0
- maxframe/tensor/random/vonmises.py +131 -0
- maxframe/tensor/random/wald.py +114 -0
- maxframe/tensor/random/weibull.py +140 -0
- maxframe/tensor/random/zipf.py +122 -0
- maxframe/tensor/rechunk/__init__.py +26 -0
- maxframe/tensor/rechunk/rechunk.py +43 -0
- maxframe/tensor/reduction/__init__.py +66 -0
- maxframe/tensor/reduction/all.py +103 -0
- maxframe/tensor/reduction/allclose.py +88 -0
- maxframe/tensor/reduction/any.py +105 -0
- maxframe/tensor/reduction/argmax.py +103 -0
- maxframe/tensor/reduction/argmin.py +103 -0
- maxframe/tensor/reduction/array_equal.py +64 -0
- maxframe/tensor/reduction/core.py +168 -0
- maxframe/tensor/reduction/count_nonzero.py +81 -0
- maxframe/tensor/reduction/cumprod.py +97 -0
- maxframe/tensor/reduction/cumsum.py +101 -0
- maxframe/tensor/reduction/max.py +120 -0
- maxframe/tensor/reduction/mean.py +123 -0
- maxframe/tensor/reduction/min.py +120 -0
- maxframe/tensor/reduction/nanargmax.py +82 -0
- maxframe/tensor/reduction/nanargmin.py +76 -0
- maxframe/tensor/reduction/nancumprod.py +91 -0
- maxframe/tensor/reduction/nancumsum.py +94 -0
- maxframe/tensor/reduction/nanmax.py +111 -0
- maxframe/tensor/reduction/nanmean.py +106 -0
- maxframe/tensor/reduction/nanmin.py +111 -0
- maxframe/tensor/reduction/nanprod.py +94 -0
- maxframe/tensor/reduction/nanstd.py +126 -0
- maxframe/tensor/reduction/nansum.py +115 -0
- maxframe/tensor/reduction/nanvar.py +149 -0
- maxframe/tensor/reduction/prod.py +130 -0
- maxframe/tensor/reduction/std.py +134 -0
- maxframe/tensor/reduction/sum.py +125 -0
- maxframe/tensor/reduction/tests/__init__.py +13 -0
- maxframe/tensor/reduction/tests/test_reduction.py +181 -0
- maxframe/tensor/reduction/var.py +176 -0
- maxframe/tensor/reshape/__init__.py +17 -0
- maxframe/tensor/reshape/reshape.py +188 -0
- maxframe/tensor/reshape/tests/__init__.py +15 -0
- maxframe/tensor/reshape/tests/test_reshape.py +37 -0
- maxframe/tensor/statistics/__init__.py +13 -0
- maxframe/tensor/statistics/percentile.py +175 -0
- maxframe/tensor/statistics/quantile.py +288 -0
- maxframe/tensor/ufunc/__init__.py +26 -0
- maxframe/tensor/ufunc/ufunc.py +200 -0
- maxframe/tensor/utils.py +718 -0
- maxframe/tests/__init__.py +13 -0
- maxframe/tests/test_codegen.py +69 -0
- maxframe/tests/test_protocol.py +144 -0
- maxframe/tests/test_utils.py +376 -0
- maxframe/tests/utils.py +164 -0
- maxframe/typing_.py +37 -0
- maxframe/udf.py +134 -0
- maxframe/utils.py +1114 -0
- maxframe-0.1.0b5.dist-info/METADATA +104 -0
- maxframe-0.1.0b5.dist-info/RECORD +647 -0
- maxframe-0.1.0b5.dist-info/WHEEL +5 -0
- maxframe-0.1.0b5.dist-info/top_level.txt +3 -0
- maxframe_client/__init__.py +17 -0
- maxframe_client/clients/__init__.py +13 -0
- maxframe_client/clients/framedriver.py +118 -0
- maxframe_client/clients/spe.py +104 -0
- maxframe_client/conftest.py +15 -0
- maxframe_client/fetcher.py +264 -0
- maxframe_client/session/__init__.py +22 -0
- maxframe_client/session/consts.py +36 -0
- maxframe_client/session/graph.py +119 -0
- maxframe_client/session/odps.py +482 -0
- maxframe_client/session/task.py +280 -0
- maxframe_client/session/tests/__init__.py +13 -0
- maxframe_client/session/tests/test_task.py +85 -0
- maxframe_client/tests/__init__.py +13 -0
- maxframe_client/tests/test_fetcher.py +89 -0
- maxframe_client/tests/test_session.py +255 -0
|
@@ -0,0 +1,439 @@
|
|
|
1
|
+
# Copyright 1999-2024 Alibaba Group Holding Ltd.
|
|
2
|
+
#
|
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
+
# you may not use this file except in compliance with the License.
|
|
5
|
+
# You may obtain a copy of the License at
|
|
6
|
+
#
|
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
+
#
|
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
+
# See the License for the specific language governing permissions and
|
|
13
|
+
# limitations under the License.
|
|
14
|
+
|
|
15
|
+
from ... import opcodes
|
|
16
|
+
from ...serialization.serializables import AnyField, Int32Field
|
|
17
|
+
from ...utils import no_default
|
|
18
|
+
from ..operators import SERIES_TYPE, DataFrameOperator, DataFrameOperatorMixin
|
|
19
|
+
from ..utils import build_df, build_series
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
class DataFrameReplace(DataFrameOperator, DataFrameOperatorMixin):
|
|
23
|
+
_op_type_ = opcodes.REPLACE
|
|
24
|
+
|
|
25
|
+
to_replace = AnyField("to_replace", default=None)
|
|
26
|
+
value = AnyField("value", default=None)
|
|
27
|
+
limit = Int32Field("limit", default=None)
|
|
28
|
+
regex = AnyField("regex", default=None)
|
|
29
|
+
method = AnyField("method", default=no_default)
|
|
30
|
+
|
|
31
|
+
def _set_inputs(self, inputs):
|
|
32
|
+
super()._set_inputs(inputs)
|
|
33
|
+
input_iter = iter(inputs)
|
|
34
|
+
next(input_iter)
|
|
35
|
+
if isinstance(self.to_replace, SERIES_TYPE):
|
|
36
|
+
self.to_replace = next(input_iter)
|
|
37
|
+
if isinstance(self.value, SERIES_TYPE):
|
|
38
|
+
self.value = next(input_iter)
|
|
39
|
+
|
|
40
|
+
def __call__(self, df_or_series):
|
|
41
|
+
inputs = [df_or_series]
|
|
42
|
+
mock_obj = (
|
|
43
|
+
build_df(df_or_series)
|
|
44
|
+
if df_or_series.ndim == 2
|
|
45
|
+
else build_series(df_or_series)
|
|
46
|
+
)
|
|
47
|
+
|
|
48
|
+
if isinstance(self.to_replace, SERIES_TYPE):
|
|
49
|
+
mock_to_replace = build_series(self.to_replace)
|
|
50
|
+
inputs.append(self.to_replace)
|
|
51
|
+
else:
|
|
52
|
+
mock_to_replace = self.to_replace
|
|
53
|
+
|
|
54
|
+
if isinstance(self.value, SERIES_TYPE):
|
|
55
|
+
mock_value = build_series(self.value)
|
|
56
|
+
inputs.append(self.value)
|
|
57
|
+
else:
|
|
58
|
+
mock_value = self.value
|
|
59
|
+
|
|
60
|
+
mock_result = mock_obj.replace(
|
|
61
|
+
mock_to_replace, mock_value, regex=self.regex, method=self.method
|
|
62
|
+
)
|
|
63
|
+
|
|
64
|
+
if df_or_series.ndim == 2:
|
|
65
|
+
return self.new_dataframe(
|
|
66
|
+
inputs,
|
|
67
|
+
shape=df_or_series.shape,
|
|
68
|
+
dtypes=mock_result.dtypes,
|
|
69
|
+
index_value=df_or_series.index_value,
|
|
70
|
+
columns_value=df_or_series.columns_value,
|
|
71
|
+
)
|
|
72
|
+
else:
|
|
73
|
+
return self.new_series(
|
|
74
|
+
inputs,
|
|
75
|
+
shape=df_or_series.shape,
|
|
76
|
+
dtype=mock_result.dtype,
|
|
77
|
+
index_value=df_or_series.index_value,
|
|
78
|
+
name=df_or_series.name,
|
|
79
|
+
)
|
|
80
|
+
|
|
81
|
+
|
|
82
|
+
_fun_doc = """
|
|
83
|
+
Replace values given in `to_replace` with `value`.
|
|
84
|
+
|
|
85
|
+
Values of the #obj_type# are replaced with other values dynamically.
|
|
86
|
+
This differs from updating with ``.loc`` or ``.iloc``, which require
|
|
87
|
+
you to specify a location to update with some value.
|
|
88
|
+
|
|
89
|
+
Parameters
|
|
90
|
+
----------
|
|
91
|
+
to_replace : str, regex, list, dict, Series, int, float, or None
|
|
92
|
+
How to find the values that will be replaced.
|
|
93
|
+
|
|
94
|
+
* numeric, str or regex:
|
|
95
|
+
|
|
96
|
+
- numeric: numeric values equal to `to_replace` will be
|
|
97
|
+
replaced with `value`
|
|
98
|
+
- str: string exactly matching `to_replace` will be replaced
|
|
99
|
+
with `value`
|
|
100
|
+
- regex: regexs matching `to_replace` will be replaced with
|
|
101
|
+
`value`
|
|
102
|
+
|
|
103
|
+
* list of str, regex, or numeric:
|
|
104
|
+
|
|
105
|
+
- First, if `to_replace` and `value` are both lists, they
|
|
106
|
+
**must** be the same length.
|
|
107
|
+
- Second, if ``regex=True`` then all of the strings in **both**
|
|
108
|
+
lists will be interpreted as regexs otherwise they will match
|
|
109
|
+
directly. This doesn't matter much for `value` since there
|
|
110
|
+
are only a few possible substitution regexes you can use.
|
|
111
|
+
- str, regex and numeric rules apply as above.
|
|
112
|
+
|
|
113
|
+
* dict:
|
|
114
|
+
|
|
115
|
+
- Dicts can be used to specify different replacement values
|
|
116
|
+
for different existing values. For example,
|
|
117
|
+
``{'a': 'b', 'y': 'z'}`` replaces the value 'a' with 'b' and
|
|
118
|
+
'y' with 'z'. To use a dict in this way the `value`
|
|
119
|
+
parameter should be `None`.
|
|
120
|
+
- For a DataFrame a dict can specify that different values
|
|
121
|
+
should be replaced in different columns. For example,
|
|
122
|
+
``{'a': 1, 'b': 'z'}`` looks for the value 1 in column 'a'
|
|
123
|
+
and the value 'z' in column 'b' and replaces these values
|
|
124
|
+
with whatever is specified in `value`. The `value` parameter
|
|
125
|
+
should not be ``None`` in this case. You can treat this as a
|
|
126
|
+
special case of passing two lists except that you are
|
|
127
|
+
specifying the column to search in.
|
|
128
|
+
- For a DataFrame nested dictionaries, e.g.,
|
|
129
|
+
``{'a': {'b': np.nan}}``, are read as follows: look in column
|
|
130
|
+
'a' for the value 'b' and replace it with NaN. The `value`
|
|
131
|
+
parameter should be ``None`` to use a nested dict in this
|
|
132
|
+
way. You can nest regular expressions as well. Note that
|
|
133
|
+
column names (the top-level dictionary keys in a nested
|
|
134
|
+
dictionary) **cannot** be regular expressions.
|
|
135
|
+
|
|
136
|
+
* None:
|
|
137
|
+
|
|
138
|
+
- This means that the `regex` argument must be a string,
|
|
139
|
+
compiled regular expression, or list, dict, ndarray or
|
|
140
|
+
Series of such elements. If `value` is also ``None`` then
|
|
141
|
+
this **must** be a nested dictionary or Series.
|
|
142
|
+
|
|
143
|
+
See the examples section for examples of each of these.
|
|
144
|
+
value : scalar, dict, list, str, regex, default None
|
|
145
|
+
Value to replace any values matching `to_replace` with.
|
|
146
|
+
For a DataFrame a dict of values can be used to specify which
|
|
147
|
+
value to use for each column (columns not in the dict will not be
|
|
148
|
+
filled). Regular expressions, strings and lists or dicts of such
|
|
149
|
+
objects are also allowed.
|
|
150
|
+
inplace : bool, default False
|
|
151
|
+
If True, in place. Note: this will modify any
|
|
152
|
+
other views on this object (e.g. a column from a DataFrame).
|
|
153
|
+
Returns the caller if this is True.
|
|
154
|
+
limit : int, default None
|
|
155
|
+
Maximum size gap to forward or backward fill.
|
|
156
|
+
regex : bool or same types as `to_replace`, default False
|
|
157
|
+
Whether to interpret `to_replace` and/or `value` as regular
|
|
158
|
+
expressions. If this is ``True`` then `to_replace` *must* be a
|
|
159
|
+
string. Alternatively, this could be a regular expression or a
|
|
160
|
+
list, dict, or array of regular expressions in which case
|
|
161
|
+
`to_replace` must be ``None``.
|
|
162
|
+
method : {'pad', 'ffill', 'bfill', `None`}
|
|
163
|
+
The method to use when for replacement, when `to_replace` is a
|
|
164
|
+
scalar, list or tuple and `value` is ``None``.
|
|
165
|
+
|
|
166
|
+
Returns
|
|
167
|
+
-------
|
|
168
|
+
#obj_type#
|
|
169
|
+
Object after replacement.
|
|
170
|
+
|
|
171
|
+
Raises
|
|
172
|
+
------
|
|
173
|
+
AssertionError
|
|
174
|
+
* If `regex` is not a ``bool`` and `to_replace` is not
|
|
175
|
+
``None``.
|
|
176
|
+
TypeError
|
|
177
|
+
* If `to_replace` is a ``dict`` and `value` is not a ``list``,
|
|
178
|
+
``dict``, ``ndarray``, or ``Series``
|
|
179
|
+
* If `to_replace` is ``None`` and `regex` is not compilable
|
|
180
|
+
into a regular expression or is a list, dict, ndarray, or
|
|
181
|
+
Series.
|
|
182
|
+
* When replacing multiple ``bool`` or ``datetime64`` objects and
|
|
183
|
+
the arguments to `to_replace` does not match the type of the
|
|
184
|
+
value being replaced
|
|
185
|
+
ValueError
|
|
186
|
+
* If a ``list`` or an ``ndarray`` is passed to `to_replace` and
|
|
187
|
+
`value` but they are not the same length.
|
|
188
|
+
|
|
189
|
+
See Also
|
|
190
|
+
--------
|
|
191
|
+
#obj_type#.fillna : Fill NA values.
|
|
192
|
+
#obj_type#.where : Replace values based on boolean condition.
|
|
193
|
+
Series.str.replace : Simple string replacement.
|
|
194
|
+
|
|
195
|
+
Notes
|
|
196
|
+
-----
|
|
197
|
+
* Regex substitution is performed under the hood with ``re.sub``. The
|
|
198
|
+
rules for substitution for ``re.sub`` are the same.
|
|
199
|
+
* Regular expressions will only substitute on strings, meaning you
|
|
200
|
+
cannot provide, for example, a regular expression matching floating
|
|
201
|
+
point numbers and expect the columns in your frame that have a
|
|
202
|
+
numeric dtype to be matched. However, if those floating point
|
|
203
|
+
numbers *are* strings, then you can do this.
|
|
204
|
+
* This method has *a lot* of options. You are encouraged to experiment
|
|
205
|
+
and play with this method to gain intuition about how it works.
|
|
206
|
+
* When dict is used as the `to_replace` value, it is like
|
|
207
|
+
key(s) in the dict are the to_replace part and
|
|
208
|
+
value(s) in the dict are the value parameter.
|
|
209
|
+
|
|
210
|
+
Examples
|
|
211
|
+
--------
|
|
212
|
+
|
|
213
|
+
**Scalar `to_replace` and `value`**
|
|
214
|
+
|
|
215
|
+
>>> import maxframe.tensor as mt
|
|
216
|
+
>>> import maxframe.dataframe as md
|
|
217
|
+
>>> s = md.Series([0, 1, 2, 3, 4])
|
|
218
|
+
>>> s.replace(0, 5).execute()
|
|
219
|
+
0 5
|
|
220
|
+
1 1
|
|
221
|
+
2 2
|
|
222
|
+
3 3
|
|
223
|
+
4 4
|
|
224
|
+
dtype: int64
|
|
225
|
+
|
|
226
|
+
>>> df = md.DataFrame({'A': [0, 1, 2, 3, 4],
|
|
227
|
+
... 'B': [5, 6, 7, 8, 9],
|
|
228
|
+
... 'C': ['a', 'b', 'c', 'd', 'e']})
|
|
229
|
+
>>> df.replace(0, 5).execute()
|
|
230
|
+
A B C
|
|
231
|
+
0 5 5 a
|
|
232
|
+
1 1 6 b
|
|
233
|
+
2 2 7 c
|
|
234
|
+
3 3 8 d
|
|
235
|
+
4 4 9 e
|
|
236
|
+
|
|
237
|
+
**List-like `to_replace`**
|
|
238
|
+
|
|
239
|
+
>>> df.replace([0, 1, 2, 3], 4).execute()
|
|
240
|
+
A B C
|
|
241
|
+
0 4 5 a
|
|
242
|
+
1 4 6 b
|
|
243
|
+
2 4 7 c
|
|
244
|
+
3 4 8 d
|
|
245
|
+
4 4 9 e
|
|
246
|
+
|
|
247
|
+
>>> df.replace([0, 1, 2, 3], [4, 3, 2, 1]).execute()
|
|
248
|
+
A B C
|
|
249
|
+
0 4 5 a
|
|
250
|
+
1 3 6 b
|
|
251
|
+
2 2 7 c
|
|
252
|
+
3 1 8 d
|
|
253
|
+
4 4 9 e
|
|
254
|
+
|
|
255
|
+
>>> s.replace([1, 2], method='bfill').execute()
|
|
256
|
+
0 0
|
|
257
|
+
1 3
|
|
258
|
+
2 3
|
|
259
|
+
3 3
|
|
260
|
+
4 4
|
|
261
|
+
dtype: int64
|
|
262
|
+
|
|
263
|
+
**dict-like `to_replace`**
|
|
264
|
+
|
|
265
|
+
>>> df.replace({0: 10, 1: 100}).execute()
|
|
266
|
+
A B C
|
|
267
|
+
0 10 5 a
|
|
268
|
+
1 100 6 b
|
|
269
|
+
2 2 7 c
|
|
270
|
+
3 3 8 d
|
|
271
|
+
4 4 9 e
|
|
272
|
+
|
|
273
|
+
>>> df.replace({'A': 0, 'B': 5}, 100).execute()
|
|
274
|
+
A B C
|
|
275
|
+
0 100 100 a
|
|
276
|
+
1 1 6 b
|
|
277
|
+
2 2 7 c
|
|
278
|
+
3 3 8 d
|
|
279
|
+
4 4 9 e
|
|
280
|
+
|
|
281
|
+
>>> df.replace({'A': {0: 100, 4: 400}}).execute()
|
|
282
|
+
A B C
|
|
283
|
+
0 100 5 a
|
|
284
|
+
1 1 6 b
|
|
285
|
+
2 2 7 c
|
|
286
|
+
3 3 8 d
|
|
287
|
+
4 400 9 e
|
|
288
|
+
|
|
289
|
+
**Regular expression `to_replace`**
|
|
290
|
+
|
|
291
|
+
>>> df = md.DataFrame({'A': ['bat', 'foo', 'bait'],
|
|
292
|
+
... 'B': ['abc', 'bar', 'xyz']})
|
|
293
|
+
>>> df.replace(to_replace=r'^ba.$', value='new', regex=True).execute()
|
|
294
|
+
A B
|
|
295
|
+
0 new abc
|
|
296
|
+
1 foo new
|
|
297
|
+
2 bait xyz
|
|
298
|
+
|
|
299
|
+
>>> df.replace({'A': r'^ba.$'}, {'A': 'new'}, regex=True).execute()
|
|
300
|
+
A B
|
|
301
|
+
0 new abc
|
|
302
|
+
1 foo bar
|
|
303
|
+
2 bait xyz
|
|
304
|
+
|
|
305
|
+
>>> df.replace(regex=r'^ba.$', value='new').execute()
|
|
306
|
+
A B
|
|
307
|
+
0 new abc
|
|
308
|
+
1 foo new
|
|
309
|
+
2 bait xyz
|
|
310
|
+
|
|
311
|
+
>>> df.replace(regex={r'^ba.$': 'new', 'foo': 'xyz'}).execute()
|
|
312
|
+
A B
|
|
313
|
+
0 new abc
|
|
314
|
+
1 xyz new
|
|
315
|
+
2 bait xyz
|
|
316
|
+
|
|
317
|
+
>>> df.replace(regex=[r'^ba.$', 'foo'], value='new').execute()
|
|
318
|
+
A B
|
|
319
|
+
0 new abc
|
|
320
|
+
1 new new
|
|
321
|
+
2 bait xyz
|
|
322
|
+
|
|
323
|
+
Note that when replacing multiple ``bool`` or ``datetime64`` objects,
|
|
324
|
+
the data types in the `to_replace` parameter must match the data
|
|
325
|
+
type of the value being replaced:
|
|
326
|
+
|
|
327
|
+
>>> df = md.DataFrame({'A': [True, False, True],
|
|
328
|
+
... 'B': [False, True, False]})
|
|
329
|
+
>>> df.replace({'a string': 'new value', True: False}) # raises.execute()
|
|
330
|
+
Traceback (most recent call last):
|
|
331
|
+
....execute()
|
|
332
|
+
TypeError: Cannot compare types 'ndarray(dtype=bool)' and 'str'
|
|
333
|
+
|
|
334
|
+
This raises a ``TypeError`` because one of the ``dict`` keys is not of
|
|
335
|
+
the correct type for replacement.
|
|
336
|
+
|
|
337
|
+
Compare the behavior of ``s.replace({'a': None})`` and
|
|
338
|
+
``s.replace('a', None)`` to understand the peculiarities
|
|
339
|
+
of the `to_replace` parameter:
|
|
340
|
+
|
|
341
|
+
>>> s = md.Series([10, 'a', 'a', 'b', 'a'])
|
|
342
|
+
|
|
343
|
+
When one uses a dict as the `to_replace` value, it is like the
|
|
344
|
+
value(s) in the dict are equal to the `value` parameter.
|
|
345
|
+
``s.replace({'a': None})`` is equivalent to
|
|
346
|
+
``s.replace(to_replace={'a': None}, value=None, method=None)``:
|
|
347
|
+
|
|
348
|
+
>>> s.replace({'a': None}).execute()
|
|
349
|
+
0 10
|
|
350
|
+
1 None
|
|
351
|
+
2 None
|
|
352
|
+
3 b
|
|
353
|
+
4 None
|
|
354
|
+
dtype: object
|
|
355
|
+
|
|
356
|
+
When ``value=None`` and `to_replace` is a scalar, list or
|
|
357
|
+
tuple, `replace` uses the method parameter (default 'pad') to do the
|
|
358
|
+
replacement. So this is why the 'a' values are being replaced by 10
|
|
359
|
+
in rows 1 and 2 and 'b' in row 4 in this case.
|
|
360
|
+
The command ``s.replace('a', None)`` is actually equivalent to
|
|
361
|
+
``s.replace(to_replace='a', value=None, method='pad')``:
|
|
362
|
+
|
|
363
|
+
>>> s.replace('a', None).execute()
|
|
364
|
+
0 10
|
|
365
|
+
1 10
|
|
366
|
+
2 10
|
|
367
|
+
3 b
|
|
368
|
+
4 b
|
|
369
|
+
dtype: object
|
|
370
|
+
"""
|
|
371
|
+
|
|
372
|
+
|
|
373
|
+
def _replace(
|
|
374
|
+
df_or_series,
|
|
375
|
+
to_replace=None,
|
|
376
|
+
value=None,
|
|
377
|
+
inplace=False,
|
|
378
|
+
limit=None,
|
|
379
|
+
regex=False,
|
|
380
|
+
method=no_default,
|
|
381
|
+
):
|
|
382
|
+
if not isinstance(to_replace, dict) and value is no_default and limit is not None:
|
|
383
|
+
raise NotImplementedError("fill with limit not supported when value is None")
|
|
384
|
+
|
|
385
|
+
if not isinstance(regex, bool):
|
|
386
|
+
to_replace = regex
|
|
387
|
+
regex = True
|
|
388
|
+
op = DataFrameReplace(
|
|
389
|
+
to_replace=to_replace, value=value, limit=limit, regex=regex, method=method
|
|
390
|
+
)
|
|
391
|
+
ret = op(df_or_series)
|
|
392
|
+
if inplace:
|
|
393
|
+
df_or_series.data = ret.data
|
|
394
|
+
else:
|
|
395
|
+
return ret
|
|
396
|
+
|
|
397
|
+
|
|
398
|
+
def df_replace(
|
|
399
|
+
df,
|
|
400
|
+
to_replace=no_default,
|
|
401
|
+
value=no_default,
|
|
402
|
+
inplace=False,
|
|
403
|
+
limit=None,
|
|
404
|
+
regex=False,
|
|
405
|
+
method=no_default,
|
|
406
|
+
):
|
|
407
|
+
return _replace(
|
|
408
|
+
df,
|
|
409
|
+
to_replace=to_replace,
|
|
410
|
+
value=value,
|
|
411
|
+
inplace=inplace,
|
|
412
|
+
limit=limit,
|
|
413
|
+
regex=regex,
|
|
414
|
+
method=method,
|
|
415
|
+
)
|
|
416
|
+
|
|
417
|
+
|
|
418
|
+
def series_replace(
|
|
419
|
+
series,
|
|
420
|
+
to_replace=no_default,
|
|
421
|
+
value=no_default,
|
|
422
|
+
inplace=False,
|
|
423
|
+
limit=None,
|
|
424
|
+
regex=False,
|
|
425
|
+
method=no_default,
|
|
426
|
+
):
|
|
427
|
+
return _replace(
|
|
428
|
+
series,
|
|
429
|
+
to_replace=to_replace,
|
|
430
|
+
value=value,
|
|
431
|
+
inplace=inplace,
|
|
432
|
+
limit=limit,
|
|
433
|
+
regex=regex,
|
|
434
|
+
method=method,
|
|
435
|
+
)
|
|
436
|
+
|
|
437
|
+
|
|
438
|
+
df_replace.__doc__ = _fun_doc.replace("#obj_type#", "DataFrame")
|
|
439
|
+
series_replace.__doc__ = _fun_doc.replace("#obj_type#", "Series")
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
# Copyright 1999-2024 Alibaba Group Holding Ltd.
|
|
2
|
+
#
|
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
+
# you may not use this file except in compliance with the License.
|
|
5
|
+
# You may obtain a copy of the License at
|
|
6
|
+
#
|
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
+
#
|
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
+
# See the License for the specific language governing permissions and
|
|
13
|
+
# limitations under the License.
|
|
@@ -0,0 +1,89 @@
|
|
|
1
|
+
# Copyright 1999-2024 Alibaba Group Holding Ltd.
|
|
2
|
+
#
|
|
3
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
4
|
+
# you may not use this file except in compliance with the License.
|
|
5
|
+
# You may obtain a copy of the License at
|
|
6
|
+
#
|
|
7
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
8
|
+
#
|
|
9
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
10
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
11
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
12
|
+
# See the License for the specific language governing permissions and
|
|
13
|
+
# limitations under the License.
|
|
14
|
+
import random
|
|
15
|
+
|
|
16
|
+
import numpy as np
|
|
17
|
+
import pandas as pd
|
|
18
|
+
import pytest
|
|
19
|
+
|
|
20
|
+
from .... import dataframe as md
|
|
21
|
+
from ...core import MultiIndex
|
|
22
|
+
from .. import isna, isnull, notna, notnull
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
def test_fill_na():
|
|
26
|
+
df_raw = pd.DataFrame(np.nan, index=range(0, 20), columns=list("ABCDEFGHIJ"))
|
|
27
|
+
for _ in range(20):
|
|
28
|
+
df_raw.iloc[random.randint(0, 19), random.randint(0, 9)] = random.randint(0, 99)
|
|
29
|
+
series_raw = pd.Series(np.nan, index=range(20))
|
|
30
|
+
for _ in range(3):
|
|
31
|
+
series_raw.iloc[random.randint(0, 19)] = random.randint(0, 99)
|
|
32
|
+
|
|
33
|
+
df = md.DataFrame(df_raw)
|
|
34
|
+
series = md.Series(series_raw)
|
|
35
|
+
|
|
36
|
+
# when nothing supplied, raise
|
|
37
|
+
with pytest.raises(ValueError):
|
|
38
|
+
df.fillna()
|
|
39
|
+
# when both values and methods supplied, raises
|
|
40
|
+
with pytest.raises(ValueError):
|
|
41
|
+
df.fillna(value=1, method="ffill")
|
|
42
|
+
# when call on series, cannot supply DataFrames
|
|
43
|
+
with pytest.raises(ValueError):
|
|
44
|
+
series.fillna(value=df)
|
|
45
|
+
with pytest.raises(ValueError):
|
|
46
|
+
series.fillna(value=df_raw)
|
|
47
|
+
with pytest.raises(NotImplementedError):
|
|
48
|
+
series.fillna(value=series_raw, downcast="infer")
|
|
49
|
+
with pytest.raises(NotImplementedError):
|
|
50
|
+
series.ffill(limit=1)
|
|
51
|
+
|
|
52
|
+
|
|
53
|
+
@pytest.mark.parametrize("check_func", [isna, isnull, notna, notnull])
|
|
54
|
+
def test_isna(check_func):
|
|
55
|
+
# multi index
|
|
56
|
+
with pytest.raises(NotImplementedError):
|
|
57
|
+
midx = MultiIndex()
|
|
58
|
+
check_func(midx)
|
|
59
|
+
|
|
60
|
+
|
|
61
|
+
def test_drop_na():
|
|
62
|
+
# dataframe cases
|
|
63
|
+
df_raw = pd.DataFrame(np.nan, index=range(0, 20), columns=list("ABCDEFGHIJ"))
|
|
64
|
+
for _ in range(30):
|
|
65
|
+
df_raw.iloc[random.randint(0, 19), random.randint(0, 9)] = random.randint(0, 99)
|
|
66
|
+
for rowid in range(random.randint(1, 5)):
|
|
67
|
+
row = random.randint(0, 19)
|
|
68
|
+
for idx in range(0, 10):
|
|
69
|
+
df_raw.iloc[row, idx] = random.randint(0, 99)
|
|
70
|
+
|
|
71
|
+
# not supporting drop with axis=1
|
|
72
|
+
with pytest.raises(NotImplementedError):
|
|
73
|
+
md.DataFrame(df_raw).dropna(axis=1)
|
|
74
|
+
|
|
75
|
+
|
|
76
|
+
def test_replace():
|
|
77
|
+
# dataframe cases
|
|
78
|
+
df_raw = pd.DataFrame(-1, index=range(0, 20), columns=list("ABCDEFGHIJ"))
|
|
79
|
+
for _ in range(30):
|
|
80
|
+
df_raw.iloc[random.randint(0, 19), random.randint(0, 9)] = random.randint(0, 99)
|
|
81
|
+
for rowid in range(random.randint(1, 5)):
|
|
82
|
+
row = random.randint(0, 19)
|
|
83
|
+
for idx in range(0, 10):
|
|
84
|
+
df_raw.iloc[row, idx] = random.randint(0, 99)
|
|
85
|
+
|
|
86
|
+
# not supporting fill with limit
|
|
87
|
+
df = md.DataFrame(df_raw, chunk_size=4)
|
|
88
|
+
with pytest.raises(NotImplementedError):
|
|
89
|
+
df.replace(-1, method="ffill", limit=5)
|