PyPI - fugue - Versions diffs - 0.8.7.dev8__py3-none-any.whl → 0.9.0__py3-none-any.whl - Mend

fugue 0.8.7.dev8py3-none-any.whl → 0.9.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

fugue/collections/sql.py +1 -1
fugue/dataframe/utils.py +4 -18
fugue/test/__init__.py +11 -0
fugue/test/pandas_tester.py +24 -0
fugue/test/plugins.py +393 -0
{fugue-0.8.7.dev8.dist-info → fugue-0.9.0.dist-info}/METADATA +24 -15
{fugue-0.8.7.dev8.dist-info → fugue-0.9.0.dist-info}/RECORD +38 -47
{fugue-0.8.7.dev8.dist-info → fugue-0.9.0.dist-info}/WHEEL +1 -1
fugue-0.9.0.dist-info/entry_points.txt +12 -0
fugue_dask/_io.py +8 -5
fugue_dask/_utils.py +4 -4
fugue_dask/execution_engine.py +11 -0
fugue_dask/registry.py +2 -0
fugue_dask/tester.py +24 -0
fugue_duckdb/__init__.py +0 -5
fugue_duckdb/_io.py +1 -0
fugue_duckdb/registry.py +30 -2
fugue_duckdb/tester.py +49 -0
fugue_ibis/__init__.py +0 -3
fugue_ibis/dataframe.py +2 -2
fugue_ibis/execution_engine.py +14 -7
fugue_ray/_constants.py +3 -4
fugue_ray/_utils/dataframe.py +10 -21
fugue_ray/_utils/io.py +38 -9
fugue_ray/execution_engine.py +1 -2
fugue_ray/registry.py +1 -0
fugue_ray/tester.py +22 -0
fugue_spark/execution_engine.py +5 -5
fugue_spark/registry.py +13 -1
fugue_spark/tester.py +78 -0
fugue_test/__init__.py +82 -0
fugue_test/builtin_suite.py +26 -43
fugue_test/dataframe_suite.py +5 -14
fugue_test/execution_suite.py +170 -143
fugue_test/fixtures.py +61 -0
fugue_version/__init__.py +1 -1
fugue-0.8.7.dev8.dist-info/entry_points.txt +0 -17
fugue_dask/ibis_engine.py +0 -62
fugue_duckdb/ibis_engine.py +0 -56
fugue_ibis/execution/__init__.py +0 -0
fugue_ibis/execution/ibis_engine.py +0 -49
fugue_ibis/execution/pandas_backend.py +0 -54
fugue_ibis/extensions.py +0 -203
fugue_spark/ibis_engine.py +0 -45
fugue_test/ibis_suite.py +0 -92
fugue_test/plugins/__init__.py +0 -0
fugue_test/plugins/dask/__init__.py +0 -2
fugue_test/plugins/dask/fixtures.py +0 -12
fugue_test/plugins/duckdb/__init__.py +0 -2
fugue_test/plugins/duckdb/fixtures.py +0 -9
fugue_test/plugins/misc/__init__.py +0 -2
fugue_test/plugins/misc/fixtures.py +0 -18
fugue_test/plugins/ray/__init__.py +0 -2
fugue_test/plugins/ray/fixtures.py +0 -9
{fugue-0.8.7.dev8.dist-info → fugue-0.9.0.dist-info}/LICENSE +0 -0
{fugue-0.8.7.dev8.dist-info → fugue-0.9.0.dist-info}/top_level.txt +0 -0

fugue_test/execution_suite.py CHANGED Viewed

@@ -10,7 +10,6 @@ import copy
 import os
 import pickle
 from datetime import datetime
-from unittest import TestCase
 import pandas as pd
 import pytest
@@ -20,17 +19,15 @@ from triad.utils.io import isfile, makedirs, touch
 import fugue.api as fa
 import fugue.column.functions as ff
+import fugue.test as ft
 from fugue import (
     ArrayDataFrame,
     DataFrame,
     DataFrames,
-    ExecutionEngine,
     PandasDataFrame,
     PartitionSpec,
-    register_default_sql_engine,
 )
 from fugue.column import all_cols, col, lit
-from fugue.dataframe.utils import _df_eq as df_eq
 from fugue.execution.native_execution_engine import NativeExecutionEngine
@@ -40,25 +37,7 @@ class ExecutionEngineTests(object):
     should pass this test suite.
     """
-    class Tests(TestCase):
-        @classmethod
-        def setUpClass(cls):
-            register_default_sql_engine(lambda engine: engine.sql_engine)
-            cls._engine = cls.make_engine(cls)
-            fa.set_global_engine(cls._engine)
-        @property
-        def engine(self) -> ExecutionEngine:
-            return self._engine  # type: ignore
-        @classmethod
-        def tearDownClass(cls):
-            fa.clear_global_engine()
-            cls._engine.stop()
-        def make_engine(self) -> ExecutionEngine:  # pragma: no cover
-            raise NotImplementedError
+    class Tests(ft.FugueTestSuite):
         def test_init(self):
             print(self.engine)
             assert self.engine.log is not None
@@ -76,19 +55,19 @@ class ExecutionEngineTests(object):
             )
             # all engines should accept these types of inputs
             # should take fugue.DataFrame
-            df_eq(o, fa.as_fugue_engine_df(e, o), throw=True)
+            self.df_eq(o, fa.as_fugue_engine_df(e, o), throw=True)
             # should take array, shema
-            df_eq(
+            self.df_eq(
                 o,
                 fa.as_fugue_engine_df(e, [[1.1, 2.2], [3.3, 4.4]], "a:double,b:double"),
                 throw=True,
             )
             # should take pandas dataframe
             pdf = pd.DataFrame([[1.1, 2.2], [3.3, 4.4]], columns=["a", "b"])
-            df_eq(o, fa.as_fugue_engine_df(e, pdf), throw=True)
+            self.df_eq(o, fa.as_fugue_engine_df(e, pdf), throw=True)
             # should convert string to datetime in to_df
-            df_eq(
+            self.df_eq(
                 fa.as_fugue_engine_df(e, [["2020-01-01"]], "a:datetime"),
                 [[datetime(2020, 1, 1)]],
                 "a:datetime",
@@ -99,7 +78,7 @@ class ExecutionEngineTests(object):
             o = ArrayDataFrame([], "a:double,b:str")
             pdf = pd.DataFrame([[0.1, "a"]], columns=["a", "b"])
             pdf = pdf[pdf.a < 0]
-            df_eq(o, fa.as_fugue_engine_df(e, pdf), throw=True)
+            self.df_eq(o, fa.as_fugue_engine_df(e, pdf), throw=True)
         @pytest.mark.skipif(not HAS_QPD, reason="qpd not working")
         def test_filter(self):
@@ -108,11 +87,11 @@ class ExecutionEngineTests(object):
                 "a:double,b:int",
             )
             b = fa.filter(a, col("a").not_null())
-            df_eq(b, [[1, 2], [3, 4]], "a:double,b:int", throw=True)
+            self.df_eq(b, [[1, 2], [3, 4]], "a:double,b:int", throw=True)
             c = fa.filter(a, col("a").not_null() & (col("b") < 3))
-            df_eq(c, [[1, 2]], "a:double,b:int", throw=True)
+            self.df_eq(c, [[1, 2]], "a:double,b:int", throw=True)
             c = fa.filter(a, col("a") + col("b") == 3)
-            df_eq(c, [[1, 2]], "a:double,b:int", throw=True)
+            self.df_eq(c, [[1, 2]], "a:double,b:int", throw=True)
         @pytest.mark.skipif(not HAS_QPD, reason="qpd not working")
         def test_select(self):
@@ -122,7 +101,7 @@ class ExecutionEngineTests(object):
             # simple
             b = fa.select(a, col("b"), (col("b") + 1).alias("c").cast(str))
-            df_eq(
+            self.df_eq(
                 b,
                 [[2, "3"], [2, "3"], [1, "2"], [4, "5"], [4, "5"]],
                 "b:int,c:str",
@@ -133,7 +112,7 @@ class ExecutionEngineTests(object):
             b = fa.select(
                 a, col("b"), (col("b") + 1).alias("c").cast(str), distinct=True
             )
-            df_eq(
+            self.df_eq(
                 b,
                 [[2, "3"], [1, "2"], [4, "5"]],
                 "b:int,c:str",
@@ -142,11 +121,11 @@ class ExecutionEngineTests(object):
             # wildcard
             b = fa.select(a, all_cols(), where=col("a") + col("b") == 3)
-            df_eq(b, [[1, 2]], "a:double,b:int", throw=True)
+            self.df_eq(b, [[1, 2]], "a:double,b:int", throw=True)
             # aggregation
             b = fa.select(a, col("a"), ff.sum(col("b")).cast(float).alias("b"))
-            df_eq(b, [[1, 2], [3, 4], [None, 7]], "a:double,b:double", throw=True)
+            self.df_eq(b, [[1, 2], [3, 4], [None, 7]], "a:double,b:double", throw=True)
             # having
             # https://github.com/fugue-project/fugue/issues/222
@@ -157,7 +136,7 @@ class ExecutionEngineTests(object):
                 col_b.cast(float).alias("c"),
                 having=(col_b >= 7) | (col("a") == 1),
             )
-            df_eq(b, [[1, 2], [None, 7]], "a:double,c:double", throw=True)
+            self.df_eq(b, [[1, 2], [None, 7]], "a:double,c:double", throw=True)
             # literal + alias inference
             # https://github.com/fugue-project/fugue/issues/222
@@ -169,7 +148,7 @@ class ExecutionEngineTests(object):
                 col_b.cast(float).alias("c"),
                 having=(col_b >= 7) | (col("a") == 1),
             )
-            df_eq(
+            self.df_eq(
                 b, [[1, "1", 2], [None, "1", 7]], "a:double,o:str,c:double", throw=True
             )
@@ -180,7 +159,7 @@ class ExecutionEngineTests(object):
             )
             b = fa.assign(a, x=1, b=col("b").cast(str), c=(col("b") + 1).cast(int))
-            df_eq(
+            self.df_eq(
                 b,
                 [
                     [1, "2", 1, 3],
@@ -204,7 +183,7 @@ class ExecutionEngineTests(object):
                 b=ff.max(col("b")),
                 c=(ff.max(col("b")) * 2).cast("int32").alias("c"),
             )
-            df_eq(b, [[4, 8]], "b:int,c:int", throw=True)
+            self.df_eq(b, [[4, 8]], "b:int,c:int", throw=True)
             b = fa.aggregate(
                 a,
@@ -212,7 +191,7 @@ class ExecutionEngineTests(object):
                 b=ff.max(col("b")),
                 c=(ff.max(col("b")) * 2).cast("int32").alias("c"),
             )
-            df_eq(
+            self.df_eq(
                 b,
                 [[None, 4, 8], [1, 2, 4], [3, 4, 8]],
                 "a:double,b:int,c:int",
@@ -241,17 +220,17 @@ class ExecutionEngineTests(object):
             a = fa.as_fugue_engine_df(e, o)
             # no partition
             c = e.map_engine.map_dataframe(a, noop, a.schema, PartitionSpec())
-            df_eq(c, o, throw=True)
+            self.df_eq(c, o, throw=True)
             # with key partition
             c = e.map_engine.map_dataframe(
                 a, noop, a.schema, PartitionSpec(by=["a"], presort="b")
             )
-            df_eq(c, o, throw=True)
+            self.df_eq(c, o, throw=True)
             # select top
             c = e.map_engine.map_dataframe(
                 a, select_top, a.schema, PartitionSpec(by=["a"], presort="b")
             )
-            df_eq(c, [[None, 1], [1, 2], [3, 4]], "a:double,b:int", throw=True)
+            self.df_eq(c, [[None, 1], [1, 2], [3, 4]], "a:double,b:int", throw=True)
             # select top with another order
             c = e.map_engine.map_dataframe(
                 a,
@@ -259,7 +238,7 @@ class ExecutionEngineTests(object):
                 a.schema,
                 PartitionSpec(partition_by=["a"], presort="b DESC"),
             )
-            df_eq(
+            self.df_eq(
                 c,
                 [[None, 4], [1, 2], [3, 4]],
                 "a:double,b:int",
@@ -273,7 +252,7 @@ class ExecutionEngineTests(object):
                 PartitionSpec(partition_by=["a"], presort="b DESC", num_partitions=3),
                 on_init=on_init,
             )
-            df_eq(c, [[None, 4], [1, 2], [3, 4]], "a:double,b:int", throw=True)
+            self.df_eq(c, [[None, 4], [1, 2], [3, 4]], "a:double,b:int", throw=True)
         def test_map_with_special_values(self):
             def with_nat(cursor, data):
@@ -290,7 +269,7 @@ class ExecutionEngineTests(object):
             c = e.map_engine.map_dataframe(
                 o, select_top, o.schema, PartitionSpec(by=["a", "b"], presort="c")
             )
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, None, 0], [None, None, 2]],
                 "a:double,b:double,c:int",
@@ -311,7 +290,7 @@ class ExecutionEngineTests(object):
             c = e.map_engine.map_dataframe(
                 o, select_top, o.schema, PartitionSpec(by=["a", "c"], presort="b DESC")
             )
-            df_eq(
+            self.df_eq(
                 c,
                 [[None, 4, None], [dt, 5, 1]],
                 "a:datetime,b:int,c:double",
@@ -320,7 +299,7 @@ class ExecutionEngineTests(object):
             d = e.map_engine.map_dataframe(
                 c, with_nat, "a:datetime,b:int,c:double,nat:datetime", PartitionSpec()
             )
-            df_eq(
+            self.df_eq(
                 d,
                 [[None, 4, None, None], [dt, 5, 1, None]],
                 "a:datetime,b:int,c:double,nat:datetime",
@@ -331,7 +310,7 @@ class ExecutionEngineTests(object):
             c = e.map_engine.map_dataframe(
                 o, select_top, o.schema, PartitionSpec(by=["a"])
             )
-            df_eq(c, o, check_order=True, throw=True)
+            self.df_eq(c, o, check_order=True, throw=True)
         def test_map_with_dict_col(self):
             e = self.engine
@@ -341,7 +320,7 @@ class ExecutionEngineTests(object):
             c = e.map_engine.map_dataframe(
                 o, select_top, o.schema, PartitionSpec(by=["a"])
             )
-            df_eq(c, o, no_pandas=True, check_order=True, throw=True)
+            self.df_eq(c, o, no_pandas=True, check_order=True, throw=True)
             # input has dict, output doesn't
             def mp2(cursor, data):
@@ -350,7 +329,7 @@ class ExecutionEngineTests(object):
             c = e.map_engine.map_dataframe(
                 o, mp2, "a:datetime", PartitionSpec(by=["a"])
             )
-            df_eq(
+            self.df_eq(
                 c,
                 PandasDataFrame([[dt]], "a:datetime"),
                 no_pandas=True,
@@ -365,7 +344,7 @@ class ExecutionEngineTests(object):
             c = e.map_engine.map_dataframe(
                 c, mp3, "a:datetime,b:{a:long}", PartitionSpec(by=["a"])
             )
-            df_eq(c, o, no_pandas=True, check_order=True, throw=True)
+            self.df_eq(c, o, no_pandas=True, check_order=True, throw=True)
         def test_map_with_binary(self):
             e = self.engine
@@ -381,7 +360,7 @@ class ExecutionEngineTests(object):
                 ],
                 "a:bytes",
             )
-            df_eq(expected, c, no_pandas=True, check_order=True, throw=True)
+            self.df_eq(expected, c, no_pandas=True, check_order=False, throw=True)
         def test_join_multiple(self):
             e = self.engine
@@ -389,7 +368,7 @@ class ExecutionEngineTests(object):
             b = fa.as_fugue_engine_df(e, [[1, 20], [3, 40]], "a:int,c:int")
             c = fa.as_fugue_engine_df(e, [[1, 200], [3, 400]], "a:int,d:int")
             d = fa.inner_join(a, b, c)
-            df_eq(
+            self.df_eq(
                 d,
                 [[1, 2, 20, 200], [3, 4, 40, 400]],
                 "a:int,b:int,c:int,d:int",
@@ -401,7 +380,7 @@ class ExecutionEngineTests(object):
             a = fa.as_fugue_engine_df(e, [[1, 2], [3, 4]], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [[6], [7]], "c:int")
             c = fa.join(a, b, how="Cross")
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, 2, 6], [1, 2, 7], [3, 4, 6], [3, 4, 7]],
                 "a:int,b:int,c:int",
@@ -410,26 +389,26 @@ class ExecutionEngineTests(object):
             b = fa.as_fugue_engine_df(e, [], "c:int")
             c = fa.cross_join(a, b)
-            df_eq(c, [], "a:int,b:int,c:int", throw=True)
+            self.df_eq(c, [], "a:int,b:int,c:int", throw=True)
             a = fa.as_fugue_engine_df(e, [], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [], "c:int")
             c = fa.join(a, b, how="Cross")
-            df_eq(c, [], "a:int,b:int,c:int", throw=True)
+            self.df_eq(c, [], "a:int,b:int,c:int", throw=True)
         def test__join_inner(self):
             e = self.engine
             a = fa.as_fugue_engine_df(e, [[1, 2], [3, 4]], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [[6, 1], [2, 7]], "c:int,a:int")
             c = fa.join(a, b, how="INNER", on=["a"])
-            df_eq(c, [[1, 2, 6]], "a:int,b:int,c:int", throw=True)
+            self.df_eq(c, [[1, 2, 6]], "a:int,b:int,c:int", throw=True)
             c = fa.inner_join(b, a)
-            df_eq(c, [[6, 1, 2]], "c:int,a:int,b:int", throw=True)
+            self.df_eq(c, [[6, 1, 2]], "c:int,a:int,b:int", throw=True)
             a = fa.as_fugue_engine_df(e, [], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [], "c:int,a:int")
             c = fa.join(a, b, how="INNER", on=["a"])
-            df_eq(c, [], "a:int,b:int,c:int", throw=True)
+            self.df_eq(c, [], "a:int,b:int,c:int", throw=True)
         def test__join_outer(self):
             e = self.engine
@@ -437,34 +416,38 @@ class ExecutionEngineTests(object):
             a = fa.as_fugue_engine_df(e, [], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [], "c:str,a:int")
             c = fa.left_outer_join(a, b)
-            df_eq(c, [], "a:int,b:int,c:str", throw=True)
+            self.df_eq(c, [], "a:int,b:int,c:str", throw=True)
             a = fa.as_fugue_engine_df(e, [], "a:int,b:str")
             b = fa.as_fugue_engine_df(e, [], "c:int,a:int")
             c = fa.right_outer_join(a, b)
-            df_eq(c, [], "a:int,b:str,c:int", throw=True)
+            self.df_eq(c, [], "a:int,b:str,c:int", throw=True)
             a = fa.as_fugue_engine_df(e, [], "a:int,b:str")
             b = fa.as_fugue_engine_df(e, [], "c:str,a:int")
             c = fa.full_outer_join(a, b)
-            df_eq(c, [], "a:int,b:str,c:str", throw=True)
+            self.df_eq(c, [], "a:int,b:str,c:str", throw=True)
             a = fa.as_fugue_engine_df(e, [[1, "2"], [3, "4"]], "a:int,b:str")
             b = fa.as_fugue_engine_df(e, [["6", 1], ["2", 7]], "c:str,a:int")
             c = fa.join(a, b, how="left_OUTER", on=["a"])
-            df_eq(c, [[1, "2", "6"], [3, "4", None]], "a:int,b:str,c:str", throw=True)
+            self.df_eq(
+                c, [[1, "2", "6"], [3, "4", None]], "a:int,b:str,c:str", throw=True
+            )
             c = fa.join(b, a, how="left_outer", on=["a"])
-            df_eq(c, [["6", 1, "2"], ["2", 7, None]], "c:str,a:int,b:str", throw=True)
+            self.df_eq(
+                c, [["6", 1, "2"], ["2", 7, None]], "c:str,a:int,b:str", throw=True
+            )
             a = fa.as_fugue_engine_df(e, [[1, "2"], [3, "4"]], "a:int,b:str")
             b = fa.as_fugue_engine_df(e, [[6, 1], [2, 7]], "c:double,a:int")
             c = fa.join(a, b, how="left_OUTER", on=["a"])
-            df_eq(
+            self.df_eq(
                 c, [[1, "2", 6.0], [3, "4", None]], "a:int,b:str,c:double", throw=True
             )
             c = fa.join(b, a, how="left_outer", on=["a"])
             # assert c.as_pandas().values.tolist()[1][2] is None
-            df_eq(
+            self.df_eq(
                 c, [[6.0, 1, "2"], [2.0, 7, None]], "c:double,a:int,b:str", throw=True
             )
@@ -472,10 +455,12 @@ class ExecutionEngineTests(object):
             b = fa.as_fugue_engine_df(e, [["6", 1], ["2", 7]], "c:str,a:int")
             c = fa.join(a, b, how="right_outer", on=["a"])
             # assert c.as_pandas().values.tolist()[1][1] is None
-            df_eq(c, [[1, "2", "6"], [7, None, "2"]], "a:int,b:str,c:str", throw=True)
+            self.df_eq(
+                c, [[1, "2", "6"], [7, None, "2"]], "a:int,b:str,c:str", throw=True
+            )
             c = fa.join(a, b, how="full_outer", on=["a"])
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, "2", "6"], [3, "4", None], [7, None, "2"]],
                 "a:int,b:str,c:str",
@@ -488,21 +473,23 @@ class ExecutionEngineTests(object):
             a = fa.as_fugue_engine_df(e, [[1, "2"], [3, "4"]], "a:int,b:str")
             b = fa.as_fugue_engine_df(e, [[6, 1], [2, 7]], "c:int,a:int")
             c = fa.join(a, b, how="left_OUTER", on=["a"])
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, "2", 6], [3, "4", None]],
                 "a:int,b:str,c:int",
                 throw=True,
             )
             c = fa.join(b, a, how="left_outer", on=["a"])
-            df_eq(c, [[6, 1, "2"], [2, 7, None]], "c:int,a:int,b:str", throw=True)
+            self.df_eq(c, [[6, 1, "2"], [2, 7, None]], "c:int,a:int,b:str", throw=True)
             a = fa.as_fugue_engine_df(e, [[1, "2"], [3, "4"]], "a:int,b:str")
             b = fa.as_fugue_engine_df(e, [[True, 1], [False, 7]], "c:bool,a:int")
             c = fa.join(a, b, how="left_OUTER", on=["a"])
-            df_eq(c, [[1, "2", True], [3, "4", None]], "a:int,b:str,c:bool", throw=True)
+            self.df_eq(
+                c, [[1, "2", True], [3, "4", None]], "a:int,b:str,c:bool", throw=True
+            )
             c = fa.join(b, a, how="left_outer", on=["a"])
-            df_eq(
+            self.df_eq(
                 c, [[True, 1, "2"], [False, 7, None]], "c:bool,a:int,b:str", throw=True
             )
@@ -511,36 +498,36 @@ class ExecutionEngineTests(object):
             a = fa.as_fugue_engine_df(e, [[1, 2], [3, 4]], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [[6, 1], [2, 7]], "c:int,a:int")
             c = fa.join(a, b, how="semi", on=["a"])
-            df_eq(c, [[1, 2]], "a:int,b:int", throw=True)
+            self.df_eq(c, [[1, 2]], "a:int,b:int", throw=True)
             c = fa.semi_join(b, a)
-            df_eq(c, [[6, 1]], "c:int,a:int", throw=True)
+            self.df_eq(c, [[6, 1]], "c:int,a:int", throw=True)
             b = fa.as_fugue_engine_df(e, [], "c:int,a:int")
             c = fa.join(a, b, how="semi", on=["a"])
-            df_eq(c, [], "a:int,b:int", throw=True)
+            self.df_eq(c, [], "a:int,b:int", throw=True)
             a = fa.as_fugue_engine_df(e, [], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [], "c:int,a:int")
             c = fa.join(a, b, how="semi", on=["a"])
-            df_eq(c, [], "a:int,b:int", throw=True)
+            self.df_eq(c, [], "a:int,b:int", throw=True)
         def test__join_anti(self):
             e = self.engine
             a = fa.as_fugue_engine_df(e, [[1, 2], [3, 4]], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [[6, 1], [2, 7]], "c:int,a:int")
             c = fa.join(a, b, how="anti", on=["a"])
-            df_eq(c, [[3, 4]], "a:int,b:int", throw=True)
+            self.df_eq(c, [[3, 4]], "a:int,b:int", throw=True)
             c = fa.anti_join(b, a)
-            df_eq(c, [[2, 7]], "c:int,a:int", throw=True)
+            self.df_eq(c, [[2, 7]], "c:int,a:int", throw=True)
             b = fa.as_fugue_engine_df(e, [], "c:int,a:int")
             c = fa.join(a, b, how="anti", on=["a"])
-            df_eq(c, [[1, 2], [3, 4]], "a:int,b:int", throw=True)
+            self.df_eq(c, [[1, 2], [3, 4]], "a:int,b:int", throw=True)
             a = fa.as_fugue_engine_df(e, [], "a:int,b:int")
             b = fa.as_fugue_engine_df(e, [], "c:int,a:int")
             c = fa.join(a, b, how="anti", on=["a"])
-            df_eq(c, [], "a:int,b:int", throw=True)
+            self.df_eq(c, [], "a:int,b:int", throw=True)
         def test__join_with_null_keys(self):
             # SQL will not match null values
@@ -552,7 +539,7 @@ class ExecutionEngineTests(object):
                 e, [[1, 2, 33], [4, None, 63]], "a:double,b:double,d:int"
             )
             c = fa.join(a, b, how="INNER")
-            df_eq(c, [[1, 2, 3, 33]], "a:double,b:double,c:int,d:int", throw=True)
+            self.df_eq(c, [[1, 2, 3, 33]], "a:double,b:double,c:int,d:int", throw=True)
         def test_union(self):
             e = self.engine
@@ -563,21 +550,21 @@ class ExecutionEngineTests(object):
                 e, [[1, 2, 33], [4, None, 6]], "a:double,b:double,c:int"
             )
             c = fa.union(a, b)
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, 2, 3], [4, None, 6], [1, 2, 33]],
                 "a:double,b:double,c:int",
                 throw=True,
             )
             c = fa.union(a, b, distinct=False)
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, 2, 3], [4, None, 6], [1, 2, 33], [4, None, 6]],
                 "a:double,b:double,c:int",
                 throw=True,
             )
             d = fa.union(a, b, c, distinct=False)
-            df_eq(
+            self.df_eq(
                 d,
                 [
                     [1, 2, 3],
@@ -602,7 +589,7 @@ class ExecutionEngineTests(object):
                 e, [[1, 2, 33], [4, None, 6]], "a:double,b:double,c:int"
             )
             c = fa.subtract(a, b)
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, 2, 3]],
                 "a:double,b:double,c:int",
@@ -611,7 +598,7 @@ class ExecutionEngineTests(object):
             x = fa.as_fugue_engine_df(e, [[1, 2, 33]], "a:double,b:double,c:int")
             y = fa.as_fugue_engine_df(e, [[4, None, 6]], "a:double,b:double,c:int")
             z = fa.subtract(a, x, y)
-            df_eq(
+            self.df_eq(
                 z,
                 [[1, 2, 3]],
                 "a:double,b:double,c:int",
@@ -619,7 +606,7 @@ class ExecutionEngineTests(object):
             )
             # TODO: EXCEPT ALL is not implemented (QPD issue)
             # c = fa.subtract(a, b, distinct=False)
-            # df_eq(
+            # self.df_eq(
             #     c,
             #     [[1, 2, 3], [1, 2, 3]],
             #     "a:double,b:double,c:int",
@@ -637,7 +624,7 @@ class ExecutionEngineTests(object):
                 "a:double,b:double,c:int",
             )
             c = fa.intersect(a, b)
-            df_eq(
+            self.df_eq(
                 c,
                 [[4, None, 6]],
                 "a:double,b:double,c:int",
@@ -654,7 +641,7 @@ class ExecutionEngineTests(object):
                 "a:double,b:double,c:int",
             )
             z = fa.intersect(a, x, y)
-            df_eq(
+            self.df_eq(
                 z,
                 [],
                 "a:double,b:double,c:int",
@@ -662,7 +649,7 @@ class ExecutionEngineTests(object):
             )
             # TODO: INTERSECT ALL is not implemented (QPD issue)
             # c = fa.intersect(a, b, distinct=False)
-            # df_eq(
+            # self.df_eq(
             #     c,
             #     [[4, None, 6], [4, None, 6]],
             #     "a:double,b:double,c:int",
@@ -675,7 +662,7 @@ class ExecutionEngineTests(object):
                 e, [[4, None, 6], [1, 2, 3], [4, None, 6]], "a:double,b:double,c:int"
             )
             c = fa.distinct(a)
-            df_eq(
+            self.df_eq(
                 c,
                 [[4, None, 6], [1, 2, 3]],
                 "a:double,b:double,c:int",
@@ -694,25 +681,25 @@ class ExecutionEngineTests(object):
             f = fa.dropna(a, how="any", thresh=2)
             g = fa.dropna(a, how="any", subset=["a", "c"])
             h = fa.dropna(a, how="any", thresh=1, subset=["a", "c"])
-            df_eq(
+            self.df_eq(
                 c,
                 [[1, 2, 3]],
                 "a:double,b:double,c:double",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 d,
                 [[4, None, 6], [1, 2, 3], [4, None, None]],
                 "a:double,b:double,c:double",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 f, [[4, None, 6], [1, 2, 3]], "a:double,b:double,c:double", throw=True
             )
-            df_eq(
+            self.df_eq(
                 g, [[4, None, 6], [1, 2, 3]], "a:double,b:double,c:double", throw=True
             )
-            df_eq(
+            self.df_eq(
                 h,
                 [[4, None, 6], [1, 2, 3], [4, None, None]],
                 "a:double,b:double,c:double",
@@ -730,25 +717,25 @@ class ExecutionEngineTests(object):
             d = fa.fillna(a, {"b": 99, "c": -99})
             f = fa.fillna(a, value=-99, subset=["c"])
             g = fa.fillna(a, {"b": 99, "c": -99}, subset=["c"])  # subset ignored
-            df_eq(
+            self.df_eq(
                 c,
                 [[4, 1, 6], [1, 2, 3], [4, 1, 1]],
                 "a:double,b:double,c:double",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 d,
                 [[4, 99, 6], [1, 2, 3], [4, 99, -99]],
                 "a:double,b:double,c:double",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 f,
                 [[4, None, 6], [1, 2, 3], [4, None, -99]],
                 "a:double,b:double,c:double",
                 throw=True,
             )
-            df_eq(g, d, throw=True)
+            self.df_eq(g, d, throw=True)
             raises(ValueError, lambda: fa.fillna(a, {"b": None, c: "99"}))
             raises(ValueError, lambda: fa.fillna(a, None))
             # raises(ValueError, lambda: fa.fillna(a, ["b"]))
@@ -767,9 +754,9 @@ class ExecutionEngineTests(object):
             h = fa.sample(a, frac=0.8, seed=1)
             h2 = fa.sample(a, frac=0.8, seed=1)
             i = fa.sample(a, frac=0.8, seed=2)
-            assert not df_eq(f, g, throw=False)
-            df_eq(h, h2, throw=True)
-            assert not df_eq(h, i, throw=False)
+            assert not self.df_eq(f, g, throw=False)
+            self.df_eq(h, h2, throw=True)
+            assert not self.df_eq(h, i, throw=False)
             assert abs(len(i.as_array()) - 80) < 10
         def test_take(self):
@@ -794,37 +781,37 @@ class ExecutionEngineTests(object):
             f = fa.take(a, n=1, presort=None, partition=ps2)
             g = fa.take(a, n=2, presort="a desc", na_position="last")
             h = fa.take(a, n=2, presort="a", na_position="first")
-            df_eq(
+            self.df_eq(
                 b,
                 [[None, 4, 2]],
                 "a:str,b:int,c:long",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 c,
                 [[None, 4, 2], [None, 2, 1]],
                 "a:str,b:int,c:long",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 d,
                 [["a", 3, 4], ["b", 2, 2], [None, 4, 2]],
                 "a:str,b:int,c:long",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 f,
                 [["a", 2, 3], ["a", 3, 4], ["b", 1, 2], [None, 2, 1]],
                 "a:str,b:int,c:long",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 g,
                 [["b", 1, 2], ["b", 2, 2]],
                 "a:str,b:int,c:long",
                 throw=True,
             )
-            df_eq(
+            self.df_eq(
                 h,
                 [
                     [None, 4, 2],
@@ -833,6 +820,46 @@ class ExecutionEngineTests(object):
                 "a:str,b:int,c:long",
                 throw=True,
             )
+            a = fa.as_fugue_engine_df(
+                e,
+                [
+                    ["a", 2, 3],
+                    [None, 4, 2],
+                    [None, 2, 1],
+                ],
+                "a:str,b:int,c:long",
+            )
+            i = fa.take(a, n=1, partition="a", presort=None)
+            case1 = self.df_eq(
+                i,
+                [
+                    ["a", 2, 3],
+                    [None, 4, 2],
+                ],
+                "a:str,b:int,c:long",
+                throw=False,
+            )
+            case2 = self.df_eq(
+                i,
+                [
+                    ["a", 2, 3],
+                    [None, 2, 1],
+                ],
+                "a:str,b:int,c:long",
+                throw=False,
+            )
+            assert case1 or case2
+            j = fa.take(a, n=2, partition="a", presort=None)
+            self.df_eq(
+                j,
+                [
+                    ["a", 2, 3],
+                    [None, 4, 2],
+                    [None, 2, 1],
+                ],
+                "a:str,b:int,c:long",
+                throw=True,
+            )
             raises(ValueError, lambda: fa.take(a, n=0.5, presort=None))
         def test_sample_n(self):
@@ -844,9 +871,9 @@ class ExecutionEngineTests(object):
             d = fa.sample(a, n=90, seed=1)
             d2 = fa.sample(a, n=90, seed=1)
             e = fa.sample(a, n=90, seed=2)
-            assert not df_eq(b, c, throw=False)
-            df_eq(d, d2, throw=True)
-            assert not df_eq(d, e, throw=False)
+            assert not self.df_eq(b, c, throw=False)
+            self.df_eq(d, d2, throw=True)
+            assert not self.df_eq(d, e, throw=False)
             assert abs(len(e.as_array()) - 90) < 2
         def test_comap(self):
@@ -902,11 +929,11 @@ class ExecutionEngineTests(object):
                 PartitionSpec(),
                 on_init=on_init,
             )
-            df_eq(res, [[1, "_02,_11"]], "a:int,v:str", throw=True)
+            self.df_eq(res, [[1, "_02,_11"]], "a:int,v:str", throw=True)
             # for outer joins, the NULL will be filled with empty dataframe
             res = e.comap(z2, comap, "a:int,v:str", PartitionSpec())
-            df_eq(
+            self.df_eq(
                 res,
                 [[1, "_02,_11"], [3, "_01,_10"]],
                 "a:int,v:str",
@@ -914,7 +941,7 @@ class ExecutionEngineTests(object):
             )
             res = e.comap(z3, comap, "a:int,v:str", PartitionSpec())
-            df_eq(
+            self.df_eq(
                 res,
                 [[1, "_01,_12"], [3, "_00,_11"]],
                 "a:int,v:str",
@@ -922,10 +949,10 @@ class ExecutionEngineTests(object):
             )
             res = e.comap(z4, comap, "v:str", PartitionSpec())
-            df_eq(res, [["_03,_12"]], "v:str", throw=True)
+            self.df_eq(res, [["_03,_12"]], "v:str", throw=True)
             res = e.comap(z5, comap, "a:int,v:str", PartitionSpec())
-            df_eq(
+            self.df_eq(
                 res,
                 [[1, "_02,_11"], [3, "_01,_10"], [7, "_00,_11"]],
                 "a:int,v:str",
@@ -963,7 +990,7 @@ class ExecutionEngineTests(object):
                 PartitionSpec(),
                 on_init=on_init,
             )
-            df_eq(res, [[1, "x2,y1"]], "a:int,v:str", throw=True)
+            self.df_eq(res, [[1, "x2,y1"]], "a:int,v:str", throw=True)
             res = e.comap(
                 z2,
@@ -972,7 +999,7 @@ class ExecutionEngineTests(object):
                 PartitionSpec(),
                 on_init=on_init,
             )
-            df_eq(res, [[1, "x2,y1,z1"]], "a:int,v:str", throw=True)
+            self.df_eq(res, [[1, "x2,y1,z1"]], "a:int,v:str", throw=True)
             res = e.comap(
                 z3,
@@ -981,10 +1008,10 @@ class ExecutionEngineTests(object):
                 PartitionSpec(),
                 on_init=on_init,
             )
-            df_eq(res, [[1, "z1"]], "a:int,v:str", throw=True)
+            self.df_eq(res, [[1, "z1"]], "a:int,v:str", throw=True)
         @pytest.fixture(autouse=True)
-        def init_tmpdir(self, tmpdir, tmp_mem_dir):
+        def init_tmpdir(self, tmpdir):
             self.tmpdir = tmpdir
         def test_save_single_and_load_parquet(self):
@@ -995,20 +1022,20 @@ class ExecutionEngineTests(object):
             fa.save(b, path, format_hint="parquet", force_single=True)
             assert isfile(path)
             c = fa.load(path, format_hint="parquet", columns=["a", "c"], as_fugue=True)
-            df_eq(c, [[1, 6], [7, 2]], "a:long,c:int", throw=True)
+            self.df_eq(c, [[1, 6], [7, 2]], "a:long,c:int", throw=True)
             # overwirte single with folder (if applicable)
             b = ArrayDataFrame([[60, 1], [20, 7]], "c:int,a:long")
             fa.save(b, path, format_hint="parquet", mode="overwrite")
             c = fa.load(path, format_hint="parquet", columns=["a", "c"], as_fugue=True)
-            df_eq(c, [[1, 60], [7, 20]], "a:long,c:int", throw=True)
+            self.df_eq(c, [[1, 60], [7, 20]], "a:long,c:int", throw=True)
         def test_save_and_load_parquet(self):
             b = ArrayDataFrame([[6, 1], [2, 7]], "c:int,a:long")
             path = os.path.join(self.tmpdir, "a", "b")
             fa.save(b, path, format_hint="parquet")
             c = fa.load(path, format_hint="parquet", columns=["a", "c"], as_fugue=True)
-            df_eq(c, [[1, 6], [7, 2]], "a:long,c:int", throw=True)
+            self.df_eq(c, [[1, 6], [7, 2]], "a:long,c:int", throw=True)
         def test_load_parquet_folder(self):
             native = NativeExecutionEngine()
@@ -1019,7 +1046,7 @@ class ExecutionEngineTests(object):
             fa.save(b, os.path.join(path, "b.parquet"), engine=native)
             touch(os.path.join(path, "_SUCCESS"))
             c = fa.load(path, format_hint="parquet", columns=["a", "c"], as_fugue=True)
-            df_eq(c, [[1, 6], [7, 2], [8, 4]], "a:long,c:int", throw=True)
+            self.df_eq(c, [[1, 6], [7, 2], [8, 4]], "a:long,c:int", throw=True)
         def test_load_parquet_files(self):
             native = NativeExecutionEngine()
@@ -1033,7 +1060,7 @@ class ExecutionEngineTests(object):
             c = fa.load(
                 [f1, f2], format_hint="parquet", columns=["a", "c"], as_fugue=True
             )
-            df_eq(c, [[1, 6], [7, 2], [8, 4]], "a:long,c:int", throw=True)
+            self.df_eq(c, [[1, 6], [7, 2], [8, 4]], "a:long,c:int", throw=True)
         def test_save_single_and_load_csv(self):
             b = ArrayDataFrame([[6.1, 1.1], [2.1, 7.1]], "c:double,a:double")
@@ -1045,12 +1072,12 @@ class ExecutionEngineTests(object):
             c = fa.load(
                 path, format_hint="csv", header=True, infer_schema=False, as_fugue=True
             )
-            df_eq(c, [["6.1", "1.1"], ["2.1", "7.1"]], "c:str,a:str", throw=True)
+            self.df_eq(c, [["6.1", "1.1"], ["2.1", "7.1"]], "c:str,a:str", throw=True)
             c = fa.load(
                 path, format_hint="csv", header=True, infer_schema=True, as_fugue=True
             )
-            df_eq(c, [[6.1, 1.1], [2.1, 7.1]], "c:double,a:double", throw=True)
+            self.df_eq(c, [[6.1, 1.1], [2.1, 7.1]], "c:double,a:double", throw=True)
             with raises(ValueError):
                 c = fa.load(
@@ -1070,7 +1097,7 @@ class ExecutionEngineTests(object):
                 columns=["a", "c"],
                 as_fugue=True,
             )
-            df_eq(c, [["1.1", "6.1"], ["7.1", "2.1"]], "a:str,c:str", throw=True)
+            self.df_eq(c, [["1.1", "6.1"], ["7.1", "2.1"]], "a:str,c:str", throw=True)
             c = fa.load(
                 path,
@@ -1080,7 +1107,7 @@ class ExecutionEngineTests(object):
                 columns="a:double,c:double",
                 as_fugue=True,
             )
-            df_eq(c, [[1.1, 6.1], [7.1, 2.1]], "a:double,c:double", throw=True)
+            self.df_eq(c, [[1.1, 6.1], [7.1, 2.1]], "a:double,c:double", throw=True)
             # overwirte single with folder (if applicable)
             b = ArrayDataFrame([[60.1, 1.1], [20.1, 7.1]], "c:double,a:double")
@@ -1093,7 +1120,7 @@ class ExecutionEngineTests(object):
                 columns=["a", "c"],
                 as_fugue=True,
             )
-            df_eq(c, [["1.1", "60.1"], ["7.1", "20.1"]], "a:str,c:str", throw=True)
+            self.df_eq(c, [["1.1", "60.1"], ["7.1", "20.1"]], "a:str,c:str", throw=True)
         def test_save_single_and_load_csv_no_header(self):
             b = ArrayDataFrame([[6.1, 1.1], [2.1, 7.1]], "c:double,a:double")
@@ -1109,7 +1136,7 @@ class ExecutionEngineTests(object):
                     format_hint="csv",
                     header=False,
                     infer_schema=False,
-                    as_fugue=True
+                    as_fugue=True,
                     # when header is False, must set columns
                 )
@@ -1121,7 +1148,7 @@ class ExecutionEngineTests(object):
                 columns=["c", "a"],
                 as_fugue=True,
             )
-            df_eq(c, [["6.1", "1.1"], ["2.1", "7.1"]], "c:str,a:str", throw=True)
+            self.df_eq(c, [["6.1", "1.1"], ["2.1", "7.1"]], "c:str,a:str", throw=True)
             c = fa.load(
                 path,
@@ -1131,7 +1158,7 @@ class ExecutionEngineTests(object):
                 columns=["c", "a"],
                 as_fugue=True,
             )
-            df_eq(c, [[6.1, 1.1], [2.1, 7.1]], "c:double,a:double", throw=True)
+            self.df_eq(c, [[6.1, 1.1], [2.1, 7.1]], "c:double,a:double", throw=True)
             with raises(ValueError):
                 c = fa.load(
@@ -1151,7 +1178,7 @@ class ExecutionEngineTests(object):
                 columns="c:double,a:str",
                 as_fugue=True,
             )
-            df_eq(c, [[6.1, "1.1"], [2.1, "7.1"]], "c:double,a:str", throw=True)
+            self.df_eq(c, [[6.1, "1.1"], [2.1, "7.1"]], "c:double,a:str", throw=True)
         def test_save_and_load_csv(self):
             b = ArrayDataFrame([[6.1, 1.1], [2.1, 7.1]], "c:double,a:double")
@@ -1165,7 +1192,7 @@ class ExecutionEngineTests(object):
                 columns=["a", "c"],
                 as_fugue=True,
             )
-            df_eq(c, [[1.1, 6.1], [7.1, 2.1]], "a:double,c:double", throw=True)
+            self.df_eq(c, [[1.1, 6.1], [7.1, 2.1]], "a:double,c:double", throw=True)
         def test_load_csv_folder(self):
             native = NativeExecutionEngine()
@@ -1195,7 +1222,7 @@ class ExecutionEngineTests(object):
                 columns=["a", "c"],
                 as_fugue=True,
             )
-            df_eq(
+            self.df_eq(
                 c, [[1.1, 6.1], [7.1, 2.1], [8.1, 4.1]], "a:double,c:double", throw=True
             )
@@ -1207,13 +1234,13 @@ class ExecutionEngineTests(object):
             fa.save(b, path, format_hint="json", force_single=True)
             assert isfile(path)
             c = fa.load(path, format_hint="json", columns=["a", "c"], as_fugue=True)
-            df_eq(c, [[1, 6], [7, 2]], "a:long,c:long", throw=True)
+            self.df_eq(c, [[1, 6], [7, 2]], "a:long,c:long", throw=True)
             # overwirte single with folder (if applicable)
             b = ArrayDataFrame([[60, 1], [20, 7]], "c:long,a:long")
             fa.save(b, path, format_hint="json", mode="overwrite")
             c = fa.load(path, format_hint="json", columns=["a", "c"], as_fugue=True)
-            df_eq(c, [[1, 60], [7, 20]], "a:long,c:long", throw=True)
+            self.df_eq(c, [[1, 60], [7, 20]], "a:long,c:long", throw=True)
         def test_save_and_load_json(self):
             e = self.engine
@@ -1225,7 +1252,7 @@ class ExecutionEngineTests(object):
                 format_hint="json",
             )
             c = fa.load(path, format_hint="json", columns=["a", "c"], as_fugue=True)
-            df_eq(
+            self.df_eq(
                 c, [[1, 6], [7, 2], [4, 3], [8, 4], [7, 6]], "a:long,c:long", throw=True
             )
@@ -1238,7 +1265,7 @@ class ExecutionEngineTests(object):
             fa.save(b, os.path.join(path, "b.json"), format_hint="json", engine=native)
             touch(os.path.join(path, "_SUCCESS"))
             c = fa.load(path, format_hint="json", columns=["a", "c"], as_fugue=True)
-            df_eq(c, [[1, 6], [7, 2], [8, 4], [4, 3]], "a:long,c:long", throw=True)
+            self.df_eq(c, [[1, 6], [7, 2], [8, 4], [4, 3]], "a:long,c:long", throw=True)
         def test_engine_api(self):
             # complimentary tests not covered by the other tests
@@ -1251,7 +1278,7 @@ class ExecutionEngineTests(object):
                 assert fa.is_df(df3) and not isinstance(df3, DataFrame)
                 df4 = fa.union(df1, df2, as_fugue=True)
                 assert isinstance(df4, DataFrame)
-                df_eq(df4, fa.as_pandas(df3), throw=True)
+                self.df_eq(df4, fa.as_pandas(df3), throw=True)
 def select_top(cursor, data):

fugue 0.8.7.dev8__py3-none-any.whl → 0.9.0__py3-none-any.whl

fugue 0.8.7.dev8py3-none-any.whl → 0.9.0py3-none-any.whl