sqlframe 3.13.0__py3-none-any.whl → 3.13.2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- sqlframe/_version.py +2 -2
- sqlframe/base/dataframe.py +23 -11
- sqlframe/bigquery/dataframe.py +5 -0
- sqlframe/duckdb/dataframe.py +6 -0
- sqlframe/snowflake/dataframe.py +1 -0
- {sqlframe-3.13.0.dist-info → sqlframe-3.13.2.dist-info}/METADATA +33 -36
- {sqlframe-3.13.0.dist-info → sqlframe-3.13.2.dist-info}/RECORD +10 -10
- {sqlframe-3.13.0.dist-info → sqlframe-3.13.2.dist-info}/WHEEL +1 -1
- {sqlframe-3.13.0.dist-info → sqlframe-3.13.2.dist-info}/LICENSE +0 -0
- {sqlframe-3.13.0.dist-info → sqlframe-3.13.2.dist-info}/top_level.txt +0 -0
sqlframe/_version.py
CHANGED
sqlframe/base/dataframe.py
CHANGED
|
@@ -202,6 +202,7 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
|
|
|
202
202
|
_na: t.Type[NA]
|
|
203
203
|
_stat: t.Type[STAT]
|
|
204
204
|
_group_data: t.Type[GROUP_DATA]
|
|
205
|
+
_EXPLAIN_PREFIX = "EXPLAIN"
|
|
205
206
|
|
|
206
207
|
def __init__(
|
|
207
208
|
self,
|
|
@@ -806,6 +807,8 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
|
|
|
806
807
|
)
|
|
807
808
|
else:
|
|
808
809
|
col = self._ensure_and_normalize_col(column)
|
|
810
|
+
if isinstance(col.expression, exp.Alias):
|
|
811
|
+
col.expression = col.expression.this
|
|
809
812
|
return self.copy(expression=self.expression.where(col.expression))
|
|
810
813
|
|
|
811
814
|
filter = where
|
|
@@ -1018,9 +1021,9 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
|
|
|
1018
1021
|
elif not isinstance(ascending, list):
|
|
1019
1022
|
ascending = [ascending] * len(columns)
|
|
1020
1023
|
ascending = [bool(x) for i, x in enumerate(ascending)]
|
|
1021
|
-
assert len(columns) == len(
|
|
1022
|
-
ascending
|
|
1023
|
-
)
|
|
1024
|
+
assert len(columns) == len(ascending), (
|
|
1025
|
+
"The length of items in ascending must equal the number of columns provided"
|
|
1026
|
+
)
|
|
1024
1027
|
col_and_ascending = list(zip(columns, ascending))
|
|
1025
1028
|
order_by_columns = [
|
|
1026
1029
|
(
|
|
@@ -1142,6 +1145,18 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
|
|
|
1142
1145
|
final_df = filtered_df.select(*all_columns)
|
|
1143
1146
|
return final_df
|
|
1144
1147
|
|
|
1148
|
+
def _get_explain_plan_rows(self) -> t.List[Row]:
|
|
1149
|
+
sql_queries = self.sql(
|
|
1150
|
+
pretty=False, optimize=False, as_list=True, dialect=self.session.execution_dialect
|
|
1151
|
+
)
|
|
1152
|
+
if len(sql_queries) > 1:
|
|
1153
|
+
raise ValueError("Cannot explain a DataFrame with multiple queries")
|
|
1154
|
+
sql_query = " ".join([self._EXPLAIN_PREFIX, sql_queries[0]])
|
|
1155
|
+
results = self.session._collect(sql_query)
|
|
1156
|
+
if len(results) != 1:
|
|
1157
|
+
raise ValueError("Got more than one result from explain query")
|
|
1158
|
+
return results
|
|
1159
|
+
|
|
1145
1160
|
def explain(
|
|
1146
1161
|
self, extended: t.Optional[t.Union[bool, str]] = None, mode: t.Optional[str] = None
|
|
1147
1162
|
) -> None:
|
|
@@ -1210,11 +1225,8 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
|
|
|
1210
1225
|
...Statistics...
|
|
1211
1226
|
...
|
|
1212
1227
|
"""
|
|
1213
|
-
|
|
1214
|
-
|
|
1215
|
-
raise ValueError("Cannot explain a DataFrame with multiple queries")
|
|
1216
|
-
sql_query = "EXPLAIN " + sql_queries[0]
|
|
1217
|
-
self.session._execute(sql_query)
|
|
1228
|
+
results = self._get_explain_plan_rows()
|
|
1229
|
+
print(results[0][0])
|
|
1218
1230
|
|
|
1219
1231
|
@operation(Operation.FROM)
|
|
1220
1232
|
def fillna(
|
|
@@ -1282,9 +1294,9 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
|
|
|
1282
1294
|
new_values = list(to_replace.values())
|
|
1283
1295
|
elif not old_values and isinstance(to_replace, list):
|
|
1284
1296
|
assert isinstance(value, list), "value must be a list since the replacements are a list"
|
|
1285
|
-
assert len(to_replace) == len(
|
|
1286
|
-
|
|
1287
|
-
)
|
|
1297
|
+
assert len(to_replace) == len(value), (
|
|
1298
|
+
"the replacements and values must be the same length"
|
|
1299
|
+
)
|
|
1288
1300
|
old_values = to_replace
|
|
1289
1301
|
new_values = value
|
|
1290
1302
|
else:
|
sqlframe/bigquery/dataframe.py
CHANGED
|
@@ -72,3 +72,8 @@ class BigQueryDataFrame(
|
|
|
72
72
|
sql = self.session._to_sql(self.expression)
|
|
73
73
|
query_job = self.session._client.query(sql, job_config=job_config)
|
|
74
74
|
return [field_to_column(field) for field in query_job.schema]
|
|
75
|
+
|
|
76
|
+
def explain(
|
|
77
|
+
self, extended: t.Optional[t.Union[bool, str]] = None, mode: t.Optional[str] = None
|
|
78
|
+
) -> None:
|
|
79
|
+
raise NotImplementedError("BigQuery does not support EXPLAIN")
|
sqlframe/duckdb/dataframe.py
CHANGED
|
@@ -46,6 +46,12 @@ class DuckDBDataFrame(
|
|
|
46
46
|
_stat = DuckDBDataFrameStatFunctions
|
|
47
47
|
_group_data = DuckDBGroupedData
|
|
48
48
|
|
|
49
|
+
def explain(
|
|
50
|
+
self, extended: t.Optional[t.Union[bool, str]] = None, mode: t.Optional[str] = None
|
|
51
|
+
) -> None:
|
|
52
|
+
results = self._get_explain_plan_rows()
|
|
53
|
+
print(results[0][1])
|
|
54
|
+
|
|
49
55
|
@t.overload
|
|
50
56
|
def toArrow(self) -> ArrowTable: ...
|
|
51
57
|
|
sqlframe/snowflake/dataframe.py
CHANGED
|
@@ -1,12 +1,11 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: sqlframe
|
|
3
|
-
Version: 3.13.
|
|
3
|
+
Version: 3.13.2
|
|
4
4
|
Summary: Turning PySpark Into a Universal DataFrame API
|
|
5
5
|
Home-page: https://github.com/eakmanrq/sqlframe
|
|
6
6
|
Author: Ryan Eakman
|
|
7
7
|
Author-email: eakmanrq@gmail.com
|
|
8
8
|
License: MIT
|
|
9
|
-
Platform: UNKNOWN
|
|
10
9
|
Classifier: Development Status :: 5 - Production/Stable
|
|
11
10
|
Classifier: Intended Audience :: Developers
|
|
12
11
|
Classifier: Intended Audience :: Science/Research
|
|
@@ -17,52 +16,52 @@ Classifier: Programming Language :: Python :: 3 :: Only
|
|
|
17
16
|
Requires-Python: >=3.9
|
|
18
17
|
Description-Content-Type: text/markdown
|
|
19
18
|
License-File: LICENSE
|
|
20
|
-
Requires-Dist: prettytable
|
|
21
|
-
Requires-Dist: sqlglot
|
|
19
|
+
Requires-Dist: prettytable <4
|
|
20
|
+
Requires-Dist: sqlglot <26.3,>=24.0.0
|
|
22
21
|
Requires-Dist: typing-extensions
|
|
23
22
|
Provides-Extra: bigquery
|
|
24
|
-
Requires-Dist: google-cloud-bigquery-storage
|
|
25
|
-
Requires-Dist: google-cloud-bigquery[pandas]
|
|
23
|
+
Requires-Dist: google-cloud-bigquery-storage <3,>=2 ; extra == 'bigquery'
|
|
24
|
+
Requires-Dist: google-cloud-bigquery[pandas] <4,>=3 ; extra == 'bigquery'
|
|
26
25
|
Provides-Extra: databricks
|
|
27
|
-
Requires-Dist: databricks-sql-connector
|
|
26
|
+
Requires-Dist: databricks-sql-connector <4,>=3.6 ; extra == 'databricks'
|
|
28
27
|
Provides-Extra: dev
|
|
29
|
-
Requires-Dist: duckdb
|
|
30
|
-
Requires-Dist: findspark
|
|
31
|
-
Requires-Dist: mypy
|
|
32
|
-
Requires-Dist: openai
|
|
33
|
-
Requires-Dist: pandas-stubs
|
|
34
|
-
Requires-Dist: pandas
|
|
35
|
-
Requires-Dist: pre-commit
|
|
36
|
-
Requires-Dist: psycopg
|
|
37
|
-
Requires-Dist: pyarrow
|
|
38
|
-
Requires-Dist: pyspark
|
|
28
|
+
Requires-Dist: duckdb <1.2,>=0.9 ; extra == 'dev'
|
|
29
|
+
Requires-Dist: findspark <3,>=2 ; extra == 'dev'
|
|
30
|
+
Requires-Dist: mypy <1.15,>=1.10.0 ; extra == 'dev'
|
|
31
|
+
Requires-Dist: openai <2,>=1.30 ; extra == 'dev'
|
|
32
|
+
Requires-Dist: pandas-stubs <3,>=2 ; extra == 'dev'
|
|
33
|
+
Requires-Dist: pandas <3,>=2 ; extra == 'dev'
|
|
34
|
+
Requires-Dist: pre-commit <5,>=3.7 ; extra == 'dev'
|
|
35
|
+
Requires-Dist: psycopg <4,>=3.1 ; extra == 'dev'
|
|
36
|
+
Requires-Dist: pyarrow <20,>=10 ; extra == 'dev'
|
|
37
|
+
Requires-Dist: pyspark <3.6,>=2 ; extra == 'dev'
|
|
39
38
|
Requires-Dist: pytest-forked ; extra == 'dev'
|
|
40
|
-
Requires-Dist: pytest-postgresql
|
|
41
|
-
Requires-Dist: pytest-xdist
|
|
42
|
-
Requires-Dist: pytest
|
|
43
|
-
Requires-Dist: ruff
|
|
44
|
-
Requires-Dist: types-psycopg2
|
|
39
|
+
Requires-Dist: pytest-postgresql <7,>=6 ; extra == 'dev'
|
|
40
|
+
Requires-Dist: pytest-xdist <3.7,>=3.6 ; extra == 'dev'
|
|
41
|
+
Requires-Dist: pytest <8.4,>=8.2.0 ; extra == 'dev'
|
|
42
|
+
Requires-Dist: ruff <0.10,>=0.4.4 ; extra == 'dev'
|
|
43
|
+
Requires-Dist: types-psycopg2 <3,>=2.9 ; extra == 'dev'
|
|
45
44
|
Provides-Extra: docs
|
|
46
|
-
Requires-Dist: mkdocs-include-markdown-plugin
|
|
47
|
-
Requires-Dist: mkdocs-material-extensions
|
|
48
|
-
Requires-Dist: mkdocs-material
|
|
49
|
-
Requires-Dist: mkdocs
|
|
45
|
+
Requires-Dist: mkdocs-include-markdown-plugin ==6.0.6 ; extra == 'docs'
|
|
46
|
+
Requires-Dist: mkdocs-material-extensions ==1.1.1 ; extra == 'docs'
|
|
47
|
+
Requires-Dist: mkdocs-material ==9.0.5 ; extra == 'docs'
|
|
48
|
+
Requires-Dist: mkdocs ==1.4.2 ; extra == 'docs'
|
|
50
49
|
Requires-Dist: pymdown-extensions ; extra == 'docs'
|
|
51
50
|
Provides-Extra: duckdb
|
|
52
|
-
Requires-Dist: duckdb
|
|
53
|
-
Requires-Dist: pandas
|
|
51
|
+
Requires-Dist: duckdb <1.2,>=0.9 ; extra == 'duckdb'
|
|
52
|
+
Requires-Dist: pandas <3,>=2 ; extra == 'duckdb'
|
|
54
53
|
Provides-Extra: openai
|
|
55
|
-
Requires-Dist: openai
|
|
54
|
+
Requires-Dist: openai <2,>=1.30 ; extra == 'openai'
|
|
56
55
|
Provides-Extra: pandas
|
|
57
|
-
Requires-Dist: pandas
|
|
56
|
+
Requires-Dist: pandas <3,>=2 ; extra == 'pandas'
|
|
58
57
|
Provides-Extra: postgres
|
|
59
|
-
Requires-Dist: psycopg2
|
|
58
|
+
Requires-Dist: psycopg2 <3,>=2.8 ; extra == 'postgres'
|
|
60
59
|
Provides-Extra: redshift
|
|
61
|
-
Requires-Dist: redshift-connector
|
|
60
|
+
Requires-Dist: redshift-connector <2.2.0,>=2.1.1 ; extra == 'redshift'
|
|
62
61
|
Provides-Extra: snowflake
|
|
63
|
-
Requires-Dist: snowflake-connector-python[secure-local-storage]
|
|
62
|
+
Requires-Dist: snowflake-connector-python[secure-local-storage] <3.13,>=3.10.0 ; extra == 'snowflake'
|
|
64
63
|
Provides-Extra: spark
|
|
65
|
-
Requires-Dist: pyspark
|
|
64
|
+
Requires-Dist: pyspark <3.6,>=2 ; extra == 'spark'
|
|
66
65
|
|
|
67
66
|
<div align="center">
|
|
68
67
|
<img src="https://sqlframe.readthedocs.io/en/stable/docs/images/sqlframe_logo.png" alt="SQLFrame Logo" width="400"/>
|
|
@@ -227,5 +226,3 @@ LIMIT 5
|
|
|
227
226
|
| 1975 | 868,985 | 10.92 |
|
|
228
227
|
+------+---------------------------+----------------+
|
|
229
228
|
```
|
|
230
|
-
|
|
231
|
-
|
|
@@ -1,10 +1,10 @@
|
|
|
1
1
|
sqlframe/__init__.py,sha256=wfqm98eLoLid9oV_FzzpG5loKC6LxOhj2lXpfN7SARo,3138
|
|
2
|
-
sqlframe/_version.py,sha256=
|
|
2
|
+
sqlframe/_version.py,sha256=efGc9qGpdvsN2KEWLmdYgdokJecNkK44Rg-Lf6L0IvM,413
|
|
3
3
|
sqlframe/base/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
4
4
|
sqlframe/base/_typing.py,sha256=b2clI5HI1zEZKB_3Msx3FeAJQyft44ubUifJwQRVXyQ,1298
|
|
5
5
|
sqlframe/base/catalog.py,sha256=SzFQalTWdhWzxUY-4ut1f9TfOECp_JmJEgNPfrRKCe0,38457
|
|
6
6
|
sqlframe/base/column.py,sha256=wRghgieYAA51aw4WuFQWOvl0TFOToZbBhBuIamEzxx4,18011
|
|
7
|
-
sqlframe/base/dataframe.py,sha256=
|
|
7
|
+
sqlframe/base/dataframe.py,sha256=bnF8SYIDhSFPYKchGakRG_oWqgZ-66jKZsdcqUSqCDE,74940
|
|
8
8
|
sqlframe/base/decorators.py,sha256=P56cgs8DANxGRIwVs5uOMnDy-BlXZZYMbf4fdnkpWPI,1889
|
|
9
9
|
sqlframe/base/exceptions.py,sha256=9Uwvqn2eAkDpqm4BrRgbL61qM-GMCbJEMAW8otxO46s,370
|
|
10
10
|
sqlframe/base/function_alternatives.py,sha256=8kDCh1cOXtdCcBPYBQ8byXxRAZvphS9N8GDs4txBzGg,52544
|
|
@@ -26,7 +26,7 @@ sqlframe/base/mixins/readwriter_mixins.py,sha256=ap8j_g7PoUGHaHKCPMnRPbXofOsUhUz
|
|
|
26
26
|
sqlframe/bigquery/__init__.py,sha256=kbaomhYAANPdxeDQhajv8IHfMg_ENKivtYK-rPwaV08,939
|
|
27
27
|
sqlframe/bigquery/catalog.py,sha256=8d36IzT5GPWd1FdxJ9vEljOdbIDepHnFOBjwP0bX6FE,11625
|
|
28
28
|
sqlframe/bigquery/column.py,sha256=E1tUa62Y5HajkhgFuebU9zohrGyieudcHzTT8gfalio,40
|
|
29
|
-
sqlframe/bigquery/dataframe.py,sha256=
|
|
29
|
+
sqlframe/bigquery/dataframe.py,sha256=2qlnwTOpfpHQxr9MCxeZWxKiQoL6txEgGNE8JQsalUQ,2599
|
|
30
30
|
sqlframe/bigquery/functions.py,sha256=MYLs6-sXXqe5o6ghJHHtEpFJlYMeyKzx9-rT3wwXlc4,426
|
|
31
31
|
sqlframe/bigquery/functions.pyi,sha256=KXgV46eZFNIXwXIhPuSJ08BG18iLQzDCQjyI3REBEXg,11925
|
|
32
32
|
sqlframe/bigquery/group.py,sha256=UVBNBRTo8OqS-_cS5YwvTeJYgYxeG-d6R3kfyHmlFqw,391
|
|
@@ -50,7 +50,7 @@ sqlframe/databricks/window.py,sha256=6GKPzuxeSapJakBaKBeT9VpED1ACdjggDv9JRILDyV0
|
|
|
50
50
|
sqlframe/duckdb/__init__.py,sha256=KAw_uZEhFMwi3D9Wj6AgHAKqLNk-EAx2uDIYu56oL44,872
|
|
51
51
|
sqlframe/duckdb/catalog.py,sha256=YYYVmetLUaJOdObKw4AJ7L0P-msshkta4xHlcZQ9zEA,4795
|
|
52
52
|
sqlframe/duckdb/column.py,sha256=E1tUa62Y5HajkhgFuebU9zohrGyieudcHzTT8gfalio,40
|
|
53
|
-
sqlframe/duckdb/dataframe.py,sha256=
|
|
53
|
+
sqlframe/duckdb/dataframe.py,sha256=Z8_K69UQGZVeBfVGXVwIJP8OMuIvNBB3DPKTP3Lfu4w,1908
|
|
54
54
|
sqlframe/duckdb/functions.py,sha256=ix2efGGD4HLaY1rtCtEd3IrsicGEVGiBAeKOo5OD8rA,424
|
|
55
55
|
sqlframe/duckdb/functions.pyi,sha256=P0ky6k-J7LdCDrQ0OjfRC3ARIYNHPmAmmaB_jBEO5L0,12383
|
|
56
56
|
sqlframe/duckdb/group.py,sha256=IkhbW42Ng1U5YT3FkIdiB4zBqRkW4QyTb-1detY1e_4,383
|
|
@@ -85,7 +85,7 @@ sqlframe/redshift/window.py,sha256=6GKPzuxeSapJakBaKBeT9VpED1ACdjggDv9JRILDyV0,3
|
|
|
85
85
|
sqlframe/snowflake/__init__.py,sha256=msYAxOnPyjuBSTbpb5s9P5o0pr2N82UUGPxUtv0TNNw,966
|
|
86
86
|
sqlframe/snowflake/catalog.py,sha256=Tp_B9oMTInnqLTiZNsT0UNc-a-aKXu3zFThlCwLeKCA,6507
|
|
87
87
|
sqlframe/snowflake/column.py,sha256=E1tUa62Y5HajkhgFuebU9zohrGyieudcHzTT8gfalio,40
|
|
88
|
-
sqlframe/snowflake/dataframe.py,sha256=
|
|
88
|
+
sqlframe/snowflake/dataframe.py,sha256=TosBO9tnnqAQ9Y-abX954vQM8VBLYRmN_P50iusMFgQ,2185
|
|
89
89
|
sqlframe/snowflake/functions.py,sha256=g3ELesLGvN7tyRyiEAnPneVyL0rQhSSOxYFvBFuOiaM,391
|
|
90
90
|
sqlframe/snowflake/functions.pyi,sha256=sEqNdyqQBtgqoKtRViUb70QT5yrvpVoP3ZN7VxHNxbw,12612
|
|
91
91
|
sqlframe/snowflake/group.py,sha256=pPP1l2RRo_LgkXrji8a87n2PKo-63ZRPT-WUtvVcBME,395
|
|
@@ -119,8 +119,8 @@ sqlframe/standalone/udf.py,sha256=azmgtUjHNIPs0WMVNId05SHwiYn41MKVBhKXsQJ5dmY,27
|
|
|
119
119
|
sqlframe/standalone/window.py,sha256=6GKPzuxeSapJakBaKBeT9VpED1ACdjggDv9JRILDyV0,35
|
|
120
120
|
sqlframe/testing/__init__.py,sha256=VVCosQhitU74A3NnE52O4mNtGZONapuEXcc20QmSlnQ,132
|
|
121
121
|
sqlframe/testing/utils.py,sha256=PFsGZpwNUE_4-g_f43_vstTqsK0AQ2lBneb5Eb6NkFo,13008
|
|
122
|
-
sqlframe-3.13.
|
|
123
|
-
sqlframe-3.13.
|
|
124
|
-
sqlframe-3.13.
|
|
125
|
-
sqlframe-3.13.
|
|
126
|
-
sqlframe-3.13.
|
|
122
|
+
sqlframe-3.13.2.dist-info/LICENSE,sha256=VZu79YgW780qxaFJMr0t5ZgbOYEh04xWoxaWOaqIGWk,1068
|
|
123
|
+
sqlframe-3.13.2.dist-info/METADATA,sha256=QHITWgwWxHNUam2uSDUcpJq6Y9zCJQPxQ-EN7YtvBtg,8970
|
|
124
|
+
sqlframe-3.13.2.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
|
|
125
|
+
sqlframe-3.13.2.dist-info/top_level.txt,sha256=T0_RpoygaZSF6heeWwIDQgaP0varUdSK1pzjeJZRjM8,9
|
|
126
|
+
sqlframe-3.13.2.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|