sqlframe 3.13.0__py3-none-any.whl → 3.13.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
sqlframe/_version.py CHANGED
@@ -12,5 +12,5 @@ __version__: str
12
12
  __version_tuple__: VERSION_TUPLE
13
13
  version_tuple: VERSION_TUPLE
14
14
 
15
- __version__ = version = '3.13.0'
16
- __version_tuple__ = version_tuple = (3, 13, 0)
15
+ __version__ = version = '3.13.2'
16
+ __version_tuple__ = version_tuple = (3, 13, 2)
@@ -202,6 +202,7 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
202
202
  _na: t.Type[NA]
203
203
  _stat: t.Type[STAT]
204
204
  _group_data: t.Type[GROUP_DATA]
205
+ _EXPLAIN_PREFIX = "EXPLAIN"
205
206
 
206
207
  def __init__(
207
208
  self,
@@ -806,6 +807,8 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
806
807
  )
807
808
  else:
808
809
  col = self._ensure_and_normalize_col(column)
810
+ if isinstance(col.expression, exp.Alias):
811
+ col.expression = col.expression.this
809
812
  return self.copy(expression=self.expression.where(col.expression))
810
813
 
811
814
  filter = where
@@ -1018,9 +1021,9 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
1018
1021
  elif not isinstance(ascending, list):
1019
1022
  ascending = [ascending] * len(columns)
1020
1023
  ascending = [bool(x) for i, x in enumerate(ascending)]
1021
- assert len(columns) == len(
1022
- ascending
1023
- ), "The length of items in ascending must equal the number of columns provided"
1024
+ assert len(columns) == len(ascending), (
1025
+ "The length of items in ascending must equal the number of columns provided"
1026
+ )
1024
1027
  col_and_ascending = list(zip(columns, ascending))
1025
1028
  order_by_columns = [
1026
1029
  (
@@ -1142,6 +1145,18 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
1142
1145
  final_df = filtered_df.select(*all_columns)
1143
1146
  return final_df
1144
1147
 
1148
+ def _get_explain_plan_rows(self) -> t.List[Row]:
1149
+ sql_queries = self.sql(
1150
+ pretty=False, optimize=False, as_list=True, dialect=self.session.execution_dialect
1151
+ )
1152
+ if len(sql_queries) > 1:
1153
+ raise ValueError("Cannot explain a DataFrame with multiple queries")
1154
+ sql_query = " ".join([self._EXPLAIN_PREFIX, sql_queries[0]])
1155
+ results = self.session._collect(sql_query)
1156
+ if len(results) != 1:
1157
+ raise ValueError("Got more than one result from explain query")
1158
+ return results
1159
+
1145
1160
  def explain(
1146
1161
  self, extended: t.Optional[t.Union[bool, str]] = None, mode: t.Optional[str] = None
1147
1162
  ) -> None:
@@ -1210,11 +1225,8 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
1210
1225
  ...Statistics...
1211
1226
  ...
1212
1227
  """
1213
- sql_queries = self.sql(pretty=False, optimize=False, as_list=True)
1214
- if len(sql_queries) > 1:
1215
- raise ValueError("Cannot explain a DataFrame with multiple queries")
1216
- sql_query = "EXPLAIN " + sql_queries[0]
1217
- self.session._execute(sql_query)
1228
+ results = self._get_explain_plan_rows()
1229
+ print(results[0][0])
1218
1230
 
1219
1231
  @operation(Operation.FROM)
1220
1232
  def fillna(
@@ -1282,9 +1294,9 @@ class BaseDataFrame(t.Generic[SESSION, WRITER, NA, STAT, GROUP_DATA]):
1282
1294
  new_values = list(to_replace.values())
1283
1295
  elif not old_values and isinstance(to_replace, list):
1284
1296
  assert isinstance(value, list), "value must be a list since the replacements are a list"
1285
- assert len(to_replace) == len(
1286
- value
1287
- ), "the replacements and values must be the same length"
1297
+ assert len(to_replace) == len(value), (
1298
+ "the replacements and values must be the same length"
1299
+ )
1288
1300
  old_values = to_replace
1289
1301
  new_values = value
1290
1302
  else:
@@ -72,3 +72,8 @@ class BigQueryDataFrame(
72
72
  sql = self.session._to_sql(self.expression)
73
73
  query_job = self.session._client.query(sql, job_config=job_config)
74
74
  return [field_to_column(field) for field in query_job.schema]
75
+
76
+ def explain(
77
+ self, extended: t.Optional[t.Union[bool, str]] = None, mode: t.Optional[str] = None
78
+ ) -> None:
79
+ raise NotImplementedError("BigQuery does not support EXPLAIN")
@@ -46,6 +46,12 @@ class DuckDBDataFrame(
46
46
  _stat = DuckDBDataFrameStatFunctions
47
47
  _group_data = DuckDBGroupedData
48
48
 
49
+ def explain(
50
+ self, extended: t.Optional[t.Union[bool, str]] = None, mode: t.Optional[str] = None
51
+ ) -> None:
52
+ results = self._get_explain_plan_rows()
53
+ print(results[0][1])
54
+
49
55
  @t.overload
50
56
  def toArrow(self) -> ArrowTable: ...
51
57
 
@@ -43,6 +43,7 @@ class SnowflakeDataFrame(
43
43
  _na = SnowflakeDataFrameNaFunctions
44
44
  _stat = SnowflakeDataFrameStatFunctions
45
45
  _group_data = SnowflakeGroupedData
46
+ _EXPLAIN_PREFIX = "EXPLAIN USING TEXT"
46
47
 
47
48
  @property
48
49
  def _typed_columns(self) -> t.List[CatalogColumn]:
@@ -1,12 +1,11 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: sqlframe
3
- Version: 3.13.0
3
+ Version: 3.13.2
4
4
  Summary: Turning PySpark Into a Universal DataFrame API
5
5
  Home-page: https://github.com/eakmanrq/sqlframe
6
6
  Author: Ryan Eakman
7
7
  Author-email: eakmanrq@gmail.com
8
8
  License: MIT
9
- Platform: UNKNOWN
10
9
  Classifier: Development Status :: 5 - Production/Stable
11
10
  Classifier: Intended Audience :: Developers
12
11
  Classifier: Intended Audience :: Science/Research
@@ -17,52 +16,52 @@ Classifier: Programming Language :: Python :: 3 :: Only
17
16
  Requires-Python: >=3.9
18
17
  Description-Content-Type: text/markdown
19
18
  License-File: LICENSE
20
- Requires-Dist: prettytable (<4)
21
- Requires-Dist: sqlglot (<26.1,>=24.0.0)
19
+ Requires-Dist: prettytable <4
20
+ Requires-Dist: sqlglot <26.3,>=24.0.0
22
21
  Requires-Dist: typing-extensions
23
22
  Provides-Extra: bigquery
24
- Requires-Dist: google-cloud-bigquery-storage (<3,>=2) ; extra == 'bigquery'
25
- Requires-Dist: google-cloud-bigquery[pandas] (<4,>=3) ; extra == 'bigquery'
23
+ Requires-Dist: google-cloud-bigquery-storage <3,>=2 ; extra == 'bigquery'
24
+ Requires-Dist: google-cloud-bigquery[pandas] <4,>=3 ; extra == 'bigquery'
26
25
  Provides-Extra: databricks
27
- Requires-Dist: databricks-sql-connector (<4,>=3.6) ; extra == 'databricks'
26
+ Requires-Dist: databricks-sql-connector <4,>=3.6 ; extra == 'databricks'
28
27
  Provides-Extra: dev
29
- Requires-Dist: duckdb (<1.2,>=0.9) ; extra == 'dev'
30
- Requires-Dist: findspark (<3,>=2) ; extra == 'dev'
31
- Requires-Dist: mypy (<1.15,>=1.10.0) ; extra == 'dev'
32
- Requires-Dist: openai (<2,>=1.30) ; extra == 'dev'
33
- Requires-Dist: pandas-stubs (<3,>=2) ; extra == 'dev'
34
- Requires-Dist: pandas (<3,>=2) ; extra == 'dev'
35
- Requires-Dist: pre-commit (<5,>=3.7) ; extra == 'dev'
36
- Requires-Dist: psycopg (<4,>=3.1) ; extra == 'dev'
37
- Requires-Dist: pyarrow (<19,>=10) ; extra == 'dev'
38
- Requires-Dist: pyspark (<3.6,>=2) ; extra == 'dev'
28
+ Requires-Dist: duckdb <1.2,>=0.9 ; extra == 'dev'
29
+ Requires-Dist: findspark <3,>=2 ; extra == 'dev'
30
+ Requires-Dist: mypy <1.15,>=1.10.0 ; extra == 'dev'
31
+ Requires-Dist: openai <2,>=1.30 ; extra == 'dev'
32
+ Requires-Dist: pandas-stubs <3,>=2 ; extra == 'dev'
33
+ Requires-Dist: pandas <3,>=2 ; extra == 'dev'
34
+ Requires-Dist: pre-commit <5,>=3.7 ; extra == 'dev'
35
+ Requires-Dist: psycopg <4,>=3.1 ; extra == 'dev'
36
+ Requires-Dist: pyarrow <20,>=10 ; extra == 'dev'
37
+ Requires-Dist: pyspark <3.6,>=2 ; extra == 'dev'
39
38
  Requires-Dist: pytest-forked ; extra == 'dev'
40
- Requires-Dist: pytest-postgresql (<7,>=6) ; extra == 'dev'
41
- Requires-Dist: pytest-xdist (<3.7,>=3.6) ; extra == 'dev'
42
- Requires-Dist: pytest (<8.4,>=8.2.0) ; extra == 'dev'
43
- Requires-Dist: ruff (<0.9,>=0.4.4) ; extra == 'dev'
44
- Requires-Dist: types-psycopg2 (<3,>=2.9) ; extra == 'dev'
39
+ Requires-Dist: pytest-postgresql <7,>=6 ; extra == 'dev'
40
+ Requires-Dist: pytest-xdist <3.7,>=3.6 ; extra == 'dev'
41
+ Requires-Dist: pytest <8.4,>=8.2.0 ; extra == 'dev'
42
+ Requires-Dist: ruff <0.10,>=0.4.4 ; extra == 'dev'
43
+ Requires-Dist: types-psycopg2 <3,>=2.9 ; extra == 'dev'
45
44
  Provides-Extra: docs
46
- Requires-Dist: mkdocs-include-markdown-plugin (==6.0.6) ; extra == 'docs'
47
- Requires-Dist: mkdocs-material-extensions (==1.1.1) ; extra == 'docs'
48
- Requires-Dist: mkdocs-material (==9.0.5) ; extra == 'docs'
49
- Requires-Dist: mkdocs (==1.4.2) ; extra == 'docs'
45
+ Requires-Dist: mkdocs-include-markdown-plugin ==6.0.6 ; extra == 'docs'
46
+ Requires-Dist: mkdocs-material-extensions ==1.1.1 ; extra == 'docs'
47
+ Requires-Dist: mkdocs-material ==9.0.5 ; extra == 'docs'
48
+ Requires-Dist: mkdocs ==1.4.2 ; extra == 'docs'
50
49
  Requires-Dist: pymdown-extensions ; extra == 'docs'
51
50
  Provides-Extra: duckdb
52
- Requires-Dist: duckdb (<1.2,>=0.9) ; extra == 'duckdb'
53
- Requires-Dist: pandas (<3,>=2) ; extra == 'duckdb'
51
+ Requires-Dist: duckdb <1.2,>=0.9 ; extra == 'duckdb'
52
+ Requires-Dist: pandas <3,>=2 ; extra == 'duckdb'
54
53
  Provides-Extra: openai
55
- Requires-Dist: openai (<2,>=1.30) ; extra == 'openai'
54
+ Requires-Dist: openai <2,>=1.30 ; extra == 'openai'
56
55
  Provides-Extra: pandas
57
- Requires-Dist: pandas (<3,>=2) ; extra == 'pandas'
56
+ Requires-Dist: pandas <3,>=2 ; extra == 'pandas'
58
57
  Provides-Extra: postgres
59
- Requires-Dist: psycopg2 (<3,>=2.8) ; extra == 'postgres'
58
+ Requires-Dist: psycopg2 <3,>=2.8 ; extra == 'postgres'
60
59
  Provides-Extra: redshift
61
- Requires-Dist: redshift-connector (<2.2.0,>=2.1.1) ; extra == 'redshift'
60
+ Requires-Dist: redshift-connector <2.2.0,>=2.1.1 ; extra == 'redshift'
62
61
  Provides-Extra: snowflake
63
- Requires-Dist: snowflake-connector-python[secure-local-storage] (<3.13,>=3.10.0) ; extra == 'snowflake'
62
+ Requires-Dist: snowflake-connector-python[secure-local-storage] <3.13,>=3.10.0 ; extra == 'snowflake'
64
63
  Provides-Extra: spark
65
- Requires-Dist: pyspark (<3.6,>=2) ; extra == 'spark'
64
+ Requires-Dist: pyspark <3.6,>=2 ; extra == 'spark'
66
65
 
67
66
  <div align="center">
68
67
  <img src="https://sqlframe.readthedocs.io/en/stable/docs/images/sqlframe_logo.png" alt="SQLFrame Logo" width="400"/>
@@ -227,5 +226,3 @@ LIMIT 5
227
226
  | 1975 | 868,985 | 10.92 |
228
227
  +------+---------------------------+----------------+
229
228
  ```
230
-
231
-
@@ -1,10 +1,10 @@
1
1
  sqlframe/__init__.py,sha256=wfqm98eLoLid9oV_FzzpG5loKC6LxOhj2lXpfN7SARo,3138
2
- sqlframe/_version.py,sha256=3fJaN4m_eO3OOhIj24x2tSFiMOpH1Uw0GgL-P7s9_M0,413
2
+ sqlframe/_version.py,sha256=efGc9qGpdvsN2KEWLmdYgdokJecNkK44Rg-Lf6L0IvM,413
3
3
  sqlframe/base/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
4
4
  sqlframe/base/_typing.py,sha256=b2clI5HI1zEZKB_3Msx3FeAJQyft44ubUifJwQRVXyQ,1298
5
5
  sqlframe/base/catalog.py,sha256=SzFQalTWdhWzxUY-4ut1f9TfOECp_JmJEgNPfrRKCe0,38457
6
6
  sqlframe/base/column.py,sha256=wRghgieYAA51aw4WuFQWOvl0TFOToZbBhBuIamEzxx4,18011
7
- sqlframe/base/dataframe.py,sha256=c27sJq8kb0AHBGwJJyDofayw58sOdJMePktpjqB2gJk,74452
7
+ sqlframe/base/dataframe.py,sha256=bnF8SYIDhSFPYKchGakRG_oWqgZ-66jKZsdcqUSqCDE,74940
8
8
  sqlframe/base/decorators.py,sha256=P56cgs8DANxGRIwVs5uOMnDy-BlXZZYMbf4fdnkpWPI,1889
9
9
  sqlframe/base/exceptions.py,sha256=9Uwvqn2eAkDpqm4BrRgbL61qM-GMCbJEMAW8otxO46s,370
10
10
  sqlframe/base/function_alternatives.py,sha256=8kDCh1cOXtdCcBPYBQ8byXxRAZvphS9N8GDs4txBzGg,52544
@@ -26,7 +26,7 @@ sqlframe/base/mixins/readwriter_mixins.py,sha256=ap8j_g7PoUGHaHKCPMnRPbXofOsUhUz
26
26
  sqlframe/bigquery/__init__.py,sha256=kbaomhYAANPdxeDQhajv8IHfMg_ENKivtYK-rPwaV08,939
27
27
  sqlframe/bigquery/catalog.py,sha256=8d36IzT5GPWd1FdxJ9vEljOdbIDepHnFOBjwP0bX6FE,11625
28
28
  sqlframe/bigquery/column.py,sha256=E1tUa62Y5HajkhgFuebU9zohrGyieudcHzTT8gfalio,40
29
- sqlframe/bigquery/dataframe.py,sha256=O7qkwVRuuyqdesfwjXLBMgScQqUugPIYklboQ2vgRyE,2403
29
+ sqlframe/bigquery/dataframe.py,sha256=2qlnwTOpfpHQxr9MCxeZWxKiQoL6txEgGNE8JQsalUQ,2599
30
30
  sqlframe/bigquery/functions.py,sha256=MYLs6-sXXqe5o6ghJHHtEpFJlYMeyKzx9-rT3wwXlc4,426
31
31
  sqlframe/bigquery/functions.pyi,sha256=KXgV46eZFNIXwXIhPuSJ08BG18iLQzDCQjyI3REBEXg,11925
32
32
  sqlframe/bigquery/group.py,sha256=UVBNBRTo8OqS-_cS5YwvTeJYgYxeG-d6R3kfyHmlFqw,391
@@ -50,7 +50,7 @@ sqlframe/databricks/window.py,sha256=6GKPzuxeSapJakBaKBeT9VpED1ACdjggDv9JRILDyV0
50
50
  sqlframe/duckdb/__init__.py,sha256=KAw_uZEhFMwi3D9Wj6AgHAKqLNk-EAx2uDIYu56oL44,872
51
51
  sqlframe/duckdb/catalog.py,sha256=YYYVmetLUaJOdObKw4AJ7L0P-msshkta4xHlcZQ9zEA,4795
52
52
  sqlframe/duckdb/column.py,sha256=E1tUa62Y5HajkhgFuebU9zohrGyieudcHzTT8gfalio,40
53
- sqlframe/duckdb/dataframe.py,sha256=OgU4zySAKqz7XhwOhNJuUkwkflU67UvyqV3IbvaFVo4,1706
53
+ sqlframe/duckdb/dataframe.py,sha256=Z8_K69UQGZVeBfVGXVwIJP8OMuIvNBB3DPKTP3Lfu4w,1908
54
54
  sqlframe/duckdb/functions.py,sha256=ix2efGGD4HLaY1rtCtEd3IrsicGEVGiBAeKOo5OD8rA,424
55
55
  sqlframe/duckdb/functions.pyi,sha256=P0ky6k-J7LdCDrQ0OjfRC3ARIYNHPmAmmaB_jBEO5L0,12383
56
56
  sqlframe/duckdb/group.py,sha256=IkhbW42Ng1U5YT3FkIdiB4zBqRkW4QyTb-1detY1e_4,383
@@ -85,7 +85,7 @@ sqlframe/redshift/window.py,sha256=6GKPzuxeSapJakBaKBeT9VpED1ACdjggDv9JRILDyV0,3
85
85
  sqlframe/snowflake/__init__.py,sha256=msYAxOnPyjuBSTbpb5s9P5o0pr2N82UUGPxUtv0TNNw,966
86
86
  sqlframe/snowflake/catalog.py,sha256=Tp_B9oMTInnqLTiZNsT0UNc-a-aKXu3zFThlCwLeKCA,6507
87
87
  sqlframe/snowflake/column.py,sha256=E1tUa62Y5HajkhgFuebU9zohrGyieudcHzTT8gfalio,40
88
- sqlframe/snowflake/dataframe.py,sha256=X3FOasXh12OPFGF5-YYy1ThxIEdDwqc1xf3hdmuViN0,2142
88
+ sqlframe/snowflake/dataframe.py,sha256=TosBO9tnnqAQ9Y-abX954vQM8VBLYRmN_P50iusMFgQ,2185
89
89
  sqlframe/snowflake/functions.py,sha256=g3ELesLGvN7tyRyiEAnPneVyL0rQhSSOxYFvBFuOiaM,391
90
90
  sqlframe/snowflake/functions.pyi,sha256=sEqNdyqQBtgqoKtRViUb70QT5yrvpVoP3ZN7VxHNxbw,12612
91
91
  sqlframe/snowflake/group.py,sha256=pPP1l2RRo_LgkXrji8a87n2PKo-63ZRPT-WUtvVcBME,395
@@ -119,8 +119,8 @@ sqlframe/standalone/udf.py,sha256=azmgtUjHNIPs0WMVNId05SHwiYn41MKVBhKXsQJ5dmY,27
119
119
  sqlframe/standalone/window.py,sha256=6GKPzuxeSapJakBaKBeT9VpED1ACdjggDv9JRILDyV0,35
120
120
  sqlframe/testing/__init__.py,sha256=VVCosQhitU74A3NnE52O4mNtGZONapuEXcc20QmSlnQ,132
121
121
  sqlframe/testing/utils.py,sha256=PFsGZpwNUE_4-g_f43_vstTqsK0AQ2lBneb5Eb6NkFo,13008
122
- sqlframe-3.13.0.dist-info/LICENSE,sha256=VZu79YgW780qxaFJMr0t5ZgbOYEh04xWoxaWOaqIGWk,1068
123
- sqlframe-3.13.0.dist-info/METADATA,sha256=ojHxGxwoZc-kduIGwSOuWHIMGtAqea0IKU6LXSNwdkM,9053
124
- sqlframe-3.13.0.dist-info/WHEEL,sha256=G16H4A3IeoQmnOrYV4ueZGKSjhipXx8zc8nu9FGlvMA,92
125
- sqlframe-3.13.0.dist-info/top_level.txt,sha256=T0_RpoygaZSF6heeWwIDQgaP0varUdSK1pzjeJZRjM8,9
126
- sqlframe-3.13.0.dist-info/RECORD,,
122
+ sqlframe-3.13.2.dist-info/LICENSE,sha256=VZu79YgW780qxaFJMr0t5ZgbOYEh04xWoxaWOaqIGWk,1068
123
+ sqlframe-3.13.2.dist-info/METADATA,sha256=QHITWgwWxHNUam2uSDUcpJq6Y9zCJQPxQ-EN7YtvBtg,8970
124
+ sqlframe-3.13.2.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
125
+ sqlframe-3.13.2.dist-info/top_level.txt,sha256=T0_RpoygaZSF6heeWwIDQgaP0varUdSK1pzjeJZRjM8,9
126
+ sqlframe-3.13.2.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: bdist_wheel (0.37.1)
2
+ Generator: bdist_wheel (0.42.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5