dagster-duckdb-pyspark 0.22.6__py3-none-any.whl → 0.28.6__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- dagster_duckdb_pyspark/__init__.py +3 -3
- dagster_duckdb_pyspark/duckdb_pyspark_type_handler.py +9 -12
- dagster_duckdb_pyspark/version.py +1 -1
- {dagster_duckdb_pyspark-0.22.6.dist-info → dagster_duckdb_pyspark-0.28.6.dist-info}/METADATA +16 -9
- dagster_duckdb_pyspark-0.28.6.dist-info/RECORD +9 -0
- {dagster_duckdb_pyspark-0.22.6.dist-info → dagster_duckdb_pyspark-0.28.6.dist-info}/WHEEL +1 -1
- {dagster_duckdb_pyspark-0.22.6.dist-info → dagster_duckdb_pyspark-0.28.6.dist-info/licenses}/LICENSE +1 -1
- dagster_duckdb_pyspark-0.22.6.dist-info/RECORD +0 -9
- {dagster_duckdb_pyspark-0.22.6.dist-info → dagster_duckdb_pyspark-0.28.6.dist-info}/top_level.txt +0 -0
|
@@ -1,10 +1,10 @@
|
|
|
1
|
-
from
|
|
1
|
+
from dagster_shared.libraries import DagsterLibraryRegistry
|
|
2
2
|
|
|
3
|
-
from .duckdb_pyspark_type_handler import (
|
|
3
|
+
from dagster_duckdb_pyspark.duckdb_pyspark_type_handler import (
|
|
4
4
|
DuckDBPySparkIOManager as DuckDBPySparkIOManager,
|
|
5
5
|
DuckDBPySparkTypeHandler as DuckDBPySparkTypeHandler,
|
|
6
6
|
duckdb_pyspark_io_manager as duckdb_pyspark_io_manager,
|
|
7
7
|
)
|
|
8
|
-
from .version import __version__
|
|
8
|
+
from dagster_duckdb_pyspark.version import __version__
|
|
9
9
|
|
|
10
10
|
DagsterLibraryRegistry.register("dagster-duckdb-pyspark", __version__)
|
|
@@ -1,15 +1,12 @@
|
|
|
1
|
-
from
|
|
1
|
+
from collections.abc import Sequence
|
|
2
|
+
from typing import Optional
|
|
2
3
|
|
|
3
4
|
import pyarrow as pa
|
|
4
5
|
import pyspark
|
|
5
6
|
import pyspark.sql
|
|
6
7
|
from dagster import InputContext, MetadataValue, OutputContext, TableColumn, TableSchema
|
|
7
8
|
from dagster._core.storage.db_io_manager import DbTypeHandler, TableSlice
|
|
8
|
-
from dagster_duckdb.io_manager import
|
|
9
|
-
DuckDbClient,
|
|
10
|
-
DuckDBIOManager,
|
|
11
|
-
build_duckdb_io_manager,
|
|
12
|
-
)
|
|
9
|
+
from dagster_duckdb.io_manager import DuckDbClient, DuckDBIOManager, build_duckdb_io_manager
|
|
13
10
|
from pyspark.sql import SparkSession
|
|
14
11
|
from pyspark.sql.types import StructType
|
|
15
12
|
|
|
@@ -43,7 +40,7 @@ class DuckDBPySparkTypeHandler(DbTypeHandler[pyspark.sql.DataFrame]):
|
|
|
43
40
|
def my_table() -> pyspark.sql.DataFrame: # the name of the asset will be the table name
|
|
44
41
|
...
|
|
45
42
|
|
|
46
|
-
|
|
43
|
+
Definitions(
|
|
47
44
|
assets=[my_table],
|
|
48
45
|
resources={"io_manager": MyDuckDBIOManager(database="my_db.duckdb")}
|
|
49
46
|
)
|
|
@@ -120,7 +117,7 @@ Examples:
|
|
|
120
117
|
def my_table() -> pyspark.sql.DataFrame: # the name of the asset will be the table name
|
|
121
118
|
...
|
|
122
119
|
|
|
123
|
-
|
|
120
|
+
Definitions(
|
|
124
121
|
assets=[my_table],
|
|
125
122
|
resources={"io_manager": duckdb_pyspark_io_manager.configured({"database": "my_db.duckdb"})}
|
|
126
123
|
)
|
|
@@ -130,7 +127,7 @@ Examples:
|
|
|
130
127
|
|
|
131
128
|
.. code-block:: python
|
|
132
129
|
|
|
133
|
-
|
|
130
|
+
Definitions(
|
|
134
131
|
assets=[my_table],
|
|
135
132
|
resources={"io_manager": duckdb_pyspark_io_manager.configured({"database": "my_db.duckdb", "schema": "my_schema"})}
|
|
136
133
|
)
|
|
@@ -199,7 +196,7 @@ class DuckDBPySparkIOManager(DuckDBIOManager):
|
|
|
199
196
|
def my_table() -> pyspark.sql.DataFrame: # the name of the asset will be the table name
|
|
200
197
|
...
|
|
201
198
|
|
|
202
|
-
|
|
199
|
+
Definitions(
|
|
203
200
|
assets=[my_table],
|
|
204
201
|
resources={"io_manager": DuckDBPySparkIOManager(database="my_db.duckdb")}
|
|
205
202
|
)
|
|
@@ -209,7 +206,7 @@ class DuckDBPySparkIOManager(DuckDBIOManager):
|
|
|
209
206
|
|
|
210
207
|
.. code-block:: python
|
|
211
208
|
|
|
212
|
-
|
|
209
|
+
Definitions(
|
|
213
210
|
assets=[my_table],
|
|
214
211
|
resources={"io_manager": DuckDBPySparkIOManager(database="my_db.duckdb", schema="my_schema")}
|
|
215
212
|
)
|
|
@@ -267,5 +264,5 @@ class DuckDBPySparkIOManager(DuckDBIOManager):
|
|
|
267
264
|
return [DuckDBPySparkTypeHandler()]
|
|
268
265
|
|
|
269
266
|
@staticmethod
|
|
270
|
-
def default_load_type() -> Optional[
|
|
267
|
+
def default_load_type() -> Optional[type]:
|
|
271
268
|
return pyspark.sql.DataFrame
|
|
@@ -1 +1 @@
|
|
|
1
|
-
__version__ = "0.
|
|
1
|
+
__version__ = "0.28.6"
|
{dagster_duckdb_pyspark-0.22.6.dist-info → dagster_duckdb_pyspark-0.28.6.dist-info}/METADATA
RENAMED
|
@@ -1,20 +1,27 @@
|
|
|
1
|
-
Metadata-Version: 2.
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
2
|
Name: dagster-duckdb-pyspark
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.28.6
|
|
4
4
|
Summary: Package for storing PySpark DataFrames in DuckDB.
|
|
5
5
|
Home-page: https://github.com/dagster-io/dagster/tree/master/python_modules/libraries/dagster-duckb-pyspark
|
|
6
6
|
Author: Dagster Labs
|
|
7
7
|
Author-email: hello@dagsterlabs.com
|
|
8
8
|
License: Apache-2.0
|
|
9
|
-
Classifier: Programming Language :: Python :: 3.8
|
|
10
|
-
Classifier: Programming Language :: Python :: 3.9
|
|
11
9
|
Classifier: Programming Language :: Python :: 3.10
|
|
12
10
|
Classifier: License :: OSI Approved :: Apache Software License
|
|
13
11
|
Classifier: Operating System :: OS Independent
|
|
12
|
+
Requires-Python: >=3.10,<3.14
|
|
14
13
|
License-File: LICENSE
|
|
15
|
-
Requires-Dist: dagster
|
|
16
|
-
Requires-Dist: dagster-duckdb
|
|
17
|
-
Requires-Dist: pyspark
|
|
18
|
-
Requires-Dist: pandas
|
|
14
|
+
Requires-Dist: dagster==1.12.6
|
|
15
|
+
Requires-Dist: dagster-duckdb==0.28.6
|
|
16
|
+
Requires-Dist: pyspark<4,>=3
|
|
17
|
+
Requires-Dist: pandas
|
|
19
18
|
Requires-Dist: pyarrow
|
|
20
|
-
|
|
19
|
+
Dynamic: author
|
|
20
|
+
Dynamic: author-email
|
|
21
|
+
Dynamic: classifier
|
|
22
|
+
Dynamic: home-page
|
|
23
|
+
Dynamic: license
|
|
24
|
+
Dynamic: license-file
|
|
25
|
+
Dynamic: requires-dist
|
|
26
|
+
Dynamic: requires-python
|
|
27
|
+
Dynamic: summary
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
dagster_duckdb_pyspark/__init__.py,sha256=Xq5fF8XBDLE8iB4SptQEOd40CKuKN3EzxGBDR29npIs,427
|
|
2
|
+
dagster_duckdb_pyspark/duckdb_pyspark_type_handler.py,sha256=NHTzVmpC2uMLtvLgwWCyOKdnNmhT3PR3er9b5p556X4,9557
|
|
3
|
+
dagster_duckdb_pyspark/py.typed,sha256=mDShSrm8qg9qjacQc2F-rI8ATllqP6EdgHuEYxuCXZ0,7
|
|
4
|
+
dagster_duckdb_pyspark/version.py,sha256=b5kdBWIZTaI8Q8AFU25gXvG6Pk4-ffI6MZboEwGcgSI,23
|
|
5
|
+
dagster_duckdb_pyspark-0.28.6.dist-info/licenses/LICENSE,sha256=4lsMW-RCvfVD4_F57wrmpe3vX1xwUk_OAKKmV_XT7Z0,11348
|
|
6
|
+
dagster_duckdb_pyspark-0.28.6.dist-info/METADATA,sha256=iUSYWTtigghtx6CCHxnwbq3v3XrWi05YYM_yw0hVnfQ,848
|
|
7
|
+
dagster_duckdb_pyspark-0.28.6.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
8
|
+
dagster_duckdb_pyspark-0.28.6.dist-info/top_level.txt,sha256=UYh0E2YiAlK01-DAkx0eikRaH-TIk0n9jijQK2joJBs,23
|
|
9
|
+
dagster_duckdb_pyspark-0.28.6.dist-info/RECORD,,
|
{dagster_duckdb_pyspark-0.22.6.dist-info → dagster_duckdb_pyspark-0.28.6.dist-info/licenses}/LICENSE
RENAMED
|
@@ -186,7 +186,7 @@
|
|
|
186
186
|
same "printed page" as the copyright notice for easier
|
|
187
187
|
identification within third-party archives.
|
|
188
188
|
|
|
189
|
-
Copyright
|
|
189
|
+
Copyright 2025 Dagster Labs, Inc.
|
|
190
190
|
|
|
191
191
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
192
192
|
you may not use this file except in compliance with the License.
|
|
@@ -1,9 +0,0 @@
|
|
|
1
|
-
dagster_duckdb_pyspark/__init__.py,sha256=KjwD42HKQJslK2WPFg2F7mvHe1hPyrp02xSWM0Az39Y,382
|
|
2
|
-
dagster_duckdb_pyspark/duckdb_pyspark_type_handler.py,sha256=Tqo9McLXY_dmzgszA3nK5X7Hbws7jd8WuXMSXWfMDaQ,9588
|
|
3
|
-
dagster_duckdb_pyspark/py.typed,sha256=mDShSrm8qg9qjacQc2F-rI8ATllqP6EdgHuEYxuCXZ0,7
|
|
4
|
-
dagster_duckdb_pyspark/version.py,sha256=mo2N8Hr5LBKhIiNjttqZHNVcCox72DrgMlDVDK6CNjo,23
|
|
5
|
-
dagster_duckdb_pyspark-0.22.6.dist-info/LICENSE,sha256=TMatHW4_G9ldRdodEAp-l2Xa2WvsdeOh60E3v1R2jis,11349
|
|
6
|
-
dagster_duckdb_pyspark-0.22.6.dist-info/METADATA,sha256=6K5JLeLqL6cSgfkwC_ZmWmwkJgBlPwxJ8UmHDmgAUEg,742
|
|
7
|
-
dagster_duckdb_pyspark-0.22.6.dist-info/WHEEL,sha256=yQN5g4mg4AybRjkgi-9yy4iQEFibGQmlz78Pik5Or-A,92
|
|
8
|
-
dagster_duckdb_pyspark-0.22.6.dist-info/top_level.txt,sha256=UYh0E2YiAlK01-DAkx0eikRaH-TIk0n9jijQK2joJBs,23
|
|
9
|
-
dagster_duckdb_pyspark-0.22.6.dist-info/RECORD,,
|
{dagster_duckdb_pyspark-0.22.6.dist-info → dagster_duckdb_pyspark-0.28.6.dist-info}/top_level.txt
RENAMED
|
File without changes
|