sws-spark-dissemination-helper 0.0.95__tar.gz → 0.0.96__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/PKG-INFO +1 -1
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/pyproject.toml +1 -1
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/src/sws_spark_dissemination_helper/SWSBronzeIcebergSparkHelper.py +29 -2
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/.gitignore +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/LICENSE +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/README.md +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/old_requirements.txt +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/requirements.txt +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/src/sws_spark_dissemination_helper/SWSGoldIcebergSparkHelper.py +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/src/sws_spark_dissemination_helper/SWSPostgresSparkReader.py +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/src/sws_spark_dissemination_helper/SWSSilverIcebergSparkHelper.py +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/src/sws_spark_dissemination_helper/__init__.py +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/src/sws_spark_dissemination_helper/constants.py +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/src/sws_spark_dissemination_helper/utils.py +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/tests/__init__.py +0 -0
- {sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/tests/test.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: sws-spark-dissemination-helper
|
|
3
|
-
Version: 0.0.
|
|
3
|
+
Version: 0.0.96
|
|
4
4
|
Summary: A Python helper package providing streamlined Spark functions for efficient data dissemination processes
|
|
5
5
|
Project-URL: Repository, https://bitbucket.org/cioapps/sws-it-python-spark-dissemination-helper
|
|
6
6
|
Author-email: Daniele Mansillo <danielemansillo@gmail.com>
|
|
@@ -1,4 +1,5 @@
|
|
|
1
1
|
import logging
|
|
2
|
+
import time
|
|
2
3
|
from copy import copy
|
|
3
4
|
from typing import Dict, List, Tuple
|
|
4
5
|
|
|
@@ -389,6 +390,15 @@ class SWSBronzeIcebergSparkHelper:
|
|
|
389
390
|
self.spark.sql(
|
|
390
391
|
f"ALTER TABLE {self.iceberg_tables.BRONZE.iceberg_id} CREATE TAG `{self.tag_name}`"
|
|
391
392
|
)
|
|
393
|
+
while (
|
|
394
|
+
self.spark.sql(
|
|
395
|
+
f"SELECT * FROM {self.iceberg_tables.BRONZE.iceberg_id}.refs"
|
|
396
|
+
)
|
|
397
|
+
.filter((col("type") == lit("TAG")) & (col("name") == lit(self.tag_name)))
|
|
398
|
+
.count()
|
|
399
|
+
) == 0:
|
|
400
|
+
logging.info(f"Waiting for the tag {self.tag_name} to be created")
|
|
401
|
+
time.sleep(2)
|
|
392
402
|
|
|
393
403
|
logging.info(f"bronze tag '{self.tag_name}' created")
|
|
394
404
|
|
|
@@ -447,14 +457,31 @@ class SWSBronzeIcebergSparkHelper:
|
|
|
447
457
|
def write_bronze_disseminated_tag_data_to_iceberg_and_csv(
|
|
448
458
|
self, dimensions: Dict[str, List[str]]
|
|
449
459
|
) -> DataFrame:
|
|
450
|
-
|
|
451
|
-
refs = self.spark.sql(
|
|
460
|
+
|
|
461
|
+
refs = self.spark.sql(
|
|
462
|
+
f"SELECT * FROM {self.iceberg_tables.BRONZE.iceberg_id}.refs"
|
|
463
|
+
).collect()
|
|
452
464
|
logging.info(f"bronze refs: {refs}")
|
|
453
465
|
|
|
454
466
|
create_branch_query = f"ALTER TABLE {self.iceberg_tables.BRONZE.iceberg_id}.`tag_{self.tag_name}` CREATE OR REPLACE BRANCH `diss_tag_{self.tag_name}`" # AS OF VERSION `{tag_name}`
|
|
455
467
|
logging.info(f"create_branch_query: {create_branch_query}")
|
|
456
468
|
create_branch_query_result = self.spark.sql(create_branch_query).collect()
|
|
457
469
|
|
|
470
|
+
while (
|
|
471
|
+
self.spark.sql(
|
|
472
|
+
f"SELECT * FROM {self.iceberg_tables.BRONZE.iceberg_id}.refs"
|
|
473
|
+
)
|
|
474
|
+
.filter(
|
|
475
|
+
(col("type") == lit("BRANCH"))
|
|
476
|
+
& (col("name") == lit(f"diss_tag_{self.tag_name}"))
|
|
477
|
+
)
|
|
478
|
+
.count()
|
|
479
|
+
) == 0:
|
|
480
|
+
logging.info(
|
|
481
|
+
f"Waiting for the branch {self.tag_name} diss_tag_{self.tag_name} to be created"
|
|
482
|
+
)
|
|
483
|
+
time.sleep(2)
|
|
484
|
+
|
|
458
485
|
logging.info(f"result of create_branch_query: {create_branch_query_result}")
|
|
459
486
|
|
|
460
487
|
self.disseminated_tag_df = self.spark.read.option(
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/old_requirements.txt
RENAMED
|
File without changes
|
{sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/requirements.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/tests/__init__.py
RENAMED
|
File without changes
|
{sws_spark_dissemination_helper-0.0.95 → sws_spark_dissemination_helper-0.0.96}/tests/test.py
RENAMED
|
File without changes
|